diff --git "a/wandb/run-20220323_165914-1vl16ira/files/wandb-summary.json" "b/wandb/run-20220323_165914-1vl16ira/files/wandb-summary.json" --- "a/wandb/run-20220323_165914-1vl16ira/files/wandb-summary.json" +++ "b/wandb/run-20220323_165914-1vl16ira/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 0.0753, "train/learning_rate": 4.057803468208092e-05, "train/epoch": 4.48, "train/global_step": 2000, "_runtime": 24113, "_timestamp": 1648078867, "_step": 2003, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 4.0, 2.0, 3.0, 5.0, 8.0, 9.0, 12.0, 17.0, 26.0, 26.0, 27.0, 32.0, 39.0, 49.0, 63.0, 61.0, 74.0, 81.0, 73.0, 68.0, 64.0, 53.0, 39.0, 38.0, 31.0, 21.0, 20.0, 16.0, 13.0, 8.0, 7.0, 5.0, 7.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.6806318163871765, -0.6569727063179016, -0.6333135962486267, -0.6096544861793518, -0.5859953761100769, -0.562336266040802, -0.5386772155761719, -0.515018105506897, -0.4913589656352997, -0.4676998555660248, -0.4440407454967499, -0.42038166522979736, -0.39672255516052246, -0.37306344509124756, -0.34940433502197266, -0.32574522495269775, -0.30208611488342285, -0.27842700481414795, -0.25476789474487305, -0.23110879957675934, -0.20744968950748444, -0.18379057943820953, -0.16013148427009583, -0.13647237420082092, -0.11281326413154602, -0.08915415406227112, -0.06549505144357681, -0.04183594882488251, -0.018176838755607605, 0.005482271313667297, 0.029141366481781006, 0.05280047655105591, 0.07645964622497559, 0.10011875629425049, 0.1237778589129448, 0.1474369615316391, 0.171096071600914, 0.1947551816701889, 0.2184142768383026, 0.24207338690757751, 0.2657324969768524, 0.2893916070461273, 0.3130507171154022, 0.33670979738235474, 0.36036890745162964, 0.38402801752090454, 0.40768712759017944, 0.43134623765945435, 0.45500534772872925, 0.47866445779800415, 0.502323567867279, 0.525982677936554, 0.5496417880058289, 0.5733008980751038, 0.5969599485397339, 0.6206190586090088, 0.6442781686782837, 0.6679372787475586, 0.6915963888168335, 0.7152554988861084, 0.7389146089553833, 0.7625737190246582, 0.7862328290939331, 0.809891939163208, 0.8335510492324829]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 8.0, 9.0, 3.0, 2.0, 9.0, 12.0, 14.0, 14.0, 9.0, 18.0, 20.0, 25.0, 27.0, 32.0, 43.0, 35.0, 29.0, 40.0, 43.0, 43.0, 53.0, 36.0, 47.0, 55.0, 43.0, 38.0, 40.0, 40.0, 35.0, 29.0, 26.0, 26.0, 19.0, 16.0, 9.0, 12.0, 12.0, 9.0, 9.0, 6.0, 5.0, 5.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.9462643265724182, -0.9208422303199768, -0.8954201340675354, -0.869998037815094, -0.8445758819580078, -0.8191537857055664, -0.793731689453125, -0.7683095932006836, -0.7428874969482422, -0.7174654006958008, -0.6920433044433594, -0.666621208190918, -0.6411991119384766, -0.6157770156860352, -0.590354859828949, -0.5649327635765076, -0.5395106673240662, -0.5140885710716248, -0.48866647481918335, -0.46324434876441956, -0.43782225251197815, -0.41240015625953674, -0.38697803020477295, -0.36155593395233154, -0.33613383769989014, -0.31071174144744873, -0.2852896451950073, -0.25986751914024353, -0.23444542288780212, -0.20902332663536072, -0.18360121548175812, -0.15817910432815552, -0.1327570080757141, -0.10733490437269211, -0.0819128006696701, -0.0564906969666481, -0.0310685932636261, -0.005646497011184692, 0.019775614142417908, 0.04519772529602051, 0.07061982154846191, 0.09604192525148392, 0.12146402895450592, 0.14688614010810852, 0.17230823636054993, 0.19773033261299133, 0.22315244376659393, 0.24857455492019653, 0.27399665117263794, 0.29941874742507935, 0.32484084367752075, 0.35026296973228455, 0.37568506598472595, 0.40110716223716736, 0.42652928829193115, 0.45195138454437256, 0.47737348079681396, 0.5027955770492554, 0.5282176733016968, 0.5536397695541382, 0.5790618658065796, 0.604483962059021, 0.6299061179161072, 0.6553282141685486, 0.68075031042099]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 9.0, 7.0, 6.0, 19.0, 23.0, 33.0, 33.0, 68.0, 90.0, 135.0, 189.0, 318.0, 411.0, 668.0, 1049.0, 1595.0, 2768.0, 4825.0, 8997.0, 18311.0, 47448.0, 159914.0, 656301.0, 1878380.0, 1022497.0, 264309.0, 74301.0, 25533.0, 11584.0, 5859.0, 3321.0, 1924.0, 1188.0, 774.0, 445.0, 289.0, 195.0, 147.0, 102.0, 76.0, 39.0, 30.0, 25.0, 24.0, 8.0, 8.0, 4.0, 5.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3505859375, -1.306549072265625, -1.26251220703125, -1.218475341796875, -1.1744384765625, -1.130401611328125, -1.08636474609375, -1.042327880859375, -0.998291015625, -0.954254150390625, -0.91021728515625, -0.866180419921875, -0.8221435546875, -0.778106689453125, -0.73406982421875, -0.690032958984375, -0.64599609375, -0.601959228515625, -0.55792236328125, -0.513885498046875, -0.4698486328125, -0.425811767578125, -0.38177490234375, -0.337738037109375, -0.293701171875, -0.249664306640625, -0.20562744140625, -0.161590576171875, -0.1175537109375, -0.073516845703125, -0.02947998046875, 0.014556884765625, 0.05859375, 0.102630615234375, 0.14666748046875, 0.190704345703125, 0.2347412109375, 0.278778076171875, 0.32281494140625, 0.366851806640625, 0.410888671875, 0.454925537109375, 0.49896240234375, 0.542999267578125, 0.5870361328125, 0.631072998046875, 0.67510986328125, 0.719146728515625, 0.76318359375, 0.807220458984375, 0.85125732421875, 0.895294189453125, 0.9393310546875, 0.983367919921875, 1.02740478515625, 1.071441650390625, 1.115478515625, 1.159515380859375, 1.20355224609375, 1.247589111328125, 1.2916259765625, 1.335662841796875, 1.37969970703125, 1.423736572265625, 1.4677734375]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 8.0, 5.0, 4.0, 1.0, 2.0, 5.0, 5.0, 12.0, 9.0, 12.0, 13.0, 17.0, 20.0, 19.0, 19.0, 25.0, 32.0, 38.0, 27.0, 34.0, 35.0, 43.0, 40.0, 37.0, 39.0, 44.0, 59.0, 40.0, 31.0, 33.0, 35.0, 37.0, 34.0, 29.0, 27.0, 23.0, 20.0, 22.0, 16.0, 7.0, 14.0, 8.0, 9.0, 4.0, 3.0, 3.0, 5.0, 1.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2001953125, -1.1624908447265625, -1.124786376953125, -1.0870819091796875, -1.04937744140625, -1.0116729736328125, -0.973968505859375, -0.9362640380859375, -0.8985595703125, -0.8608551025390625, -0.823150634765625, -0.7854461669921875, -0.74774169921875, -0.7100372314453125, -0.672332763671875, -0.6346282958984375, -0.596923828125, -0.5592193603515625, -0.521514892578125, -0.4838104248046875, -0.44610595703125, -0.4084014892578125, -0.370697021484375, -0.3329925537109375, -0.2952880859375, -0.2575836181640625, -0.219879150390625, -0.1821746826171875, -0.14447021484375, -0.1067657470703125, -0.069061279296875, -0.0313568115234375, 0.00634765625, 0.0440521240234375, 0.081756591796875, 0.1194610595703125, 0.15716552734375, 0.1948699951171875, 0.232574462890625, 0.2702789306640625, 0.3079833984375, 0.3456878662109375, 0.383392333984375, 0.4210968017578125, 0.45880126953125, 0.4965057373046875, 0.534210205078125, 0.5719146728515625, 0.609619140625, 0.6473236083984375, 0.685028076171875, 0.7227325439453125, 0.76043701171875, 0.7981414794921875, 0.835845947265625, 0.8735504150390625, 0.9112548828125, 0.9489593505859375, 0.986663818359375, 1.0243682861328125, 1.06207275390625, 1.0997772216796875, 1.137481689453125, 1.1751861572265625, 1.212890625]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 8.0, 9.0, 19.0, 41.0, 189.0, 2834.0, 4190048.0, 950.0, 110.0, 39.0, 15.0, 11.0, 8.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.875, -34.7666015625, -33.658203125, -32.5498046875, -31.44140625, -30.3330078125, -29.224609375, -28.1162109375, -27.0078125, -25.8994140625, -24.791015625, -23.6826171875, -22.57421875, -21.4658203125, -20.357421875, -19.2490234375, -18.140625, -17.0322265625, -15.923828125, -14.8154296875, -13.70703125, -12.5986328125, -11.490234375, -10.3818359375, -9.2734375, -8.1650390625, -7.056640625, -5.9482421875, -4.83984375, -3.7314453125, -2.623046875, -1.5146484375, -0.40625, 0.7021484375, 1.810546875, 2.9189453125, 4.02734375, 5.1357421875, 6.244140625, 7.3525390625, 8.4609375, 9.5693359375, 10.677734375, 11.7861328125, 12.89453125, 14.0029296875, 15.111328125, 16.2197265625, 17.328125, 18.4365234375, 19.544921875, 20.6533203125, 21.76171875, 22.8701171875, 23.978515625, 25.0869140625, 26.1953125, 27.3037109375, 28.412109375, 29.5205078125, 30.62890625, 31.7373046875, 32.845703125, 33.9541015625, 35.0625]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 5.0, 4.0, 7.0, 17.0, 23.0, 46.0, 127.0, 181.0, 482.0, 1236.0, 1133.0, 410.0, 197.0, 105.0, 51.0, 19.0, 18.0, 12.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.09375, -1.0605316162109375, -1.027313232421875, -0.9940948486328125, -0.96087646484375, -0.9276580810546875, -0.894439697265625, -0.8612213134765625, -0.8280029296875, -0.7947845458984375, -0.761566162109375, -0.7283477783203125, -0.69512939453125, -0.6619110107421875, -0.628692626953125, -0.5954742431640625, -0.562255859375, -0.5290374755859375, -0.495819091796875, -0.4626007080078125, -0.42938232421875, -0.3961639404296875, -0.362945556640625, -0.3297271728515625, -0.2965087890625, -0.2632904052734375, -0.230072021484375, -0.1968536376953125, -0.16363525390625, -0.1304168701171875, -0.097198486328125, -0.0639801025390625, -0.03076171875, 0.0024566650390625, 0.035675048828125, 0.0688934326171875, 0.10211181640625, 0.1353302001953125, 0.168548583984375, 0.2017669677734375, 0.2349853515625, 0.2682037353515625, 0.301422119140625, 0.3346405029296875, 0.36785888671875, 0.4010772705078125, 0.434295654296875, 0.4675140380859375, 0.500732421875, 0.5339508056640625, 0.567169189453125, 0.6003875732421875, 0.63360595703125, 0.6668243408203125, 0.700042724609375, 0.7332611083984375, 0.7664794921875, 0.7996978759765625, 0.832916259765625, 0.8661346435546875, 0.89935302734375, 0.9325714111328125, 0.965789794921875, 0.9990081787109375, 1.0322265625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 5.0, 8.0, 9.0, 13.0, 8.0, 12.0, 19.0, 15.0, 19.0, 18.0, 32.0, 36.0, 37.0, 44.0, 49.0, 55.0, 68.0, 50.0, 48.0, 49.0, 53.0, 58.0, 39.0, 45.0, 42.0, 27.0, 31.0, 19.0, 21.0, 10.0, 11.0, 4.0, 11.0, 4.0, 4.0, 6.0, 7.0, 4.0, 7.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3254849910736084, -1.283860206604004, -1.242235541343689, -1.2006107568740845, -1.15898597240448, -1.117361307144165, -1.0757365226745605, -1.034111738204956, -0.9924870133399963, -0.9508622884750366, -0.9092375040054321, -0.8676127791404724, -0.8259880542755127, -0.7843632698059082, -0.7427385449409485, -0.7011138200759888, -0.6594890356063843, -0.6178643107414246, -0.5762395262718201, -0.5346148014068604, -0.49299004673957825, -0.45136529207229614, -0.4097405672073364, -0.3681158125400543, -0.3264910578727722, -0.2848663032054901, -0.2432415634393692, -0.2016168236732483, -0.1599920690059662, -0.11836731433868408, -0.07674257457256317, -0.03511783480644226, 0.006506800651550293, 0.0481315478682518, 0.08975629508495331, 0.13138103485107422, 0.17300578951835632, 0.21463054418563843, 0.25625526905059814, 0.29788002371788025, 0.33950477838516235, 0.38112953305244446, 0.42275428771972656, 0.4643790125846863, 0.506003737449646, 0.5476285219192505, 0.5892532467842102, 0.6308779716491699, 0.6725027561187744, 0.7141274809837341, 0.7557522654533386, 0.7973769903182983, 0.8390017747879028, 0.8806264996528625, 0.9222512245178223, 0.9638760089874268, 1.0055007934570312, 1.0471255779266357, 1.0887502431869507, 1.1303750276565552, 1.1719998121261597, 1.2136244773864746, 1.255249261856079, 1.2968740463256836, 1.3384987115859985]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 7.0, 7.0, 5.0, 5.0, 11.0, 10.0, 5.0, 12.0, 10.0, 11.0, 14.0, 22.0, 23.0, 35.0, 24.0, 18.0, 39.0, 30.0, 34.0, 31.0, 32.0, 47.0, 37.0, 42.0, 35.0, 41.0, 48.0, 44.0, 33.0, 42.0, 29.0, 36.0, 25.0, 29.0, 16.0, 18.0, 11.0, 16.0, 15.0, 21.0, 6.0, 9.0, 8.0, 6.0, 3.0, 6.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.209162712097168, -1.1751840114593506, -1.1412054300308228, -1.1072267293930054, -1.073248028755188, -1.0392694473266602, -1.0052907466888428, -0.9713120460510254, -0.9373334050178528, -0.9033547639846802, -0.8693760633468628, -0.8353974223136902, -0.8014187812805176, -0.7674400806427002, -0.7334614396095276, -0.699482798576355, -0.6655040979385376, -0.631525456905365, -0.5975467562675476, -0.563568115234375, -0.5295894145965576, -0.495610773563385, -0.4616321325302124, -0.4276534616947174, -0.3936747908592224, -0.3596961200237274, -0.3257174491882324, -0.2917388081550598, -0.2577601373195648, -0.22378146648406982, -0.18980281054973602, -0.15582415461540222, -0.12184542417526245, -0.08786676079034805, -0.053888097405433655, -0.019909434020519257, 0.014069229364395142, 0.04804790019989014, 0.08202655613422394, 0.11600521206855774, 0.14998388290405273, 0.18396255373954773, 0.21794120967388153, 0.25191986560821533, 0.2858985364437103, 0.3198772072792053, 0.35385584831237793, 0.3878345191478729, 0.4218131899833679, 0.4557918608188629, 0.4897705316543579, 0.5237491726875305, 0.5577278137207031, 0.5917065143585205, 0.6256851553916931, 0.6596637964248657, 0.6936424970626831, 0.7276211380958557, 0.7615998387336731, 0.7955784797668457, 0.8295571804046631, 0.8635358214378357, 0.8975144624710083, 0.9314931631088257, 0.9654718041419983]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 6.0, 2.0, 3.0, 7.0, 13.0, 13.0, 15.0, 24.0, 21.0, 44.0, 67.0, 93.0, 156.0, 238.0, 350.0, 545.0, 888.0, 1422.0, 2259.0, 3576.0, 6160.0, 10237.0, 17788.0, 30648.0, 54289.0, 94808.0, 158275.0, 228825.0, 179594.0, 109455.0, 62385.0, 35589.0, 20551.0, 11862.0, 7085.0, 4161.0, 2647.0, 1652.0, 945.0, 670.0, 382.0, 261.0, 187.0, 113.0, 82.0, 60.0, 36.0, 33.0, 12.0, 14.0, 6.0, 8.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.404541015625, -0.39133453369140625, -0.3781280517578125, -0.36492156982421875, -0.351715087890625, -0.33850860595703125, -0.3253021240234375, -0.31209564208984375, -0.29888916015625, -0.28568267822265625, -0.2724761962890625, -0.25926971435546875, -0.246063232421875, -0.23285675048828125, -0.2196502685546875, -0.20644378662109375, -0.1932373046875, -0.18003082275390625, -0.1668243408203125, -0.15361785888671875, -0.140411376953125, -0.12720489501953125, -0.1139984130859375, -0.10079193115234375, -0.08758544921875, -0.07437896728515625, -0.0611724853515625, -0.04796600341796875, -0.034759521484375, -0.02155303955078125, -0.0083465576171875, 0.00485992431640625, 0.01806640625, 0.03127288818359375, 0.0444793701171875, 0.05768585205078125, 0.070892333984375, 0.08409881591796875, 0.0973052978515625, 0.11051177978515625, 0.12371826171875, 0.13692474365234375, 0.1501312255859375, 0.16333770751953125, 0.176544189453125, 0.18975067138671875, 0.2029571533203125, 0.21616363525390625, 0.2293701171875, 0.24257659912109375, 0.2557830810546875, 0.26898956298828125, 0.282196044921875, 0.29540252685546875, 0.3086090087890625, 0.32181549072265625, 0.33502197265625, 0.34822845458984375, 0.3614349365234375, 0.37464141845703125, 0.387847900390625, 0.40105438232421875, 0.4142608642578125, 0.42746734619140625, 0.440673828125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 6.0, 4.0, 2.0, 1.0, 4.0, 11.0, 7.0, 14.0, 15.0, 14.0, 23.0, 14.0, 25.0, 27.0, 27.0, 31.0, 36.0, 36.0, 38.0, 48.0, 34.0, 41.0, 44.0, 34.0, 46.0, 41.0, 43.0, 45.0, 33.0, 48.0, 30.0, 24.0, 19.0, 21.0, 19.0, 12.0, 19.0, 15.0, 15.0, 14.0, 5.0, 3.0, 7.0, 6.0, 3.0, 3.0, 1.0, 2.0, 0.0, 3.0], "bins": [-0.88232421875, -0.8583984375, -0.83447265625, -0.810546875, -0.78662109375, -0.7626953125, -0.73876953125, -0.71484375, -0.69091796875, -0.6669921875, -0.64306640625, -0.619140625, -0.59521484375, -0.5712890625, -0.54736328125, -0.5234375, -0.49951171875, -0.4755859375, -0.45166015625, -0.427734375, -0.40380859375, -0.3798828125, -0.35595703125, -0.33203125, -0.30810546875, -0.2841796875, -0.26025390625, -0.236328125, -0.21240234375, -0.1884765625, -0.16455078125, -0.140625, -0.11669921875, -0.0927734375, -0.06884765625, -0.044921875, -0.02099609375, 0.0029296875, 0.02685546875, 0.05078125, 0.07470703125, 0.0986328125, 0.12255859375, 0.146484375, 0.17041015625, 0.1943359375, 0.21826171875, 0.2421875, 0.26611328125, 0.2900390625, 0.31396484375, 0.337890625, 0.36181640625, 0.3857421875, 0.40966796875, 0.43359375, 0.45751953125, 0.4814453125, 0.50537109375, 0.529296875, 0.55322265625, 0.5771484375, 0.60107421875, 0.625, 0.64892578125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 5.0, 4.0, 6.0, 4.0, 13.0, 20.0, 18.0, 35.0, 45.0, 69.0, 82.0, 166.0, 246.0, 464.0, 791.0, 1781.0, 4481.0, 12330.0, 39375.0, 142896.0, 435408.0, 292300.0, 81150.0, 23435.0, 7752.0, 2989.0, 1192.0, 600.0, 332.0, 194.0, 120.0, 81.0, 65.0, 36.0, 19.0, 21.0, 15.0, 5.0, 1.0, 5.0, 5.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.8447265625, -0.8197250366210938, -0.7947235107421875, -0.7697219848632812, -0.744720458984375, -0.7197189331054688, -0.6947174072265625, -0.6697158813476562, -0.64471435546875, -0.6197128295898438, -0.5947113037109375, -0.5697097778320312, -0.544708251953125, -0.5197067260742188, -0.4947052001953125, -0.46970367431640625, -0.4447021484375, -0.41970062255859375, -0.3946990966796875, -0.36969757080078125, -0.344696044921875, -0.31969451904296875, -0.2946929931640625, -0.26969146728515625, -0.24468994140625, -0.21968841552734375, -0.1946868896484375, -0.16968536376953125, -0.144683837890625, -0.11968231201171875, -0.0946807861328125, -0.06967926025390625, -0.044677734375, -0.01967620849609375, 0.0053253173828125, 0.03032684326171875, 0.055328369140625, 0.08032989501953125, 0.1053314208984375, 0.13033294677734375, 0.15533447265625, 0.18033599853515625, 0.2053375244140625, 0.23033905029296875, 0.255340576171875, 0.28034210205078125, 0.3053436279296875, 0.33034515380859375, 0.3553466796875, 0.38034820556640625, 0.4053497314453125, 0.43035125732421875, 0.455352783203125, 0.48035430908203125, 0.5053558349609375, 0.5303573608398438, 0.55535888671875, 0.5803604125976562, 0.6053619384765625, 0.6303634643554688, 0.655364990234375, 0.6803665161132812, 0.7053680419921875, 0.7303695678710938, 0.75537109375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 3.0, 6.0, 7.0, 7.0, 14.0, 16.0, 13.0, 17.0, 10.0, 17.0, 27.0, 30.0, 29.0, 33.0, 39.0, 43.0, 50.0, 43.0, 46.0, 50.0, 33.0, 49.0, 36.0, 48.0, 32.0, 31.0, 37.0, 31.0, 27.0, 27.0, 17.0, 21.0, 25.0, 17.0, 16.0, 8.0, 11.0, 9.0, 4.0, 6.0, 3.0, 6.0, 3.0, 3.0, 1.0, 3.0, 0.0, 3.0, 1.0], "bins": [-1.84375, -1.7917327880859375, -1.739715576171875, -1.6876983642578125, -1.63568115234375, -1.5836639404296875, -1.531646728515625, -1.4796295166015625, -1.4276123046875, -1.3755950927734375, -1.323577880859375, -1.2715606689453125, -1.21954345703125, -1.1675262451171875, -1.115509033203125, -1.0634918212890625, -1.011474609375, -0.9594573974609375, -0.907440185546875, -0.8554229736328125, -0.80340576171875, -0.7513885498046875, -0.699371337890625, -0.6473541259765625, -0.5953369140625, -0.5433197021484375, -0.491302490234375, -0.4392852783203125, -0.38726806640625, -0.3352508544921875, -0.283233642578125, -0.2312164306640625, -0.17919921875, -0.1271820068359375, -0.075164794921875, -0.0231475830078125, 0.02886962890625, 0.0808868408203125, 0.132904052734375, 0.1849212646484375, 0.2369384765625, 0.2889556884765625, 0.340972900390625, 0.3929901123046875, 0.44500732421875, 0.4970245361328125, 0.549041748046875, 0.6010589599609375, 0.653076171875, 0.7050933837890625, 0.757110595703125, 0.8091278076171875, 0.86114501953125, 0.9131622314453125, 0.965179443359375, 1.0171966552734375, 1.0692138671875, 1.1212310791015625, 1.173248291015625, 1.2252655029296875, 1.27728271484375, 1.3292999267578125, 1.381317138671875, 1.4333343505859375, 1.4853515625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 6.0, 5.0, 13.0, 19.0, 25.0, 18.0, 32.0, 38.0, 73.0, 110.0, 147.0, 265.0, 367.0, 623.0, 1117.0, 1873.0, 3477.0, 7072.0, 16281.0, 44465.0, 164571.0, 513273.0, 205531.0, 53478.0, 18707.0, 7896.0, 3772.0, 2111.0, 1148.0, 742.0, 465.0, 291.0, 145.0, 114.0, 78.0, 63.0, 32.0, 34.0, 17.0, 17.0, 15.0, 6.0, 4.0, 4.0, 3.0, 6.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.2132568359375, -0.20690536499023438, -0.20055389404296875, -0.19420242309570312, -0.1878509521484375, -0.18149948120117188, -0.17514801025390625, -0.16879653930664062, -0.162445068359375, -0.15609359741210938, -0.14974212646484375, -0.14339065551757812, -0.1370391845703125, -0.13068771362304688, -0.12433624267578125, -0.11798477172851562, -0.11163330078125, -0.10528182983398438, -0.09893035888671875, -0.09257888793945312, -0.0862274169921875, -0.07987594604492188, -0.07352447509765625, -0.06717300415039062, -0.060821533203125, -0.054470062255859375, -0.04811859130859375, -0.041767120361328125, -0.0354156494140625, -0.029064178466796875, -0.02271270751953125, -0.016361236572265625, -0.010009765625, -0.003658294677734375, 0.00269317626953125, 0.009044647216796875, 0.0153961181640625, 0.021747589111328125, 0.02809906005859375, 0.034450531005859375, 0.040802001953125, 0.047153472900390625, 0.05350494384765625, 0.059856414794921875, 0.0662078857421875, 0.07255935668945312, 0.07891082763671875, 0.08526229858398438, 0.09161376953125, 0.09796524047851562, 0.10431671142578125, 0.11066818237304688, 0.1170196533203125, 0.12337112426757812, 0.12972259521484375, 0.13607406616210938, 0.142425537109375, 0.14877700805664062, 0.15512847900390625, 0.16147994995117188, 0.1678314208984375, 0.17418289184570312, 0.18053436279296875, 0.18688583374023438, 0.1932373046875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 6.0, 4.0, 9.0, 9.0, 14.0, 14.0, 24.0, 27.0, 47.0, 73.0, 102.0, 175.0, 174.0, 95.0, 62.0, 43.0, 34.0, 16.0, 24.0, 12.0, 10.0, 12.0, 8.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001838207244873047, -0.00017746537923812866, -0.00017111003398895264, -0.0001647546887397766, -0.00015839934349060059, -0.00015204399824142456, -0.00014568865299224854, -0.0001393333077430725, -0.00013297796249389648, -0.00012662261724472046, -0.00012026727199554443, -0.00011391192674636841, -0.00010755658149719238, -0.00010120123624801636, -9.484589099884033e-05, -8.84905457496643e-05, -8.213520050048828e-05, -7.577985525131226e-05, -6.942451000213623e-05, -6.30691647529602e-05, -5.671381950378418e-05, -5.0358474254608154e-05, -4.400312900543213e-05, -3.7647783756256104e-05, -3.129243850708008e-05, -2.4937093257904053e-05, -1.8581748008728027e-05, -1.2226402759552002e-05, -5.8710575103759766e-06, 4.842877388000488e-07, 6.839632987976074e-06, 1.31949782371521e-05, 1.9550323486328125e-05, 2.590566873550415e-05, 3.2261013984680176e-05, 3.86163592338562e-05, 4.4971704483032227e-05, 5.132704973220825e-05, 5.768239498138428e-05, 6.40377402305603e-05, 7.039308547973633e-05, 7.674843072891235e-05, 8.310377597808838e-05, 8.94591212272644e-05, 9.581446647644043e-05, 0.00010216981172561646, 0.00010852515697479248, 0.0001148805022239685, 0.00012123584747314453, 0.00012759119272232056, 0.00013394653797149658, 0.0001403018832206726, 0.00014665722846984863, 0.00015301257371902466, 0.00015936791896820068, 0.0001657232642173767, 0.00017207860946655273, 0.00017843395471572876, 0.00018478929996490479, 0.0001911446452140808, 0.00019749999046325684, 0.00020385533571243286, 0.0002102106809616089, 0.0002165660262107849, 0.00022292137145996094]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 6.0, 6.0, 3.0, 6.0, 8.0, 15.0, 13.0, 21.0, 26.0, 29.0, 62.0, 78.0, 144.0, 301.0, 767.0, 2810.0, 13503.0, 109328.0, 741837.0, 156812.0, 17641.0, 3492.0, 908.0, 328.0, 138.0, 83.0, 52.0, 29.0, 31.0, 20.0, 14.0, 8.0, 12.0, 9.0, 3.0, 7.0, 3.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.361083984375, -0.3484458923339844, -0.33580780029296875, -0.3231697082519531, -0.3105316162109375, -0.2978935241699219, -0.28525543212890625, -0.2726173400878906, -0.259979248046875, -0.24734115600585938, -0.23470306396484375, -0.22206497192382812, -0.2094268798828125, -0.19678878784179688, -0.18415069580078125, -0.17151260375976562, -0.15887451171875, -0.14623641967773438, -0.13359832763671875, -0.12096023559570312, -0.1083221435546875, -0.09568405151367188, -0.08304595947265625, -0.07040786743164062, -0.057769775390625, -0.045131683349609375, -0.03249359130859375, -0.019855499267578125, -0.0072174072265625, 0.005420684814453125, 0.01805877685546875, 0.030696868896484375, 0.0433349609375, 0.055973052978515625, 0.06861114501953125, 0.08124923706054688, 0.0938873291015625, 0.10652542114257812, 0.11916351318359375, 0.13180160522460938, 0.144439697265625, 0.15707778930664062, 0.16971588134765625, 0.18235397338867188, 0.1949920654296875, 0.20763015747070312, 0.22026824951171875, 0.23290634155273438, 0.24554443359375, 0.2581825256347656, 0.27082061767578125, 0.2834587097167969, 0.2960968017578125, 0.3087348937988281, 0.32137298583984375, 0.3340110778808594, 0.346649169921875, 0.3592872619628906, 0.37192535400390625, 0.3845634460449219, 0.3972015380859375, 0.4098396301269531, 0.42247772216796875, 0.4351158142089844, 0.44775390625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 7.0, 10.0, 10.0, 13.0, 9.0, 13.0, 23.0, 18.0, 39.0, 42.0, 47.0, 61.0, 72.0, 79.0, 75.0, 76.0, 77.0, 53.0, 47.0, 37.0, 31.0, 35.0, 24.0, 20.0, 18.0, 9.0, 11.0, 7.0, 4.0, 8.0, 6.0, 5.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0555419921875, -0.05356311798095703, -0.05158424377441406, -0.049605369567871094, -0.047626495361328125, -0.045647621154785156, -0.04366874694824219, -0.04168987274169922, -0.03971099853515625, -0.03773212432861328, -0.03575325012207031, -0.033774375915527344, -0.031795501708984375, -0.029816627502441406, -0.027837753295898438, -0.02585887908935547, -0.0238800048828125, -0.02190113067626953, -0.019922256469726562, -0.017943382263183594, -0.015964508056640625, -0.013985633850097656, -0.012006759643554688, -0.010027885437011719, -0.00804901123046875, -0.006070137023925781, -0.0040912628173828125, -0.0021123886108398438, -0.000133514404296875, 0.0018453598022460938, 0.0038242340087890625, 0.005803108215332031, 0.007781982421875, 0.009760856628417969, 0.011739730834960938, 0.013718605041503906, 0.015697479248046875, 0.017676353454589844, 0.019655227661132812, 0.02163410186767578, 0.02361297607421875, 0.02559185028076172, 0.027570724487304688, 0.029549598693847656, 0.031528472900390625, 0.033507347106933594, 0.03548622131347656, 0.03746509552001953, 0.0394439697265625, 0.04142284393310547, 0.04340171813964844, 0.045380592346191406, 0.047359466552734375, 0.049338340759277344, 0.05131721496582031, 0.05329608917236328, 0.05527496337890625, 0.05725383758544922, 0.05923271179199219, 0.061211585998535156, 0.06319046020507812, 0.0651693344116211, 0.06714820861816406, 0.06912708282470703, 0.07110595703125]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 1.0, 5.0, 4.0, 5.0, 15.0, 8.0, 12.0, 16.0, 21.0, 27.0, 33.0, 51.0, 61.0, 63.0, 78.0, 81.0, 75.0, 69.0, 76.0, 57.0, 39.0, 44.0, 30.0, 37.0, 28.0, 13.0, 18.0, 5.0, 11.0, 5.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.2740452289581299, -1.2388832569122314, -1.203721284866333, -1.1685593128204346, -1.1333973407745361, -1.0982353687286377, -1.0630733966827393, -1.0279114246368408, -0.9927495121955872, -0.9575875401496887, -0.9224255681037903, -0.8872635960578918, -0.8521016836166382, -0.8169397115707397, -0.7817777395248413, -0.7466157674789429, -0.7114537954330444, -0.676291823387146, -0.6411298513412476, -0.6059678792953491, -0.5708059072494507, -0.5356439352035522, -0.5004820227622986, -0.46532005071640015, -0.4301580786705017, -0.39499610662460327, -0.35983413457870483, -0.3246721923351288, -0.28951022028923035, -0.2543482482433319, -0.21918629109859467, -0.18402433395385742, -0.14886236190795898, -0.11370039731264114, -0.0785384327173233, -0.04337646812200546, -0.008214503526687622, 0.026947468519210815, 0.06210942566394806, 0.0972713828086853, 0.13243335485458374, 0.16759532690048218, 0.20275728404521942, 0.23791924118995667, 0.2730812132358551, 0.30824318528175354, 0.3434051275253296, 0.378567099571228, 0.41372907161712646, 0.4488910436630249, 0.48405301570892334, 0.5192149877548218, 0.5543769598007202, 0.5895389318466187, 0.6247008442878723, 0.6598628163337708, 0.6950247883796692, 0.7301867604255676, 0.7653487324714661, 0.8005107045173645, 0.8356726169586182, 0.8708345890045166, 0.905996561050415, 0.9411585330963135, 0.9763205051422119]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 3.0, 3.0, 7.0, 8.0, 11.0, 11.0, 13.0, 11.0, 18.0, 18.0, 19.0, 26.0, 26.0, 34.0, 40.0, 31.0, 40.0, 35.0, 41.0, 38.0, 39.0, 44.0, 49.0, 43.0, 49.0, 44.0, 44.0, 37.0, 29.0, 28.0, 22.0, 27.0, 14.0, 17.0, 20.0, 14.0, 14.0, 18.0, 9.0, 5.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.8446028828620911, -0.8207578659057617, -0.7969129085540771, -0.7730678915977478, -0.7492228746414185, -0.7253779172897339, -0.7015329003334045, -0.6776878833770752, -0.6538429260253906, -0.6299979090690613, -0.6061529517173767, -0.5823079347610474, -0.558462917804718, -0.5346179008483887, -0.5107729434967041, -0.48692792654037476, -0.4630829095840454, -0.43923792243003845, -0.4153929054737091, -0.39154791831970215, -0.3677029013633728, -0.34385791420936584, -0.3200129270553589, -0.29616791009902954, -0.2723229229450226, -0.24847792088985443, -0.22463291883468628, -0.20078793168067932, -0.17694292962551117, -0.15309792757034302, -0.12925294041633606, -0.10540793836116791, -0.08156293630599976, -0.0577179379761219, -0.03387293964624405, -0.010027945041656494, 0.013817057013511658, 0.03766205906867981, 0.06150704622268677, 0.08535204827785492, 0.10919705033302307, 0.13304205238819122, 0.15688705444335938, 0.18073204159736633, 0.20457704365253448, 0.22842204570770264, 0.2522670328617096, 0.27611202001571655, 0.2999570369720459, 0.32380202412605286, 0.3476470410823822, 0.37149202823638916, 0.3953370451927185, 0.41918203234672546, 0.4430270195007324, 0.46687203645706177, 0.4907170236110687, 0.5145620107650757, 0.538407027721405, 0.5622520446777344, 0.586097002029419, 0.6099420189857483, 0.6337870359420776, 0.6576319932937622, 0.6814770102500916]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 1.0, 8.0, 8.0, 18.0, 20.0, 40.0, 41.0, 50.0, 104.0, 147.0, 204.0, 295.0, 380.0, 546.0, 745.0, 1115.0, 1485.0, 2154.0, 2983.0, 4195.0, 6205.0, 9548.0, 16116.0, 34261.0, 120949.0, 536578.0, 209205.0, 47216.0, 19877.0, 10922.0, 6865.0, 4661.0, 3372.0, 2365.0, 1731.0, 1150.0, 927.0, 610.0, 450.0, 315.0, 206.0, 150.0, 117.0, 65.0, 61.0, 24.0, 28.0, 18.0, 13.0, 9.0, 7.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.303955078125, -0.2937049865722656, -0.28345489501953125, -0.2732048034667969, -0.2629547119140625, -0.2527046203613281, -0.24245452880859375, -0.23220443725585938, -0.221954345703125, -0.21170425415039062, -0.20145416259765625, -0.19120407104492188, -0.1809539794921875, -0.17070388793945312, -0.16045379638671875, -0.15020370483398438, -0.13995361328125, -0.12970352172851562, -0.11945343017578125, -0.10920333862304688, -0.0989532470703125, -0.08870315551757812, -0.07845306396484375, -0.06820297241210938, -0.057952880859375, -0.047702789306640625, -0.03745269775390625, -0.027202606201171875, -0.0169525146484375, -0.006702423095703125, 0.00354766845703125, 0.013797760009765625, 0.0240478515625, 0.034297943115234375, 0.04454803466796875, 0.054798126220703125, 0.0650482177734375, 0.07529830932617188, 0.08554840087890625, 0.09579849243164062, 0.106048583984375, 0.11629867553710938, 0.12654876708984375, 0.13679885864257812, 0.1470489501953125, 0.15729904174804688, 0.16754913330078125, 0.17779922485351562, 0.18804931640625, 0.19829940795898438, 0.20854949951171875, 0.21879959106445312, 0.2290496826171875, 0.23929977416992188, 0.24954986572265625, 0.2597999572753906, 0.270050048828125, 0.2803001403808594, 0.29055023193359375, 0.3008003234863281, 0.3110504150390625, 0.3213005065917969, 0.33155059814453125, 0.3418006896972656, 0.35205078125]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 8.0, 11.0, 6.0, 11.0, 9.0, 12.0, 15.0, 18.0, 26.0, 19.0, 18.0, 23.0, 34.0, 31.0, 32.0, 55.0, 28.0, 42.0, 47.0, 47.0, 47.0, 47.0, 41.0, 33.0, 39.0, 35.0, 30.0, 31.0, 31.0, 27.0, 28.0, 15.0, 12.0, 10.0, 21.0, 14.0, 8.0, 10.0, 9.0, 9.0, 8.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-1.30859375, -1.271240234375, -1.23388671875, -1.196533203125, -1.1591796875, -1.121826171875, -1.08447265625, -1.047119140625, -1.009765625, -0.972412109375, -0.93505859375, -0.897705078125, -0.8603515625, -0.822998046875, -0.78564453125, -0.748291015625, -0.7109375, -0.673583984375, -0.63623046875, -0.598876953125, -0.5615234375, -0.524169921875, -0.48681640625, -0.449462890625, -0.412109375, -0.374755859375, -0.33740234375, -0.300048828125, -0.2626953125, -0.225341796875, -0.18798828125, -0.150634765625, -0.11328125, -0.075927734375, -0.03857421875, -0.001220703125, 0.0361328125, 0.073486328125, 0.11083984375, 0.148193359375, 0.185546875, 0.222900390625, 0.26025390625, 0.297607421875, 0.3349609375, 0.372314453125, 0.40966796875, 0.447021484375, 0.484375, 0.521728515625, 0.55908203125, 0.596435546875, 0.6337890625, 0.671142578125, 0.70849609375, 0.745849609375, 0.783203125, 0.820556640625, 0.85791015625, 0.895263671875, 0.9326171875, 0.969970703125, 1.00732421875, 1.044677734375, 1.08203125]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 1.0, 6.0, 5.0, 9.0, 23.0, 16.0, 22.0, 28.0, 43.0, 66.0, 110.0, 143.0, 271.0, 589.0, 1578.0, 5529.0, 25592.0, 626721.0, 358829.0, 21377.0, 4796.0, 1453.0, 581.0, 279.0, 161.0, 102.0, 60.0, 44.0, 37.0, 26.0, 18.0, 13.0, 10.0, 10.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.013671875, -0.9786529541015625, -0.943634033203125, -0.9086151123046875, -0.87359619140625, -0.8385772705078125, -0.803558349609375, -0.7685394287109375, -0.7335205078125, -0.6985015869140625, -0.663482666015625, -0.6284637451171875, -0.59344482421875, -0.5584259033203125, -0.523406982421875, -0.4883880615234375, -0.453369140625, -0.4183502197265625, -0.383331298828125, -0.3483123779296875, -0.31329345703125, -0.2782745361328125, -0.243255615234375, -0.2082366943359375, -0.1732177734375, -0.1381988525390625, -0.103179931640625, -0.0681610107421875, -0.03314208984375, 0.0018768310546875, 0.036895751953125, 0.0719146728515625, 0.10693359375, 0.1419525146484375, 0.176971435546875, 0.2119903564453125, 0.24700927734375, 0.2820281982421875, 0.317047119140625, 0.3520660400390625, 0.3870849609375, 0.4221038818359375, 0.457122802734375, 0.4921417236328125, 0.52716064453125, 0.5621795654296875, 0.597198486328125, 0.6322174072265625, 0.667236328125, 0.7022552490234375, 0.737274169921875, 0.7722930908203125, 0.80731201171875, 0.8423309326171875, 0.877349853515625, 0.9123687744140625, 0.9473876953125, 0.9824066162109375, 1.017425537109375, 1.0524444580078125, 1.08746337890625, 1.1224822998046875, 1.157501220703125, 1.1925201416015625, 1.2275390625]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 4.0, 4.0, 8.0, 7.0, 5.0, 5.0, 8.0, 7.0, 15.0, 21.0, 16.0, 20.0, 15.0, 17.0, 25.0, 22.0, 25.0, 36.0, 40.0, 40.0, 38.0, 41.0, 45.0, 51.0, 40.0, 39.0, 34.0, 38.0, 38.0, 29.0, 41.0, 33.0, 36.0, 19.0, 20.0, 18.0, 16.0, 16.0, 12.0, 7.0, 12.0, 9.0, 7.0, 5.0, 7.0, 1.0, 3.0, 7.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.1328125, -1.0979156494140625, -1.063018798828125, -1.0281219482421875, -0.99322509765625, -0.9583282470703125, -0.923431396484375, -0.8885345458984375, -0.8536376953125, -0.8187408447265625, -0.783843994140625, -0.7489471435546875, -0.71405029296875, -0.6791534423828125, -0.644256591796875, -0.6093597412109375, -0.574462890625, -0.5395660400390625, -0.504669189453125, -0.4697723388671875, -0.43487548828125, -0.3999786376953125, -0.365081787109375, -0.3301849365234375, -0.2952880859375, -0.2603912353515625, -0.225494384765625, -0.1905975341796875, -0.15570068359375, -0.1208038330078125, -0.085906982421875, -0.0510101318359375, -0.01611328125, 0.0187835693359375, 0.053680419921875, 0.0885772705078125, 0.12347412109375, 0.1583709716796875, 0.193267822265625, 0.2281646728515625, 0.2630615234375, 0.2979583740234375, 0.332855224609375, 0.3677520751953125, 0.40264892578125, 0.4375457763671875, 0.472442626953125, 0.5073394775390625, 0.542236328125, 0.5771331787109375, 0.612030029296875, 0.6469268798828125, 0.68182373046875, 0.7167205810546875, 0.751617431640625, 0.7865142822265625, 0.8214111328125, 0.8563079833984375, 0.891204833984375, 0.9261016845703125, 0.96099853515625, 0.9958953857421875, 1.030792236328125, 1.0656890869140625, 1.1005859375]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 7.0, 2.0, 10.0, 11.0, 12.0, 36.0, 44.0, 98.0, 152.0, 294.0, 631.0, 1404.0, 4629.0, 19788.0, 186056.0, 794697.0, 30803.0, 6422.0, 1935.0, 755.0, 341.0, 182.0, 85.0, 70.0, 35.0, 22.0, 11.0, 12.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.360107421875, -0.3481559753417969, -0.33620452880859375, -0.3242530822753906, -0.3123016357421875, -0.3003501892089844, -0.28839874267578125, -0.2764472961425781, -0.264495849609375, -0.2525444030761719, -0.24059295654296875, -0.22864151000976562, -0.2166900634765625, -0.20473861694335938, -0.19278717041015625, -0.18083572387695312, -0.16888427734375, -0.15693283081054688, -0.14498138427734375, -0.13302993774414062, -0.1210784912109375, -0.10912704467773438, -0.09717559814453125, -0.08522415161132812, -0.073272705078125, -0.061321258544921875, -0.04936981201171875, -0.037418365478515625, -0.0254669189453125, -0.013515472412109375, -0.00156402587890625, 0.010387420654296875, 0.0223388671875, 0.034290313720703125, 0.04624176025390625, 0.058193206787109375, 0.0701446533203125, 0.08209609985351562, 0.09404754638671875, 0.10599899291992188, 0.117950439453125, 0.12990188598632812, 0.14185333251953125, 0.15380477905273438, 0.1657562255859375, 0.17770767211914062, 0.18965911865234375, 0.20161056518554688, 0.21356201171875, 0.22551345825195312, 0.23746490478515625, 0.24941635131835938, 0.2613677978515625, 0.2733192443847656, 0.28527069091796875, 0.2972221374511719, 0.309173583984375, 0.3211250305175781, 0.33307647705078125, 0.3450279235839844, 0.3569793701171875, 0.3689308166503906, 0.38088226318359375, 0.3928337097167969, 0.40478515625]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 0.0, 3.0, 6.0, 9.0, 6.0, 10.0, 14.0, 14.0, 22.0, 39.0, 59.0, 258.0, 357.0, 80.0, 52.0, 22.0, 10.0, 15.0, 9.0, 6.0, 7.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.437301635742188e-05, -6.254110485315323e-05, -6.070919334888458e-05, -5.8877281844615936e-05, -5.704537034034729e-05, -5.5213458836078644e-05, -5.338154733181e-05, -5.154963582754135e-05, -4.9717724323272705e-05, -4.788581281900406e-05, -4.605390131473541e-05, -4.4221989810466766e-05, -4.239007830619812e-05, -4.0558166801929474e-05, -3.872625529766083e-05, -3.689434379339218e-05, -3.5062432289123535e-05, -3.323052078485489e-05, -3.139860928058624e-05, -2.9566697776317596e-05, -2.773478627204895e-05, -2.5902874767780304e-05, -2.4070963263511658e-05, -2.223905175924301e-05, -2.0407140254974365e-05, -1.857522875070572e-05, -1.6743317246437073e-05, -1.4911405742168427e-05, -1.307949423789978e-05, -1.1247582733631134e-05, -9.415671229362488e-06, -7.5837597250938416e-06, -5.751848220825195e-06, -3.919936716556549e-06, -2.088025212287903e-06, -2.561137080192566e-07, 1.5757977962493896e-06, 3.407709300518036e-06, 5.239620804786682e-06, 7.071532309055328e-06, 8.903443813323975e-06, 1.0735355317592621e-05, 1.2567266821861267e-05, 1.4399178326129913e-05, 1.623108983039856e-05, 1.8063001334667206e-05, 1.9894912838935852e-05, 2.1726824343204498e-05, 2.3558735847473145e-05, 2.539064735174179e-05, 2.7222558856010437e-05, 2.9054470360279083e-05, 3.088638186454773e-05, 3.2718293368816376e-05, 3.455020487308502e-05, 3.638211637735367e-05, 3.8214027881622314e-05, 4.004593938589096e-05, 4.187785089015961e-05, 4.370976239442825e-05, 4.55416738986969e-05, 4.7373585402965546e-05, 4.920549690723419e-05, 5.103740841150284e-05, 5.2869319915771484e-05]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 7.0, 5.0, 8.0, 7.0, 9.0, 20.0, 40.0, 44.0, 80.0, 196.0, 415.0, 1037.0, 3046.0, 12712.0, 90977.0, 880083.0, 47984.0, 8201.0, 2219.0, 768.0, 329.0, 161.0, 72.0, 46.0, 31.0, 18.0, 18.0, 10.0, 1.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.411865234375, -0.39987945556640625, -0.3878936767578125, -0.37590789794921875, -0.363922119140625, -0.35193634033203125, -0.3399505615234375, -0.32796478271484375, -0.31597900390625, -0.30399322509765625, -0.2920074462890625, -0.28002166748046875, -0.268035888671875, -0.25605010986328125, -0.2440643310546875, -0.23207855224609375, -0.2200927734375, -0.20810699462890625, -0.1961212158203125, -0.18413543701171875, -0.172149658203125, -0.16016387939453125, -0.1481781005859375, -0.13619232177734375, -0.12420654296875, -0.11222076416015625, -0.1002349853515625, -0.08824920654296875, -0.076263427734375, -0.06427764892578125, -0.0522918701171875, -0.04030609130859375, -0.0283203125, -0.01633453369140625, -0.0043487548828125, 0.00763702392578125, 0.019622802734375, 0.03160858154296875, 0.0435943603515625, 0.05558013916015625, 0.06756591796875, 0.07955169677734375, 0.0915374755859375, 0.10352325439453125, 0.115509033203125, 0.12749481201171875, 0.1394805908203125, 0.15146636962890625, 0.1634521484375, 0.17543792724609375, 0.1874237060546875, 0.19940948486328125, 0.211395263671875, 0.22338104248046875, 0.2353668212890625, 0.24735260009765625, 0.25933837890625, 0.27132415771484375, 0.2833099365234375, 0.29529571533203125, 0.307281494140625, 0.31926727294921875, 0.3312530517578125, 0.34323883056640625, 0.355224609375]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 4.0, 1.0, 2.0, 2.0, 4.0, 7.0, 7.0, 6.0, 8.0, 10.0, 16.0, 15.0, 37.0, 38.0, 57.0, 85.0, 326.0, 158.0, 90.0, 40.0, 26.0, 20.0, 12.0, 10.0, 6.0, 5.0, 12.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09002685546875, -0.08623600006103516, -0.08244514465332031, -0.07865428924560547, -0.07486343383789062, -0.07107257843017578, -0.06728172302246094, -0.0634908676147461, -0.05970001220703125, -0.055909156799316406, -0.05211830139160156, -0.04832744598388672, -0.044536590576171875, -0.04074573516845703, -0.03695487976074219, -0.033164024353027344, -0.0293731689453125, -0.025582313537597656, -0.021791458129882812, -0.01800060272216797, -0.014209747314453125, -0.010418891906738281, -0.0066280364990234375, -0.0028371810913085938, 0.00095367431640625, 0.004744529724121094, 0.008535385131835938, 0.012326240539550781, 0.016117095947265625, 0.01990795135498047, 0.023698806762695312, 0.027489662170410156, 0.031280517578125, 0.035071372985839844, 0.03886222839355469, 0.04265308380126953, 0.046443939208984375, 0.05023479461669922, 0.05402565002441406, 0.057816505432128906, 0.06160736083984375, 0.0653982162475586, 0.06918907165527344, 0.07297992706298828, 0.07677078247070312, 0.08056163787841797, 0.08435249328613281, 0.08814334869384766, 0.0919342041015625, 0.09572505950927734, 0.09951591491699219, 0.10330677032470703, 0.10709762573242188, 0.11088848114013672, 0.11467933654785156, 0.1184701919555664, 0.12226104736328125, 0.1260519027709961, 0.12984275817871094, 0.13363361358642578, 0.13742446899414062, 0.14121532440185547, 0.1450061798095703, 0.14879703521728516, 0.152587890625]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 7.0, 21.0, 91.0, 401.0, 397.0, 89.0, 12.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8507499694824219, -1.4779772758483887, -1.105204463005066, -0.7324316501617432, -0.35965895652770996, 0.013113737106323242, 0.38588666915893555, 0.7586593627929688, 1.131432056427002, 1.5042047500610352, 1.876977562904358, 2.2497503757476807, 2.622523069381714, 2.995295763015747, 3.3680686950683594, 3.7408413887023926, 4.113614082336426, 4.486386775970459, 4.859159469604492, 5.231932640075684, 5.604704856872559, 5.97747802734375, 6.350250720977783, 6.723023414611816, 7.09579610824585, 7.468568801879883, 7.841341495513916, 8.21411418914795, 8.58688735961914, 8.959659576416016, 9.332432746887207, 9.705205917358398, 10.077978134155273, 10.450751304626465, 10.82352352142334, 11.196296691894531, 11.569068908691406, 11.941842079162598, 12.314615249633789, 12.687387466430664, 13.060159683227539, 13.43293285369873, 13.805705070495605, 14.178478240966797, 14.551250457763672, 14.924023628234863, 15.296796798706055, 15.66956901550293, 16.042343139648438, 16.415115356445312, 16.78788948059082, 17.160661697387695, 17.53343391418457, 17.906206130981445, 18.278980255126953, 18.651752471923828, 19.024524688720703, 19.397296905517578, 19.770071029663086, 20.14284324645996, 20.515615463256836, 20.88838768005371, 21.26116180419922, 21.633934020996094, 22.00670623779297]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 5.0, 4.0, 2.0, 3.0, 9.0, 12.0, 12.0, 8.0, 18.0, 24.0, 19.0, 19.0, 27.0, 33.0, 27.0, 48.0, 34.0, 45.0, 49.0, 49.0, 46.0, 45.0, 42.0, 44.0, 34.0, 43.0, 44.0, 30.0, 37.0, 30.0, 26.0, 24.0, 26.0, 16.0, 13.0, 18.0, 7.0, 6.0, 12.0, 10.0, 7.0, 2.0, 6.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.3942344188690186, -2.3292629718780518, -2.264291763305664, -2.1993203163146973, -2.1343488693237305, -2.0693774223327637, -2.004406213760376, -1.9394347667694092, -1.874463438987732, -1.8094921112060547, -1.744520664215088, -1.6795493364334106, -1.6145780086517334, -1.5496065616607666, -1.4846352338790894, -1.419663906097412, -1.3546924591064453, -1.289721131324768, -1.2247496843338013, -1.159778356552124, -1.0948069095611572, -1.02983558177948, -0.9648642539978027, -0.8998928666114807, -0.8349214792251587, -0.7699500918388367, -0.7049787044525146, -0.6400073766708374, -0.5750359892845154, -0.5100646018981934, -0.4450932443141937, -0.3801218867301941, -0.31515026092529297, -0.25017887353897095, -0.1852075159549713, -0.12023614346981049, -0.05526477098464966, 0.009706616401672363, 0.074677973985672, 0.13964933156967163, 0.20462071895599365, 0.2695921063423157, 0.3345634639263153, 0.39953482151031494, 0.46450620889663696, 0.529477596282959, 0.5944489240646362, 0.6594203114509583, 0.7243916988372803, 0.7893630862236023, 0.8543344736099243, 0.9193058013916016, 0.9842771887779236, 1.0492485761642456, 1.1142199039459229, 1.1791913509368896, 1.244162678718567, 1.3091340065002441, 1.374105453491211, 1.4390767812728882, 1.5040481090545654, 1.5690195560455322, 1.6339908838272095, 1.6989622116088867, 1.7639336585998535]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 4.0, 2.0, 8.0, 13.0, 17.0, 18.0, 31.0, 41.0, 73.0, 102.0, 167.0, 290.0, 561.0, 1054.0, 2115.0, 4792.0, 12035.0, 37833.0, 251598.0, 1975228.0, 1660895.0, 195608.0, 32648.0, 10712.0, 4290.0, 1902.0, 1046.0, 518.0, 265.0, 129.0, 93.0, 49.0, 34.0, 28.0, 30.0, 19.0, 13.0, 10.0, 8.0, 3.0, 3.0, 5.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2490234375, -1.202667236328125, -1.15631103515625, -1.109954833984375, -1.0635986328125, -1.017242431640625, -0.97088623046875, -0.924530029296875, -0.878173828125, -0.831817626953125, -0.78546142578125, -0.739105224609375, -0.6927490234375, -0.646392822265625, -0.60003662109375, -0.553680419921875, -0.50732421875, -0.460968017578125, -0.41461181640625, -0.368255615234375, -0.3218994140625, -0.275543212890625, -0.22918701171875, -0.182830810546875, -0.136474609375, -0.090118408203125, -0.04376220703125, 0.002593994140625, 0.0489501953125, 0.095306396484375, 0.14166259765625, 0.188018798828125, 0.234375, 0.280731201171875, 0.32708740234375, 0.373443603515625, 0.4197998046875, 0.466156005859375, 0.51251220703125, 0.558868408203125, 0.605224609375, 0.651580810546875, 0.69793701171875, 0.744293212890625, 0.7906494140625, 0.837005615234375, 0.88336181640625, 0.929718017578125, 0.97607421875, 1.022430419921875, 1.06878662109375, 1.115142822265625, 1.1614990234375, 1.207855224609375, 1.25421142578125, 1.300567626953125, 1.346923828125, 1.393280029296875, 1.43963623046875, 1.485992431640625, 1.5323486328125, 1.578704833984375, 1.62506103515625, 1.671417236328125, 1.7177734375]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 6.0, 10.0, 9.0, 11.0, 13.0, 12.0, 12.0, 23.0, 12.0, 20.0, 21.0, 32.0, 29.0, 29.0, 29.0, 37.0, 39.0, 36.0, 47.0, 34.0, 62.0, 48.0, 37.0, 50.0, 42.0, 35.0, 35.0, 31.0, 33.0, 13.0, 22.0, 17.0, 21.0, 18.0, 18.0, 13.0, 12.0, 7.0, 9.0, 4.0, 2.0, 8.0, 7.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.859375, -0.8345108032226562, -0.8096466064453125, -0.7847824096679688, -0.759918212890625, -0.7350540161132812, -0.7101898193359375, -0.6853256225585938, -0.66046142578125, -0.6355972290039062, -0.6107330322265625, -0.5858688354492188, -0.561004638671875, -0.5361404418945312, -0.5112762451171875, -0.48641204833984375, -0.4615478515625, -0.43668365478515625, -0.4118194580078125, -0.38695526123046875, -0.362091064453125, -0.33722686767578125, -0.3123626708984375, -0.28749847412109375, -0.26263427734375, -0.23777008056640625, -0.2129058837890625, -0.18804168701171875, -0.163177490234375, -0.13831329345703125, -0.1134490966796875, -0.08858489990234375, -0.063720703125, -0.03885650634765625, -0.0139923095703125, 0.01087188720703125, 0.035736083984375, 0.06060028076171875, 0.0854644775390625, 0.11032867431640625, 0.13519287109375, 0.16005706787109375, 0.1849212646484375, 0.20978546142578125, 0.234649658203125, 0.25951385498046875, 0.2843780517578125, 0.30924224853515625, 0.3341064453125, 0.35897064208984375, 0.3838348388671875, 0.40869903564453125, 0.433563232421875, 0.45842742919921875, 0.4832916259765625, 0.5081558227539062, 0.53302001953125, 0.5578842163085938, 0.5827484130859375, 0.6076126098632812, 0.632476806640625, 0.6573410034179688, 0.6822052001953125, 0.7070693969726562, 0.73193359375]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 7.0, 11.0, 25.0, 50.0, 142.0, 442.0, 3700.0, 4155145.0, 33614.0, 757.0, 209.0, 89.0, 48.0, 24.0, 9.0, 3.0, 8.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.4765625, -8.1705322265625, -7.864501953125, -7.5584716796875, -7.25244140625, -6.9464111328125, -6.640380859375, -6.3343505859375, -6.0283203125, -5.7222900390625, -5.416259765625, -5.1102294921875, -4.80419921875, -4.4981689453125, -4.192138671875, -3.8861083984375, -3.580078125, -3.2740478515625, -2.968017578125, -2.6619873046875, -2.35595703125, -2.0499267578125, -1.743896484375, -1.4378662109375, -1.1318359375, -0.8258056640625, -0.519775390625, -0.2137451171875, 0.09228515625, 0.3983154296875, 0.704345703125, 1.0103759765625, 1.31640625, 1.6224365234375, 1.928466796875, 2.2344970703125, 2.54052734375, 2.8465576171875, 3.152587890625, 3.4586181640625, 3.7646484375, 4.0706787109375, 4.376708984375, 4.6827392578125, 4.98876953125, 5.2947998046875, 5.600830078125, 5.9068603515625, 6.212890625, 6.5189208984375, 6.824951171875, 7.1309814453125, 7.43701171875, 7.7430419921875, 8.049072265625, 8.3551025390625, 8.6611328125, 8.9671630859375, 9.273193359375, 9.5792236328125, 9.88525390625, 10.1912841796875, 10.497314453125, 10.8033447265625, 11.109375]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 6.0, 6.0, 14.0, 21.0, 51.0, 97.0, 168.0, 294.0, 692.0, 1129.0, 757.0, 410.0, 166.0, 111.0, 60.0, 42.0, 22.0, 14.0, 11.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.98779296875, -0.9656448364257812, -0.9434967041015625, -0.9213485717773438, -0.899200439453125, -0.8770523071289062, -0.8549041748046875, -0.8327560424804688, -0.81060791015625, -0.7884597778320312, -0.7663116455078125, -0.7441635131835938, -0.722015380859375, -0.6998672485351562, -0.6777191162109375, -0.6555709838867188, -0.6334228515625, -0.6112747192382812, -0.5891265869140625, -0.5669784545898438, -0.544830322265625, -0.5226821899414062, -0.5005340576171875, -0.47838592529296875, -0.45623779296875, -0.43408966064453125, -0.4119415283203125, -0.38979339599609375, -0.367645263671875, -0.34549713134765625, -0.3233489990234375, -0.30120086669921875, -0.279052734375, -0.25690460205078125, -0.2347564697265625, -0.21260833740234375, -0.190460205078125, -0.16831207275390625, -0.1461639404296875, -0.12401580810546875, -0.10186767578125, -0.07971954345703125, -0.0575714111328125, -0.03542327880859375, -0.013275146484375, 0.00887298583984375, 0.0310211181640625, 0.05316925048828125, 0.0753173828125, 0.09746551513671875, 0.1196136474609375, 0.14176177978515625, 0.163909912109375, 0.18605804443359375, 0.2082061767578125, 0.23035430908203125, 0.25250244140625, 0.27465057373046875, 0.2967987060546875, 0.31894683837890625, 0.341094970703125, 0.36324310302734375, 0.3853912353515625, 0.40753936767578125, 0.4296875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 6.0, 4.0, 10.0, 11.0, 16.0, 20.0, 18.0, 38.0, 30.0, 51.0, 56.0, 49.0, 76.0, 81.0, 72.0, 90.0, 53.0, 60.0, 60.0, 32.0, 31.0, 42.0, 19.0, 22.0, 9.0, 8.0, 7.0, 6.0, 5.0, 4.0, 9.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.3727426528930664, -1.3338072299957275, -1.2948718070983887, -1.2559365034103394, -1.2170010805130005, -1.1780656576156616, -1.1391303539276123, -1.1001949310302734, -1.0612595081329346, -1.0223240852355957, -0.9833887219429016, -0.9444533586502075, -0.9055179357528687, -0.8665825128555298, -0.8276471495628357, -0.7887117862701416, -0.7497763633728027, -0.7108409404754639, -0.6719055771827698, -0.6329702138900757, -0.5940347909927368, -0.555099368095398, -0.5161640048027039, -0.4772286117076874, -0.4382932186126709, -0.3993578255176544, -0.36042243242263794, -0.32148703932762146, -0.282551646232605, -0.2436162531375885, -0.20468086004257202, -0.16574546694755554, -0.12681007385253906, -0.08787468075752258, -0.048939287662506104, -0.010003894567489624, 0.028931498527526855, 0.06786689162254333, 0.10680228471755981, 0.1457376778125763, 0.18467307090759277, 0.22360846400260925, 0.26254385709762573, 0.3014792501926422, 0.3404146432876587, 0.37935003638267517, 0.41828542947769165, 0.45722082257270813, 0.4961562156677246, 0.5350916385650635, 0.5740270018577576, 0.6129623651504517, 0.6518977880477905, 0.6908332109451294, 0.7297685742378235, 0.7687039375305176, 0.8076393604278564, 0.8465747833251953, 0.8855101466178894, 0.9244455099105835, 0.9633809328079224, 1.0023163557052612, 1.0412516593933105, 1.0801870822906494, 1.1191225051879883]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 1.0, 5.0, 5.0, 10.0, 7.0, 14.0, 11.0, 16.0, 16.0, 14.0, 20.0, 23.0, 23.0, 23.0, 32.0, 37.0, 36.0, 29.0, 36.0, 34.0, 39.0, 44.0, 41.0, 46.0, 26.0, 33.0, 39.0, 42.0, 38.0, 27.0, 42.0, 26.0, 18.0, 20.0, 21.0, 16.0, 14.0, 19.0, 13.0, 9.0, 11.0, 12.0, 3.0, 3.0, 4.0, 3.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.872513473033905, -0.8469646573066711, -0.821415901184082, -0.7958670854568481, -0.7703182697296143, -0.7447694540023804, -0.7192206978797913, -0.6936718821525574, -0.6681231260299683, -0.6425743103027344, -0.6170255541801453, -0.5914767384529114, -0.5659279227256775, -0.5403791666030884, -0.5148303508758545, -0.4892815351486206, -0.4637327194213867, -0.4381839334964752, -0.41263511776924133, -0.38708633184432983, -0.36153751611709595, -0.33598873019218445, -0.31043994426727295, -0.28489112854003906, -0.25934234261512756, -0.23379354178905487, -0.20824474096298218, -0.18269595503807068, -0.15714715421199799, -0.1315983533859253, -0.1060495674610138, -0.0805007666349411, -0.054952025413513184, -0.02940322831273079, -0.0038544312119483948, 0.0216943621635437, 0.047243162989616394, 0.07279196381568909, 0.09834074974060059, 0.12388955056667328, 0.14943835139274597, 0.17498715221881866, 0.20053595304489136, 0.22608473896980286, 0.25163352489471436, 0.27718234062194824, 0.30273112654685974, 0.32827991247177124, 0.3538287281990051, 0.3793775141239166, 0.4049263298511505, 0.430475115776062, 0.4560239315032959, 0.4815727174282074, 0.5071215033531189, 0.5326703190803528, 0.5582190752029419, 0.5837678909301758, 0.6093166470527649, 0.6348654627799988, 0.6604142785072327, 0.6859630346298218, 0.7115118503570557, 0.7370606660842896, 0.7626094818115234]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 8.0, 8.0, 9.0, 20.0, 41.0, 48.0, 106.0, 164.0, 310.0, 592.0, 1170.0, 2167.0, 4669.0, 10452.0, 24395.0, 61327.0, 163482.0, 369357.0, 251295.0, 94314.0, 36581.0, 15181.0, 6507.0, 3070.0, 1552.0, 802.0, 403.0, 246.0, 111.0, 78.0, 39.0, 25.0, 10.0, 9.0, 5.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.495849609375, -0.4797096252441406, -0.46356964111328125, -0.4474296569824219, -0.4312896728515625, -0.4151496887207031, -0.39900970458984375, -0.3828697204589844, -0.366729736328125, -0.3505897521972656, -0.33444976806640625, -0.3183097839355469, -0.3021697998046875, -0.2860298156738281, -0.26988983154296875, -0.2537498474121094, -0.23760986328125, -0.22146987915039062, -0.20532989501953125, -0.18918991088867188, -0.1730499267578125, -0.15690994262695312, -0.14076995849609375, -0.12462997436523438, -0.108489990234375, -0.09235000610351562, -0.07621002197265625, -0.060070037841796875, -0.0439300537109375, -0.027790069580078125, -0.01165008544921875, 0.004489898681640625, 0.0206298828125, 0.036769866943359375, 0.05290985107421875, 0.06904983520507812, 0.0851898193359375, 0.10132980346679688, 0.11746978759765625, 0.13360977172851562, 0.149749755859375, 0.16588973999023438, 0.18202972412109375, 0.19816970825195312, 0.2143096923828125, 0.23044967651367188, 0.24658966064453125, 0.2627296447753906, 0.27886962890625, 0.2950096130371094, 0.31114959716796875, 0.3272895812988281, 0.3434295654296875, 0.3595695495605469, 0.37570953369140625, 0.3918495178222656, 0.407989501953125, 0.4241294860839844, 0.44026947021484375, 0.4564094543457031, 0.4725494384765625, 0.4886894226074219, 0.5048294067382812, 0.5209693908691406, 0.537109375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 6.0, 5.0, 5.0, 5.0, 9.0, 11.0, 14.0, 13.0, 9.0, 19.0, 27.0, 16.0, 19.0, 28.0, 28.0, 35.0, 30.0, 39.0, 25.0, 29.0, 36.0, 35.0, 38.0, 40.0, 32.0, 34.0, 32.0, 35.0, 34.0, 36.0, 28.0, 40.0, 33.0, 24.0, 19.0, 16.0, 13.0, 18.0, 8.0, 9.0, 11.0, 14.0, 11.0, 14.0, 4.0, 3.0, 2.0, 2.0, 3.0, 4.0, 3.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.5283203125, -0.5119857788085938, -0.4956512451171875, -0.47931671142578125, -0.462982177734375, -0.44664764404296875, -0.4303131103515625, -0.41397857666015625, -0.39764404296875, -0.38130950927734375, -0.3649749755859375, -0.34864044189453125, -0.332305908203125, -0.31597137451171875, -0.2996368408203125, -0.28330230712890625, -0.2669677734375, -0.25063323974609375, -0.2342987060546875, -0.21796417236328125, -0.201629638671875, -0.18529510498046875, -0.1689605712890625, -0.15262603759765625, -0.13629150390625, -0.11995697021484375, -0.1036224365234375, -0.08728790283203125, -0.070953369140625, -0.05461883544921875, -0.0382843017578125, -0.02194976806640625, -0.005615234375, 0.01071929931640625, 0.0270538330078125, 0.04338836669921875, 0.059722900390625, 0.07605743408203125, 0.0923919677734375, 0.10872650146484375, 0.12506103515625, 0.14139556884765625, 0.1577301025390625, 0.17406463623046875, 0.190399169921875, 0.20673370361328125, 0.2230682373046875, 0.23940277099609375, 0.2557373046875, 0.27207183837890625, 0.2884063720703125, 0.30474090576171875, 0.321075439453125, 0.33740997314453125, 0.3537445068359375, 0.37007904052734375, 0.38641357421875, 0.40274810791015625, 0.4190826416015625, 0.43541717529296875, 0.451751708984375, 0.46808624267578125, 0.4844207763671875, 0.5007553100585938, 0.51708984375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 6.0, 3.0, 7.0, 5.0, 13.0, 15.0, 21.0, 32.0, 36.0, 65.0, 113.0, 172.0, 313.0, 561.0, 1063.0, 2335.0, 6081.0, 18213.0, 65014.0, 270229.0, 481003.0, 147707.0, 36809.0, 11194.0, 3904.0, 1672.0, 817.0, 438.0, 255.0, 158.0, 91.0, 63.0, 48.0, 41.0, 20.0, 10.0, 10.0, 6.0, 7.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.57275390625, -0.5531997680664062, -0.5336456298828125, -0.5140914916992188, -0.494537353515625, -0.47498321533203125, -0.4554290771484375, -0.43587493896484375, -0.41632080078125, -0.39676666259765625, -0.3772125244140625, -0.35765838623046875, -0.338104248046875, -0.31855010986328125, -0.2989959716796875, -0.27944183349609375, -0.2598876953125, -0.24033355712890625, -0.2207794189453125, -0.20122528076171875, -0.181671142578125, -0.16211700439453125, -0.1425628662109375, -0.12300872802734375, -0.10345458984375, -0.08390045166015625, -0.0643463134765625, -0.04479217529296875, -0.025238037109375, -0.00568389892578125, 0.0138702392578125, 0.03342437744140625, 0.052978515625, 0.07253265380859375, 0.0920867919921875, 0.11164093017578125, 0.131195068359375, 0.15074920654296875, 0.1703033447265625, 0.18985748291015625, 0.20941162109375, 0.22896575927734375, 0.2485198974609375, 0.26807403564453125, 0.287628173828125, 0.30718231201171875, 0.3267364501953125, 0.34629058837890625, 0.3658447265625, 0.38539886474609375, 0.4049530029296875, 0.42450714111328125, 0.444061279296875, 0.46361541748046875, 0.4831695556640625, 0.5027236938476562, 0.52227783203125, 0.5418319702148438, 0.5613861083984375, 0.5809402465820312, 0.600494384765625, 0.6200485229492188, 0.6396026611328125, 0.6591567993164062, 0.6787109375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 6.0, 5.0, 11.0, 8.0, 8.0, 13.0, 17.0, 19.0, 27.0, 29.0, 28.0, 40.0, 33.0, 38.0, 46.0, 42.0, 39.0, 30.0, 40.0, 45.0, 42.0, 50.0, 31.0, 42.0, 40.0, 43.0, 25.0, 27.0, 35.0, 22.0, 18.0, 22.0, 19.0, 17.0, 7.0, 8.0, 6.0, 5.0, 1.0, 4.0, 7.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-1.193359375, -1.1558685302734375, -1.118377685546875, -1.0808868408203125, -1.04339599609375, -1.0059051513671875, -0.968414306640625, -0.9309234619140625, -0.8934326171875, -0.8559417724609375, -0.818450927734375, -0.7809600830078125, -0.74346923828125, -0.7059783935546875, -0.668487548828125, -0.6309967041015625, -0.593505859375, -0.5560150146484375, -0.518524169921875, -0.4810333251953125, -0.44354248046875, -0.4060516357421875, -0.368560791015625, -0.3310699462890625, -0.2935791015625, -0.2560882568359375, -0.218597412109375, -0.1811065673828125, -0.14361572265625, -0.1061248779296875, -0.068634033203125, -0.0311431884765625, 0.00634765625, 0.0438385009765625, 0.081329345703125, 0.1188201904296875, 0.15631103515625, 0.1938018798828125, 0.231292724609375, 0.2687835693359375, 0.3062744140625, 0.3437652587890625, 0.381256103515625, 0.4187469482421875, 0.45623779296875, 0.4937286376953125, 0.531219482421875, 0.5687103271484375, 0.606201171875, 0.6436920166015625, 0.681182861328125, 0.7186737060546875, 0.75616455078125, 0.7936553955078125, 0.831146240234375, 0.8686370849609375, 0.9061279296875, 0.9436187744140625, 0.981109619140625, 1.0186004638671875, 1.05609130859375, 1.0935821533203125, 1.131072998046875, 1.1685638427734375, 1.2060546875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 6.0, 8.0, 8.0, 10.0, 13.0, 18.0, 21.0, 44.0, 78.0, 88.0, 124.0, 213.0, 293.0, 537.0, 821.0, 1446.0, 2567.0, 5112.0, 10765.0, 26301.0, 76245.0, 257954.0, 426061.0, 157457.0, 47646.0, 17828.0, 7932.0, 3892.0, 2032.0, 1152.0, 690.0, 413.0, 256.0, 180.0, 113.0, 71.0, 47.0, 45.0, 18.0, 18.0, 16.0, 11.0, 3.0, 7.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.11895751953125, -0.11538505554199219, -0.11181259155273438, -0.10824012756347656, -0.10466766357421875, -0.10109519958496094, -0.09752273559570312, -0.09395027160644531, -0.0903778076171875, -0.08680534362792969, -0.08323287963867188, -0.07966041564941406, -0.07608795166015625, -0.07251548767089844, -0.06894302368164062, -0.06537055969238281, -0.061798095703125, -0.05822563171386719, -0.054653167724609375, -0.05108070373535156, -0.04750823974609375, -0.04393577575683594, -0.040363311767578125, -0.03679084777832031, -0.0332183837890625, -0.029645919799804688, -0.026073455810546875, -0.022500991821289062, -0.01892852783203125, -0.015356063842773438, -0.011783599853515625, -0.008211135864257812, -0.004638671875, -0.0010662078857421875, 0.002506256103515625, 0.0060787200927734375, 0.00965118408203125, 0.013223648071289062, 0.016796112060546875, 0.020368576049804688, 0.0239410400390625, 0.027513504028320312, 0.031085968017578125, 0.03465843200683594, 0.03823089599609375, 0.04180335998535156, 0.045375823974609375, 0.04894828796386719, 0.052520751953125, 0.05609321594238281, 0.059665679931640625, 0.06323814392089844, 0.06681060791015625, 0.07038307189941406, 0.07395553588867188, 0.07752799987792969, 0.0811004638671875, 0.08467292785644531, 0.08824539184570312, 0.09181785583496094, 0.09539031982421875, 0.09896278381347656, 0.10253524780273438, 0.10610771179199219, 0.10968017578125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 7.0, 1.0, 11.0, 5.0, 10.0, 22.0, 22.0, 24.0, 33.0, 55.0, 48.0, 94.0, 93.0, 103.0, 111.0, 85.0, 68.0, 47.0, 40.0, 21.0, 23.0, 12.0, 12.0, 11.0, 12.0, 7.0, 3.0, 3.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0], "bins": [-9.620189666748047e-05, -9.325612336397171e-05, -9.031035006046295e-05, -8.736457675695419e-05, -8.441880345344543e-05, -8.147303014993668e-05, -7.852725684642792e-05, -7.558148354291916e-05, -7.26357102394104e-05, -6.968993693590164e-05, -6.674416363239288e-05, -6.379839032888412e-05, -6.0852617025375366e-05, -5.790684372186661e-05, -5.496107041835785e-05, -5.201529711484909e-05, -4.906952381134033e-05, -4.6123750507831573e-05, -4.3177977204322815e-05, -4.0232203900814056e-05, -3.72864305973053e-05, -3.434065729379654e-05, -3.139488399028778e-05, -2.8449110686779022e-05, -2.5503337383270264e-05, -2.2557564079761505e-05, -1.9611790776252747e-05, -1.6666017472743988e-05, -1.372024416923523e-05, -1.0774470865726471e-05, -7.828697562217712e-06, -4.882924258708954e-06, -1.9371509552001953e-06, 1.0086223483085632e-06, 3.954395651817322e-06, 6.90016895532608e-06, 9.845942258834839e-06, 1.2791715562343597e-05, 1.5737488865852356e-05, 1.8683262169361115e-05, 2.1629035472869873e-05, 2.457480877637863e-05, 2.752058207988739e-05, 3.046635538339615e-05, 3.341212868690491e-05, 3.6357901990413666e-05, 3.9303675293922424e-05, 4.224944859743118e-05, 4.519522190093994e-05, 4.81409952044487e-05, 5.108676850795746e-05, 5.403254181146622e-05, 5.6978315114974976e-05, 5.9924088418483734e-05, 6.286986172199249e-05, 6.581563502550125e-05, 6.876140832901001e-05, 7.170718163251877e-05, 7.465295493602753e-05, 7.759872823953629e-05, 8.054450154304504e-05, 8.34902748465538e-05, 8.643604815006256e-05, 8.938182145357132e-05, 9.232759475708008e-05]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0, 3.0, 4.0, 7.0, 9.0, 22.0, 22.0, 30.0, 57.0, 75.0, 130.0, 164.0, 338.0, 592.0, 1075.0, 2139.0, 4753.0, 12848.0, 42177.0, 166888.0, 460268.0, 259395.0, 66686.0, 18679.0, 6413.0, 2791.0, 1256.0, 719.0, 392.0, 238.0, 127.0, 88.0, 44.0, 45.0, 22.0, 13.0, 15.0, 7.0, 12.0, 4.0, 3.0, 3.0, 3.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.12030029296875, -0.11661720275878906, -0.11293411254882812, -0.10925102233886719, -0.10556793212890625, -0.10188484191894531, -0.09820175170898438, -0.09451866149902344, -0.0908355712890625, -0.08715248107910156, -0.08346939086914062, -0.07978630065917969, -0.07610321044921875, -0.07242012023925781, -0.06873703002929688, -0.06505393981933594, -0.061370849609375, -0.05768775939941406, -0.054004669189453125, -0.05032157897949219, -0.04663848876953125, -0.04295539855957031, -0.039272308349609375, -0.03558921813964844, -0.0319061279296875, -0.028223037719726562, -0.024539947509765625, -0.020856857299804688, -0.01717376708984375, -0.013490676879882812, -0.009807586669921875, -0.0061244964599609375, -0.00244140625, 0.0012416839599609375, 0.004924774169921875, 0.008607864379882812, 0.01229095458984375, 0.015974044799804688, 0.019657135009765625, 0.023340225219726562, 0.0270233154296875, 0.030706405639648438, 0.034389495849609375, 0.03807258605957031, 0.04175567626953125, 0.04543876647949219, 0.049121856689453125, 0.05280494689941406, 0.056488037109375, 0.06017112731933594, 0.06385421752929688, 0.06753730773925781, 0.07122039794921875, 0.07490348815917969, 0.07858657836914062, 0.08226966857910156, 0.0859527587890625, 0.08963584899902344, 0.09331893920898438, 0.09700202941894531, 0.10068511962890625, 0.10436820983886719, 0.10805130004882812, 0.11173439025878906, 0.11541748046875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 2.0, 5.0, 10.0, 4.0, 11.0, 14.0, 16.0, 22.0, 28.0, 24.0, 28.0, 33.0, 24.0, 38.0, 63.0, 71.0, 61.0, 63.0, 77.0, 84.0, 52.0, 46.0, 40.0, 34.0, 32.0, 25.0, 20.0, 16.0, 12.0, 9.0, 8.0, 7.0, 4.0, 5.0, 2.0, 1.0, 1.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.03009033203125, -0.02920246124267578, -0.028314590454101562, -0.027426719665527344, -0.026538848876953125, -0.025650978088378906, -0.024763107299804688, -0.02387523651123047, -0.02298736572265625, -0.02209949493408203, -0.021211624145507812, -0.020323753356933594, -0.019435882568359375, -0.018548011779785156, -0.017660140991210938, -0.01677227020263672, -0.0158843994140625, -0.014996528625488281, -0.014108657836914062, -0.013220787048339844, -0.012332916259765625, -0.011445045471191406, -0.010557174682617188, -0.009669303894042969, -0.00878143310546875, -0.007893562316894531, -0.0070056915283203125, -0.006117820739746094, -0.005229949951171875, -0.004342079162597656, -0.0034542083740234375, -0.0025663375854492188, -0.001678466796875, -0.0007905960083007812, 9.72747802734375e-05, 0.0009851455688476562, 0.001873016357421875, 0.0027608871459960938, 0.0036487579345703125, 0.004536628723144531, 0.00542449951171875, 0.006312370300292969, 0.0072002410888671875, 0.008088111877441406, 0.008975982666015625, 0.009863853454589844, 0.010751724243164062, 0.011639595031738281, 0.0125274658203125, 0.013415336608886719, 0.014303207397460938, 0.015191078186035156, 0.016078948974609375, 0.016966819763183594, 0.017854690551757812, 0.01874256134033203, 0.01963043212890625, 0.02051830291748047, 0.021406173706054688, 0.022294044494628906, 0.023181915283203125, 0.024069786071777344, 0.024957656860351562, 0.02584552764892578, 0.0267333984375]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 1.0, 3.0, 2.0, 4.0, 5.0, 17.0, 20.0, 23.0, 38.0, 51.0, 67.0, 85.0, 97.0, 117.0, 109.0, 98.0, 82.0, 55.0, 42.0, 31.0, 15.0, 13.0, 8.0, 8.0, 5.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.2921644449234009, -1.2579072713851929, -1.2236502170562744, -1.1893930435180664, -1.1551358699798584, -1.1208786964416504, -1.0866215229034424, -1.052364468574524, -1.018107295036316, -0.9838501214981079, -0.9495930075645447, -0.9153358936309814, -0.8810787200927734, -0.8468215465545654, -0.8125644326210022, -0.778307318687439, -0.744050145149231, -0.709792971611023, -0.6755358576774597, -0.6412787437438965, -0.6070215702056885, -0.5727643966674805, -0.5385072827339172, -0.504250168800354, -0.469992995262146, -0.4357358515262604, -0.40147870779037476, -0.36722156405448914, -0.3329644203186035, -0.2987072765827179, -0.2644501328468323, -0.23019298911094666, -0.19593572616577148, -0.16167858242988586, -0.12742143869400024, -0.09316429495811462, -0.058907151222229004, -0.024650007486343384, 0.009607136249542236, 0.043864279985427856, 0.07812142372131348, 0.1123785674571991, 0.14663571119308472, 0.18089285492897034, 0.21514999866485596, 0.24940714240074158, 0.2836642861366272, 0.3179214298725128, 0.35217857360839844, 0.38643571734428406, 0.4206928610801697, 0.4549500048160553, 0.4892071485519409, 0.5234643220901489, 0.5577214360237122, 0.5919785499572754, 0.6262357234954834, 0.6604928970336914, 0.6947500109672546, 0.7290071249008179, 0.7632642984390259, 0.7975214719772339, 0.8317785859107971, 0.8660356998443604, 0.9002928733825684]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 2.0, 5.0, 8.0, 6.0, 9.0, 14.0, 14.0, 17.0, 16.0, 22.0, 27.0, 23.0, 23.0, 26.0, 35.0, 37.0, 47.0, 27.0, 47.0, 42.0, 53.0, 51.0, 44.0, 36.0, 45.0, 31.0, 48.0, 39.0, 40.0, 24.0, 14.0, 22.0, 21.0, 17.0, 15.0, 19.0, 11.0, 11.0, 4.0, 4.0, 5.0, 1.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.661098837852478, -0.6427605152130127, -0.6244221925735474, -0.6060839295387268, -0.5877456068992615, -0.5694072842597961, -0.5510690212249756, -0.5327306985855103, -0.5143923759460449, -0.4960540533065796, -0.47771576046943665, -0.4593774676322937, -0.44103914499282837, -0.42270082235336304, -0.4043625295162201, -0.38602423667907715, -0.3676859140396118, -0.3493475914001465, -0.33100929856300354, -0.3126710057258606, -0.29433268308639526, -0.27599436044692993, -0.257656067609787, -0.23931775987148285, -0.2209794521331787, -0.20264114439487457, -0.18430283665657043, -0.1659645289182663, -0.14762622117996216, -0.12928791344165802, -0.11094960570335388, -0.09261129796504974, -0.07427304983139038, -0.05593474209308624, -0.037596434354782104, -0.019258126616477966, -0.0009198188781738281, 0.01741848886013031, 0.03575679659843445, 0.054095104336738586, 0.07243341207504272, 0.09077171981334686, 0.109110027551651, 0.12744833528995514, 0.14578664302825928, 0.16412495076656342, 0.18246325850486755, 0.2008015662431717, 0.21913987398147583, 0.23747818171977997, 0.2558164894580841, 0.27415478229522705, 0.2924931049346924, 0.3108314275741577, 0.32916972041130066, 0.3475080132484436, 0.36584633588790894, 0.38418465852737427, 0.4025229513645172, 0.42086124420166016, 0.4391995668411255, 0.4575378894805908, 0.47587618231773376, 0.4942144751548767, 0.512552797794342]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 3.0, 7.0, 13.0, 9.0, 21.0, 29.0, 48.0, 66.0, 85.0, 179.0, 283.0, 468.0, 797.0, 1388.0, 2389.0, 4350.0, 8713.0, 18846.0, 46860.0, 209045.0, 609900.0, 88257.0, 29786.0, 12882.0, 6368.0, 3328.0, 1850.0, 1014.0, 572.0, 353.0, 245.0, 132.0, 83.0, 59.0, 39.0, 26.0, 23.0, 11.0, 7.0, 8.0, 5.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.81396484375, -0.7915191650390625, -0.769073486328125, -0.7466278076171875, -0.72418212890625, -0.7017364501953125, -0.679290771484375, -0.6568450927734375, -0.6343994140625, -0.6119537353515625, -0.589508056640625, -0.5670623779296875, -0.54461669921875, -0.5221710205078125, -0.499725341796875, -0.4772796630859375, -0.454833984375, -0.4323883056640625, -0.409942626953125, -0.3874969482421875, -0.36505126953125, -0.3426055908203125, -0.320159912109375, -0.2977142333984375, -0.2752685546875, -0.2528228759765625, -0.230377197265625, -0.2079315185546875, -0.18548583984375, -0.1630401611328125, -0.140594482421875, -0.1181488037109375, -0.095703125, -0.0732574462890625, -0.050811767578125, -0.0283660888671875, -0.00592041015625, 0.0165252685546875, 0.038970947265625, 0.0614166259765625, 0.0838623046875, 0.1063079833984375, 0.128753662109375, 0.1511993408203125, 0.17364501953125, 0.1960906982421875, 0.218536376953125, 0.2409820556640625, 0.263427734375, 0.2858734130859375, 0.308319091796875, 0.3307647705078125, 0.35321044921875, 0.3756561279296875, 0.398101806640625, 0.4205474853515625, 0.4429931640625, 0.4654388427734375, 0.487884521484375, 0.5103302001953125, 0.53277587890625, 0.5552215576171875, 0.577667236328125, 0.6001129150390625, 0.62255859375]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 4.0, 7.0, 12.0, 12.0, 14.0, 13.0, 23.0, 17.0, 17.0, 39.0, 39.0, 45.0, 34.0, 41.0, 47.0, 47.0, 53.0, 50.0, 53.0, 39.0, 44.0, 42.0, 50.0, 29.0, 45.0, 29.0, 23.0, 29.0, 26.0, 21.0, 13.0, 11.0, 6.0, 7.0, 8.0, 5.0, 4.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.423828125, -1.3860626220703125, -1.348297119140625, -1.3105316162109375, -1.27276611328125, -1.2350006103515625, -1.197235107421875, -1.1594696044921875, -1.1217041015625, -1.0839385986328125, -1.046173095703125, -1.0084075927734375, -0.97064208984375, -0.9328765869140625, -0.895111083984375, -0.8573455810546875, -0.819580078125, -0.7818145751953125, -0.744049072265625, -0.7062835693359375, -0.66851806640625, -0.6307525634765625, -0.592987060546875, -0.5552215576171875, -0.5174560546875, -0.4796905517578125, -0.441925048828125, -0.4041595458984375, -0.36639404296875, -0.3286285400390625, -0.290863037109375, -0.2530975341796875, -0.21533203125, -0.1775665283203125, -0.139801025390625, -0.1020355224609375, -0.06427001953125, -0.0265045166015625, 0.011260986328125, 0.0490264892578125, 0.0867919921875, 0.1245574951171875, 0.162322998046875, 0.2000885009765625, 0.23785400390625, 0.2756195068359375, 0.313385009765625, 0.3511505126953125, 0.388916015625, 0.4266815185546875, 0.464447021484375, 0.5022125244140625, 0.53997802734375, 0.5777435302734375, 0.615509033203125, 0.6532745361328125, 0.6910400390625, 0.7288055419921875, 0.766571044921875, 0.8043365478515625, 0.84210205078125, 0.8798675537109375, 0.917633056640625, 0.9553985595703125, 0.9931640625]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 0.0, 8.0, 6.0, 4.0, 5.0, 9.0, 8.0, 20.0, 15.0, 17.0, 25.0, 29.0, 45.0, 59.0, 63.0, 90.0, 117.0, 300.0, 1770.0, 72683.0, 964612.0, 7425.0, 591.0, 167.0, 100.0, 73.0, 49.0, 47.0, 26.0, 41.0, 24.0, 20.0, 25.0, 16.0, 12.0, 13.0, 6.0, 15.0, 4.0, 5.0, 3.0, 5.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.3515625, -3.2442626953125, -3.136962890625, -3.0296630859375, -2.92236328125, -2.8150634765625, -2.707763671875, -2.6004638671875, -2.4931640625, -2.3858642578125, -2.278564453125, -2.1712646484375, -2.06396484375, -1.9566650390625, -1.849365234375, -1.7420654296875, -1.634765625, -1.5274658203125, -1.420166015625, -1.3128662109375, -1.20556640625, -1.0982666015625, -0.990966796875, -0.8836669921875, -0.7763671875, -0.6690673828125, -0.561767578125, -0.4544677734375, -0.34716796875, -0.2398681640625, -0.132568359375, -0.0252685546875, 0.08203125, 0.1893310546875, 0.296630859375, 0.4039306640625, 0.51123046875, 0.6185302734375, 0.725830078125, 0.8331298828125, 0.9404296875, 1.0477294921875, 1.155029296875, 1.2623291015625, 1.36962890625, 1.4769287109375, 1.584228515625, 1.6915283203125, 1.798828125, 1.9061279296875, 2.013427734375, 2.1207275390625, 2.22802734375, 2.3353271484375, 2.442626953125, 2.5499267578125, 2.6572265625, 2.7645263671875, 2.871826171875, 2.9791259765625, 3.08642578125, 3.1937255859375, 3.301025390625, 3.4083251953125, 3.515625]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 8.0, 3.0, 4.0, 7.0, 9.0, 12.0, 18.0, 13.0, 15.0, 24.0, 35.0, 35.0, 42.0, 52.0, 40.0, 41.0, 43.0, 50.0, 55.0, 46.0, 50.0, 38.0, 42.0, 53.0, 45.0, 41.0, 26.0, 25.0, 20.0, 18.0, 22.0, 14.0, 8.0, 11.0, 4.0, 11.0, 4.0, 6.0, 2.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.36328125, -1.318695068359375, -1.27410888671875, -1.229522705078125, -1.1849365234375, -1.140350341796875, -1.09576416015625, -1.051177978515625, -1.006591796875, -0.962005615234375, -0.91741943359375, -0.872833251953125, -0.8282470703125, -0.783660888671875, -0.73907470703125, -0.694488525390625, -0.64990234375, -0.605316162109375, -0.56072998046875, -0.516143798828125, -0.4715576171875, -0.426971435546875, -0.38238525390625, -0.337799072265625, -0.293212890625, -0.248626708984375, -0.20404052734375, -0.159454345703125, -0.1148681640625, -0.070281982421875, -0.02569580078125, 0.018890380859375, 0.0634765625, 0.108062744140625, 0.15264892578125, 0.197235107421875, 0.2418212890625, 0.286407470703125, 0.33099365234375, 0.375579833984375, 0.420166015625, 0.464752197265625, 0.50933837890625, 0.553924560546875, 0.5985107421875, 0.643096923828125, 0.68768310546875, 0.732269287109375, 0.77685546875, 0.821441650390625, 0.86602783203125, 0.910614013671875, 0.9552001953125, 0.999786376953125, 1.04437255859375, 1.088958740234375, 1.133544921875, 1.178131103515625, 1.22271728515625, 1.267303466796875, 1.3118896484375, 1.356475830078125, 1.40106201171875, 1.445648193359375, 1.490234375]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 1.0, 1.0, 0.0, 5.0, 4.0, 3.0, 5.0, 8.0, 12.0, 12.0, 34.0, 65.0, 131.0, 657.0, 8634.0, 1019668.0, 18071.0, 939.0, 155.0, 70.0, 27.0, 23.0, 8.0, 6.0, 7.0, 2.0, 5.0, 2.0, 1.0, 0.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.435546875, -1.377166748046875, -1.31878662109375, -1.260406494140625, -1.2020263671875, -1.143646240234375, -1.08526611328125, -1.026885986328125, -0.968505859375, -0.910125732421875, -0.85174560546875, -0.793365478515625, -0.7349853515625, -0.676605224609375, -0.61822509765625, -0.559844970703125, -0.50146484375, -0.443084716796875, -0.38470458984375, -0.326324462890625, -0.2679443359375, -0.209564208984375, -0.15118408203125, -0.092803955078125, -0.034423828125, 0.023956298828125, 0.08233642578125, 0.140716552734375, 0.1990966796875, 0.257476806640625, 0.31585693359375, 0.374237060546875, 0.4326171875, 0.490997314453125, 0.54937744140625, 0.607757568359375, 0.6661376953125, 0.724517822265625, 0.78289794921875, 0.841278076171875, 0.899658203125, 0.958038330078125, 1.01641845703125, 1.074798583984375, 1.1331787109375, 1.191558837890625, 1.24993896484375, 1.308319091796875, 1.36669921875, 1.425079345703125, 1.48345947265625, 1.541839599609375, 1.6002197265625, 1.658599853515625, 1.71697998046875, 1.775360107421875, 1.833740234375, 1.892120361328125, 1.95050048828125, 2.008880615234375, 2.0672607421875, 2.125640869140625, 2.18402099609375, 2.242401123046875, 2.30078125]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 5.0, 8.0, 10.0, 28.0, 46.0, 123.0, 385.0, 234.0, 60.0, 34.0, 31.0, 13.0, 3.0, 6.0, 3.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.347894668579102e-05, -5.968380719423294e-05, -5.5888667702674866e-05, -5.209352821111679e-05, -4.8298388719558716e-05, -4.450324922800064e-05, -4.0708109736442566e-05, -3.691297024488449e-05, -3.3117830753326416e-05, -2.932269126176834e-05, -2.5527551770210266e-05, -2.173241227865219e-05, -1.7937272787094116e-05, -1.4142133295536041e-05, -1.0346993803977966e-05, -6.551854312419891e-06, -2.7567148208618164e-06, 1.0384246706962585e-06, 4.8335641622543335e-06, 8.628703653812408e-06, 1.2423843145370483e-05, 1.621898263692856e-05, 2.0014122128486633e-05, 2.3809261620044708e-05, 2.7604401111602783e-05, 3.139954060316086e-05, 3.519468009471893e-05, 3.898981958627701e-05, 4.278495907783508e-05, 4.658009856939316e-05, 5.037523806095123e-05, 5.417037755250931e-05, 5.796551704406738e-05, 6.176065653562546e-05, 6.555579602718353e-05, 6.935093551874161e-05, 7.314607501029968e-05, 7.694121450185776e-05, 8.073635399341583e-05, 8.453149348497391e-05, 8.832663297653198e-05, 9.212177246809006e-05, 9.591691195964813e-05, 9.971205145120621e-05, 0.00010350719094276428, 0.00010730233043432236, 0.00011109746992588043, 0.00011489260941743851, 0.00011868774890899658, 0.00012248288840055466, 0.00012627802789211273, 0.0001300731673836708, 0.00013386830687522888, 0.00013766344636678696, 0.00014145858585834503, 0.0001452537253499031, 0.00014904886484146118, 0.00015284400433301926, 0.00015663914382457733, 0.0001604342833161354, 0.00016422942280769348, 0.00016802456229925156, 0.00017181970179080963, 0.0001756148412823677, 0.00017940998077392578]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 8.0, 4.0, 2.0, 3.0, 13.0, 10.0, 15.0, 27.0, 33.0, 78.0, 159.0, 646.0, 3571.0, 85740.0, 946121.0, 10376.0, 1224.0, 277.0, 101.0, 56.0, 31.0, 24.0, 13.0, 7.0, 7.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.185546875, -1.1475677490234375, -1.109588623046875, -1.0716094970703125, -1.03363037109375, -0.9956512451171875, -0.957672119140625, -0.9196929931640625, -0.8817138671875, -0.8437347412109375, -0.805755615234375, -0.7677764892578125, -0.72979736328125, -0.6918182373046875, -0.653839111328125, -0.6158599853515625, -0.577880859375, -0.5399017333984375, -0.501922607421875, -0.4639434814453125, -0.42596435546875, -0.3879852294921875, -0.350006103515625, -0.3120269775390625, -0.2740478515625, -0.2360687255859375, -0.198089599609375, -0.1601104736328125, -0.12213134765625, -0.0841522216796875, -0.046173095703125, -0.0081939697265625, 0.02978515625, 0.0677642822265625, 0.105743408203125, 0.1437225341796875, 0.18170166015625, 0.2196807861328125, 0.257659912109375, 0.2956390380859375, 0.3336181640625, 0.3715972900390625, 0.409576416015625, 0.4475555419921875, 0.48553466796875, 0.5235137939453125, 0.561492919921875, 0.5994720458984375, 0.637451171875, 0.6754302978515625, 0.713409423828125, 0.7513885498046875, 0.78936767578125, 0.8273468017578125, 0.865325927734375, 0.9033050537109375, 0.9412841796875, 0.9792633056640625, 1.017242431640625, 1.0552215576171875, 1.09320068359375, 1.1311798095703125, 1.169158935546875, 1.2071380615234375, 1.2451171875]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 2.0, 11.0, 9.0, 15.0, 19.0, 36.0, 61.0, 121.0, 233.0, 227.0, 113.0, 49.0, 28.0, 28.0, 16.0, 8.0, 4.0, 5.0, 2.0, 1.0, 5.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.240234375, -0.23273086547851562, -0.22522735595703125, -0.21772384643554688, -0.2102203369140625, -0.20271682739257812, -0.19521331787109375, -0.18770980834960938, -0.180206298828125, -0.17270278930664062, -0.16519927978515625, -0.15769577026367188, -0.1501922607421875, -0.14268875122070312, -0.13518524169921875, -0.12768173217773438, -0.12017822265625, -0.11267471313476562, -0.10517120361328125, -0.09766769409179688, -0.0901641845703125, -0.08266067504882812, -0.07515716552734375, -0.06765365600585938, -0.060150146484375, -0.052646636962890625, -0.04514312744140625, -0.037639617919921875, -0.0301361083984375, -0.022632598876953125, -0.01512908935546875, -0.007625579833984375, -0.0001220703125, 0.007381439208984375, 0.01488494873046875, 0.022388458251953125, 0.0298919677734375, 0.037395477294921875, 0.04489898681640625, 0.052402496337890625, 0.059906005859375, 0.06740951538085938, 0.07491302490234375, 0.08241653442382812, 0.0899200439453125, 0.09742355346679688, 0.10492706298828125, 0.11243057250976562, 0.11993408203125, 0.12743759155273438, 0.13494110107421875, 0.14244461059570312, 0.1499481201171875, 0.15745162963867188, 0.16495513916015625, 0.17245864868164062, 0.179962158203125, 0.18746566772460938, 0.19496917724609375, 0.20247268676757812, 0.2099761962890625, 0.21747970581054688, 0.22498321533203125, 0.23248672485351562, 0.239990234375]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 3.0, 15.0, 74.0, 171.0, 347.0, 280.0, 81.0, 26.0, 10.0, 6.0, 3.0], "bins": [-12.971693992614746, -12.746723175048828, -12.521751403808594, -12.296780586242676, -12.071809768676758, -11.846837997436523, -11.621867179870605, -11.396895408630371, -11.171924591064453, -10.946953773498535, -10.7219820022583, -10.497011184692383, -10.272039413452148, -10.04706859588623, -9.822097778320312, -9.597126007080078, -9.37215518951416, -9.147184371948242, -8.922212600708008, -8.69724178314209, -8.472270965576172, -8.247299194335938, -8.02232837677002, -7.797357082366943, -7.572385787963867, -7.347414493560791, -7.122443199157715, -6.897472381591797, -6.672501087188721, -6.4475297927856445, -6.222558975219727, -5.99758768081665, -5.772615909576416, -5.54764461517334, -5.322673797607422, -5.097702503204346, -4.8727312088012695, -4.647759914398193, -4.422788619995117, -4.197817802429199, -3.972846508026123, -3.747875213623047, -3.52290415763855, -3.2979331016540527, -3.0729618072509766, -2.8479905128479004, -2.6230194568634033, -2.3980484008789062, -2.17307710647583, -1.9481059312820435, -1.7231347560882568, -1.4981635808944702, -1.2731924057006836, -1.048221230506897, -0.8232500553131104, -0.5982788801193237, -0.37330782413482666, -0.14833664894104004, 0.07663452625274658, 0.3016057014465332, 0.5265768766403198, 0.7515480518341064, 0.9765192270278931, 1.2014904022216797, 1.4264615774154663]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 5.0, 7.0, 3.0, 3.0, 4.0, 9.0, 7.0, 5.0, 10.0, 7.0, 21.0, 26.0, 20.0, 28.0, 24.0, 27.0, 25.0, 23.0, 44.0, 41.0, 44.0, 42.0, 52.0, 33.0, 42.0, 50.0, 35.0, 33.0, 33.0, 30.0, 39.0, 32.0, 33.0, 23.0, 27.0, 15.0, 12.0, 18.0, 16.0, 10.0, 12.0, 11.0, 8.0, 6.0, 6.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-1.615898609161377, -1.563563346862793, -1.5112279653549194, -1.4588927030563354, -1.406557321548462, -1.354222059249878, -1.301886796951294, -1.2495514154434204, -1.1972161531448364, -1.1448808908462524, -1.092545509338379, -1.040210247039795, -0.9878749251365662, -0.9355396032333374, -0.8832042813301086, -0.8308689594268799, -0.7785336375236511, -0.7261983156204224, -0.6738629937171936, -0.6215276718139648, -0.5691924095153809, -0.5168570876121521, -0.46452176570892334, -0.41218647360801697, -0.3598511517047882, -0.30751582980155945, -0.2551805377006531, -0.20284521579742432, -0.15050990879535675, -0.09817460179328918, -0.045839279890060425, 0.006496012210845947, 0.05883133411407471, 0.11116664111614227, 0.16350194811820984, 0.2158372700214386, 0.26817256212234497, 0.32050788402557373, 0.3728432059288025, 0.42517849802970886, 0.4775138199329376, 0.529849112033844, 0.5821844339370728, 0.6345197558403015, 0.6868550777435303, 0.7391903400421143, 0.7915257215499878, 0.8438609838485718, 0.8961963057518005, 0.9485316276550293, 1.0008668899536133, 1.0532022714614868, 1.1055375337600708, 1.1578729152679443, 1.2102081775665283, 1.2625434398651123, 1.3148788213729858, 1.3672140836715698, 1.4195494651794434, 1.4718847274780273, 1.5242201089859009, 1.5765553712844849, 1.6288907527923584, 1.6812260150909424, 1.7335612773895264]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 6.0, 4.0, 6.0, 14.0, 29.0, 40.0, 55.0, 112.0, 187.0, 396.0, 951.0, 2821.0, 10947.0, 113384.0, 3317247.0, 714261.0, 26321.0, 4878.0, 1483.0, 552.0, 237.0, 137.0, 72.0, 50.0, 30.0, 20.0, 13.0, 7.0, 4.0, 5.0, 4.0, 5.0, 2.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.3671875, -2.29486083984375, -2.2225341796875, -2.15020751953125, -2.077880859375, -2.00555419921875, -1.9332275390625, -1.86090087890625, -1.78857421875, -1.71624755859375, -1.6439208984375, -1.57159423828125, -1.499267578125, -1.42694091796875, -1.3546142578125, -1.28228759765625, -1.2099609375, -1.13763427734375, -1.0653076171875, -0.99298095703125, -0.920654296875, -0.84832763671875, -0.7760009765625, -0.70367431640625, -0.63134765625, -0.55902099609375, -0.4866943359375, -0.41436767578125, -0.342041015625, -0.26971435546875, -0.1973876953125, -0.12506103515625, -0.052734375, 0.01959228515625, 0.0919189453125, 0.16424560546875, 0.236572265625, 0.30889892578125, 0.3812255859375, 0.45355224609375, 0.52587890625, 0.59820556640625, 0.6705322265625, 0.74285888671875, 0.815185546875, 0.88751220703125, 0.9598388671875, 1.03216552734375, 1.1044921875, 1.17681884765625, 1.2491455078125, 1.32147216796875, 1.393798828125, 1.46612548828125, 1.5384521484375, 1.61077880859375, 1.68310546875, 1.75543212890625, 1.8277587890625, 1.90008544921875, 1.972412109375, 2.04473876953125, 2.1170654296875, 2.18939208984375, 2.26171875]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 3.0, 4.0, 5.0, 5.0, 11.0, 12.0, 7.0, 20.0, 12.0, 13.0, 13.0, 20.0, 25.0, 22.0, 26.0, 34.0, 42.0, 38.0, 40.0, 42.0, 38.0, 32.0, 46.0, 35.0, 47.0, 33.0, 32.0, 39.0, 29.0, 32.0, 31.0, 32.0, 32.0, 23.0, 19.0, 15.0, 15.0, 15.0, 13.0, 10.0, 4.0, 8.0, 4.0, 6.0, 4.0, 3.0, 3.0, 2.0, 3.0, 3.0, 0.0, 1.0, 4.0], "bins": [-0.63037109375, -0.611663818359375, -0.59295654296875, -0.574249267578125, -0.5555419921875, -0.536834716796875, -0.51812744140625, -0.499420166015625, -0.480712890625, -0.462005615234375, -0.44329833984375, -0.424591064453125, -0.4058837890625, -0.387176513671875, -0.36846923828125, -0.349761962890625, -0.3310546875, -0.312347412109375, -0.29364013671875, -0.274932861328125, -0.2562255859375, -0.237518310546875, -0.21881103515625, -0.200103759765625, -0.181396484375, -0.162689208984375, -0.14398193359375, -0.125274658203125, -0.1065673828125, -0.087860107421875, -0.06915283203125, -0.050445556640625, -0.03173828125, -0.013031005859375, 0.00567626953125, 0.024383544921875, 0.0430908203125, 0.061798095703125, 0.08050537109375, 0.099212646484375, 0.117919921875, 0.136627197265625, 0.15533447265625, 0.174041748046875, 0.1927490234375, 0.211456298828125, 0.23016357421875, 0.248870849609375, 0.267578125, 0.286285400390625, 0.30499267578125, 0.323699951171875, 0.3424072265625, 0.361114501953125, 0.37982177734375, 0.398529052734375, 0.417236328125, 0.435943603515625, 0.45465087890625, 0.473358154296875, 0.4920654296875, 0.510772705078125, 0.52947998046875, 0.548187255859375, 0.56689453125]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 4.0, 8.0, 5.0, 12.0, 22.0, 36.0, 70.0, 110.0, 211.0, 493.0, 1188.0, 6910.0, 310660.0, 3849290.0, 21986.0, 2000.0, 647.0, 267.0, 150.0, 79.0, 51.0, 31.0, 21.0, 12.0, 7.0, 2.0, 4.0, 4.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.03125, -3.916748046875, -3.80224609375, -3.687744140625, -3.5732421875, -3.458740234375, -3.34423828125, -3.229736328125, -3.115234375, -3.000732421875, -2.88623046875, -2.771728515625, -2.6572265625, -2.542724609375, -2.42822265625, -2.313720703125, -2.19921875, -2.084716796875, -1.97021484375, -1.855712890625, -1.7412109375, -1.626708984375, -1.51220703125, -1.397705078125, -1.283203125, -1.168701171875, -1.05419921875, -0.939697265625, -0.8251953125, -0.710693359375, -0.59619140625, -0.481689453125, -0.3671875, -0.252685546875, -0.13818359375, -0.023681640625, 0.0908203125, 0.205322265625, 0.31982421875, 0.434326171875, 0.548828125, 0.663330078125, 0.77783203125, 0.892333984375, 1.0068359375, 1.121337890625, 1.23583984375, 1.350341796875, 1.46484375, 1.579345703125, 1.69384765625, 1.808349609375, 1.9228515625, 2.037353515625, 2.15185546875, 2.266357421875, 2.380859375, 2.495361328125, 2.60986328125, 2.724365234375, 2.8388671875, 2.953369140625, 3.06787109375, 3.182373046875, 3.296875]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 5.0, 4.0, 6.0, 20.0, 24.0, 34.0, 53.0, 92.0, 152.0, 337.0, 730.0, 1064.0, 735.0, 390.0, 194.0, 90.0, 60.0, 33.0, 22.0, 6.0, 13.0, 8.0, 3.0, 4.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.86962890625, -0.851348876953125, -0.83306884765625, -0.814788818359375, -0.7965087890625, -0.778228759765625, -0.75994873046875, -0.741668701171875, -0.723388671875, -0.705108642578125, -0.68682861328125, -0.668548583984375, -0.6502685546875, -0.631988525390625, -0.61370849609375, -0.595428466796875, -0.5771484375, -0.558868408203125, -0.54058837890625, -0.522308349609375, -0.5040283203125, -0.485748291015625, -0.46746826171875, -0.449188232421875, -0.430908203125, -0.412628173828125, -0.39434814453125, -0.376068115234375, -0.3577880859375, -0.339508056640625, -0.32122802734375, -0.302947998046875, -0.28466796875, -0.266387939453125, -0.24810791015625, -0.229827880859375, -0.2115478515625, -0.193267822265625, -0.17498779296875, -0.156707763671875, -0.138427734375, -0.120147705078125, -0.10186767578125, -0.083587646484375, -0.0653076171875, -0.047027587890625, -0.02874755859375, -0.010467529296875, 0.0078125, 0.026092529296875, 0.04437255859375, 0.062652587890625, 0.0809326171875, 0.099212646484375, 0.11749267578125, 0.135772705078125, 0.154052734375, 0.172332763671875, 0.19061279296875, 0.208892822265625, 0.2271728515625, 0.245452880859375, 0.26373291015625, 0.282012939453125, 0.30029296875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 6.0, 3.0, 0.0, 5.0, 7.0, 6.0, 12.0, 16.0, 17.0, 19.0, 33.0, 34.0, 48.0, 38.0, 70.0, 78.0, 78.0, 86.0, 81.0, 65.0, 55.0, 60.0, 41.0, 34.0, 36.0, 21.0, 12.0, 13.0, 7.0, 7.0, 4.0, 5.0, 0.0, 5.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8711289763450623, -0.8354905247688293, -0.7998520731925964, -0.7642136216163635, -0.7285751700401306, -0.6929367184638977, -0.6572983264923096, -0.6216598749160767, -0.5860214233398438, -0.5503829717636108, -0.5147445201873779, -0.479106068611145, -0.4434676170349121, -0.4078291654586792, -0.3721907436847687, -0.33655229210853577, -0.30091381072998047, -0.26527535915374756, -0.22963690757751465, -0.19399847090244293, -0.15836001932621002, -0.12272156774997711, -0.0870831310749054, -0.051444679498672485, -0.015806227922439575, 0.019832219928503036, 0.05547066777944565, 0.09110911190509796, 0.12674756348133087, 0.16238601505756378, 0.1980244517326355, 0.2336629033088684, 0.26930129528045654, 0.30493974685668945, 0.34057819843292236, 0.3762166500091553, 0.4118551015853882, 0.4474935531616211, 0.4831319749355316, 0.5187704563140869, 0.5544089078903198, 0.5900473594665527, 0.6256858110427856, 0.6613242626190186, 0.6969627141952515, 0.7326011657714844, 0.7682396173477173, 0.8038780689239502, 0.8395164608955383, 0.8751549124717712, 0.9107933640480042, 0.9464318156242371, 0.98207026720047, 1.017708659172058, 1.053347110748291, 1.088985562324524, 1.1246240139007568, 1.1602624654769897, 1.1959009170532227, 1.2315393686294556, 1.2671778202056885, 1.3028162717819214, 1.3384547233581543, 1.3740931749343872, 1.4097316265106201]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 5.0, 4.0, 1.0, 3.0, 4.0, 9.0, 10.0, 9.0, 9.0, 22.0, 11.0, 15.0, 21.0, 21.0, 19.0, 42.0, 41.0, 35.0, 37.0, 38.0, 36.0, 48.0, 41.0, 28.0, 35.0, 32.0, 48.0, 44.0, 32.0, 37.0, 32.0, 29.0, 32.0, 22.0, 23.0, 14.0, 22.0, 16.0, 13.0, 8.0, 16.0, 5.0, 15.0, 6.0, 7.0, 3.0, 3.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.7382323145866394, -0.7154096364974976, -0.6925870180130005, -0.6697643399238586, -0.6469417214393616, -0.6241190433502197, -0.6012964248657227, -0.5784737467765808, -0.555651068687439, -0.5328283905982971, -0.5100057721138, -0.4871830940246582, -0.46436047554016113, -0.4415377974510193, -0.41871514916419983, -0.39589250087738037, -0.3730698823928833, -0.35024723410606384, -0.3274245858192444, -0.30460190773010254, -0.28177928924560547, -0.2589566111564636, -0.23613396286964417, -0.2133113145828247, -0.19048866629600525, -0.1676660180091858, -0.14484336972236633, -0.12202070653438568, -0.09919805824756622, -0.07637540996074677, -0.05355274677276611, -0.030730098485946655, -0.007907450199127197, 0.01491520181298256, 0.037737853825092316, 0.06056050956249237, 0.08338315784931183, 0.10620580613613129, 0.12902846932411194, 0.1518511176109314, 0.17467376589775085, 0.1974964141845703, 0.22031906247138977, 0.24314172565937042, 0.2659643888473511, 0.28878700733184814, 0.31160968542099, 0.33443233370780945, 0.3572549819946289, 0.38007763028144836, 0.4029002785682678, 0.42572295665740967, 0.44854557514190674, 0.4713682532310486, 0.49419090151786804, 0.5170135498046875, 0.5398361682891846, 0.5626588463783264, 0.5854814648628235, 0.6083041429519653, 0.6311267614364624, 0.6539494395256042, 0.6767721176147461, 0.6995947360992432, 0.722417414188385]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 6.0, 1.0, 3.0, 4.0, 6.0, 5.0, 12.0, 10.0, 19.0, 20.0, 56.0, 127.0, 280.0, 958.0, 4634.0, 32505.0, 581532.0, 397899.0, 25420.0, 3816.0, 777.0, 229.0, 101.0, 56.0, 29.0, 24.0, 12.0, 6.0, 8.0, 4.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.93994140625, -0.9037094116210938, -0.8674774169921875, -0.8312454223632812, -0.795013427734375, -0.7587814331054688, -0.7225494384765625, -0.6863174438476562, -0.65008544921875, -0.6138534545898438, -0.5776214599609375, -0.5413894653320312, -0.505157470703125, -0.46892547607421875, -0.4326934814453125, -0.39646148681640625, -0.3602294921875, -0.32399749755859375, -0.2877655029296875, -0.25153350830078125, -0.215301513671875, -0.17906951904296875, -0.1428375244140625, -0.10660552978515625, -0.07037353515625, -0.03414154052734375, 0.0020904541015625, 0.03832244873046875, 0.074554443359375, 0.11078643798828125, 0.1470184326171875, 0.18325042724609375, 0.219482421875, 0.25571441650390625, 0.2919464111328125, 0.32817840576171875, 0.364410400390625, 0.40064239501953125, 0.4368743896484375, 0.47310638427734375, 0.50933837890625, 0.5455703735351562, 0.5818023681640625, 0.6180343627929688, 0.654266357421875, 0.6904983520507812, 0.7267303466796875, 0.7629623413085938, 0.7991943359375, 0.8354263305664062, 0.8716583251953125, 0.9078903198242188, 0.944122314453125, 0.9803543090820312, 1.0165863037109375, 1.0528182983398438, 1.08905029296875, 1.1252822875976562, 1.1615142822265625, 1.1977462768554688, 1.233978271484375, 1.2702102661132812, 1.3064422607421875, 1.3426742553710938, 1.37890625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 8.0, 5.0, 4.0, 4.0, 11.0, 10.0, 17.0, 17.0, 17.0, 22.0, 29.0, 35.0, 44.0, 40.0, 45.0, 44.0, 48.0, 51.0, 59.0, 40.0, 52.0, 48.0, 47.0, 44.0, 33.0, 44.0, 35.0, 30.0, 28.0, 20.0, 12.0, 19.0, 14.0, 8.0, 6.0, 8.0, 4.0, 3.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.6591796875, -0.6418571472167969, -0.6245346069335938, -0.6072120666503906, -0.5898895263671875, -0.5725669860839844, -0.5552444458007812, -0.5379219055175781, -0.520599365234375, -0.5032768249511719, -0.48595428466796875, -0.4686317443847656, -0.4513092041015625, -0.4339866638183594, -0.41666412353515625, -0.3993415832519531, -0.38201904296875, -0.3646965026855469, -0.34737396240234375, -0.3300514221191406, -0.3127288818359375, -0.2954063415527344, -0.27808380126953125, -0.2607612609863281, -0.243438720703125, -0.22611618041992188, -0.20879364013671875, -0.19147109985351562, -0.1741485595703125, -0.15682601928710938, -0.13950347900390625, -0.12218093872070312, -0.1048583984375, -0.08753585815429688, -0.07021331787109375, -0.052890777587890625, -0.0355682373046875, -0.018245697021484375, -0.00092315673828125, 0.016399383544921875, 0.033721923828125, 0.051044464111328125, 0.06836700439453125, 0.08568954467773438, 0.1030120849609375, 0.12033462524414062, 0.13765716552734375, 0.15497970581054688, 0.17230224609375, 0.18962478637695312, 0.20694732666015625, 0.22426986694335938, 0.2415924072265625, 0.2589149475097656, 0.27623748779296875, 0.2935600280761719, 0.310882568359375, 0.3282051086425781, 0.34552764892578125, 0.3628501892089844, 0.3801727294921875, 0.3974952697753906, 0.41481781005859375, 0.4321403503417969, 0.449462890625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 5.0, 8.0, 11.0, 13.0, 16.0, 34.0, 47.0, 75.0, 136.0, 221.0, 409.0, 842.0, 1881.0, 4794.0, 14630.0, 55447.0, 286749.0, 541152.0, 104594.0, 24911.0, 7610.0, 2677.0, 1138.0, 485.0, 255.0, 158.0, 82.0, 65.0, 30.0, 18.0, 20.0, 13.0, 4.0, 5.0, 4.0, 1.0, 8.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.455078125, -0.440948486328125, -0.42681884765625, -0.412689208984375, -0.3985595703125, -0.384429931640625, -0.37030029296875, -0.356170654296875, -0.342041015625, -0.327911376953125, -0.31378173828125, -0.299652099609375, -0.2855224609375, -0.271392822265625, -0.25726318359375, -0.243133544921875, -0.22900390625, -0.214874267578125, -0.20074462890625, -0.186614990234375, -0.1724853515625, -0.158355712890625, -0.14422607421875, -0.130096435546875, -0.115966796875, -0.101837158203125, -0.08770751953125, -0.073577880859375, -0.0594482421875, -0.045318603515625, -0.03118896484375, -0.017059326171875, -0.0029296875, 0.011199951171875, 0.02532958984375, 0.039459228515625, 0.0535888671875, 0.067718505859375, 0.08184814453125, 0.095977783203125, 0.110107421875, 0.124237060546875, 0.13836669921875, 0.152496337890625, 0.1666259765625, 0.180755615234375, 0.19488525390625, 0.209014892578125, 0.22314453125, 0.237274169921875, 0.25140380859375, 0.265533447265625, 0.2796630859375, 0.293792724609375, 0.30792236328125, 0.322052001953125, 0.336181640625, 0.350311279296875, 0.36444091796875, 0.378570556640625, 0.3927001953125, 0.406829833984375, 0.42095947265625, 0.435089111328125, 0.44921875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 5.0, 6.0, 5.0, 3.0, 7.0, 5.0, 6.0, 7.0, 17.0, 17.0, 16.0, 28.0, 25.0, 30.0, 27.0, 26.0, 37.0, 29.0, 51.0, 40.0, 59.0, 44.0, 44.0, 52.0, 42.0, 36.0, 31.0, 40.0, 30.0, 25.0, 30.0, 28.0, 28.0, 26.0, 20.0, 20.0, 14.0, 8.0, 2.0, 9.0, 4.0, 7.0, 3.0, 5.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.859375, -0.8329086303710938, -0.8064422607421875, -0.7799758911132812, -0.753509521484375, -0.7270431518554688, -0.7005767822265625, -0.6741104125976562, -0.64764404296875, -0.6211776733398438, -0.5947113037109375, -0.5682449340820312, -0.541778564453125, -0.5153121948242188, -0.4888458251953125, -0.46237945556640625, -0.4359130859375, -0.40944671630859375, -0.3829803466796875, -0.35651397705078125, -0.330047607421875, -0.30358123779296875, -0.2771148681640625, -0.25064849853515625, -0.22418212890625, -0.19771575927734375, -0.1712493896484375, -0.14478302001953125, -0.118316650390625, -0.09185028076171875, -0.0653839111328125, -0.03891754150390625, -0.012451171875, 0.01401519775390625, 0.0404815673828125, 0.06694793701171875, 0.093414306640625, 0.11988067626953125, 0.1463470458984375, 0.17281341552734375, 0.19927978515625, 0.22574615478515625, 0.2522125244140625, 0.27867889404296875, 0.305145263671875, 0.33161163330078125, 0.3580780029296875, 0.38454437255859375, 0.4110107421875, 0.43747711181640625, 0.4639434814453125, 0.49040985107421875, 0.516876220703125, 0.5433425903320312, 0.5698089599609375, 0.5962753295898438, 0.62274169921875, 0.6492080688476562, 0.6756744384765625, 0.7021408081054688, 0.728607177734375, 0.7550735473632812, 0.7815399169921875, 0.8080062866210938, 0.83447265625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 2.0, 7.0, 3.0, 7.0, 17.0, 15.0, 16.0, 41.0, 51.0, 77.0, 102.0, 184.0, 261.0, 388.0, 667.0, 1119.0, 2065.0, 3603.0, 6946.0, 14770.0, 36817.0, 114854.0, 452186.0, 289717.0, 74776.0, 26237.0, 11142.0, 5548.0, 2885.0, 1543.0, 952.0, 557.0, 334.0, 231.0, 152.0, 100.0, 45.0, 40.0, 30.0, 27.0, 7.0, 17.0, 7.0, 7.0, 3.0, 4.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.126953125, -0.12340927124023438, -0.11986541748046875, -0.11632156372070312, -0.1127777099609375, -0.10923385620117188, -0.10569000244140625, -0.10214614868164062, -0.098602294921875, -0.09505844116210938, -0.09151458740234375, -0.08797073364257812, -0.0844268798828125, -0.08088302612304688, -0.07733917236328125, -0.07379531860351562, -0.07025146484375, -0.06670761108398438, -0.06316375732421875, -0.059619903564453125, -0.0560760498046875, -0.052532196044921875, -0.04898834228515625, -0.045444488525390625, -0.041900634765625, -0.038356781005859375, -0.03481292724609375, -0.031269073486328125, -0.0277252197265625, -0.024181365966796875, -0.02063751220703125, -0.017093658447265625, -0.0135498046875, -0.010005950927734375, -0.00646209716796875, -0.002918243408203125, 0.0006256103515625, 0.004169464111328125, 0.00771331787109375, 0.011257171630859375, 0.014801025390625, 0.018344879150390625, 0.02188873291015625, 0.025432586669921875, 0.0289764404296875, 0.032520294189453125, 0.03606414794921875, 0.039608001708984375, 0.04315185546875, 0.046695709228515625, 0.05023956298828125, 0.053783416748046875, 0.0573272705078125, 0.060871124267578125, 0.06441497802734375, 0.06795883178710938, 0.071502685546875, 0.07504653930664062, 0.07859039306640625, 0.08213424682617188, 0.0856781005859375, 0.08922195434570312, 0.09276580810546875, 0.09630966186523438, 0.099853515625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 4.0, 3.0, 18.0, 17.0, 22.0, 36.0, 40.0, 71.0, 102.0, 173.0, 174.0, 127.0, 63.0, 49.0, 33.0, 21.0, 14.0, 3.0, 9.0, 5.0, 3.0, 4.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.00014328956604003906, -0.000139712356030941, -0.00013613514602184296, -0.0001325579360127449, -0.00012898072600364685, -0.0001254035159945488, -0.00012182630598545074, -0.00011824909597635269, -0.00011467188596725464, -0.00011109467595815659, -0.00010751746594905853, -0.00010394025593996048, -0.00010036304593086243, -9.678583592176437e-05, -9.320862591266632e-05, -8.963141590356827e-05, -8.605420589447021e-05, -8.247699588537216e-05, -7.889978587627411e-05, -7.532257586717606e-05, -7.1745365858078e-05, -6.816815584897995e-05, -6.45909458398819e-05, -6.1013735830783844e-05, -5.743652582168579e-05, -5.385931581258774e-05, -5.0282105803489685e-05, -4.670489579439163e-05, -4.312768578529358e-05, -3.9550475776195526e-05, -3.597326576709747e-05, -3.239605575799942e-05, -2.8818845748901367e-05, -2.5241635739803314e-05, -2.166442573070526e-05, -1.8087215721607208e-05, -1.4510005712509155e-05, -1.0932795703411102e-05, -7.355585694313049e-06, -3.7783756852149963e-06, -2.0116567611694336e-07, 3.3760443329811096e-06, 6.953254342079163e-06, 1.0530464351177216e-05, 1.4107674360275269e-05, 1.768488436937332e-05, 2.1262094378471375e-05, 2.4839304387569427e-05, 2.841651439666748e-05, 3.1993724405765533e-05, 3.5570934414863586e-05, 3.914814442396164e-05, 4.272535443305969e-05, 4.6302564442157745e-05, 4.98797744512558e-05, 5.345698446035385e-05, 5.7034194469451904e-05, 6.061140447854996e-05, 6.418861448764801e-05, 6.776582449674606e-05, 7.134303450584412e-05, 7.492024451494217e-05, 7.849745452404022e-05, 8.207466453313828e-05, 8.565187454223633e-05]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 4.0, 5.0, 9.0, 5.0, 7.0, 14.0, 12.0, 13.0, 26.0, 29.0, 45.0, 107.0, 129.0, 197.0, 276.0, 465.0, 804.0, 1481.0, 2744.0, 5815.0, 13087.0, 36983.0, 132717.0, 504480.0, 252324.0, 60480.0, 20028.0, 8107.0, 3734.0, 1856.0, 1033.0, 571.0, 314.0, 214.0, 141.0, 97.0, 51.0, 51.0, 29.0, 22.0, 16.0, 11.0, 7.0, 5.0, 7.0, 6.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11981201171875, -0.11591053009033203, -0.11200904846191406, -0.1081075668334961, -0.10420608520507812, -0.10030460357666016, -0.09640312194824219, -0.09250164031982422, -0.08860015869140625, -0.08469867706298828, -0.08079719543457031, -0.07689571380615234, -0.07299423217773438, -0.0690927505493164, -0.06519126892089844, -0.06128978729248047, -0.0573883056640625, -0.05348682403564453, -0.04958534240722656, -0.045683860778808594, -0.041782379150390625, -0.037880897521972656, -0.03397941589355469, -0.03007793426513672, -0.02617645263671875, -0.02227497100830078, -0.018373489379882812, -0.014472007751464844, -0.010570526123046875, -0.006669044494628906, -0.0027675628662109375, 0.0011339187622070312, 0.005035400390625, 0.008936882019042969, 0.012838363647460938, 0.016739845275878906, 0.020641326904296875, 0.024542808532714844, 0.028444290161132812, 0.03234577178955078, 0.03624725341796875, 0.04014873504638672, 0.04405021667480469, 0.047951698303222656, 0.051853179931640625, 0.055754661560058594, 0.05965614318847656, 0.06355762481689453, 0.0674591064453125, 0.07136058807373047, 0.07526206970214844, 0.0791635513305664, 0.08306503295898438, 0.08696651458740234, 0.09086799621582031, 0.09476947784423828, 0.09867095947265625, 0.10257244110107422, 0.10647392272949219, 0.11037540435791016, 0.11427688598632812, 0.1181783676147461, 0.12207984924316406, 0.12598133087158203, 0.1298828125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 6.0, 2.0, 4.0, 6.0, 5.0, 3.0, 11.0, 7.0, 15.0, 17.0, 24.0, 24.0, 48.0, 28.0, 39.0, 65.0, 78.0, 109.0, 101.0, 77.0, 75.0, 50.0, 40.0, 27.0, 29.0, 17.0, 19.0, 22.0, 14.0, 8.0, 7.0, 9.0, 6.0, 4.0, 3.0, 4.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.034271240234375, -0.03326010704040527, -0.03224897384643555, -0.03123784065246582, -0.030226707458496094, -0.029215574264526367, -0.02820444107055664, -0.027193307876586914, -0.026182174682617188, -0.02517104148864746, -0.024159908294677734, -0.023148775100708008, -0.02213764190673828, -0.021126508712768555, -0.020115375518798828, -0.0191042423248291, -0.018093109130859375, -0.01708197593688965, -0.016070842742919922, -0.015059709548950195, -0.014048576354980469, -0.013037443161010742, -0.012026309967041016, -0.011015176773071289, -0.010004043579101562, -0.008992910385131836, -0.00798177719116211, -0.006970643997192383, -0.005959510803222656, -0.00494837760925293, -0.003937244415283203, -0.0029261112213134766, -0.00191497802734375, -0.0009038448333740234, 0.00010728836059570312, 0.0011184215545654297, 0.0021295547485351562, 0.003140687942504883, 0.004151821136474609, 0.005162954330444336, 0.0061740875244140625, 0.007185220718383789, 0.008196353912353516, 0.009207487106323242, 0.010218620300292969, 0.011229753494262695, 0.012240886688232422, 0.013252019882202148, 0.014263153076171875, 0.015274286270141602, 0.016285419464111328, 0.017296552658081055, 0.01830768585205078, 0.019318819046020508, 0.020329952239990234, 0.02134108543395996, 0.022352218627929688, 0.023363351821899414, 0.02437448501586914, 0.025385618209838867, 0.026396751403808594, 0.02740788459777832, 0.028419017791748047, 0.029430150985717773, 0.0304412841796875]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 6.0, 3.0, 5.0, 6.0, 10.0, 7.0, 11.0, 25.0, 34.0, 45.0, 54.0, 84.0, 88.0, 128.0, 106.0, 97.0, 74.0, 46.0, 57.0, 31.0, 29.0, 19.0, 7.0, 8.0, 8.0, 2.0, 3.0, 2.0, 3.0, 3.0, 6.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6634179949760437, -0.6369640827178955, -0.6105102300643921, -0.5840563774108887, -0.5576024651527405, -0.5311485528945923, -0.5046947002410889, -0.47824081778526306, -0.45178693532943726, -0.42533305287361145, -0.39887917041778564, -0.37242528796195984, -0.34597140550613403, -0.3195175230503082, -0.2930636405944824, -0.2666097581386566, -0.2401558756828308, -0.213701993227005, -0.1872481107711792, -0.1607942283153534, -0.1343403458595276, -0.10788646340370178, -0.08143258094787598, -0.05497869849205017, -0.028524816036224365, -0.0020709335803985596, 0.024382948875427246, 0.05083683133125305, 0.07729071378707886, 0.10374459624290466, 0.13019847869873047, 0.15665236115455627, 0.1831061840057373, 0.2095600664615631, 0.23601394891738892, 0.2624678313732147, 0.2889217138290405, 0.31537559628486633, 0.34182947874069214, 0.36828336119651794, 0.39473724365234375, 0.42119112610816956, 0.44764500856399536, 0.47409889101982117, 0.500552773475647, 0.5270066261291504, 0.5534605383872986, 0.5799144506454468, 0.6063683032989502, 0.6328221559524536, 0.6592760682106018, 0.68572998046875, 0.7121838331222534, 0.7386376857757568, 0.765091598033905, 0.7915455102920532, 0.8179993629455566, 0.8444532155990601, 0.8709071278572083, 0.8973610401153564, 0.9238148927688599, 0.9502687454223633, 0.9767226576805115, 1.0031765699386597, 1.029630422592163]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 8.0, 0.0, 2.0, 8.0, 4.0, 3.0, 4.0, 5.0, 13.0, 16.0, 11.0, 22.0, 19.0, 15.0, 20.0, 34.0, 34.0, 37.0, 42.0, 46.0, 45.0, 39.0, 44.0, 31.0, 33.0, 44.0, 42.0, 46.0, 33.0, 42.0, 33.0, 43.0, 25.0, 24.0, 13.0, 18.0, 21.0, 12.0, 17.0, 16.0, 8.0, 7.0, 12.0, 3.0, 6.0, 4.0, 5.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.44668665528297424, -0.4328303337097168, -0.41897398233413696, -0.4051176607608795, -0.3912613093852997, -0.37740498781204224, -0.3635486364364624, -0.34969231486320496, -0.3358359932899475, -0.32197967171669006, -0.30812332034111023, -0.2942669987678528, -0.28041064739227295, -0.2665543258190155, -0.25269800424575806, -0.23884165287017822, -0.2249853014945984, -0.21112896502017975, -0.1972726285457611, -0.18341630697250366, -0.16955995559692383, -0.15570363402366638, -0.14184729754924774, -0.1279909610748291, -0.11413462460041046, -0.10027828812599182, -0.08642195165157318, -0.07256562262773514, -0.0587092861533165, -0.04485294967889786, -0.030996620655059814, -0.017140284180641174, -0.003283977508544922, 0.010572357103228569, 0.02442869171500206, 0.0382850244641304, 0.05214136093854904, 0.06599769741296768, 0.07985402643680573, 0.09371036291122437, 0.107566699385643, 0.12142303586006165, 0.13527937233448029, 0.14913570880889893, 0.16299203038215637, 0.1768483817577362, 0.19070470333099365, 0.2045610398054123, 0.21841737627983093, 0.23227371275424957, 0.2461300492286682, 0.25998637080192566, 0.2738427221775055, 0.28769904375076294, 0.3015553951263428, 0.3154117166996002, 0.32926803827285767, 0.3431243598461151, 0.35698071122169495, 0.3708370327949524, 0.3846933841705322, 0.3985497057437897, 0.4124060273170471, 0.42626237869262695, 0.4401187300682068]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 7.0, 9.0, 5.0, 14.0, 20.0, 32.0, 51.0, 73.0, 136.0, 232.0, 379.0, 585.0, 959.0, 1703.0, 2927.0, 5351.0, 10019.0, 22852.0, 63509.0, 244172.0, 497001.0, 127170.0, 38603.0, 15697.0, 7459.0, 4047.0, 2236.0, 1242.0, 823.0, 467.0, 306.0, 169.0, 110.0, 64.0, 56.0, 22.0, 22.0, 7.0, 8.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.481201171875, -0.467559814453125, -0.45391845703125, -0.440277099609375, -0.4266357421875, -0.412994384765625, -0.39935302734375, -0.385711669921875, -0.3720703125, -0.358428955078125, -0.34478759765625, -0.331146240234375, -0.3175048828125, -0.303863525390625, -0.29022216796875, -0.276580810546875, -0.262939453125, -0.249298095703125, -0.23565673828125, -0.222015380859375, -0.2083740234375, -0.194732666015625, -0.18109130859375, -0.167449951171875, -0.15380859375, -0.140167236328125, -0.12652587890625, -0.112884521484375, -0.0992431640625, -0.085601806640625, -0.07196044921875, -0.058319091796875, -0.044677734375, -0.031036376953125, -0.01739501953125, -0.003753662109375, 0.0098876953125, 0.023529052734375, 0.03717041015625, 0.050811767578125, 0.064453125, 0.078094482421875, 0.09173583984375, 0.105377197265625, 0.1190185546875, 0.132659912109375, 0.14630126953125, 0.159942626953125, 0.173583984375, 0.187225341796875, 0.20086669921875, 0.214508056640625, 0.2281494140625, 0.241790771484375, 0.25543212890625, 0.269073486328125, 0.28271484375, 0.296356201171875, 0.30999755859375, 0.323638916015625, 0.3372802734375, 0.350921630859375, 0.36456298828125, 0.378204345703125, 0.391845703125]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 5.0, 3.0, 7.0, 2.0, 8.0, 5.0, 10.0, 10.0, 15.0, 9.0, 15.0, 25.0, 18.0, 25.0, 32.0, 34.0, 35.0, 46.0, 46.0, 36.0, 46.0, 43.0, 39.0, 34.0, 41.0, 41.0, 47.0, 44.0, 27.0, 39.0, 26.0, 27.0, 23.0, 24.0, 25.0, 10.0, 16.0, 6.0, 14.0, 13.0, 5.0, 11.0, 3.0, 1.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.90771484375, -0.8792877197265625, -0.850860595703125, -0.8224334716796875, -0.79400634765625, -0.7655792236328125, -0.737152099609375, -0.7087249755859375, -0.6802978515625, -0.6518707275390625, -0.623443603515625, -0.5950164794921875, -0.56658935546875, -0.5381622314453125, -0.509735107421875, -0.4813079833984375, -0.452880859375, -0.4244537353515625, -0.396026611328125, -0.3675994873046875, -0.33917236328125, -0.3107452392578125, -0.282318115234375, -0.2538909912109375, -0.2254638671875, -0.1970367431640625, -0.168609619140625, -0.1401824951171875, -0.11175537109375, -0.0833282470703125, -0.054901123046875, -0.0264739990234375, 0.001953125, 0.0303802490234375, 0.058807373046875, 0.0872344970703125, 0.11566162109375, 0.1440887451171875, 0.172515869140625, 0.2009429931640625, 0.2293701171875, 0.2577972412109375, 0.286224365234375, 0.3146514892578125, 0.34307861328125, 0.3715057373046875, 0.399932861328125, 0.4283599853515625, 0.456787109375, 0.4852142333984375, 0.513641357421875, 0.5420684814453125, 0.57049560546875, 0.5989227294921875, 0.627349853515625, 0.6557769775390625, 0.6842041015625, 0.7126312255859375, 0.741058349609375, 0.7694854736328125, 0.79791259765625, 0.8263397216796875, 0.854766845703125, 0.8831939697265625, 0.91162109375]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 5.0, 2.0, 3.0, 8.0, 7.0, 8.0, 6.0, 5.0, 12.0, 8.0, 11.0, 20.0, 19.0, 21.0, 22.0, 36.0, 24.0, 46.0, 44.0, 69.0, 78.0, 173.0, 1302.0, 939931.0, 105444.0, 685.0, 168.0, 90.0, 47.0, 36.0, 31.0, 35.0, 22.0, 17.0, 33.0, 18.0, 18.0, 8.0, 18.0, 10.0, 9.0, 5.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.498046875, -3.372589111328125, -3.24713134765625, -3.121673583984375, -2.9962158203125, -2.870758056640625, -2.74530029296875, -2.619842529296875, -2.494384765625, -2.368927001953125, -2.24346923828125, -2.118011474609375, -1.9925537109375, -1.867095947265625, -1.74163818359375, -1.616180419921875, -1.49072265625, -1.365264892578125, -1.23980712890625, -1.114349365234375, -0.9888916015625, -0.863433837890625, -0.73797607421875, -0.612518310546875, -0.487060546875, -0.361602783203125, -0.23614501953125, -0.110687255859375, 0.0147705078125, 0.140228271484375, 0.26568603515625, 0.391143798828125, 0.5166015625, 0.642059326171875, 0.76751708984375, 0.892974853515625, 1.0184326171875, 1.143890380859375, 1.26934814453125, 1.394805908203125, 1.520263671875, 1.645721435546875, 1.77117919921875, 1.896636962890625, 2.0220947265625, 2.147552490234375, 2.27301025390625, 2.398468017578125, 2.52392578125, 2.649383544921875, 2.77484130859375, 2.900299072265625, 3.0257568359375, 3.151214599609375, 3.27667236328125, 3.402130126953125, 3.527587890625, 3.653045654296875, 3.77850341796875, 3.903961181640625, 4.0294189453125, 4.154876708984375, 4.28033447265625, 4.405792236328125, 4.53125]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 6.0, 9.0, 6.0, 5.0, 8.0, 7.0, 10.0, 14.0, 22.0, 17.0, 33.0, 19.0, 25.0, 45.0, 36.0, 36.0, 46.0, 45.0, 45.0, 63.0, 34.0, 49.0, 53.0, 36.0, 52.0, 34.0, 35.0, 35.0, 24.0, 26.0, 27.0, 19.0, 20.0, 15.0, 12.0, 16.0, 2.0, 8.0, 3.0, 6.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.97216796875, -0.9379806518554688, -0.9037933349609375, -0.8696060180664062, -0.835418701171875, -0.8012313842773438, -0.7670440673828125, -0.7328567504882812, -0.69866943359375, -0.6644821166992188, -0.6302947998046875, -0.5961074829101562, -0.561920166015625, -0.5277328491210938, -0.4935455322265625, -0.45935821533203125, -0.4251708984375, -0.39098358154296875, -0.3567962646484375, -0.32260894775390625, -0.288421630859375, -0.25423431396484375, -0.2200469970703125, -0.18585968017578125, -0.15167236328125, -0.11748504638671875, -0.0832977294921875, -0.04911041259765625, -0.014923095703125, 0.01926422119140625, 0.0534515380859375, 0.08763885498046875, 0.121826171875, 0.15601348876953125, 0.1902008056640625, 0.22438812255859375, 0.258575439453125, 0.29276275634765625, 0.3269500732421875, 0.36113739013671875, 0.39532470703125, 0.42951202392578125, 0.4636993408203125, 0.49788665771484375, 0.532073974609375, 0.5662612915039062, 0.6004486083984375, 0.6346359252929688, 0.6688232421875, 0.7030105590820312, 0.7371978759765625, 0.7713851928710938, 0.805572509765625, 0.8397598266601562, 0.8739471435546875, 0.9081344604492188, 0.94232177734375, 0.9765090942382812, 1.0106964111328125, 1.0448837280273438, 1.079071044921875, 1.1132583618164062, 1.1474456787109375, 1.1816329956054688, 1.2158203125]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 2.0, 5.0, 1.0, 8.0, 3.0, 17.0, 11.0, 18.0, 15.0, 27.0, 50.0, 80.0, 124.0, 243.0, 641.0, 1988.0, 7806.0, 60748.0, 913001.0, 53346.0, 7261.0, 1875.0, 665.0, 261.0, 140.0, 71.0, 51.0, 40.0, 23.0, 11.0, 11.0, 2.0, 8.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.427490234375, -0.413909912109375, -0.40032958984375, -0.386749267578125, -0.3731689453125, -0.359588623046875, -0.34600830078125, -0.332427978515625, -0.31884765625, -0.305267333984375, -0.29168701171875, -0.278106689453125, -0.2645263671875, -0.250946044921875, -0.23736572265625, -0.223785400390625, -0.210205078125, -0.196624755859375, -0.18304443359375, -0.169464111328125, -0.1558837890625, -0.142303466796875, -0.12872314453125, -0.115142822265625, -0.1015625, -0.087982177734375, -0.07440185546875, -0.060821533203125, -0.0472412109375, -0.033660888671875, -0.02008056640625, -0.006500244140625, 0.007080078125, 0.020660400390625, 0.03424072265625, 0.047821044921875, 0.0614013671875, 0.074981689453125, 0.08856201171875, 0.102142333984375, 0.11572265625, 0.129302978515625, 0.14288330078125, 0.156463623046875, 0.1700439453125, 0.183624267578125, 0.19720458984375, 0.210784912109375, 0.224365234375, 0.237945556640625, 0.25152587890625, 0.265106201171875, 0.2786865234375, 0.292266845703125, 0.30584716796875, 0.319427490234375, 0.3330078125, 0.346588134765625, 0.36016845703125, 0.373748779296875, 0.3873291015625, 0.400909423828125, 0.41448974609375, 0.428070068359375, 0.441650390625]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 1.0, 5.0, 6.0, 15.0, 24.0, 59.0, 127.0, 317.0, 257.0, 91.0, 46.0, 21.0, 15.0, 4.0, 4.0, 2.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.630752563476562e-05, -8.351728320121765e-05, -8.072704076766968e-05, -7.79367983341217e-05, -7.514655590057373e-05, -7.235631346702576e-05, -6.956607103347778e-05, -6.677582859992981e-05, -6.398558616638184e-05, -6.119534373283386e-05, -5.840510129928589e-05, -5.5614858865737915e-05, -5.282461643218994e-05, -5.003437399864197e-05, -4.7244131565093994e-05, -4.445388913154602e-05, -4.166364669799805e-05, -3.887340426445007e-05, -3.60831618309021e-05, -3.3292919397354126e-05, -3.0502676963806152e-05, -2.771243453025818e-05, -2.4922192096710205e-05, -2.213194966316223e-05, -1.9341707229614258e-05, -1.6551464796066284e-05, -1.376122236251831e-05, -1.0970979928970337e-05, -8.180737495422363e-06, -5.39049506187439e-06, -2.600252628326416e-06, 1.8998980522155762e-07, 2.9802322387695312e-06, 5.770474672317505e-06, 8.560717105865479e-06, 1.1350959539413452e-05, 1.4141201972961426e-05, 1.69314444065094e-05, 1.9721686840057373e-05, 2.2511929273605347e-05, 2.530217170715332e-05, 2.8092414140701294e-05, 3.088265657424927e-05, 3.367289900779724e-05, 3.6463141441345215e-05, 3.925338387489319e-05, 4.204362630844116e-05, 4.4833868741989136e-05, 4.762411117553711e-05, 5.041435360908508e-05, 5.320459604263306e-05, 5.599483847618103e-05, 5.8785080909729004e-05, 6.157532334327698e-05, 6.436556577682495e-05, 6.715580821037292e-05, 6.99460506439209e-05, 7.273629307746887e-05, 7.552653551101685e-05, 7.831677794456482e-05, 8.110702037811279e-05, 8.389726281166077e-05, 8.668750524520874e-05, 8.947774767875671e-05, 9.226799011230469e-05]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 8.0, 8.0, 10.0, 8.0, 14.0, 22.0, 33.0, 50.0, 68.0, 111.0, 161.0, 306.0, 576.0, 1159.0, 2814.0, 7783.0, 30585.0, 331918.0, 612925.0, 43886.0, 9894.0, 3313.0, 1362.0, 674.0, 353.0, 169.0, 115.0, 77.0, 37.0, 26.0, 13.0, 16.0, 18.0, 10.0, 9.0, 4.0, 7.0, 3.0, 0.0, 5.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.286865234375, -0.2781982421875, -0.26953125, -0.2608642578125, -0.252197265625, -0.2435302734375, -0.23486328125, -0.2261962890625, -0.217529296875, -0.2088623046875, -0.2001953125, -0.1915283203125, -0.182861328125, -0.1741943359375, -0.16552734375, -0.1568603515625, -0.148193359375, -0.1395263671875, -0.130859375, -0.1221923828125, -0.113525390625, -0.1048583984375, -0.09619140625, -0.0875244140625, -0.078857421875, -0.0701904296875, -0.0615234375, -0.0528564453125, -0.044189453125, -0.0355224609375, -0.02685546875, -0.0181884765625, -0.009521484375, -0.0008544921875, 0.0078125, 0.0164794921875, 0.025146484375, 0.0338134765625, 0.04248046875, 0.0511474609375, 0.059814453125, 0.0684814453125, 0.0771484375, 0.0858154296875, 0.094482421875, 0.1031494140625, 0.11181640625, 0.1204833984375, 0.129150390625, 0.1378173828125, 0.146484375, 0.1551513671875, 0.163818359375, 0.1724853515625, 0.18115234375, 0.1898193359375, 0.198486328125, 0.2071533203125, 0.2158203125, 0.2244873046875, 0.233154296875, 0.2418212890625, 0.25048828125, 0.2591552734375, 0.267822265625]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 5.0, 6.0, 9.0, 10.0, 23.0, 32.0, 31.0, 40.0, 73.0, 98.0, 123.0, 163.0, 82.0, 92.0, 63.0, 34.0, 32.0, 21.0, 16.0, 8.0, 10.0, 5.0, 8.0, 0.0, 3.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.098876953125, -0.095489501953125, -0.09210205078125, -0.088714599609375, -0.0853271484375, -0.081939697265625, -0.07855224609375, -0.075164794921875, -0.07177734375, -0.068389892578125, -0.06500244140625, -0.061614990234375, -0.0582275390625, -0.054840087890625, -0.05145263671875, -0.048065185546875, -0.044677734375, -0.041290283203125, -0.03790283203125, -0.034515380859375, -0.0311279296875, -0.027740478515625, -0.02435302734375, -0.020965576171875, -0.017578125, -0.014190673828125, -0.01080322265625, -0.007415771484375, -0.0040283203125, -0.000640869140625, 0.00274658203125, 0.006134033203125, 0.009521484375, 0.012908935546875, 0.01629638671875, 0.019683837890625, 0.0230712890625, 0.026458740234375, 0.02984619140625, 0.033233642578125, 0.03662109375, 0.040008544921875, 0.04339599609375, 0.046783447265625, 0.0501708984375, 0.053558349609375, 0.05694580078125, 0.060333251953125, 0.063720703125, 0.067108154296875, 0.07049560546875, 0.073883056640625, 0.0772705078125, 0.080657958984375, 0.08404541015625, 0.087432861328125, 0.0908203125, 0.094207763671875, 0.09759521484375, 0.100982666015625, 0.1043701171875, 0.107757568359375, 0.11114501953125, 0.114532470703125, 0.117919921875]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 17.0, 48.0, 215.0, 389.0, 248.0, 64.0, 24.0, 8.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.843777656555176, -10.641592979431152, -10.439409255981445, -10.237224578857422, -10.035040855407715, -9.832856178283691, -9.630672454833984, -9.428487777709961, -9.226303100585938, -9.024118423461914, -8.821934700012207, -8.619750022888184, -8.417566299438477, -8.215381622314453, -8.01319694519043, -7.811013221740723, -7.608829021453857, -7.406644821166992, -7.204460620880127, -7.002276420593262, -6.800091743469238, -6.597907543182373, -6.395723342895508, -6.193539142608643, -5.991354942321777, -5.789170742034912, -5.586986541748047, -5.384801864624023, -5.182617664337158, -4.980433464050293, -4.778249263763428, -4.5760650634765625, -4.373880386352539, -4.171696186065674, -3.9695117473602295, -3.7673275470733643, -3.56514310836792, -3.3629589080810547, -3.1607747077941895, -2.958590507507324, -2.75640606880188, -2.5542218685150146, -2.3520374298095703, -2.149853229522705, -1.9476689100265503, -1.7454845905303955, -1.5433003902435303, -1.3411160707473755, -1.1389317512512207, -0.9367474317550659, -0.7345631718635559, -0.5323789119720459, -0.3301945924758911, -0.12801027297973633, 0.0741739273071289, 0.2763582468032837, 0.4785425662994385, 0.6807268857955933, 0.8829111456871033, 1.0850954055786133, 1.287279725074768, 1.4894640445709229, 1.691648244857788, 1.8938325643539429, 2.0960168838500977]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 8.0, 6.0, 5.0, 4.0, 16.0, 13.0, 16.0, 22.0, 25.0, 27.0, 33.0, 24.0, 38.0, 33.0, 40.0, 49.0, 43.0, 47.0, 53.0, 59.0, 63.0, 44.0, 40.0, 33.0, 38.0, 41.0, 26.0, 23.0, 22.0, 20.0, 26.0, 20.0, 13.0, 9.0, 9.0, 9.0, 7.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4426016807556152, -1.3922669887542725, -1.3419322967529297, -1.291597604751587, -1.2412629127502441, -1.1909282207489014, -1.1405935287475586, -1.0902589559555054, -1.0399242639541626, -0.9895895719528198, -0.939254879951477, -0.8889201879501343, -0.8385855555534363, -0.7882508635520935, -0.7379161715507507, -0.6875815391540527, -0.6372467875480652, -0.5869120955467224, -0.5365774035453796, -0.48624274134635925, -0.43590807914733887, -0.3855733871459961, -0.3352386951446533, -0.28490403294563293, -0.23456934094429016, -0.18423466384410858, -0.133899986743927, -0.08356529474258423, -0.03323061764240265, 0.01710405945777893, 0.0674387514591217, 0.11777341365814209, 0.16810810565948486, 0.21844278275966644, 0.268777459859848, 0.3191121518611908, 0.3694468140602112, 0.41978150606155396, 0.47011619806289673, 0.5204508304595947, 0.5707855224609375, 0.6211202144622803, 0.671454906463623, 0.7217895984649658, 0.7721242308616638, 0.8224589228630066, 0.8727936148643494, 0.9231282472610474, 0.9734629988670349, 1.023797631263733, 1.0741323232650757, 1.1244670152664185, 1.1748017072677612, 1.225136399269104, 1.2754710912704468, 1.3258057832717896, 1.3761404752731323, 1.426475167274475, 1.4768098592758179, 1.5271445512771606, 1.5774792432785034, 1.6278138160705566, 1.6781485080718994, 1.7284832000732422, 1.778817892074585]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 5.0, 5.0, 4.0, 12.0, 12.0, 24.0, 23.0, 27.0, 55.0, 89.0, 164.0, 242.0, 451.0, 816.0, 1678.0, 3528.0, 8466.0, 31964.0, 300981.0, 2776570.0, 973328.0, 72665.0, 13679.0, 4932.0, 2125.0, 1089.0, 559.0, 323.0, 180.0, 107.0, 48.0, 50.0, 35.0, 21.0, 6.0, 5.0, 6.0, 8.0, 4.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.302734375, -1.26409912109375, -1.2254638671875, -1.18682861328125, -1.148193359375, -1.10955810546875, -1.0709228515625, -1.03228759765625, -0.99365234375, -0.95501708984375, -0.9163818359375, -0.87774658203125, -0.839111328125, -0.80047607421875, -0.7618408203125, -0.72320556640625, -0.6845703125, -0.64593505859375, -0.6072998046875, -0.56866455078125, -0.530029296875, -0.49139404296875, -0.4527587890625, -0.41412353515625, -0.37548828125, -0.33685302734375, -0.2982177734375, -0.25958251953125, -0.220947265625, -0.18231201171875, -0.1436767578125, -0.10504150390625, -0.06640625, -0.02777099609375, 0.0108642578125, 0.04949951171875, 0.088134765625, 0.12677001953125, 0.1654052734375, 0.20404052734375, 0.24267578125, 0.28131103515625, 0.3199462890625, 0.35858154296875, 0.397216796875, 0.43585205078125, 0.4744873046875, 0.51312255859375, 0.5517578125, 0.59039306640625, 0.6290283203125, 0.66766357421875, 0.706298828125, 0.74493408203125, 0.7835693359375, 0.82220458984375, 0.86083984375, 0.89947509765625, 0.9381103515625, 0.97674560546875, 1.015380859375, 1.05401611328125, 1.0926513671875, 1.13128662109375, 1.169921875]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 4.0, 2.0, 4.0, 8.0, 10.0, 11.0, 13.0, 12.0, 27.0, 24.0, 32.0, 34.0, 36.0, 48.0, 40.0, 53.0, 47.0, 48.0, 50.0, 63.0, 35.0, 44.0, 42.0, 58.0, 44.0, 37.0, 25.0, 25.0, 29.0, 17.0, 26.0, 8.0, 6.0, 11.0, 7.0, 5.0, 4.0, 3.0, 4.0, 2.0, 1.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.7255859375, -0.7041854858398438, -0.6827850341796875, -0.6613845825195312, -0.639984130859375, -0.6185836791992188, -0.5971832275390625, -0.5757827758789062, -0.55438232421875, -0.5329818725585938, -0.5115814208984375, -0.49018096923828125, -0.468780517578125, -0.44738006591796875, -0.4259796142578125, -0.40457916259765625, -0.3831787109375, -0.36177825927734375, -0.3403778076171875, -0.31897735595703125, -0.297576904296875, -0.27617645263671875, -0.2547760009765625, -0.23337554931640625, -0.21197509765625, -0.19057464599609375, -0.1691741943359375, -0.14777374267578125, -0.126373291015625, -0.10497283935546875, -0.0835723876953125, -0.06217193603515625, -0.040771484375, -0.01937103271484375, 0.0020294189453125, 0.02342987060546875, 0.044830322265625, 0.06623077392578125, 0.0876312255859375, 0.10903167724609375, 0.13043212890625, 0.15183258056640625, 0.1732330322265625, 0.19463348388671875, 0.216033935546875, 0.23743438720703125, 0.2588348388671875, 0.28023529052734375, 0.3016357421875, 0.32303619384765625, 0.3444366455078125, 0.36583709716796875, 0.387237548828125, 0.40863800048828125, 0.4300384521484375, 0.45143890380859375, 0.47283935546875, 0.49423980712890625, 0.5156402587890625, 0.5370407104492188, 0.558441162109375, 0.5798416137695312, 0.6012420654296875, 0.6226425170898438, 0.64404296875]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 3.0, 4.0, 7.0, 5.0, 13.0, 24.0, 19.0, 42.0, 53.0, 93.0, 154.0, 314.0, 621.0, 1823.0, 7145.0, 67944.0, 3776463.0, 318583.0, 15938.0, 3066.0, 983.0, 409.0, 210.0, 125.0, 81.0, 51.0, 23.0, 24.0, 13.0, 18.0, 8.0, 8.0, 7.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.7724609375, -1.7147369384765625, -1.657012939453125, -1.5992889404296875, -1.54156494140625, -1.4838409423828125, -1.426116943359375, -1.3683929443359375, -1.3106689453125, -1.2529449462890625, -1.195220947265625, -1.1374969482421875, -1.07977294921875, -1.0220489501953125, -0.964324951171875, -0.9066009521484375, -0.848876953125, -0.7911529541015625, -0.733428955078125, -0.6757049560546875, -0.61798095703125, -0.5602569580078125, -0.502532958984375, -0.4448089599609375, -0.3870849609375, -0.3293609619140625, -0.271636962890625, -0.2139129638671875, -0.15618896484375, -0.0984649658203125, -0.040740966796875, 0.0169830322265625, 0.07470703125, 0.1324310302734375, 0.190155029296875, 0.2478790283203125, 0.30560302734375, 0.3633270263671875, 0.421051025390625, 0.4787750244140625, 0.5364990234375, 0.5942230224609375, 0.651947021484375, 0.7096710205078125, 0.76739501953125, 0.8251190185546875, 0.882843017578125, 0.9405670166015625, 0.998291015625, 1.0560150146484375, 1.113739013671875, 1.1714630126953125, 1.22918701171875, 1.2869110107421875, 1.344635009765625, 1.4023590087890625, 1.4600830078125, 1.5178070068359375, 1.575531005859375, 1.6332550048828125, 1.69097900390625, 1.7487030029296875, 1.806427001953125, 1.8641510009765625, 1.921875]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 3.0, 10.0, 13.0, 9.0, 24.0, 30.0, 62.0, 67.0, 110.0, 162.0, 341.0, 606.0, 928.0, 728.0, 406.0, 221.0, 108.0, 73.0, 53.0, 42.0, 33.0, 11.0, 10.0, 7.0, 7.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.365966796875, -0.3544349670410156, -0.34290313720703125, -0.3313713073730469, -0.3198394775390625, -0.3083076477050781, -0.29677581787109375, -0.2852439880371094, -0.273712158203125, -0.2621803283691406, -0.25064849853515625, -0.23911666870117188, -0.2275848388671875, -0.21605300903320312, -0.20452117919921875, -0.19298934936523438, -0.18145751953125, -0.16992568969726562, -0.15839385986328125, -0.14686203002929688, -0.1353302001953125, -0.12379837036132812, -0.11226654052734375, -0.10073471069335938, -0.089202880859375, -0.07767105102539062, -0.06613922119140625, -0.054607391357421875, -0.0430755615234375, -0.031543731689453125, -0.02001190185546875, -0.008480072021484375, 0.0030517578125, 0.014583587646484375, 0.02611541748046875, 0.037647247314453125, 0.0491790771484375, 0.060710906982421875, 0.07224273681640625, 0.08377456665039062, 0.095306396484375, 0.10683822631835938, 0.11837005615234375, 0.12990188598632812, 0.1414337158203125, 0.15296554565429688, 0.16449737548828125, 0.17602920532226562, 0.18756103515625, 0.19909286499023438, 0.21062469482421875, 0.22215652465820312, 0.2336883544921875, 0.24522018432617188, 0.25675201416015625, 0.2682838439941406, 0.279815673828125, 0.2913475036621094, 0.30287933349609375, 0.3144111633300781, 0.3259429931640625, 0.3374748229980469, 0.34900665283203125, 0.3605384826660156, 0.3720703125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 3.0, 4.0, 16.0, 6.0, 11.0, 19.0, 22.0, 38.0, 54.0, 51.0, 88.0, 90.0, 98.0, 103.0, 94.0, 83.0, 62.0, 40.0, 29.0, 27.0, 16.0, 10.0, 12.0, 5.0, 8.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0885906219482422, -1.0536774396896362, -1.0187643766403198, -0.9838512539863586, -0.9489381313323975, -0.9140249490737915, -0.8791118264198303, -0.8441987037658691, -0.809285581111908, -0.7743724584579468, -0.7394593358039856, -0.7045462131500244, -0.6696330308914185, -0.634719967842102, -0.5998067855834961, -0.5648936629295349, -0.5299805402755737, -0.49506741762161255, -0.46015429496765137, -0.4252411425113678, -0.3903280198574066, -0.35541489720344543, -0.32050174474716187, -0.2855886220932007, -0.2506754994392395, -0.21576237678527832, -0.18084923923015594, -0.14593610167503357, -0.11102297902107239, -0.0761098563671112, -0.04119671881198883, -0.006283581256866455, 0.028629422187805176, 0.06354255229234695, 0.09845568239688873, 0.1333688199520111, 0.1682819426059723, 0.20319506525993347, 0.23810820281505585, 0.2730213403701782, 0.3079344630241394, 0.3428475856781006, 0.37776070833206177, 0.41267386078834534, 0.4475869834423065, 0.4825001060962677, 0.5174132585525513, 0.5523263812065125, 0.5872395038604736, 0.6221526265144348, 0.657065749168396, 0.6919788718223572, 0.7268919944763184, 0.7618051767349243, 0.7967182993888855, 0.8316314220428467, 0.8665445446968079, 0.901457667350769, 0.9363707900047302, 0.9712839126586914, 1.0061970949172974, 1.0411101579666138, 1.0760233402252197, 1.1109364032745361, 1.145849585533142]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 9.0, 6.0, 15.0, 10.0, 15.0, 28.0, 27.0, 28.0, 27.0, 35.0, 30.0, 36.0, 38.0, 59.0, 43.0, 48.0, 52.0, 38.0, 54.0, 35.0, 39.0, 27.0, 38.0, 38.0, 40.0, 27.0, 23.0, 30.0, 22.0, 17.0, 18.0, 15.0, 10.0, 6.0, 6.0, 1.0, 6.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.7659687399864197, -0.7443788647651672, -0.7227890491485596, -0.7011991739273071, -0.6796092987060547, -0.658019483089447, -0.6364296078681946, -0.6148397922515869, -0.5932499170303345, -0.571660041809082, -0.5500702261924744, -0.5284803509712219, -0.5068905353546143, -0.4853006601333618, -0.4637107849121094, -0.4421209394931793, -0.42053109407424927, -0.3989412486553192, -0.37735140323638916, -0.3557615280151367, -0.33417168259620667, -0.3125818371772766, -0.29099196195602417, -0.2694021165370941, -0.24781227111816406, -0.226222425699234, -0.20463256537914276, -0.1830427050590515, -0.16145285964012146, -0.1398630142211914, -0.11827315390110016, -0.09668329358100891, -0.07509344816207886, -0.05350359529256821, -0.031913742423057556, -0.010323889553546906, 0.011265963315963745, 0.032855816185474396, 0.054445669054985046, 0.0760355293750763, 0.09762537479400635, 0.119215227663517, 0.14080508053302765, 0.1623949408531189, 0.18398478627204895, 0.205574631690979, 0.22716449201107025, 0.2487543523311615, 0.27034419775009155, 0.2919340431690216, 0.31352388858795166, 0.3351137638092041, 0.35670360922813416, 0.3782934546470642, 0.39988332986831665, 0.4214731752872467, 0.44306302070617676, 0.4646528661251068, 0.48624271154403687, 0.5078325867652893, 0.529422402381897, 0.5510122776031494, 0.5726021528244019, 0.5941920280456543, 0.615781843662262]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 0.0, 5.0, 3.0, 6.0, 2.0, 4.0, 6.0, 16.0, 10.0, 22.0, 54.0, 157.0, 443.0, 1488.0, 6563.0, 41094.0, 913093.0, 73622.0, 8950.0, 2127.0, 547.0, 190.0, 65.0, 30.0, 18.0, 10.0, 9.0, 5.0, 5.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0400390625, -1.0036773681640625, -0.967315673828125, -0.9309539794921875, -0.89459228515625, -0.8582305908203125, -0.821868896484375, -0.7855072021484375, -0.7491455078125, -0.7127838134765625, -0.676422119140625, -0.6400604248046875, -0.60369873046875, -0.5673370361328125, -0.530975341796875, -0.4946136474609375, -0.458251953125, -0.4218902587890625, -0.385528564453125, -0.3491668701171875, -0.31280517578125, -0.2764434814453125, -0.240081787109375, -0.2037200927734375, -0.1673583984375, -0.1309967041015625, -0.094635009765625, -0.0582733154296875, -0.02191162109375, 0.0144500732421875, 0.050811767578125, 0.0871734619140625, 0.12353515625, 0.1598968505859375, 0.196258544921875, 0.2326202392578125, 0.26898193359375, 0.3053436279296875, 0.341705322265625, 0.3780670166015625, 0.4144287109375, 0.4507904052734375, 0.487152099609375, 0.5235137939453125, 0.55987548828125, 0.5962371826171875, 0.632598876953125, 0.6689605712890625, 0.705322265625, 0.7416839599609375, 0.778045654296875, 0.8144073486328125, 0.85076904296875, 0.8871307373046875, 0.923492431640625, 0.9598541259765625, 0.9962158203125, 1.0325775146484375, 1.068939208984375, 1.1053009033203125, 1.14166259765625, 1.1780242919921875, 1.214385986328125, 1.2507476806640625, 1.287109375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 5.0, 0.0, 4.0, 7.0, 13.0, 9.0, 19.0, 21.0, 28.0, 27.0, 37.0, 35.0, 33.0, 50.0, 53.0, 50.0, 46.0, 60.0, 58.0, 40.0, 48.0, 50.0, 31.0, 43.0, 33.0, 38.0, 40.0, 30.0, 21.0, 19.0, 18.0, 11.0, 6.0, 10.0, 1.0, 8.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4443359375, -0.43017578125, -0.416015625, -0.40185546875, -0.3876953125, -0.37353515625, -0.359375, -0.34521484375, -0.3310546875, -0.31689453125, -0.302734375, -0.28857421875, -0.2744140625, -0.26025390625, -0.24609375, -0.23193359375, -0.2177734375, -0.20361328125, -0.189453125, -0.17529296875, -0.1611328125, -0.14697265625, -0.1328125, -0.11865234375, -0.1044921875, -0.09033203125, -0.076171875, -0.06201171875, -0.0478515625, -0.03369140625, -0.01953125, -0.00537109375, 0.0087890625, 0.02294921875, 0.037109375, 0.05126953125, 0.0654296875, 0.07958984375, 0.09375, 0.10791015625, 0.1220703125, 0.13623046875, 0.150390625, 0.16455078125, 0.1787109375, 0.19287109375, 0.20703125, 0.22119140625, 0.2353515625, 0.24951171875, 0.263671875, 0.27783203125, 0.2919921875, 0.30615234375, 0.3203125, 0.33447265625, 0.3486328125, 0.36279296875, 0.376953125, 0.39111328125, 0.4052734375, 0.41943359375, 0.43359375, 0.44775390625, 0.4619140625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 1.0, 5.0, 2.0, 4.0, 9.0, 12.0, 8.0, 13.0, 30.0, 27.0, 30.0, 81.0, 92.0, 156.0, 272.0, 442.0, 781.0, 1700.0, 3462.0, 7781.0, 20238.0, 64562.0, 326300.0, 480156.0, 96797.0, 27034.0, 9943.0, 4311.0, 1908.0, 964.0, 537.0, 330.0, 207.0, 114.0, 73.0, 51.0, 29.0, 24.0, 19.0, 12.0, 14.0, 9.0, 3.0, 5.0, 2.0, 2.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.27685546875, -0.26850128173828125, -0.2601470947265625, -0.25179290771484375, -0.243438720703125, -0.23508453369140625, -0.2267303466796875, -0.21837615966796875, -0.21002197265625, -0.20166778564453125, -0.1933135986328125, -0.18495941162109375, -0.176605224609375, -0.16825103759765625, -0.1598968505859375, -0.15154266357421875, -0.1431884765625, -0.13483428955078125, -0.1264801025390625, -0.11812591552734375, -0.109771728515625, -0.10141754150390625, -0.0930633544921875, -0.08470916748046875, -0.07635498046875, -0.06800079345703125, -0.0596466064453125, -0.05129241943359375, -0.042938232421875, -0.03458404541015625, -0.0262298583984375, -0.01787567138671875, -0.009521484375, -0.00116729736328125, 0.0071868896484375, 0.01554107666015625, 0.023895263671875, 0.03224945068359375, 0.0406036376953125, 0.04895782470703125, 0.05731201171875, 0.06566619873046875, 0.0740203857421875, 0.08237457275390625, 0.090728759765625, 0.09908294677734375, 0.1074371337890625, 0.11579132080078125, 0.1241455078125, 0.13249969482421875, 0.1408538818359375, 0.14920806884765625, 0.157562255859375, 0.16591644287109375, 0.1742706298828125, 0.18262481689453125, 0.19097900390625, 0.19933319091796875, 0.2076873779296875, 0.21604156494140625, 0.224395751953125, 0.23274993896484375, 0.2411041259765625, 0.24945831298828125, 0.2578125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 5.0, 3.0, 6.0, 14.0, 10.0, 5.0, 17.0, 16.0, 19.0, 22.0, 24.0, 31.0, 40.0, 27.0, 34.0, 53.0, 48.0, 56.0, 53.0, 36.0, 50.0, 59.0, 42.0, 47.0, 37.0, 20.0, 37.0, 33.0, 35.0, 19.0, 14.0, 17.0, 13.0, 9.0, 11.0, 12.0, 10.0, 4.0, 4.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.751953125, -0.7288284301757812, -0.7057037353515625, -0.6825790405273438, -0.659454345703125, -0.6363296508789062, -0.6132049560546875, -0.5900802612304688, -0.56695556640625, -0.5438308715820312, -0.5207061767578125, -0.49758148193359375, -0.474456787109375, -0.45133209228515625, -0.4282073974609375, -0.40508270263671875, -0.3819580078125, -0.35883331298828125, -0.3357086181640625, -0.31258392333984375, -0.289459228515625, -0.26633453369140625, -0.2432098388671875, -0.22008514404296875, -0.19696044921875, -0.17383575439453125, -0.1507110595703125, -0.12758636474609375, -0.104461669921875, -0.08133697509765625, -0.0582122802734375, -0.03508758544921875, -0.011962890625, 0.01116180419921875, 0.0342864990234375, 0.05741119384765625, 0.080535888671875, 0.10366058349609375, 0.1267852783203125, 0.14990997314453125, 0.17303466796875, 0.19615936279296875, 0.2192840576171875, 0.24240875244140625, 0.265533447265625, 0.28865814208984375, 0.3117828369140625, 0.33490753173828125, 0.3580322265625, 0.38115692138671875, 0.4042816162109375, 0.42740631103515625, 0.450531005859375, 0.47365570068359375, 0.4967803955078125, 0.5199050903320312, 0.54302978515625, 0.5661544799804688, 0.5892791748046875, 0.6124038696289062, 0.635528564453125, 0.6586532592773438, 0.6817779541015625, 0.7049026489257812, 0.72802734375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 4.0, 13.0, 13.0, 17.0, 31.0, 26.0, 47.0, 86.0, 117.0, 160.0, 259.0, 419.0, 760.0, 1310.0, 2483.0, 5140.0, 11455.0, 28832.0, 90782.0, 350394.0, 394164.0, 105082.0, 32630.0, 12510.0, 5591.0, 2693.0, 1437.0, 806.0, 447.0, 268.0, 183.0, 109.0, 74.0, 55.0, 47.0, 33.0, 23.0, 10.0, 18.0, 7.0, 3.0, 4.0, 3.0, 4.0, 3.0, 2.0, 1.0], "bins": [-0.0718994140625, -0.06995916366577148, -0.06801891326904297, -0.06607866287231445, -0.06413841247558594, -0.06219816207885742, -0.060257911682128906, -0.05831766128540039, -0.056377410888671875, -0.05443716049194336, -0.052496910095214844, -0.05055665969848633, -0.04861640930175781, -0.0466761589050293, -0.04473590850830078, -0.042795658111572266, -0.04085540771484375, -0.038915157318115234, -0.03697490692138672, -0.0350346565246582, -0.03309440612792969, -0.031154155731201172, -0.029213905334472656, -0.02727365493774414, -0.025333404541015625, -0.02339315414428711, -0.021452903747558594, -0.019512653350830078, -0.017572402954101562, -0.015632152557373047, -0.013691902160644531, -0.011751651763916016, -0.0098114013671875, -0.007871150970458984, -0.005930900573730469, -0.003990650177001953, -0.0020503997802734375, -0.00011014938354492188, 0.0018301010131835938, 0.0037703514099121094, 0.005710601806640625, 0.007650852203369141, 0.009591102600097656, 0.011531352996826172, 0.013471603393554688, 0.015411853790283203, 0.01735210418701172, 0.019292354583740234, 0.02123260498046875, 0.023172855377197266, 0.02511310577392578, 0.027053356170654297, 0.028993606567382812, 0.030933856964111328, 0.032874107360839844, 0.03481435775756836, 0.036754608154296875, 0.03869485855102539, 0.040635108947753906, 0.04257535934448242, 0.04451560974121094, 0.04645586013793945, 0.04839611053466797, 0.050336360931396484, 0.052276611328125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 6.0, 7.0, 9.0, 19.0, 17.0, 17.0, 26.0, 34.0, 58.0, 78.0, 111.0, 119.0, 137.0, 106.0, 62.0, 58.0, 38.0, 20.0, 20.0, 12.0, 15.0, 8.0, 2.0, 8.0, 7.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.947185516357422e-05, -4.8005953431129456e-05, -4.654005169868469e-05, -4.507414996623993e-05, -4.3608248233795166e-05, -4.21423465013504e-05, -4.067644476890564e-05, -3.9210543036460876e-05, -3.774464130401611e-05, -3.627873957157135e-05, -3.481283783912659e-05, -3.3346936106681824e-05, -3.188103437423706e-05, -3.0415132641792297e-05, -2.8949230909347534e-05, -2.748332917690277e-05, -2.6017427444458008e-05, -2.4551525712013245e-05, -2.308562397956848e-05, -2.1619722247123718e-05, -2.0153820514678955e-05, -1.8687918782234192e-05, -1.722201704978943e-05, -1.5756115317344666e-05, -1.4290213584899902e-05, -1.282431185245514e-05, -1.1358410120010376e-05, -9.892508387565613e-06, -8.42660665512085e-06, -6.9607049226760864e-06, -5.494803190231323e-06, -4.02890145778656e-06, -2.562999725341797e-06, -1.0970979928970337e-06, 3.688037395477295e-07, 1.8347054719924927e-06, 3.300607204437256e-06, 4.766508936882019e-06, 6.232410669326782e-06, 7.698312401771545e-06, 9.164214134216309e-06, 1.0630115866661072e-05, 1.2096017599105835e-05, 1.3561919331550598e-05, 1.5027821063995361e-05, 1.6493722796440125e-05, 1.7959624528884888e-05, 1.942552626132965e-05, 2.0891427993774414e-05, 2.2357329726219177e-05, 2.382323145866394e-05, 2.5289133191108704e-05, 2.6755034923553467e-05, 2.822093665599823e-05, 2.9686838388442993e-05, 3.1152740120887756e-05, 3.261864185333252e-05, 3.408454358577728e-05, 3.5550445318222046e-05, 3.701634705066681e-05, 3.848224878311157e-05, 3.9948150515556335e-05, 4.14140522480011e-05, 4.287995398044586e-05, 4.4345855712890625e-05]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 2.0, 8.0, 8.0, 11.0, 15.0, 26.0, 37.0, 60.0, 88.0, 187.0, 394.0, 917.0, 2603.0, 8255.0, 31142.0, 186969.0, 645784.0, 136418.0, 24959.0, 6859.0, 2266.0, 809.0, 331.0, 177.0, 86.0, 53.0, 26.0, 29.0, 12.0, 5.0, 9.0, 4.0, 2.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.11590576171875, -0.11263370513916016, -0.10936164855957031, -0.10608959197998047, -0.10281753540039062, -0.09954547882080078, -0.09627342224121094, -0.0930013656616211, -0.08972930908203125, -0.0864572525024414, -0.08318519592285156, -0.07991313934326172, -0.07664108276367188, -0.07336902618408203, -0.07009696960449219, -0.06682491302490234, -0.0635528564453125, -0.060280799865722656, -0.05700874328613281, -0.05373668670654297, -0.050464630126953125, -0.04719257354736328, -0.04392051696777344, -0.040648460388183594, -0.03737640380859375, -0.034104347229003906, -0.030832290649414062, -0.02756023406982422, -0.024288177490234375, -0.02101612091064453, -0.017744064331054688, -0.014472007751464844, -0.011199951171875, -0.007927894592285156, -0.0046558380126953125, -0.0013837814331054688, 0.001888275146484375, 0.005160331726074219, 0.008432388305664062, 0.011704444885253906, 0.01497650146484375, 0.018248558044433594, 0.021520614624023438, 0.02479267120361328, 0.028064727783203125, 0.03133678436279297, 0.03460884094238281, 0.037880897521972656, 0.0411529541015625, 0.044425010681152344, 0.04769706726074219, 0.05096912384033203, 0.054241180419921875, 0.05751323699951172, 0.06078529357910156, 0.0640573501586914, 0.06732940673828125, 0.0706014633178711, 0.07387351989746094, 0.07714557647705078, 0.08041763305664062, 0.08368968963623047, 0.08696174621582031, 0.09023380279541016, 0.093505859375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 1.0, 2.0, 3.0, 6.0, 7.0, 14.0, 6.0, 15.0, 10.0, 19.0, 31.0, 34.0, 37.0, 52.0, 85.0, 84.0, 91.0, 96.0, 66.0, 64.0, 55.0, 55.0, 35.0, 30.0, 21.0, 25.0, 11.0, 10.0, 5.0, 5.0, 8.0, 2.0, 5.0, 4.0, 1.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0198211669921875, -0.01920175552368164, -0.01858234405517578, -0.017962932586669922, -0.017343521118164062, -0.016724109649658203, -0.016104698181152344, -0.015485286712646484, -0.014865875244140625, -0.014246463775634766, -0.013627052307128906, -0.013007640838623047, -0.012388229370117188, -0.011768817901611328, -0.011149406433105469, -0.01052999496459961, -0.00991058349609375, -0.00929117202758789, -0.008671760559082031, -0.008052349090576172, -0.0074329376220703125, -0.006813526153564453, -0.006194114685058594, -0.005574703216552734, -0.004955291748046875, -0.004335880279541016, -0.0037164688110351562, -0.003097057342529297, -0.0024776458740234375, -0.0018582344055175781, -0.0012388229370117188, -0.0006194114685058594, 0.0, 0.0006194114685058594, 0.0012388229370117188, 0.0018582344055175781, 0.0024776458740234375, 0.003097057342529297, 0.0037164688110351562, 0.004335880279541016, 0.004955291748046875, 0.005574703216552734, 0.006194114685058594, 0.006813526153564453, 0.0074329376220703125, 0.008052349090576172, 0.008671760559082031, 0.00929117202758789, 0.00991058349609375, 0.01052999496459961, 0.011149406433105469, 0.011768817901611328, 0.012388229370117188, 0.013007640838623047, 0.013627052307128906, 0.014246463775634766, 0.014865875244140625, 0.015485286712646484, 0.016104698181152344, 0.016724109649658203, 0.017343521118164062, 0.017962932586669922, 0.01858234405517578, 0.01920175552368164, 0.0198211669921875]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 3.0, 5.0, 8.0, 10.0, 16.0, 29.0, 54.0, 81.0, 133.0, 146.0, 150.0, 129.0, 91.0, 50.0, 37.0, 26.0, 10.0, 8.0, 6.0, 2.0, 0.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9141902327537537, -0.8857532143592834, -0.8573161363601685, -0.8288791179656982, -0.8004420399665833, -0.772005021572113, -0.743567943572998, -0.7151309251785278, -0.6866939067840576, -0.6582568883895874, -0.6298198103904724, -0.6013827919960022, -0.5729457139968872, -0.544508695602417, -0.5160716772079468, -0.4876345992088318, -0.4591975510120392, -0.4307605028152466, -0.402323454618454, -0.3738864064216614, -0.34544938802719116, -0.31701233983039856, -0.28857529163360596, -0.26013827323913574, -0.23170121014118195, -0.20326416194438934, -0.17482712864875793, -0.14639008045196533, -0.11795303970575333, -0.08951599895954132, -0.06107895076274872, -0.03264191746711731, -0.004204869270324707, 0.024232173338532448, 0.0526692159473896, 0.0811062604188919, 0.10954330116510391, 0.13798034191131592, 0.16641739010810852, 0.19485442340373993, 0.22329147160053253, 0.25172850489616394, 0.28016555309295654, 0.30860260128974915, 0.33703964948654175, 0.36547666788101196, 0.39391374588012695, 0.42235076427459717, 0.45078781247138977, 0.4792248606681824, 0.5076618790626526, 0.5360989570617676, 0.5645359754562378, 0.592972993850708, 0.621410071849823, 0.6498470902442932, 0.6782841682434082, 0.7067211866378784, 0.7351582646369934, 0.7635952830314636, 0.7920323610305786, 0.8204693794250488, 0.848906397819519, 0.877343475818634, 0.9057804942131042]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 7.0, 13.0, 15.0, 20.0, 21.0, 27.0, 26.0, 31.0, 40.0, 38.0, 63.0, 47.0, 55.0, 50.0, 43.0, 56.0, 47.0, 54.0, 42.0, 34.0, 45.0, 33.0, 35.0, 39.0, 29.0, 21.0, 17.0, 23.0, 7.0, 11.0, 1.0, 3.0, 5.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.44590750336647034, -0.43207022547721863, -0.4182329773902893, -0.4043956995010376, -0.3905584216117859, -0.3767211437225342, -0.36288389563560486, -0.34904661774635315, -0.33520936965942383, -0.3213720917701721, -0.3075348436832428, -0.2936975657939911, -0.2798602879047394, -0.26602303981781006, -0.25218576192855835, -0.23834848403930664, -0.22451120615005493, -0.21067394316196442, -0.1968366652727127, -0.1829994022846222, -0.16916212439537048, -0.15532486140727997, -0.14148759841918945, -0.12765032052993774, -0.11381305754184723, -0.09997578710317612, -0.086138516664505, -0.07230125367641449, -0.05846398323774338, -0.044626712799072266, -0.03078944981098175, -0.01695217937231064, -0.0031149089336395264, 0.010722359642386436, 0.0245596282184124, 0.03839689493179321, 0.052234165370464325, 0.06607143580913544, 0.07990869879722595, 0.09374596923589706, 0.10758323967456818, 0.12142051011323929, 0.1352577805519104, 0.14909504354000092, 0.16293230652809143, 0.17676958441734314, 0.19060684740543365, 0.20444411039352417, 0.21828138828277588, 0.2321186512708664, 0.2459559291601181, 0.2597931921482086, 0.2736304700374603, 0.28746771812438965, 0.30130499601364136, 0.31514227390289307, 0.3289795517921448, 0.3428168296813965, 0.3566540777683258, 0.3704913556575775, 0.3843286335468292, 0.39816588163375854, 0.41200315952301025, 0.42584043741226196, 0.4396776854991913]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 9.0, 13.0, 23.0, 52.0, 98.0, 241.0, 672.0, 2120.0, 8249.0, 49237.0, 788739.0, 176971.0, 16429.0, 3923.0, 1173.0, 347.0, 141.0, 55.0, 24.0, 15.0, 6.0, 2.0, 5.0, 4.0, 2.0, 3.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6357421875, -1.5912017822265625, -1.546661376953125, -1.5021209716796875, -1.45758056640625, -1.4130401611328125, -1.368499755859375, -1.3239593505859375, -1.2794189453125, -1.2348785400390625, -1.190338134765625, -1.1457977294921875, -1.10125732421875, -1.0567169189453125, -1.012176513671875, -0.9676361083984375, -0.923095703125, -0.8785552978515625, -0.834014892578125, -0.7894744873046875, -0.74493408203125, -0.7003936767578125, -0.655853271484375, -0.6113128662109375, -0.5667724609375, -0.5222320556640625, -0.477691650390625, -0.4331512451171875, -0.38861083984375, -0.3440704345703125, -0.299530029296875, -0.2549896240234375, -0.21044921875, -0.1659088134765625, -0.121368408203125, -0.0768280029296875, -0.03228759765625, 0.0122528076171875, 0.056793212890625, 0.1013336181640625, 0.1458740234375, 0.1904144287109375, 0.234954833984375, 0.2794952392578125, 0.32403564453125, 0.3685760498046875, 0.413116455078125, 0.4576568603515625, 0.502197265625, 0.5467376708984375, 0.591278076171875, 0.6358184814453125, 0.68035888671875, 0.7248992919921875, 0.769439697265625, 0.8139801025390625, 0.8585205078125, 0.9030609130859375, 0.947601318359375, 0.9921417236328125, 1.03668212890625, 1.0812225341796875, 1.125762939453125, 1.1703033447265625, 1.21484375]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 5.0, 6.0, 5.0, 8.0, 18.0, 15.0, 30.0, 26.0, 38.0, 50.0, 60.0, 66.0, 66.0, 70.0, 72.0, 55.0, 65.0, 56.0, 50.0, 51.0, 45.0, 41.0, 34.0, 18.0, 25.0, 12.0, 10.0, 4.0, 5.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8642578125, -0.830780029296875, -0.79730224609375, -0.763824462890625, -0.7303466796875, -0.696868896484375, -0.66339111328125, -0.629913330078125, -0.596435546875, -0.562957763671875, -0.52947998046875, -0.496002197265625, -0.4625244140625, -0.429046630859375, -0.39556884765625, -0.362091064453125, -0.32861328125, -0.295135498046875, -0.26165771484375, -0.228179931640625, -0.1947021484375, -0.161224365234375, -0.12774658203125, -0.094268798828125, -0.060791015625, -0.027313232421875, 0.00616455078125, 0.039642333984375, 0.0731201171875, 0.106597900390625, 0.14007568359375, 0.173553466796875, 0.20703125, 0.240509033203125, 0.27398681640625, 0.307464599609375, 0.3409423828125, 0.374420166015625, 0.40789794921875, 0.441375732421875, 0.474853515625, 0.508331298828125, 0.54180908203125, 0.575286865234375, 0.6087646484375, 0.642242431640625, 0.67572021484375, 0.709197998046875, 0.74267578125, 0.776153564453125, 0.80963134765625, 0.843109130859375, 0.8765869140625, 0.910064697265625, 0.94354248046875, 0.977020263671875, 1.010498046875, 1.043975830078125, 1.07745361328125, 1.110931396484375, 1.1444091796875, 1.177886962890625, 1.21136474609375, 1.244842529296875, 1.2783203125]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 5.0, 5.0, 3.0, 4.0, 5.0, 4.0, 7.0, 9.0, 15.0, 15.0, 15.0, 10.0, 24.0, 21.0, 23.0, 28.0, 34.0, 42.0, 79.0, 119.0, 206.0, 538.0, 3332.0, 60119.0, 957847.0, 23132.0, 1923.0, 406.0, 145.0, 88.0, 71.0, 40.0, 41.0, 23.0, 22.0, 23.0, 20.0, 18.0, 13.0, 13.0, 18.0, 10.0, 11.0, 7.0, 5.0, 6.0, 2.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0], "bins": [-2.16796875, -2.102996826171875, -2.03802490234375, -1.973052978515625, -1.9080810546875, -1.843109130859375, -1.77813720703125, -1.713165283203125, -1.648193359375, -1.583221435546875, -1.51824951171875, -1.453277587890625, -1.3883056640625, -1.323333740234375, -1.25836181640625, -1.193389892578125, -1.12841796875, -1.063446044921875, -0.99847412109375, -0.933502197265625, -0.8685302734375, -0.803558349609375, -0.73858642578125, -0.673614501953125, -0.608642578125, -0.543670654296875, -0.47869873046875, -0.413726806640625, -0.3487548828125, -0.283782958984375, -0.21881103515625, -0.153839111328125, -0.0888671875, -0.023895263671875, 0.04107666015625, 0.106048583984375, 0.1710205078125, 0.235992431640625, 0.30096435546875, 0.365936279296875, 0.430908203125, 0.495880126953125, 0.56085205078125, 0.625823974609375, 0.6907958984375, 0.755767822265625, 0.82073974609375, 0.885711669921875, 0.95068359375, 1.015655517578125, 1.08062744140625, 1.145599365234375, 1.2105712890625, 1.275543212890625, 1.34051513671875, 1.405487060546875, 1.470458984375, 1.535430908203125, 1.60040283203125, 1.665374755859375, 1.7303466796875, 1.795318603515625, 1.86029052734375, 1.925262451171875, 1.990234375]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 7.0, 5.0, 4.0, 11.0, 11.0, 14.0, 12.0, 16.0, 7.0, 21.0, 18.0, 11.0, 27.0, 27.0, 26.0, 30.0, 46.0, 28.0, 42.0, 46.0, 43.0, 39.0, 42.0, 40.0, 33.0, 35.0, 36.0, 38.0, 30.0, 34.0, 26.0, 27.0, 19.0, 23.0, 13.0, 16.0, 14.0, 20.0, 16.0, 11.0, 6.0, 6.0, 6.0, 4.0, 3.0, 4.0, 3.0, 1.0, 3.0, 0.0, 3.0, 4.0], "bins": [-0.66943359375, -0.64971923828125, -0.6300048828125, -0.61029052734375, -0.590576171875, -0.57086181640625, -0.5511474609375, -0.53143310546875, -0.51171875, -0.49200439453125, -0.4722900390625, -0.45257568359375, -0.432861328125, -0.41314697265625, -0.3934326171875, -0.37371826171875, -0.35400390625, -0.33428955078125, -0.3145751953125, -0.29486083984375, -0.275146484375, -0.25543212890625, -0.2357177734375, -0.21600341796875, -0.1962890625, -0.17657470703125, -0.1568603515625, -0.13714599609375, -0.117431640625, -0.09771728515625, -0.0780029296875, -0.05828857421875, -0.03857421875, -0.01885986328125, 0.0008544921875, 0.02056884765625, 0.040283203125, 0.05999755859375, 0.0797119140625, 0.09942626953125, 0.119140625, 0.13885498046875, 0.1585693359375, 0.17828369140625, 0.197998046875, 0.21771240234375, 0.2374267578125, 0.25714111328125, 0.27685546875, 0.29656982421875, 0.3162841796875, 0.33599853515625, 0.355712890625, 0.37542724609375, 0.3951416015625, 0.41485595703125, 0.4345703125, 0.45428466796875, 0.4739990234375, 0.49371337890625, 0.513427734375, 0.53314208984375, 0.5528564453125, 0.57257080078125, 0.59228515625]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 7.0, 5.0, 7.0, 16.0, 14.0, 18.0, 34.0, 56.0, 95.0, 164.0, 347.0, 726.0, 1715.0, 5344.0, 69250.0, 947123.0, 18000.0, 3370.0, 1196.0, 498.0, 256.0, 115.0, 79.0, 39.0, 26.0, 6.0, 10.0, 12.0, 6.0, 7.0, 5.0, 2.0, 3.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.63671875, -0.6170120239257812, -0.5973052978515625, -0.5775985717773438, -0.557891845703125, -0.5381851196289062, -0.5184783935546875, -0.49877166748046875, -0.47906494140625, -0.45935821533203125, -0.4396514892578125, -0.41994476318359375, -0.400238037109375, -0.38053131103515625, -0.3608245849609375, -0.34111785888671875, -0.3214111328125, -0.30170440673828125, -0.2819976806640625, -0.26229095458984375, -0.242584228515625, -0.22287750244140625, -0.2031707763671875, -0.18346405029296875, -0.16375732421875, -0.14405059814453125, -0.1243438720703125, -0.10463714599609375, -0.084930419921875, -0.06522369384765625, -0.0455169677734375, -0.02581024169921875, -0.006103515625, 0.01360321044921875, 0.0333099365234375, 0.05301666259765625, 0.072723388671875, 0.09243011474609375, 0.1121368408203125, 0.13184356689453125, 0.15155029296875, 0.17125701904296875, 0.1909637451171875, 0.21067047119140625, 0.230377197265625, 0.25008392333984375, 0.2697906494140625, 0.28949737548828125, 0.3092041015625, 0.32891082763671875, 0.3486175537109375, 0.36832427978515625, 0.388031005859375, 0.40773773193359375, 0.4274444580078125, 0.44715118408203125, 0.46685791015625, 0.48656463623046875, 0.5062713623046875, 0.5259780883789062, 0.545684814453125, 0.5653915405273438, 0.5850982666015625, 0.6048049926757812, 0.62451171875]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 9.0, 30.0, 40.0, 101.0, 259.0, 270.0, 137.0, 71.0, 35.0, 22.0, 11.0, 5.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.257129669189453e-05, -5.0094909965991974e-05, -4.7618523240089417e-05, -4.514213651418686e-05, -4.26657497882843e-05, -4.0189363062381744e-05, -3.771297633647919e-05, -3.523658961057663e-05, -3.276020288467407e-05, -3.0283816158771515e-05, -2.7807429432868958e-05, -2.53310427069664e-05, -2.2854655981063843e-05, -2.0378269255161285e-05, -1.7901882529258728e-05, -1.542549580335617e-05, -1.2949109077453613e-05, -1.0472722351551056e-05, -7.996335625648499e-06, -5.519948899745941e-06, -3.043562173843384e-06, -5.671754479408264e-07, 1.909211277961731e-06, 4.385598003864288e-06, 6.861984729766846e-06, 9.338371455669403e-06, 1.181475818157196e-05, 1.4291144907474518e-05, 1.6767531633377075e-05, 1.9243918359279633e-05, 2.172030508518219e-05, 2.4196691811084747e-05, 2.6673078536987305e-05, 2.9149465262889862e-05, 3.162585198879242e-05, 3.410223871469498e-05, 3.6578625440597534e-05, 3.905501216650009e-05, 4.153139889240265e-05, 4.4007785618305206e-05, 4.6484172344207764e-05, 4.896055907011032e-05, 5.143694579601288e-05, 5.3913332521915436e-05, 5.638971924781799e-05, 5.886610597372055e-05, 6.134249269962311e-05, 6.381887942552567e-05, 6.629526615142822e-05, 6.877165287733078e-05, 7.124803960323334e-05, 7.37244263291359e-05, 7.620081305503845e-05, 7.867719978094101e-05, 8.115358650684357e-05, 8.362997323274612e-05, 8.610635995864868e-05, 8.858274668455124e-05, 9.10591334104538e-05, 9.353552013635635e-05, 9.601190686225891e-05, 9.848829358816147e-05, 0.00010096468031406403, 0.00010344106703996658, 0.00010591745376586914]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 1.0, 4.0, 5.0, 3.0, 3.0, 9.0, 7.0, 18.0, 12.0, 37.0, 45.0, 60.0, 98.0, 170.0, 275.0, 510.0, 987.0, 2306.0, 6871.0, 82382.0, 923319.0, 23758.0, 4276.0, 1643.0, 709.0, 413.0, 245.0, 121.0, 80.0, 53.0, 38.0, 30.0, 18.0, 17.0, 7.0, 8.0, 4.0, 3.0, 8.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4921875, -0.47540283203125, -0.4586181640625, -0.44183349609375, -0.425048828125, -0.40826416015625, -0.3914794921875, -0.37469482421875, -0.35791015625, -0.34112548828125, -0.3243408203125, -0.30755615234375, -0.290771484375, -0.27398681640625, -0.2572021484375, -0.24041748046875, -0.2236328125, -0.20684814453125, -0.1900634765625, -0.17327880859375, -0.156494140625, -0.13970947265625, -0.1229248046875, -0.10614013671875, -0.08935546875, -0.07257080078125, -0.0557861328125, -0.03900146484375, -0.022216796875, -0.00543212890625, 0.0113525390625, 0.02813720703125, 0.044921875, 0.06170654296875, 0.0784912109375, 0.09527587890625, 0.112060546875, 0.12884521484375, 0.1456298828125, 0.16241455078125, 0.17919921875, 0.19598388671875, 0.2127685546875, 0.22955322265625, 0.246337890625, 0.26312255859375, 0.2799072265625, 0.29669189453125, 0.3134765625, 0.33026123046875, 0.3470458984375, 0.36383056640625, 0.380615234375, 0.39739990234375, 0.4141845703125, 0.43096923828125, 0.44775390625, 0.46453857421875, 0.4813232421875, 0.49810791015625, 0.514892578125, 0.53167724609375, 0.5484619140625, 0.56524658203125, 0.58203125]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 5.0, 4.0, 4.0, 5.0, 5.0, 11.0, 21.0, 33.0, 94.0, 146.0, 276.0, 202.0, 97.0, 50.0, 21.0, 10.0, 5.0, 7.0, 1.0, 5.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.257080078125, -0.25044822692871094, -0.24381637573242188, -0.2371845245361328, -0.23055267333984375, -0.2239208221435547, -0.21728897094726562, -0.21065711975097656, -0.2040252685546875, -0.19739341735839844, -0.19076156616210938, -0.1841297149658203, -0.17749786376953125, -0.1708660125732422, -0.16423416137695312, -0.15760231018066406, -0.150970458984375, -0.14433860778808594, -0.13770675659179688, -0.1310749053955078, -0.12444305419921875, -0.11781120300292969, -0.11117935180664062, -0.10454750061035156, -0.0979156494140625, -0.09128379821777344, -0.08465194702148438, -0.07802009582519531, -0.07138824462890625, -0.06475639343261719, -0.058124542236328125, -0.05149269104003906, -0.04486083984375, -0.03822898864746094, -0.031597137451171875, -0.024965286254882812, -0.01833343505859375, -0.011701583862304688, -0.005069732666015625, 0.0015621185302734375, 0.0081939697265625, 0.014825820922851562, 0.021457672119140625, 0.028089523315429688, 0.03472137451171875, 0.04135322570800781, 0.047985076904296875, 0.05461692810058594, 0.061248779296875, 0.06788063049316406, 0.07451248168945312, 0.08114433288574219, 0.08777618408203125, 0.09440803527832031, 0.10103988647460938, 0.10767173767089844, 0.1143035888671875, 0.12093544006347656, 0.12756729125976562, 0.1341991424560547, 0.14083099365234375, 0.1474628448486328, 0.15409469604492188, 0.16072654724121094, 0.1673583984375]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 13.0, 24.0, 44.0, 70.0, 165.0, 202.0, 219.0, 128.0, 67.0, 40.0, 17.0, 7.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6507422924041748, -1.5635559558868408, -1.4763696193695068, -1.3891834020614624, -1.3019970655441284, -1.2148107290267944, -1.12762451171875, -1.040438175201416, -0.953251838684082, -0.866065502166748, -0.7788792252540588, -0.6916929483413696, -0.6045066118240356, -0.5173202753067017, -0.43013399839401245, -0.34294772148132324, -0.25576138496398926, -0.16857507824897766, -0.08138877153396606, 0.005797535181045532, 0.09298384189605713, 0.18017014861106873, 0.2673564553260803, 0.35454273223876953, 0.4417290687561035, 0.5289154052734375, 0.6161016821861267, 0.7032879590988159, 0.7904742956161499, 0.8776606321334839, 0.9648469090461731, 1.0520331859588623, 1.1392195224761963, 1.2264058589935303, 1.3135921955108643, 1.4007784128189087, 1.4879647493362427, 1.5751510858535767, 1.662337303161621, 1.749523639678955, 1.836709976196289, 1.923896312713623, 2.011082649230957, 2.098268985748291, 2.185455322265625, 2.27264142036438, 2.359827756881714, 2.447014093399048, 2.534200429916382, 2.621386766433716, 2.70857310295105, 2.795759439468384, 2.8829455375671387, 2.9701318740844727, 3.0573182106018066, 3.1445045471191406, 3.2316908836364746, 3.3188772201538086, 3.4060635566711426, 3.4932498931884766, 3.5804362297058105, 3.6676223278045654, 3.7548086643218994, 3.8419950008392334, 3.9291813373565674]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 0.0, 3.0, 7.0, 4.0, 4.0, 5.0, 12.0, 17.0, 11.0, 15.0, 16.0, 25.0, 20.0, 32.0, 45.0, 37.0, 44.0, 46.0, 47.0, 42.0, 56.0, 45.0, 46.0, 48.0, 39.0, 45.0, 34.0, 37.0, 39.0, 35.0, 27.0, 25.0, 16.0, 18.0, 11.0, 15.0, 8.0, 13.0, 5.0, 5.0, 2.0, 0.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3662573099136353, -1.3248897790908813, -1.2835222482681274, -1.2421547174453735, -1.2007871866226196, -1.1594196557998657, -1.1180521249771118, -1.0766847133636475, -1.0353171825408936, -0.9939496517181396, -0.9525821208953857, -0.9112145900726318, -0.8698470592498779, -0.828479528427124, -0.7871120572090149, -0.745744526386261, -0.7043769359588623, -0.6630094051361084, -0.6216418743133545, -0.5802743434906006, -0.5389068126678467, -0.49753931164741516, -0.45617181062698364, -0.41480427980422974, -0.37343674898147583, -0.3320692181587219, -0.290701687335968, -0.2493341863155365, -0.2079666554927826, -0.1665991246700287, -0.12523160874843597, -0.08386409282684326, -0.042496562004089355, -0.0011290386319160461, 0.04023848474025726, 0.08160600811243057, 0.12297353148460388, 0.1643410623073578, 0.2057085782289505, 0.2470760941505432, 0.2884436249732971, 0.329811155796051, 0.37117868661880493, 0.41254618763923645, 0.45391371846199036, 0.49528124928474426, 0.5366487503051758, 0.5780162811279297, 0.6193838119506836, 0.6607513427734375, 0.7021188735961914, 0.7434864044189453, 0.7848539352416992, 0.8262214660644531, 0.8675889372825623, 0.9089564681053162, 0.9503239989280701, 0.991691529750824, 1.033059000968933, 1.074426531791687, 1.115794062614441, 1.1571615934371948, 1.1985291242599487, 1.2398966550827026, 1.2812641859054565]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 8.0, 8.0, 8.0, 13.0, 31.0, 103.0, 401.0, 2346.0, 116773.0, 4063102.0, 10359.0, 887.0, 145.0, 38.0, 23.0, 11.0, 8.0, 5.0, 6.0, 4.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.98046875, -4.853668212890625, -4.72686767578125, -4.600067138671875, -4.4732666015625, -4.346466064453125, -4.21966552734375, -4.092864990234375, -3.966064453125, -3.839263916015625, -3.71246337890625, -3.585662841796875, -3.4588623046875, -3.332061767578125, -3.20526123046875, -3.078460693359375, -2.95166015625, -2.824859619140625, -2.69805908203125, -2.571258544921875, -2.4444580078125, -2.317657470703125, -2.19085693359375, -2.064056396484375, -1.937255859375, -1.810455322265625, -1.68365478515625, -1.556854248046875, -1.4300537109375, -1.303253173828125, -1.17645263671875, -1.049652099609375, -0.9228515625, -0.796051025390625, -0.66925048828125, -0.542449951171875, -0.4156494140625, -0.288848876953125, -0.16204833984375, -0.035247802734375, 0.091552734375, 0.218353271484375, 0.34515380859375, 0.471954345703125, 0.5987548828125, 0.725555419921875, 0.85235595703125, 0.979156494140625, 1.10595703125, 1.232757568359375, 1.35955810546875, 1.486358642578125, 1.6131591796875, 1.739959716796875, 1.86676025390625, 1.993560791015625, 2.120361328125, 2.247161865234375, 2.37396240234375, 2.500762939453125, 2.6275634765625, 2.754364013671875, 2.88116455078125, 3.007965087890625, 3.134765625]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 6.0, 14.0, 10.0, 16.0, 13.0, 21.0, 22.0, 22.0, 44.0, 43.0, 49.0, 61.0, 60.0, 70.0, 58.0, 53.0, 72.0, 52.0, 44.0, 46.0, 41.0, 41.0, 25.0, 25.0, 24.0, 18.0, 10.0, 9.0, 7.0, 6.0, 3.0, 6.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.75146484375, -0.7305755615234375, -0.709686279296875, -0.6887969970703125, -0.66790771484375, -0.6470184326171875, -0.626129150390625, -0.6052398681640625, -0.5843505859375, -0.5634613037109375, -0.542572021484375, -0.5216827392578125, -0.50079345703125, -0.4799041748046875, -0.459014892578125, -0.4381256103515625, -0.417236328125, -0.3963470458984375, -0.375457763671875, -0.3545684814453125, -0.33367919921875, -0.3127899169921875, -0.291900634765625, -0.2710113525390625, -0.2501220703125, -0.2292327880859375, -0.208343505859375, -0.1874542236328125, -0.16656494140625, -0.1456756591796875, -0.124786376953125, -0.1038970947265625, -0.0830078125, -0.0621185302734375, -0.041229248046875, -0.0203399658203125, 0.00054931640625, 0.0214385986328125, 0.042327880859375, 0.0632171630859375, 0.0841064453125, 0.1049957275390625, 0.125885009765625, 0.1467742919921875, 0.16766357421875, 0.1885528564453125, 0.209442138671875, 0.2303314208984375, 0.251220703125, 0.2721099853515625, 0.292999267578125, 0.3138885498046875, 0.33477783203125, 0.3556671142578125, 0.376556396484375, 0.3974456787109375, 0.4183349609375, 0.4392242431640625, 0.460113525390625, 0.4810028076171875, 0.50189208984375, 0.5227813720703125, 0.543670654296875, 0.5645599365234375, 0.58544921875]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 4.0, 2.0, 5.0, 5.0, 6.0, 6.0, 9.0, 12.0, 16.0, 14.0, 24.0, 31.0, 49.0, 77.0, 121.0, 204.0, 445.0, 1052.0, 3829.0, 24952.0, 3052600.0, 1089038.0, 17043.0, 2955.0, 889.0, 362.0, 186.0, 97.0, 65.0, 42.0, 33.0, 24.0, 24.0, 14.0, 14.0, 8.0, 5.0, 6.0, 8.0, 4.0, 4.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.716796875, -1.661285400390625, -1.60577392578125, -1.550262451171875, -1.4947509765625, -1.439239501953125, -1.38372802734375, -1.328216552734375, -1.272705078125, -1.217193603515625, -1.16168212890625, -1.106170654296875, -1.0506591796875, -0.995147705078125, -0.93963623046875, -0.884124755859375, -0.82861328125, -0.773101806640625, -0.71759033203125, -0.662078857421875, -0.6065673828125, -0.551055908203125, -0.49554443359375, -0.440032958984375, -0.384521484375, -0.329010009765625, -0.27349853515625, -0.217987060546875, -0.1624755859375, -0.106964111328125, -0.05145263671875, 0.004058837890625, 0.0595703125, 0.115081787109375, 0.17059326171875, 0.226104736328125, 0.2816162109375, 0.337127685546875, 0.39263916015625, 0.448150634765625, 0.503662109375, 0.559173583984375, 0.61468505859375, 0.670196533203125, 0.7257080078125, 0.781219482421875, 0.83673095703125, 0.892242431640625, 0.94775390625, 1.003265380859375, 1.05877685546875, 1.114288330078125, 1.1697998046875, 1.225311279296875, 1.28082275390625, 1.336334228515625, 1.391845703125, 1.447357177734375, 1.50286865234375, 1.558380126953125, 1.6138916015625, 1.669403076171875, 1.72491455078125, 1.780426025390625, 1.8359375]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 9.0, 5.0, 14.0, 11.0, 17.0, 39.0, 42.0, 100.0, 183.0, 379.0, 742.0, 1022.0, 700.0, 332.0, 185.0, 93.0, 57.0, 48.0, 28.0, 22.0, 17.0, 6.0, 9.0, 6.0, 3.0, 3.0, 4.0, 1.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.267333984375, -0.25724029541015625, -0.2471466064453125, -0.23705291748046875, -0.226959228515625, -0.21686553955078125, -0.2067718505859375, -0.19667816162109375, -0.18658447265625, -0.17649078369140625, -0.1663970947265625, -0.15630340576171875, -0.146209716796875, -0.13611602783203125, -0.1260223388671875, -0.11592864990234375, -0.1058349609375, -0.09574127197265625, -0.0856475830078125, -0.07555389404296875, -0.065460205078125, -0.05536651611328125, -0.0452728271484375, -0.03517913818359375, -0.02508544921875, -0.01499176025390625, -0.0048980712890625, 0.00519561767578125, 0.015289306640625, 0.02538299560546875, 0.0354766845703125, 0.04557037353515625, 0.0556640625, 0.06575775146484375, 0.0758514404296875, 0.08594512939453125, 0.096038818359375, 0.10613250732421875, 0.1162261962890625, 0.12631988525390625, 0.13641357421875, 0.14650726318359375, 0.1566009521484375, 0.16669464111328125, 0.176788330078125, 0.18688201904296875, 0.1969757080078125, 0.20706939697265625, 0.2171630859375, 0.22725677490234375, 0.2373504638671875, 0.24744415283203125, 0.257537841796875, 0.26763153076171875, 0.2777252197265625, 0.28781890869140625, 0.29791259765625, 0.30800628662109375, 0.3180999755859375, 0.32819366455078125, 0.338287353515625, 0.34838104248046875, 0.3584747314453125, 0.36856842041015625, 0.378662109375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 6.0, 8.0, 3.0, 6.0, 17.0, 17.0, 35.0, 50.0, 72.0, 103.0, 96.0, 102.0, 121.0, 97.0, 78.0, 67.0, 33.0, 28.0, 11.0, 16.0, 8.0, 12.0, 2.0, 8.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9992645978927612, -0.9685320854187012, -0.9377995729446411, -0.9070670008659363, -0.8763344883918762, -0.8456019759178162, -0.8148694038391113, -0.7841368913650513, -0.7534043788909912, -0.7226718664169312, -0.6919393539428711, -0.6612067818641663, -0.6304742693901062, -0.5997417569160461, -0.5690091848373413, -0.5382766723632812, -0.5075441598892212, -0.47681164741516113, -0.4460791051387787, -0.41534656286239624, -0.3846140503883362, -0.3538815379142761, -0.3231489956378937, -0.29241645336151123, -0.26168394088745117, -0.23095141351222992, -0.20021888613700867, -0.16948635876178741, -0.13875383138656616, -0.10802130401134491, -0.07728877663612366, -0.046556249260902405, -0.015823781490325928, 0.014908745884895325, 0.04564127326011658, 0.07637380063533783, 0.10710632801055908, 0.13783885538578033, 0.1685713827610016, 0.19930391013622284, 0.2300364375114441, 0.26076894998550415, 0.2915014922618866, 0.32223403453826904, 0.3529665470123291, 0.38369905948638916, 0.4144316017627716, 0.44516414403915405, 0.4758966565132141, 0.5066291689872742, 0.537361741065979, 0.5680942535400391, 0.5988267660140991, 0.6295592784881592, 0.6602917909622192, 0.6910243630409241, 0.7217568755149841, 0.7524893879890442, 0.783221960067749, 0.8139544725418091, 0.8446869850158691, 0.8754194974899292, 0.9061520099639893, 0.9368845820426941, 0.9676170945167542]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 7.0, 4.0, 8.0, 5.0, 7.0, 6.0, 16.0, 14.0, 17.0, 16.0, 20.0, 30.0, 37.0, 41.0, 44.0, 36.0, 41.0, 43.0, 44.0, 50.0, 46.0, 55.0, 38.0, 44.0, 41.0, 42.0, 36.0, 37.0, 29.0, 21.0, 19.0, 14.0, 17.0, 16.0, 12.0, 15.0, 6.0, 7.0, 7.0, 8.0, 5.0, 1.0, 2.0, 4.0, 1.0, 2.0], "bins": [-0.6784250140190125, -0.6610329747200012, -0.64364093542099, -0.6262488961219788, -0.6088568568229675, -0.5914648175239563, -0.5740727782249451, -0.5566807985305786, -0.5392887592315674, -0.5218967199325562, -0.5045046806335449, -0.4871126413345337, -0.46972060203552246, -0.45232856273651123, -0.4349365532398224, -0.41754451394081116, -0.40015244483947754, -0.3827604055404663, -0.3653683662414551, -0.34797632694244385, -0.3305842876434326, -0.3131922483444214, -0.29580023884773254, -0.2784081995487213, -0.2610161602497101, -0.24362412095069885, -0.22623208165168762, -0.20884005725383759, -0.19144801795482635, -0.17405597865581512, -0.1566639542579651, -0.13927191495895386, -0.12187981605529785, -0.10448777675628662, -0.08709574490785599, -0.06970371305942535, -0.052311673760414124, -0.03491963446140289, -0.01752760261297226, -0.00013557076454162598, 0.017256468534469604, 0.034648504108190536, 0.05204053968191147, 0.0694325715303421, 0.08682461082935333, 0.10421665012836456, 0.1216086819767952, 0.13900071382522583, 0.15639275312423706, 0.1737847924232483, 0.19117683172225952, 0.20856885612010956, 0.2259608954191208, 0.24335293471813202, 0.26074495911598206, 0.2781369984149933, 0.2955290377140045, 0.31292107701301575, 0.330313116312027, 0.3477051556110382, 0.36509716510772705, 0.3824892044067383, 0.3998812437057495, 0.41727328300476074, 0.434665322303772]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 5.0, 5.0, 4.0, 5.0, 5.0, 8.0, 14.0, 15.0, 35.0, 46.0, 53.0, 135.0, 320.0, 1299.0, 8860.0, 163509.0, 825631.0, 43640.0, 3791.0, 669.0, 230.0, 117.0, 41.0, 44.0, 25.0, 18.0, 8.0, 5.0, 5.0, 6.0, 5.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.416015625, -0.4038887023925781, -0.39176177978515625, -0.3796348571777344, -0.3675079345703125, -0.3553810119628906, -0.34325408935546875, -0.3311271667480469, -0.319000244140625, -0.3068733215332031, -0.29474639892578125, -0.2826194763183594, -0.2704925537109375, -0.2583656311035156, -0.24623870849609375, -0.23411178588867188, -0.22198486328125, -0.20985794067382812, -0.19773101806640625, -0.18560409545898438, -0.1734771728515625, -0.16135025024414062, -0.14922332763671875, -0.13709640502929688, -0.124969482421875, -0.11284255981445312, -0.10071563720703125, -0.08858871459960938, -0.0764617919921875, -0.06433486938476562, -0.05220794677734375, -0.040081024169921875, -0.0279541015625, -0.015827178955078125, -0.00370025634765625, 0.008426666259765625, 0.0205535888671875, 0.032680511474609375, 0.04480743408203125, 0.056934356689453125, 0.069061279296875, 0.08118820190429688, 0.09331512451171875, 0.10544204711914062, 0.1175689697265625, 0.12969589233398438, 0.14182281494140625, 0.15394973754882812, 0.16607666015625, 0.17820358276367188, 0.19033050537109375, 0.20245742797851562, 0.2145843505859375, 0.22671127319335938, 0.23883819580078125, 0.2509651184082031, 0.263092041015625, 0.2752189636230469, 0.28734588623046875, 0.2994728088378906, 0.3115997314453125, 0.3237266540527344, 0.33585357666015625, 0.3479804992675781, 0.360107421875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 4.0, 1.0, 2.0, 7.0, 10.0, 13.0, 24.0, 42.0, 48.0, 66.0, 91.0, 90.0, 119.0, 113.0, 90.0, 86.0, 54.0, 45.0, 37.0, 31.0, 16.0, 14.0, 5.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.501953125, -0.476715087890625, -0.45147705078125, -0.426239013671875, -0.4010009765625, -0.375762939453125, -0.35052490234375, -0.325286865234375, -0.300048828125, -0.274810791015625, -0.24957275390625, -0.224334716796875, -0.1990966796875, -0.173858642578125, -0.14862060546875, -0.123382568359375, -0.09814453125, -0.072906494140625, -0.04766845703125, -0.022430419921875, 0.0028076171875, 0.028045654296875, 0.05328369140625, 0.078521728515625, 0.103759765625, 0.128997802734375, 0.15423583984375, 0.179473876953125, 0.2047119140625, 0.229949951171875, 0.25518798828125, 0.280426025390625, 0.3056640625, 0.330902099609375, 0.35614013671875, 0.381378173828125, 0.4066162109375, 0.431854248046875, 0.45709228515625, 0.482330322265625, 0.507568359375, 0.532806396484375, 0.55804443359375, 0.583282470703125, 0.6085205078125, 0.633758544921875, 0.65899658203125, 0.684234619140625, 0.70947265625, 0.734710693359375, 0.75994873046875, 0.785186767578125, 0.8104248046875, 0.835662841796875, 0.86090087890625, 0.886138916015625, 0.911376953125, 0.936614990234375, 0.96185302734375, 0.987091064453125, 1.0123291015625, 1.037567138671875, 1.06280517578125, 1.088043212890625, 1.11328125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 6.0, 5.0, 10.0, 7.0, 14.0, 19.0, 21.0, 23.0, 42.0, 60.0, 93.0, 137.0, 240.0, 377.0, 698.0, 1349.0, 3044.0, 8095.0, 25305.0, 104787.0, 425710.0, 363034.0, 82464.0, 20757.0, 6802.0, 2715.0, 1194.0, 602.0, 320.0, 219.0, 134.0, 83.0, 65.0, 33.0, 20.0, 20.0, 16.0, 12.0, 2.0, 9.0, 10.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1290283203125, -0.12471580505371094, -0.12040328979492188, -0.11609077453613281, -0.11177825927734375, -0.10746574401855469, -0.10315322875976562, -0.09884071350097656, -0.0945281982421875, -0.09021568298339844, -0.08590316772460938, -0.08159065246582031, -0.07727813720703125, -0.07296562194824219, -0.06865310668945312, -0.06434059143066406, -0.060028076171875, -0.05571556091308594, -0.051403045654296875, -0.04709053039550781, -0.04277801513671875, -0.03846549987792969, -0.034152984619140625, -0.029840469360351562, -0.0255279541015625, -0.021215438842773438, -0.016902923583984375, -0.012590408325195312, -0.00827789306640625, -0.0039653778076171875, 0.000347137451171875, 0.0046596527099609375, 0.00897216796875, 0.013284683227539062, 0.017597198486328125, 0.021909713745117188, 0.02622222900390625, 0.030534744262695312, 0.034847259521484375, 0.03915977478027344, 0.0434722900390625, 0.04778480529785156, 0.052097320556640625, 0.05640983581542969, 0.06072235107421875, 0.06503486633300781, 0.06934738159179688, 0.07365989685058594, 0.077972412109375, 0.08228492736816406, 0.08659744262695312, 0.09090995788574219, 0.09522247314453125, 0.09953498840332031, 0.10384750366210938, 0.10816001892089844, 0.1124725341796875, 0.11678504943847656, 0.12109756469726562, 0.1254100799560547, 0.12972259521484375, 0.1340351104736328, 0.13834762573242188, 0.14266014099121094, 0.14697265625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 3.0, 3.0, 8.0, 7.0, 11.0, 6.0, 7.0, 10.0, 9.0, 14.0, 13.0, 23.0, 21.0, 32.0, 38.0, 27.0, 37.0, 33.0, 34.0, 55.0, 40.0, 43.0, 40.0, 45.0, 49.0, 46.0, 50.0, 42.0, 29.0, 29.0, 20.0, 17.0, 30.0, 24.0, 21.0, 20.0, 11.0, 8.0, 10.0, 5.0, 6.0, 8.0, 6.0, 8.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.67578125, -0.655487060546875, -0.63519287109375, -0.614898681640625, -0.5946044921875, -0.574310302734375, -0.55401611328125, -0.533721923828125, -0.513427734375, -0.493133544921875, -0.47283935546875, -0.452545166015625, -0.4322509765625, -0.411956787109375, -0.39166259765625, -0.371368408203125, -0.35107421875, -0.330780029296875, -0.31048583984375, -0.290191650390625, -0.2698974609375, -0.249603271484375, -0.22930908203125, -0.209014892578125, -0.188720703125, -0.168426513671875, -0.14813232421875, -0.127838134765625, -0.1075439453125, -0.087249755859375, -0.06695556640625, -0.046661376953125, -0.0263671875, -0.006072998046875, 0.01422119140625, 0.034515380859375, 0.0548095703125, 0.075103759765625, 0.09539794921875, 0.115692138671875, 0.135986328125, 0.156280517578125, 0.17657470703125, 0.196868896484375, 0.2171630859375, 0.237457275390625, 0.25775146484375, 0.278045654296875, 0.29833984375, 0.318634033203125, 0.33892822265625, 0.359222412109375, 0.3795166015625, 0.399810791015625, 0.42010498046875, 0.440399169921875, 0.460693359375, 0.480987548828125, 0.50128173828125, 0.521575927734375, 0.5418701171875, 0.562164306640625, 0.58245849609375, 0.602752685546875, 0.623046875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 5.0, 7.0, 9.0, 10.0, 15.0, 15.0, 29.0, 47.0, 65.0, 95.0, 146.0, 244.0, 392.0, 643.0, 1109.0, 1989.0, 3831.0, 8190.0, 19542.0, 53371.0, 164126.0, 380678.0, 269507.0, 89798.0, 30813.0, 12282.0, 5416.0, 2705.0, 1405.0, 803.0, 450.0, 287.0, 179.0, 109.0, 62.0, 52.0, 46.0, 21.0, 18.0, 9.0, 5.0, 8.0, 5.0, 5.0, 5.0, 4.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.0270538330078125, -0.02611231803894043, -0.02517080307006836, -0.02422928810119629, -0.02328777313232422, -0.02234625816345215, -0.021404743194580078, -0.020463228225708008, -0.019521713256835938, -0.018580198287963867, -0.017638683319091797, -0.016697168350219727, -0.015755653381347656, -0.014814138412475586, -0.013872623443603516, -0.012931108474731445, -0.011989593505859375, -0.011048078536987305, -0.010106563568115234, -0.009165048599243164, -0.008223533630371094, -0.0072820186614990234, -0.006340503692626953, -0.005398988723754883, -0.0044574737548828125, -0.003515958786010742, -0.002574443817138672, -0.0016329288482666016, -0.0006914138793945312, 0.00025010108947753906, 0.0011916160583496094, 0.0021331310272216797, 0.00307464599609375, 0.00401616096496582, 0.004957675933837891, 0.005899190902709961, 0.006840705871582031, 0.0077822208404541016, 0.008723735809326172, 0.009665250778198242, 0.010606765747070312, 0.011548280715942383, 0.012489795684814453, 0.013431310653686523, 0.014372825622558594, 0.015314340591430664, 0.016255855560302734, 0.017197370529174805, 0.018138885498046875, 0.019080400466918945, 0.020021915435791016, 0.020963430404663086, 0.021904945373535156, 0.022846460342407227, 0.023787975311279297, 0.024729490280151367, 0.025671005249023438, 0.026612520217895508, 0.027554035186767578, 0.02849555015563965, 0.02943706512451172, 0.03037858009338379, 0.03132009506225586, 0.03226161003112793, 0.033203125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 3.0, 5.0, 6.0, 8.0, 9.0, 13.0, 19.0, 23.0, 42.0, 39.0, 50.0, 60.0, 85.0, 80.0, 86.0, 83.0, 83.0, 79.0, 42.0, 43.0, 27.0, 19.0, 26.0, 21.0, 11.0, 10.0, 5.0, 7.0, 7.0, 3.0, 1.0, 1.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5676021575927734e-05, -1.5006400644779205e-05, -1.4336779713630676e-05, -1.3667158782482147e-05, -1.2997537851333618e-05, -1.2327916920185089e-05, -1.165829598903656e-05, -1.0988675057888031e-05, -1.0319054126739502e-05, -9.649433195590973e-06, -8.979812264442444e-06, -8.310191333293915e-06, -7.640570402145386e-06, -6.970949470996857e-06, -6.301328539848328e-06, -5.631707608699799e-06, -4.9620866775512695e-06, -4.2924657464027405e-06, -3.6228448152542114e-06, -2.9532238841056824e-06, -2.2836029529571533e-06, -1.6139820218086243e-06, -9.443610906600952e-07, -2.7474015951156616e-07, 3.948807716369629e-07, 1.064501702785492e-06, 1.734122633934021e-06, 2.40374356508255e-06, 3.073364496231079e-06, 3.742985427379608e-06, 4.412606358528137e-06, 5.082227289676666e-06, 5.751848220825195e-06, 6.421469151973724e-06, 7.091090083122253e-06, 7.760711014270782e-06, 8.430331945419312e-06, 9.09995287656784e-06, 9.76957380771637e-06, 1.0439194738864899e-05, 1.1108815670013428e-05, 1.1778436601161957e-05, 1.2448057532310486e-05, 1.3117678463459015e-05, 1.3787299394607544e-05, 1.4456920325756073e-05, 1.5126541256904602e-05, 1.579616218805313e-05, 1.646578311920166e-05, 1.713540405035019e-05, 1.7805024981498718e-05, 1.8474645912647247e-05, 1.9144266843795776e-05, 1.9813887774944305e-05, 2.0483508706092834e-05, 2.1153129637241364e-05, 2.1822750568389893e-05, 2.249237149953842e-05, 2.316199243068695e-05, 2.383161336183548e-05, 2.450123429298401e-05, 2.5170855224132538e-05, 2.5840476155281067e-05, 2.6510097086429596e-05, 2.7179718017578125e-05]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 4.0, 5.0, 8.0, 9.0, 23.0, 23.0, 35.0, 72.0, 89.0, 119.0, 249.0, 441.0, 894.0, 2040.0, 4922.0, 13885.0, 45013.0, 156751.0, 409881.0, 288074.0, 85852.0, 25472.0, 8598.0, 3244.0, 1384.0, 662.0, 325.0, 183.0, 112.0, 64.0, 42.0, 29.0, 14.0, 12.0, 13.0, 2.0, 3.0, 1.0, 6.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0285797119140625, -0.0275118350982666, -0.026443958282470703, -0.025376081466674805, -0.024308204650878906, -0.023240327835083008, -0.02217245101928711, -0.02110457420349121, -0.020036697387695312, -0.018968820571899414, -0.017900943756103516, -0.016833066940307617, -0.01576519012451172, -0.01469731330871582, -0.013629436492919922, -0.012561559677124023, -0.011493682861328125, -0.010425806045532227, -0.009357929229736328, -0.00829005241394043, -0.007222175598144531, -0.006154298782348633, -0.005086421966552734, -0.004018545150756836, -0.0029506683349609375, -0.001882791519165039, -0.0008149147033691406, 0.0002529621124267578, 0.0013208389282226562, 0.0023887157440185547, 0.003456592559814453, 0.0045244693756103516, 0.00559234619140625, 0.0066602230072021484, 0.007728099822998047, 0.008795976638793945, 0.009863853454589844, 0.010931730270385742, 0.01199960708618164, 0.013067483901977539, 0.014135360717773438, 0.015203237533569336, 0.016271114349365234, 0.017338991165161133, 0.01840686798095703, 0.01947474479675293, 0.020542621612548828, 0.021610498428344727, 0.022678375244140625, 0.023746252059936523, 0.024814128875732422, 0.02588200569152832, 0.02694988250732422, 0.028017759323120117, 0.029085636138916016, 0.030153512954711914, 0.031221389770507812, 0.03228926658630371, 0.03335714340209961, 0.03442502021789551, 0.035492897033691406, 0.036560773849487305, 0.0376286506652832, 0.0386965274810791, 0.039764404296875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 6.0, 14.0, 19.0, 14.0, 20.0, 37.0, 20.0, 34.0, 43.0, 43.0, 52.0, 48.0, 78.0, 51.0, 59.0, 56.0, 51.0, 56.0, 49.0, 49.0, 44.0, 29.0, 23.0, 20.0, 13.0, 20.0, 14.0, 7.0, 7.0, 7.0, 3.0, 5.0, 1.0, 5.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0085906982421875, -0.008340597152709961, -0.008090496063232422, -0.007840394973754883, -0.007590293884277344, -0.007340192794799805, -0.007090091705322266, -0.0068399906158447266, -0.0065898895263671875, -0.0063397884368896484, -0.006089687347412109, -0.00583958625793457, -0.005589485168457031, -0.005339384078979492, -0.005089282989501953, -0.004839181900024414, -0.004589080810546875, -0.004338979721069336, -0.004088878631591797, -0.003838777542114258, -0.0035886764526367188, -0.0033385753631591797, -0.0030884742736816406, -0.0028383731842041016, -0.0025882720947265625, -0.0023381710052490234, -0.0020880699157714844, -0.0018379688262939453, -0.0015878677368164062, -0.0013377666473388672, -0.0010876655578613281, -0.0008375644683837891, -0.00058746337890625, -0.00033736228942871094, -8.726119995117188e-05, 0.0001628398895263672, 0.00041294097900390625, 0.0006630420684814453, 0.0009131431579589844, 0.0011632442474365234, 0.0014133453369140625, 0.0016634464263916016, 0.0019135475158691406, 0.0021636486053466797, 0.0024137496948242188, 0.002663850784301758, 0.002913951873779297, 0.003164052963256836, 0.003414154052734375, 0.003664255142211914, 0.003914356231689453, 0.004164457321166992, 0.004414558410644531, 0.00466465950012207, 0.004914760589599609, 0.0051648616790771484, 0.0054149627685546875, 0.0056650638580322266, 0.005915164947509766, 0.006165266036987305, 0.006415367126464844, 0.006665468215942383, 0.006915569305419922, 0.007165670394897461, 0.007415771484375]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 4.0, 5.0, 6.0, 9.0, 14.0, 25.0, 49.0, 67.0, 130.0, 156.0, 162.0, 146.0, 87.0, 56.0, 29.0, 17.0, 18.0, 7.0, 4.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.0424214601516724, -1.016438364982605, -0.9904552102088928, -0.9644720554351807, -0.9384889602661133, -0.9125058054924011, -0.886522650718689, -0.8605395555496216, -0.8345564007759094, -0.8085732460021973, -0.7825901508331299, -0.7566069960594177, -0.7306239008903503, -0.7046407461166382, -0.6786576509475708, -0.6526744961738586, -0.6266913414001465, -0.6007081866264343, -0.5747250914573669, -0.5487419366836548, -0.5227588415145874, -0.49677568674087524, -0.4707925617694855, -0.4448094367980957, -0.4188263416290283, -0.39284321665763855, -0.3668600916862488, -0.3408769369125366, -0.31489381194114685, -0.2889106869697571, -0.2629275619983673, -0.23694442212581635, -0.21096128225326538, -0.1849781572818756, -0.15899501740932465, -0.13301189243793488, -0.10702876001596451, -0.08104562759399414, -0.05506250262260437, -0.029079362750053406, -0.0030962377786636353, 0.022886892780661583, 0.0488700233399868, 0.07485315203666687, 0.10083628445863724, 0.1268194168806076, 0.15280254185199738, 0.17878568172454834, 0.2047688066959381, 0.23075193166732788, 0.25673505663871765, 0.2827181816101074, 0.3087013363838196, 0.33468446135520935, 0.3606675863265991, 0.3866507411003113, 0.41263383626937866, 0.43861696124076843, 0.4646000862121582, 0.49058324098587036, 0.5165663361549377, 0.5425494909286499, 0.5685325860977173, 0.5945157408714294, 0.6204988956451416]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 4.0, 1.0, 4.0, 5.0, 9.0, 10.0, 10.0, 14.0, 15.0, 21.0, 27.0, 27.0, 38.0, 66.0, 57.0, 37.0, 55.0, 47.0, 71.0, 57.0, 43.0, 63.0, 54.0, 42.0, 51.0, 23.0, 30.0, 17.0, 19.0, 22.0, 11.0, 11.0, 14.0, 8.0, 7.0, 7.0, 1.0, 3.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0], "bins": [-0.5165902376174927, -0.5032188892364502, -0.4898475110530853, -0.47647616267204285, -0.46310481429100037, -0.4497334361076355, -0.436362087726593, -0.42299073934555054, -0.40961939096450806, -0.3962480425834656, -0.3828766644001007, -0.3695053160190582, -0.35613396763801575, -0.3427625894546509, -0.3293912410736084, -0.3160198926925659, -0.30264851450920105, -0.28927716612815857, -0.2759057879447937, -0.2625344395637512, -0.24916309118270874, -0.23579172790050507, -0.2224203646183014, -0.2090490162372589, -0.19567765295505524, -0.18230628967285156, -0.16893494129180908, -0.1555635780096054, -0.14219221472740173, -0.12882086634635925, -0.11544950306415558, -0.1020781472325325, -0.08870676159858704, -0.07533540576696396, -0.06196404621005058, -0.04859268665313721, -0.03522133082151413, -0.021849974989891052, -0.008478611707687378, 0.0048927441239356995, 0.018264099955558777, 0.031635455787181854, 0.04500681534409523, 0.058378174901008606, 0.07174953073263168, 0.08512088656425476, 0.09849224984645844, 0.11186360567808151, 0.1252349615097046, 0.13860632479190826, 0.15197767317295074, 0.16534903645515442, 0.1787203848361969, 0.19209174811840057, 0.20546311140060425, 0.21883445978164673, 0.2322058230638504, 0.24557718634605408, 0.25894853472709656, 0.2723199129104614, 0.2856912612915039, 0.2990626096725464, 0.31243395805358887, 0.32580533623695374, 0.3391766846179962]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 0.0, 3.0, 3.0, 4.0, 2.0, 2.0, 4.0, 3.0, 12.0, 3.0, 12.0, 12.0, 14.0, 18.0, 27.0, 29.0, 31.0, 99.0, 320.0, 2063.0, 43276.0, 979345.0, 21328.0, 1431.0, 257.0, 70.0, 51.0, 22.0, 19.0, 17.0, 19.0, 12.0, 13.0, 10.0, 7.0, 5.0, 3.0, 4.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.654296875, -1.5960693359375, -1.537841796875, -1.4796142578125, -1.42138671875, -1.3631591796875, -1.304931640625, -1.2467041015625, -1.1884765625, -1.1302490234375, -1.072021484375, -1.0137939453125, -0.95556640625, -0.8973388671875, -0.839111328125, -0.7808837890625, -0.72265625, -0.6644287109375, -0.606201171875, -0.5479736328125, -0.48974609375, -0.4315185546875, -0.373291015625, -0.3150634765625, -0.2568359375, -0.1986083984375, -0.140380859375, -0.0821533203125, -0.02392578125, 0.0343017578125, 0.092529296875, 0.1507568359375, 0.208984375, 0.2672119140625, 0.325439453125, 0.3836669921875, 0.44189453125, 0.5001220703125, 0.558349609375, 0.6165771484375, 0.6748046875, 0.7330322265625, 0.791259765625, 0.8494873046875, 0.90771484375, 0.9659423828125, 1.024169921875, 1.0823974609375, 1.140625, 1.1988525390625, 1.257080078125, 1.3153076171875, 1.37353515625, 1.4317626953125, 1.489990234375, 1.5482177734375, 1.6064453125, 1.6646728515625, 1.722900390625, 1.7811279296875, 1.83935546875, 1.8975830078125, 1.955810546875, 2.0140380859375, 2.072265625]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 6.0, 6.0, 8.0, 17.0, 19.0, 29.0, 40.0, 55.0, 67.0, 79.0, 78.0, 100.0, 87.0, 81.0, 81.0, 72.0, 39.0, 47.0, 30.0, 26.0, 9.0, 17.0, 8.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0], "bins": [-1.9453125, -1.9038925170898438, -1.8624725341796875, -1.8210525512695312, -1.779632568359375, -1.7382125854492188, -1.6967926025390625, -1.6553726196289062, -1.61395263671875, -1.5725326538085938, -1.5311126708984375, -1.4896926879882812, -1.448272705078125, -1.4068527221679688, -1.3654327392578125, -1.3240127563476562, -1.2825927734375, -1.2411727905273438, -1.1997528076171875, -1.1583328247070312, -1.116912841796875, -1.0754928588867188, -1.0340728759765625, -0.9926528930664062, -0.95123291015625, -0.9098129272460938, -0.8683929443359375, -0.8269729614257812, -0.785552978515625, -0.7441329956054688, -0.7027130126953125, -0.6612930297851562, -0.619873046875, -0.5784530639648438, -0.5370330810546875, -0.49561309814453125, -0.454193115234375, -0.41277313232421875, -0.3713531494140625, -0.32993316650390625, -0.28851318359375, -0.24709320068359375, -0.2056732177734375, -0.16425323486328125, -0.122833251953125, -0.08141326904296875, -0.0399932861328125, 0.00142669677734375, 0.0428466796875, 0.08426666259765625, 0.1256866455078125, 0.16710662841796875, 0.208526611328125, 0.24994659423828125, 0.2913665771484375, 0.33278656005859375, 0.37420654296875, 0.41562652587890625, 0.4570465087890625, 0.49846649169921875, 0.539886474609375, 0.5813064575195312, 0.6227264404296875, 0.6641464233398438, 0.70556640625]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 4.0, 3.0, 3.0, 7.0, 19.0, 12.0, 19.0, 20.0, 27.0, 32.0, 60.0, 53.0, 78.0, 106.0, 137.0, 181.0, 292.0, 638.0, 2221.0, 19354.0, 866647.0, 149463.0, 6720.0, 1129.0, 461.0, 221.0, 160.0, 96.0, 74.0, 73.0, 46.0, 39.0, 37.0, 37.0, 16.0, 19.0, 16.0, 9.0, 4.0, 5.0, 7.0, 6.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-1.330078125, -1.29290771484375, -1.2557373046875, -1.21856689453125, -1.181396484375, -1.14422607421875, -1.1070556640625, -1.06988525390625, -1.03271484375, -0.99554443359375, -0.9583740234375, -0.92120361328125, -0.884033203125, -0.84686279296875, -0.8096923828125, -0.77252197265625, -0.7353515625, -0.69818115234375, -0.6610107421875, -0.62384033203125, -0.586669921875, -0.54949951171875, -0.5123291015625, -0.47515869140625, -0.43798828125, -0.40081787109375, -0.3636474609375, -0.32647705078125, -0.289306640625, -0.25213623046875, -0.2149658203125, -0.17779541015625, -0.140625, -0.10345458984375, -0.0662841796875, -0.02911376953125, 0.008056640625, 0.04522705078125, 0.0823974609375, 0.11956787109375, 0.15673828125, 0.19390869140625, 0.2310791015625, 0.26824951171875, 0.305419921875, 0.34259033203125, 0.3797607421875, 0.41693115234375, 0.4541015625, 0.49127197265625, 0.5284423828125, 0.56561279296875, 0.602783203125, 0.63995361328125, 0.6771240234375, 0.71429443359375, 0.75146484375, 0.78863525390625, 0.8258056640625, 0.86297607421875, 0.900146484375, 0.93731689453125, 0.9744873046875, 1.01165771484375, 1.048828125]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 7.0, 1.0, 0.0, 3.0, 13.0, 10.0, 15.0, 10.0, 15.0, 20.0, 26.0, 29.0, 34.0, 29.0, 27.0, 46.0, 35.0, 50.0, 43.0, 44.0, 46.0, 49.0, 36.0, 47.0, 47.0, 33.0, 40.0, 30.0, 30.0, 25.0, 22.0, 21.0, 25.0, 26.0, 12.0, 14.0, 16.0, 10.0, 3.0, 3.0, 5.0, 3.0, 2.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.78076171875, -0.7582550048828125, -0.735748291015625, -0.7132415771484375, -0.69073486328125, -0.6682281494140625, -0.645721435546875, -0.6232147216796875, -0.6007080078125, -0.5782012939453125, -0.555694580078125, -0.5331878662109375, -0.51068115234375, -0.4881744384765625, -0.465667724609375, -0.4431610107421875, -0.420654296875, -0.3981475830078125, -0.375640869140625, -0.3531341552734375, -0.33062744140625, -0.3081207275390625, -0.285614013671875, -0.2631072998046875, -0.2406005859375, -0.2180938720703125, -0.195587158203125, -0.1730804443359375, -0.15057373046875, -0.1280670166015625, -0.105560302734375, -0.0830535888671875, -0.060546875, -0.0380401611328125, -0.015533447265625, 0.0069732666015625, 0.02947998046875, 0.0519866943359375, 0.074493408203125, 0.0970001220703125, 0.1195068359375, 0.1420135498046875, 0.164520263671875, 0.1870269775390625, 0.20953369140625, 0.2320404052734375, 0.254547119140625, 0.2770538330078125, 0.299560546875, 0.3220672607421875, 0.344573974609375, 0.3670806884765625, 0.38958740234375, 0.4120941162109375, 0.434600830078125, 0.4571075439453125, 0.4796142578125, 0.5021209716796875, 0.524627685546875, 0.5471343994140625, 0.56964111328125, 0.5921478271484375, 0.614654541015625, 0.6371612548828125, 0.65966796875]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0, 3.0, 5.0, 5.0, 10.0, 11.0, 24.0, 29.0, 63.0, 64.0, 136.0, 281.0, 635.0, 1610.0, 5256.0, 28900.0, 892485.0, 104468.0, 10058.0, 2738.0, 934.0, 405.0, 188.0, 93.0, 52.0, 21.0, 25.0, 18.0, 11.0, 7.0, 8.0, 4.0, 1.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.58056640625, -0.5647544860839844, -0.5489425659179688, -0.5331306457519531, -0.5173187255859375, -0.5015068054199219, -0.48569488525390625, -0.4698829650878906, -0.454071044921875, -0.4382591247558594, -0.42244720458984375, -0.4066352844238281, -0.3908233642578125, -0.3750114440917969, -0.35919952392578125, -0.3433876037597656, -0.32757568359375, -0.3117637634277344, -0.29595184326171875, -0.2801399230957031, -0.2643280029296875, -0.24851608276367188, -0.23270416259765625, -0.21689224243164062, -0.201080322265625, -0.18526840209960938, -0.16945648193359375, -0.15364456176757812, -0.1378326416015625, -0.12202072143554688, -0.10620880126953125, -0.09039688110351562, -0.0745849609375, -0.058773040771484375, -0.04296112060546875, -0.027149200439453125, -0.0113372802734375, 0.004474639892578125, 0.02028656005859375, 0.036098480224609375, 0.051910400390625, 0.06772232055664062, 0.08353424072265625, 0.09934616088867188, 0.1151580810546875, 0.13097000122070312, 0.14678192138671875, 0.16259384155273438, 0.17840576171875, 0.19421768188476562, 0.21002960205078125, 0.22584152221679688, 0.2416534423828125, 0.2574653625488281, 0.27327728271484375, 0.2890892028808594, 0.304901123046875, 0.3207130432128906, 0.33652496337890625, 0.3523368835449219, 0.3681488037109375, 0.3839607238769531, 0.39977264404296875, 0.4155845642089844, 0.431396484375]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 9.0, 8.0, 9.0, 14.0, 16.0, 30.0, 57.0, 78.0, 122.0, 169.0, 148.0, 113.0, 67.0, 35.0, 28.0, 22.0, 16.0, 15.0, 9.0, 5.0, 2.0, 4.0, 6.0, 3.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.713369369506836e-05, -3.584660589694977e-05, -3.455951809883118e-05, -3.3272430300712585e-05, -3.1985342502593994e-05, -3.06982547044754e-05, -2.941116690635681e-05, -2.812407910823822e-05, -2.683699131011963e-05, -2.5549903512001038e-05, -2.4262815713882446e-05, -2.2975727915763855e-05, -2.1688640117645264e-05, -2.0401552319526672e-05, -1.911446452140808e-05, -1.782737672328949e-05, -1.65402889251709e-05, -1.5253201127052307e-05, -1.3966113328933716e-05, -1.2679025530815125e-05, -1.1391937732696533e-05, -1.0104849934577942e-05, -8.81776213645935e-06, -7.530674338340759e-06, -6.243586540222168e-06, -4.956498742103577e-06, -3.6694109439849854e-06, -2.382323145866394e-06, -1.0952353477478027e-06, 1.9185245037078857e-07, 1.4789402484893799e-06, 2.766028046607971e-06, 4.0531158447265625e-06, 5.340203642845154e-06, 6.627291440963745e-06, 7.914379239082336e-06, 9.201467037200928e-06, 1.0488554835319519e-05, 1.177564263343811e-05, 1.3062730431556702e-05, 1.4349818229675293e-05, 1.5636906027793884e-05, 1.6923993825912476e-05, 1.8211081624031067e-05, 1.9498169422149658e-05, 2.078525722026825e-05, 2.207234501838684e-05, 2.3359432816505432e-05, 2.4646520614624023e-05, 2.5933608412742615e-05, 2.7220696210861206e-05, 2.8507784008979797e-05, 2.979487180709839e-05, 3.108195960521698e-05, 3.236904740333557e-05, 3.365613520145416e-05, 3.4943222999572754e-05, 3.6230310797691345e-05, 3.7517398595809937e-05, 3.880448639392853e-05, 4.009157419204712e-05, 4.137866199016571e-05, 4.26657497882843e-05, 4.395283758640289e-05, 4.5239925384521484e-05]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 0.0, 1.0, 3.0, 2.0, 9.0, 5.0, 5.0, 18.0, 21.0, 37.0, 45.0, 68.0, 112.0, 183.0, 320.0, 582.0, 1401.0, 4399.0, 25733.0, 919543.0, 85067.0, 7204.0, 2023.0, 765.0, 411.0, 222.0, 104.0, 93.0, 51.0, 46.0, 19.0, 24.0, 11.0, 14.0, 2.0, 5.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.58251953125, -0.564697265625, -0.546875, -0.529052734375, -0.51123046875, -0.493408203125, -0.4755859375, -0.457763671875, -0.43994140625, -0.422119140625, -0.404296875, -0.386474609375, -0.36865234375, -0.350830078125, -0.3330078125, -0.315185546875, -0.29736328125, -0.279541015625, -0.26171875, -0.243896484375, -0.22607421875, -0.208251953125, -0.1904296875, -0.172607421875, -0.15478515625, -0.136962890625, -0.119140625, -0.101318359375, -0.08349609375, -0.065673828125, -0.0478515625, -0.030029296875, -0.01220703125, 0.005615234375, 0.0234375, 0.041259765625, 0.05908203125, 0.076904296875, 0.0947265625, 0.112548828125, 0.13037109375, 0.148193359375, 0.166015625, 0.183837890625, 0.20166015625, 0.219482421875, 0.2373046875, 0.255126953125, 0.27294921875, 0.290771484375, 0.30859375, 0.326416015625, 0.34423828125, 0.362060546875, 0.3798828125, 0.397705078125, 0.41552734375, 0.433349609375, 0.451171875, 0.468994140625, 0.48681640625, 0.504638671875, 0.5224609375, 0.540283203125, 0.55810546875]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 6.0, 4.0, 4.0, 5.0, 10.0, 17.0, 18.0, 23.0, 52.0, 92.0, 191.0, 240.0, 147.0, 67.0, 48.0, 26.0, 19.0, 13.0, 9.0, 4.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.163818359375, -0.15840530395507812, -0.15299224853515625, -0.14757919311523438, -0.1421661376953125, -0.13675308227539062, -0.13134002685546875, -0.12592697143554688, -0.120513916015625, -0.11510086059570312, -0.10968780517578125, -0.10427474975585938, -0.0988616943359375, -0.09344863891601562, -0.08803558349609375, -0.08262252807617188, -0.07720947265625, -0.07179641723632812, -0.06638336181640625, -0.060970306396484375, -0.0555572509765625, -0.050144195556640625, -0.04473114013671875, -0.039318084716796875, -0.033905029296875, -0.028491973876953125, -0.02307891845703125, -0.017665863037109375, -0.0122528076171875, -0.006839752197265625, -0.00142669677734375, 0.003986358642578125, 0.0093994140625, 0.014812469482421875, 0.02022552490234375, 0.025638580322265625, 0.0310516357421875, 0.036464691162109375, 0.04187774658203125, 0.047290802001953125, 0.052703857421875, 0.058116912841796875, 0.06352996826171875, 0.06894302368164062, 0.0743560791015625, 0.07976913452148438, 0.08518218994140625, 0.09059524536132812, 0.09600830078125, 0.10142135620117188, 0.10683441162109375, 0.11224746704101562, 0.1176605224609375, 0.12307357788085938, 0.12848663330078125, 0.13389968872070312, 0.139312744140625, 0.14472579956054688, 0.15013885498046875, 0.15555191040039062, 0.1609649658203125, 0.16637802124023438, 0.17179107666015625, 0.17720413208007812, 0.1826171875]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 16.0, 27.0, 189.0, 510.0, 211.0, 46.0, 7.0, 2.0, 2.0, 3.0, 1.0, 1.0], "bins": [-10.072785377502441, -9.891287803649902, -9.709790229797363, -9.528292655944824, -9.346795082092285, -9.165298461914062, -8.983800888061523, -8.802303314208984, -8.620805740356445, -8.439308166503906, -8.257810592651367, -8.076313018798828, -7.894815921783447, -7.713318347930908, -7.531820774078369, -7.350323677062988, -7.168826103210449, -6.98732852935791, -6.805830955505371, -6.62433385848999, -6.442836284637451, -6.261338710784912, -6.079841136932373, -5.898344039916992, -5.716845989227295, -5.535348415374756, -5.353850841522217, -5.172353744506836, -4.990856170654297, -4.809358596801758, -4.627861022949219, -4.44636344909668, -4.264865875244141, -4.083368301391602, -3.9018709659576416, -3.7203733921051025, -3.5388760566711426, -3.3573784828186035, -3.1758809089660645, -2.9943835735321045, -2.8128862380981445, -2.6313886642456055, -2.4498913288116455, -2.2683937549591064, -2.0868964195251465, -1.9053988456726074, -1.723901391029358, -1.5424039363861084, -1.3609064817428589, -1.1794090270996094, -0.9979115724563599, -0.8164140582084656, -0.6349166035652161, -0.45341914892196655, -0.27192163467407227, -0.09042418003082275, 0.09107327461242676, 0.27257072925567627, 0.45406821370124817, 0.6355656981468201, 0.8170631527900696, 0.9985606074333191, 1.1800581216812134, 1.361555576324463, 1.5430530309677124]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 5.0, 6.0, 13.0, 16.0, 24.0, 23.0, 25.0, 38.0, 64.0, 52.0, 71.0, 68.0, 69.0, 60.0, 73.0, 80.0, 62.0, 60.0, 41.0, 22.0, 30.0, 25.0, 25.0, 18.0, 8.0, 9.0, 8.0, 4.0, 3.0, 1.0, 3.0], "bins": [-2.7980833053588867, -2.738222360610962, -2.678361177444458, -2.618500232696533, -2.5586392879486084, -2.4987781047821045, -2.4389171600341797, -2.379056215286255, -2.319195032119751, -2.259334087371826, -2.1994729042053223, -2.1396119594573975, -2.0797510147094727, -2.0198898315429688, -1.960028886795044, -1.9001678228378296, -1.8403068780899048, -1.7804458141326904, -1.7205848693847656, -1.6607238054275513, -1.600862741470337, -1.541001796722412, -1.4811407327651978, -1.4212796688079834, -1.3614187240600586, -1.3015576601028442, -1.2416967153549194, -1.181835651397705, -1.1219745874404907, -1.0621135234832764, -1.0022525787353516, -0.9423915147781372, -0.8825305700302124, -0.8226695656776428, -0.7628085017204285, -0.7029474973678589, -0.6430864334106445, -0.583225429058075, -0.5233644247055054, -0.4635033905506134, -0.40364235639572144, -0.34378132224082947, -0.2839202880859375, -0.22405928373336792, -0.16419824957847595, -0.10433721542358398, -0.044476211071014404, 0.015384823083877563, 0.07524585723876953, 0.1351068913936615, 0.19496791064739227, 0.25482892990112305, 0.314689964056015, 0.374550998210907, 0.43441200256347656, 0.49427303671836853, 0.5541340708732605, 0.6139950752258301, 0.6738561391830444, 0.733717143535614, 0.7935781478881836, 0.853439211845398, 0.9133002161979675, 0.9731612205505371, 1.0330222845077515]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 7.0, 7.0, 5.0, 12.0, 15.0, 18.0, 31.0, 38.0, 56.0, 120.0, 199.0, 376.0, 767.0, 2005.0, 6961.0, 44210.0, 1397688.0, 2650944.0, 77546.0, 8879.0, 2417.0, 958.0, 459.0, 217.0, 130.0, 67.0, 52.0, 28.0, 24.0, 11.0, 15.0, 7.0, 5.0, 5.0, 1.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2763671875, -1.236602783203125, -1.19683837890625, -1.157073974609375, -1.1173095703125, -1.077545166015625, -1.03778076171875, -0.998016357421875, -0.958251953125, -0.918487548828125, -0.87872314453125, -0.838958740234375, -0.7991943359375, -0.759429931640625, -0.71966552734375, -0.679901123046875, -0.64013671875, -0.600372314453125, -0.56060791015625, -0.520843505859375, -0.4810791015625, -0.441314697265625, -0.40155029296875, -0.361785888671875, -0.322021484375, -0.282257080078125, -0.24249267578125, -0.202728271484375, -0.1629638671875, -0.123199462890625, -0.08343505859375, -0.043670654296875, -0.00390625, 0.035858154296875, 0.07562255859375, 0.115386962890625, 0.1551513671875, 0.194915771484375, 0.23468017578125, 0.274444580078125, 0.314208984375, 0.353973388671875, 0.39373779296875, 0.433502197265625, 0.4732666015625, 0.513031005859375, 0.55279541015625, 0.592559814453125, 0.63232421875, 0.672088623046875, 0.71185302734375, 0.751617431640625, 0.7913818359375, 0.831146240234375, 0.87091064453125, 0.910675048828125, 0.950439453125, 0.990203857421875, 1.02996826171875, 1.069732666015625, 1.1094970703125, 1.149261474609375, 1.18902587890625, 1.228790283203125, 1.2685546875]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 7.0, 9.0, 5.0, 8.0, 16.0, 20.0, 19.0, 29.0, 37.0, 47.0, 46.0, 68.0, 68.0, 65.0, 65.0, 72.0, 75.0, 70.0, 50.0, 37.0, 34.0, 34.0, 25.0, 25.0, 9.0, 15.0, 12.0, 7.0, 4.0, 9.0, 3.0, 7.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58154296875, -0.5605010986328125, -0.539459228515625, -0.5184173583984375, -0.49737548828125, -0.4763336181640625, -0.455291748046875, -0.4342498779296875, -0.4132080078125, -0.3921661376953125, -0.371124267578125, -0.3500823974609375, -0.32904052734375, -0.3079986572265625, -0.286956787109375, -0.2659149169921875, -0.244873046875, -0.2238311767578125, -0.202789306640625, -0.1817474365234375, -0.16070556640625, -0.1396636962890625, -0.118621826171875, -0.0975799560546875, -0.0765380859375, -0.0554962158203125, -0.034454345703125, -0.0134124755859375, 0.00762939453125, 0.0286712646484375, 0.049713134765625, 0.0707550048828125, 0.091796875, 0.1128387451171875, 0.133880615234375, 0.1549224853515625, 0.17596435546875, 0.1970062255859375, 0.218048095703125, 0.2390899658203125, 0.2601318359375, 0.2811737060546875, 0.302215576171875, 0.3232574462890625, 0.34429931640625, 0.3653411865234375, 0.386383056640625, 0.4074249267578125, 0.428466796875, 0.4495086669921875, 0.470550537109375, 0.4915924072265625, 0.51263427734375, 0.5336761474609375, 0.554718017578125, 0.5757598876953125, 0.5968017578125, 0.6178436279296875, 0.638885498046875, 0.6599273681640625, 0.68096923828125, 0.7020111083984375, 0.723052978515625, 0.7440948486328125, 0.76513671875]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 9.0, 5.0, 11.0, 10.0, 19.0, 31.0, 55.0, 109.0, 238.0, 699.0, 2669.0, 25684.0, 3911140.0, 244054.0, 7421.0, 1370.0, 401.0, 161.0, 98.0, 37.0, 26.0, 20.0, 5.0, 8.0, 3.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.93701171875, -0.8775405883789062, -0.8180694580078125, -0.7585983276367188, -0.699127197265625, -0.6396560668945312, -0.5801849365234375, -0.5207138061523438, -0.46124267578125, -0.40177154541015625, -0.3423004150390625, -0.28282928466796875, -0.223358154296875, -0.16388702392578125, -0.1044158935546875, -0.04494476318359375, 0.0145263671875, 0.07399749755859375, 0.1334686279296875, 0.19293975830078125, 0.252410888671875, 0.31188201904296875, 0.3713531494140625, 0.43082427978515625, 0.49029541015625, 0.5497665405273438, 0.6092376708984375, 0.6687088012695312, 0.728179931640625, 0.7876510620117188, 0.8471221923828125, 0.9065933227539062, 0.966064453125, 1.0255355834960938, 1.0850067138671875, 1.1444778442382812, 1.203948974609375, 1.2634201049804688, 1.3228912353515625, 1.3823623657226562, 1.44183349609375, 1.5013046264648438, 1.5607757568359375, 1.6202468872070312, 1.679718017578125, 1.7391891479492188, 1.7986602783203125, 1.8581314086914062, 1.9176025390625, 1.9770736694335938, 2.0365447998046875, 2.0960159301757812, 2.155487060546875, 2.2149581909179688, 2.2744293212890625, 2.3339004516601562, 2.39337158203125, 2.4528427124023438, 2.5123138427734375, 2.5717849731445312, 2.631256103515625, 2.6907272338867188, 2.7501983642578125, 2.8096694946289062, 2.869140625]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 6.0, 5.0, 10.0, 8.0, 21.0, 18.0, 40.0, 69.0, 116.0, 205.0, 437.0, 806.0, 1049.0, 621.0, 305.0, 149.0, 82.0, 49.0, 27.0, 19.0, 12.0, 5.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.416259765625, -0.4068470001220703, -0.3974342346191406, -0.38802146911621094, -0.37860870361328125, -0.36919593811035156, -0.3597831726074219, -0.3503704071044922, -0.3409576416015625, -0.3315448760986328, -0.3221321105957031, -0.31271934509277344, -0.30330657958984375, -0.29389381408691406, -0.2844810485839844, -0.2750682830810547, -0.265655517578125, -0.2562427520751953, -0.24682998657226562, -0.23741722106933594, -0.22800445556640625, -0.21859169006347656, -0.20917892456054688, -0.1997661590576172, -0.1903533935546875, -0.1809406280517578, -0.17152786254882812, -0.16211509704589844, -0.15270233154296875, -0.14328956604003906, -0.13387680053710938, -0.12446403503417969, -0.11505126953125, -0.10563850402832031, -0.09622573852539062, -0.08681297302246094, -0.07740020751953125, -0.06798744201660156, -0.058574676513671875, -0.04916191101074219, -0.0397491455078125, -0.030336380004882812, -0.020923614501953125, -0.011510848999023438, -0.00209808349609375, 0.0073146820068359375, 0.016727447509765625, 0.026140213012695312, 0.035552978515625, 0.04496574401855469, 0.054378509521484375, 0.06379127502441406, 0.07320404052734375, 0.08261680603027344, 0.09202957153320312, 0.10144233703613281, 0.1108551025390625, 0.12026786804199219, 0.12968063354492188, 0.13909339904785156, 0.14850616455078125, 0.15791893005371094, 0.16733169555664062, 0.1767444610595703, 0.1861572265625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 5.0, 14.0, 10.0, 14.0, 23.0, 23.0, 39.0, 69.0, 80.0, 121.0, 128.0, 112.0, 109.0, 83.0, 59.0, 26.0, 32.0, 13.0, 11.0, 7.0, 10.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.9831113219261169, -0.9531921148300171, -0.9232729077339172, -0.8933537006378174, -0.8634345531463623, -0.8335153460502625, -0.8035961389541626, -0.7736769318580627, -0.7437577247619629, -0.713838517665863, -0.6839193105697632, -0.6540001630783081, -0.6240809559822083, -0.5941617488861084, -0.5642425417900085, -0.5343233346939087, -0.5044041872024536, -0.47448498010635376, -0.4445658028125763, -0.41464659571647644, -0.384727418422699, -0.3548082113265991, -0.32488900423049927, -0.2949697971343994, -0.26505061984062195, -0.2351314276456833, -0.20521223545074463, -0.17529302835464478, -0.14537383615970612, -0.11545464396476746, -0.0855354368686676, -0.05561624467372894, -0.025697052478790283, 0.004222143441438675, 0.03414133936166763, 0.06406053900718689, 0.09397973120212555, 0.12389892339706421, 0.15381813049316406, 0.18373732268810272, 0.21365651488304138, 0.24357570707798004, 0.2734948992729187, 0.30341410636901855, 0.3333333134651184, 0.3632524907588959, 0.3931716978549957, 0.4230908751487732, 0.45301008224487305, 0.4829292893409729, 0.5128484964370728, 0.5427676439285278, 0.5726868510246277, 0.6026060581207275, 0.6325252652168274, 0.6624444723129272, 0.6923636198043823, 0.7222828269004822, 0.752202033996582, 0.7821211814880371, 0.812040388584137, 0.8419595956802368, 0.8718788027763367, 0.9017980098724365, 0.9317172169685364]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 2.0, 5.0, 1.0, 8.0, 5.0, 13.0, 20.0, 12.0, 20.0, 32.0, 36.0, 44.0, 47.0, 55.0, 61.0, 60.0, 73.0, 58.0, 63.0, 58.0, 63.0, 41.0, 44.0, 36.0, 27.0, 30.0, 16.0, 14.0, 17.0, 11.0, 8.0, 7.0, 1.0, 9.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7302916049957275, -0.7096372246742249, -0.6889827847480774, -0.6683284044265747, -0.6476739645004272, -0.6270195841789246, -0.6063652038574219, -0.5857107639312744, -0.5650563836097717, -0.544402003288269, -0.5237475633621216, -0.5030931830406189, -0.4824387729167938, -0.46178436279296875, -0.44112998247146606, -0.420475572347641, -0.3998211622238159, -0.37916675209999084, -0.35851234197616577, -0.3378579616546631, -0.317203551530838, -0.29654914140701294, -0.27589476108551025, -0.2552403509616852, -0.2345859408378601, -0.21393153071403503, -0.19327713549137115, -0.17262274026870728, -0.1519683301448822, -0.13131392002105713, -0.11065952479839325, -0.09000512957572937, -0.0693507194519043, -0.04869631677865982, -0.028041914105415344, -0.007387511432170868, 0.013266891241073608, 0.033921293914318085, 0.05457569658756256, 0.07523009181022644, 0.09588450193405151, 0.11653890460729599, 0.13719330728054047, 0.15784770250320435, 0.17850211262702942, 0.1991565227508545, 0.21981091797351837, 0.24046531319618225, 0.2611197233200073, 0.2817741334438324, 0.30242854356765747, 0.32308292388916016, 0.34373733401298523, 0.3643917441368103, 0.385046124458313, 0.40570053458213806, 0.42635494470596313, 0.4470093548297882, 0.4676637649536133, 0.48831814527511597, 0.5089725255966187, 0.5296269655227661, 0.5502813458442688, 0.5709357261657715, 0.591590166091919]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 5.0, 7.0, 6.0, 10.0, 20.0, 48.0, 113.0, 441.0, 2108.0, 15594.0, 963870.0, 61035.0, 4186.0, 768.0, 177.0, 75.0, 26.0, 23.0, 10.0, 9.0, 7.0, 4.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.8828125, -0.8616371154785156, -0.8404617309570312, -0.8192863464355469, -0.7981109619140625, -0.7769355773925781, -0.7557601928710938, -0.7345848083496094, -0.713409423828125, -0.6922340393066406, -0.6710586547851562, -0.6498832702636719, -0.6287078857421875, -0.6075325012207031, -0.5863571166992188, -0.5651817321777344, -0.54400634765625, -0.5228309631347656, -0.5016555786132812, -0.4804801940917969, -0.4593048095703125, -0.4381294250488281, -0.41695404052734375, -0.3957786560058594, -0.374603271484375, -0.3534278869628906, -0.33225250244140625, -0.3110771179199219, -0.2899017333984375, -0.2687263488769531, -0.24755096435546875, -0.22637557983398438, -0.2052001953125, -0.18402481079101562, -0.16284942626953125, -0.14167404174804688, -0.1204986572265625, -0.09932327270507812, -0.07814788818359375, -0.056972503662109375, -0.035797119140625, -0.014621734619140625, 0.00655364990234375, 0.027729034423828125, 0.0489044189453125, 0.07007980346679688, 0.09125518798828125, 0.11243057250976562, 0.13360595703125, 0.15478134155273438, 0.17595672607421875, 0.19713211059570312, 0.2183074951171875, 0.23948287963867188, 0.26065826416015625, 0.2818336486816406, 0.303009033203125, 0.3241844177246094, 0.34535980224609375, 0.3665351867675781, 0.3877105712890625, 0.4088859558105469, 0.43006134033203125, 0.4512367248535156, 0.472412109375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 5.0, 5.0, 20.0, 14.0, 27.0, 30.0, 37.0, 67.0, 66.0, 78.0, 79.0, 82.0, 79.0, 81.0, 80.0, 65.0, 42.0, 36.0, 34.0, 17.0, 19.0, 12.0, 6.0, 8.0, 9.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.794921875, -0.7758979797363281, -0.7568740844726562, -0.7378501892089844, -0.7188262939453125, -0.6998023986816406, -0.6807785034179688, -0.6617546081542969, -0.642730712890625, -0.6237068176269531, -0.6046829223632812, -0.5856590270996094, -0.5666351318359375, -0.5476112365722656, -0.5285873413085938, -0.5095634460449219, -0.49053955078125, -0.4715156555175781, -0.45249176025390625, -0.4334678649902344, -0.4144439697265625, -0.3954200744628906, -0.37639617919921875, -0.3573722839355469, -0.338348388671875, -0.3193244934082031, -0.30030059814453125, -0.2812767028808594, -0.2622528076171875, -0.24322891235351562, -0.22420501708984375, -0.20518112182617188, -0.1861572265625, -0.16713333129882812, -0.14810943603515625, -0.12908554077148438, -0.1100616455078125, -0.09103775024414062, -0.07201385498046875, -0.052989959716796875, -0.033966064453125, -0.014942169189453125, 0.00408172607421875, 0.023105621337890625, 0.0421295166015625, 0.061153411865234375, 0.08017730712890625, 0.09920120239257812, 0.11822509765625, 0.13724899291992188, 0.15627288818359375, 0.17529678344726562, 0.1943206787109375, 0.21334457397460938, 0.23236846923828125, 0.2513923645019531, 0.270416259765625, 0.2894401550292969, 0.30846405029296875, 0.3274879455566406, 0.3465118408203125, 0.3655357360839844, 0.38455963134765625, 0.4035835266113281, 0.422607421875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 9.0, 6.0, 4.0, 10.0, 9.0, 14.0, 27.0, 34.0, 35.0, 56.0, 110.0, 156.0, 283.0, 547.0, 1128.0, 2326.0, 5266.0, 15519.0, 91035.0, 605397.0, 278753.0, 32571.0, 8506.0, 3422.0, 1523.0, 784.0, 422.0, 235.0, 119.0, 78.0, 48.0, 31.0, 33.0, 12.0, 13.0, 9.0, 4.0, 4.0, 3.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.1678466796875, -0.16238784790039062, -0.15692901611328125, -0.15147018432617188, -0.1460113525390625, -0.14055252075195312, -0.13509368896484375, -0.12963485717773438, -0.124176025390625, -0.11871719360351562, -0.11325836181640625, -0.10779953002929688, -0.1023406982421875, -0.09688186645507812, -0.09142303466796875, -0.08596420288085938, -0.08050537109375, -0.07504653930664062, -0.06958770751953125, -0.06412887573242188, -0.0586700439453125, -0.053211212158203125, -0.04775238037109375, -0.042293548583984375, -0.036834716796875, -0.031375885009765625, -0.02591705322265625, -0.020458221435546875, -0.0149993896484375, -0.009540557861328125, -0.00408172607421875, 0.001377105712890625, 0.0068359375, 0.012294769287109375, 0.01775360107421875, 0.023212432861328125, 0.0286712646484375, 0.034130096435546875, 0.03958892822265625, 0.045047760009765625, 0.050506591796875, 0.055965423583984375, 0.06142425537109375, 0.06688308715820312, 0.0723419189453125, 0.07780075073242188, 0.08325958251953125, 0.08871841430664062, 0.09417724609375, 0.09963607788085938, 0.10509490966796875, 0.11055374145507812, 0.1160125732421875, 0.12147140502929688, 0.12693023681640625, 0.13238906860351562, 0.137847900390625, 0.14330673217773438, 0.14876556396484375, 0.15422439575195312, 0.1596832275390625, 0.16514205932617188, 0.17060089111328125, 0.17605972290039062, 0.1815185546875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 4.0, 1.0, 2.0, 2.0, 4.0, 4.0, 5.0, 5.0, 8.0, 6.0, 9.0, 15.0, 13.0, 19.0, 17.0, 25.0, 25.0, 19.0, 34.0, 28.0, 43.0, 47.0, 31.0, 51.0, 47.0, 41.0, 52.0, 42.0, 43.0, 41.0, 41.0, 40.0, 34.0, 22.0, 29.0, 25.0, 20.0, 17.0, 13.0, 15.0, 14.0, 10.0, 8.0, 4.0, 4.0, 6.0, 10.0, 5.0, 1.0, 2.0, 1.0, 4.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.64599609375, -0.6260986328125, -0.606201171875, -0.5863037109375, -0.56640625, -0.5465087890625, -0.526611328125, -0.5067138671875, -0.48681640625, -0.4669189453125, -0.447021484375, -0.4271240234375, -0.4072265625, -0.3873291015625, -0.367431640625, -0.3475341796875, -0.32763671875, -0.3077392578125, -0.287841796875, -0.2679443359375, -0.248046875, -0.2281494140625, -0.208251953125, -0.1883544921875, -0.16845703125, -0.1485595703125, -0.128662109375, -0.1087646484375, -0.0888671875, -0.0689697265625, -0.049072265625, -0.0291748046875, -0.00927734375, 0.0106201171875, 0.030517578125, 0.0504150390625, 0.0703125, 0.0902099609375, 0.110107421875, 0.1300048828125, 0.14990234375, 0.1697998046875, 0.189697265625, 0.2095947265625, 0.2294921875, 0.2493896484375, 0.269287109375, 0.2891845703125, 0.30908203125, 0.3289794921875, 0.348876953125, 0.3687744140625, 0.388671875, 0.4085693359375, 0.428466796875, 0.4483642578125, 0.46826171875, 0.4881591796875, 0.508056640625, 0.5279541015625, 0.5478515625, 0.5677490234375, 0.587646484375, 0.6075439453125, 0.62744140625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 5.0, 2.0, 5.0, 1.0, 4.0, 7.0, 9.0, 10.0, 8.0, 17.0, 27.0, 54.0, 66.0, 101.0, 133.0, 246.0, 419.0, 653.0, 1101.0, 2072.0, 4297.0, 11986.0, 60575.0, 595790.0, 324016.0, 31437.0, 8162.0, 3348.0, 1595.0, 900.0, 536.0, 320.0, 206.0, 134.0, 94.0, 55.0, 50.0, 33.0, 25.0, 12.0, 15.0, 9.0, 7.0, 6.0, 5.0, 4.0, 4.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0623779296875, -0.060355186462402344, -0.05833244323730469, -0.05630970001220703, -0.054286956787109375, -0.05226421356201172, -0.05024147033691406, -0.048218727111816406, -0.04619598388671875, -0.044173240661621094, -0.04215049743652344, -0.04012775421142578, -0.038105010986328125, -0.03608226776123047, -0.03405952453613281, -0.032036781311035156, -0.0300140380859375, -0.027991294860839844, -0.025968551635742188, -0.02394580841064453, -0.021923065185546875, -0.01990032196044922, -0.017877578735351562, -0.015854835510253906, -0.01383209228515625, -0.011809349060058594, -0.009786605834960938, -0.007763862609863281, -0.005741119384765625, -0.0037183761596679688, -0.0016956329345703125, 0.00032711029052734375, 0.002349853515625, 0.004372596740722656, 0.0063953399658203125, 0.008418083190917969, 0.010440826416015625, 0.012463569641113281, 0.014486312866210938, 0.016509056091308594, 0.01853179931640625, 0.020554542541503906, 0.022577285766601562, 0.02460002899169922, 0.026622772216796875, 0.02864551544189453, 0.030668258666992188, 0.032691001892089844, 0.0347137451171875, 0.036736488342285156, 0.03875923156738281, 0.04078197479248047, 0.042804718017578125, 0.04482746124267578, 0.04685020446777344, 0.048872947692871094, 0.05089569091796875, 0.052918434143066406, 0.05494117736816406, 0.05696392059326172, 0.058986663818359375, 0.06100940704345703, 0.06303215026855469, 0.06505489349365234, 0.06707763671875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 6.0, 3.0, 10.0, 15.0, 52.0, 94.0, 168.0, 233.0, 208.0, 113.0, 52.0, 17.0, 10.0, 10.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.696846008300781e-05, -4.538148641586304e-05, -4.379451274871826e-05, -4.2207539081573486e-05, -4.062056541442871e-05, -3.9033591747283936e-05, -3.744661808013916e-05, -3.5859644412994385e-05, -3.427267074584961e-05, -3.2685697078704834e-05, -3.109872341156006e-05, -2.9511749744415283e-05, -2.7924776077270508e-05, -2.6337802410125732e-05, -2.4750828742980957e-05, -2.316385507583618e-05, -2.1576881408691406e-05, -1.998990774154663e-05, -1.8402934074401855e-05, -1.681596040725708e-05, -1.5228986740112305e-05, -1.364201307296753e-05, -1.2055039405822754e-05, -1.0468065738677979e-05, -8.881092071533203e-06, -7.294118404388428e-06, -5.707144737243652e-06, -4.120171070098877e-06, -2.5331974029541016e-06, -9.462237358093262e-07, 6.407499313354492e-07, 2.2277235984802246e-06, 3.814697265625e-06, 5.401670932769775e-06, 6.988644599914551e-06, 8.575618267059326e-06, 1.0162591934204102e-05, 1.1749565601348877e-05, 1.3336539268493652e-05, 1.4923512935638428e-05, 1.6510486602783203e-05, 1.809746026992798e-05, 1.9684433937072754e-05, 2.127140760421753e-05, 2.2858381271362305e-05, 2.444535493850708e-05, 2.6032328605651855e-05, 2.761930227279663e-05, 2.9206275939941406e-05, 3.079324960708618e-05, 3.238022327423096e-05, 3.396719694137573e-05, 3.555417060852051e-05, 3.714114427566528e-05, 3.872811794281006e-05, 4.0315091609954834e-05, 4.190206527709961e-05, 4.3489038944244385e-05, 4.507601261138916e-05, 4.6662986278533936e-05, 4.824995994567871e-05, 4.9836933612823486e-05, 5.142390727996826e-05, 5.301088094711304e-05, 5.459785461425781e-05]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [4.0, 3.0, 1.0, 4.0, 3.0, 1.0, 1.0, 3.0, 8.0, 5.0, 6.0, 12.0, 12.0, 18.0, 22.0, 33.0, 45.0, 61.0, 102.0, 207.0, 366.0, 618.0, 1333.0, 2935.0, 7299.0, 28576.0, 239212.0, 644082.0, 98100.0, 16074.0, 4958.0, 2091.0, 1067.0, 576.0, 285.0, 173.0, 82.0, 51.0, 42.0, 27.0, 22.0, 11.0, 8.0, 8.0, 6.0, 5.0, 5.0, 0.0, 6.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.047882080078125, -0.04612874984741211, -0.04437541961669922, -0.04262208938598633, -0.04086875915527344, -0.03911542892456055, -0.037362098693847656, -0.035608768463134766, -0.033855438232421875, -0.032102108001708984, -0.030348777770996094, -0.028595447540283203, -0.026842117309570312, -0.025088787078857422, -0.02333545684814453, -0.02158212661743164, -0.01982879638671875, -0.01807546615600586, -0.01632213592529297, -0.014568805694580078, -0.012815475463867188, -0.011062145233154297, -0.009308815002441406, -0.007555484771728516, -0.005802154541015625, -0.004048824310302734, -0.0022954940795898438, -0.0005421638488769531, 0.0012111663818359375, 0.002964496612548828, 0.004717826843261719, 0.006471157073974609, 0.0082244873046875, 0.00997781753540039, 0.011731147766113281, 0.013484477996826172, 0.015237808227539062, 0.016991138458251953, 0.018744468688964844, 0.020497798919677734, 0.022251129150390625, 0.024004459381103516, 0.025757789611816406, 0.027511119842529297, 0.029264450073242188, 0.031017780303955078, 0.03277111053466797, 0.03452444076538086, 0.03627777099609375, 0.03803110122680664, 0.03978443145751953, 0.04153776168823242, 0.04329109191894531, 0.0450444221496582, 0.046797752380371094, 0.048551082611083984, 0.050304412841796875, 0.052057743072509766, 0.053811073303222656, 0.05556440353393555, 0.05731773376464844, 0.05907106399536133, 0.06082439422607422, 0.06257772445678711, 0.0643310546875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 3.0, 3.0, 8.0, 9.0, 24.0, 17.0, 28.0, 41.0, 64.0, 76.0, 77.0, 100.0, 99.0, 103.0, 98.0, 73.0, 45.0, 33.0, 27.0, 18.0, 13.0, 6.0, 7.0, 3.0, 8.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.01065826416015625, -0.010280728340148926, -0.009903192520141602, -0.009525656700134277, -0.009148120880126953, -0.008770585060119629, -0.008393049240112305, -0.00801551342010498, -0.007637977600097656, -0.007260441780090332, -0.006882905960083008, -0.006505370140075684, -0.006127834320068359, -0.005750298500061035, -0.005372762680053711, -0.004995226860046387, -0.0046176910400390625, -0.004240155220031738, -0.003862619400024414, -0.00348508358001709, -0.0031075477600097656, -0.0027300119400024414, -0.002352476119995117, -0.001974940299987793, -0.0015974044799804688, -0.0012198686599731445, -0.0008423328399658203, -0.0004647970199584961, -8.726119995117188e-05, 0.00029027462005615234, 0.0006678104400634766, 0.0010453462600708008, 0.001422882080078125, 0.0018004179000854492, 0.0021779537200927734, 0.0025554895401000977, 0.002933025360107422, 0.003310561180114746, 0.0036880970001220703, 0.0040656328201293945, 0.004443168640136719, 0.004820704460144043, 0.005198240280151367, 0.005575776100158691, 0.005953311920166016, 0.00633084774017334, 0.006708383560180664, 0.007085919380187988, 0.0074634552001953125, 0.007840991020202637, 0.008218526840209961, 0.008596062660217285, 0.00897359848022461, 0.009351134300231934, 0.009728670120239258, 0.010106205940246582, 0.010483741760253906, 0.01086127758026123, 0.011238813400268555, 0.011616349220275879, 0.011993885040283203, 0.012371420860290527, 0.012748956680297852, 0.013126492500305176, 0.0135040283203125]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 11.0, 21.0, 30.0, 58.0, 134.0, 230.0, 232.0, 149.0, 68.0, 30.0, 15.0, 12.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8799607753753662, -0.8448159098625183, -0.8096709847450256, -0.7745261192321777, -0.7393811941146851, -0.7042363286018372, -0.6690914630889893, -0.6339465379714966, -0.5988016128540039, -0.563656747341156, -0.5285118222236633, -0.49336695671081543, -0.45822203159332275, -0.42307716608047485, -0.38793227076530457, -0.3527873754501343, -0.3176425099372864, -0.2824976146221161, -0.2473527193069458, -0.2122078388929367, -0.17706294357776642, -0.14191804826259613, -0.10677316784858704, -0.07162827253341675, -0.03648337721824646, -0.0013384856283664703, 0.03380640596151352, 0.06895129382610321, 0.1040961891412735, 0.1392410844564438, 0.17438596487045288, 0.20953086018562317, 0.24467575550079346, 0.27982065081596375, 0.31496554613113403, 0.35011041164398193, 0.3852553367614746, 0.4204002022743225, 0.4555450975894928, 0.4906899929046631, 0.5258349180221558, 0.5609797835350037, 0.5961247086524963, 0.6312695741653442, 0.6664144992828369, 0.7015593647956848, 0.7367042303085327, 0.7718491554260254, 0.8069940209388733, 0.8421388864517212, 0.8772838115692139, 0.9124286770820618, 0.9475736021995544, 0.9827184677124023, 1.017863392829895, 1.0530083179473877, 1.0881531238555908, 1.1232980489730835, 1.1584428548812866, 1.1935877799987793, 1.228732705116272, 1.2638776302337646, 1.2990224361419678, 1.3341673612594604, 1.3693122863769531]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 3.0, 4.0, 3.0, 6.0, 6.0, 10.0, 14.0, 21.0, 23.0, 31.0, 32.0, 47.0, 48.0, 69.0, 74.0, 62.0, 70.0, 63.0, 68.0, 75.0, 47.0, 42.0, 34.0, 37.0, 25.0, 17.0, 14.0, 18.0, 8.0, 9.0, 7.0, 6.0, 3.0, 5.0, 5.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5559635758399963, -0.5412487983703613, -0.5265340805053711, -0.5118193030357361, -0.4971045255661011, -0.48238977789878845, -0.46767503023147583, -0.4529602527618408, -0.4382455050945282, -0.4235307574272156, -0.40881597995758057, -0.39410123229026794, -0.3793864846229553, -0.3646717071533203, -0.3499569594860077, -0.33524221181869507, -0.32052743434906006, -0.30581268668174744, -0.2910979092121124, -0.2763831615447998, -0.2616683840751648, -0.24695363640785217, -0.23223888874053955, -0.21752412617206573, -0.20280936360359192, -0.1880946010351181, -0.1733798384666443, -0.15866509079933167, -0.14395032823085785, -0.12923556566238403, -0.11452081054449081, -0.0998060554265976, -0.08509132266044617, -0.07037656009197235, -0.05566180497407913, -0.040947046130895615, -0.026232287287712097, -0.011517524719238281, 0.0031972303986549377, 0.017911985516548157, 0.03262674808502197, 0.04734150692820549, 0.06205626577138901, 0.07677102088928223, 0.09148578345775604, 0.10620054602622986, 0.12091530114412308, 0.1356300562620163, 0.1503448188304901, 0.16505958139896393, 0.17977434396743774, 0.19448909163475037, 0.20920385420322418, 0.223918616771698, 0.23863336443901062, 0.25334811210632324, 0.26806288957595825, 0.2827776372432709, 0.2974924147129059, 0.3122071623802185, 0.3269219398498535, 0.34163668751716614, 0.35635143518447876, 0.37106621265411377, 0.3857809603214264]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 5.0, 7.0, 4.0, 8.0, 3.0, 12.0, 14.0, 30.0, 77.0, 466.0, 38485.0, 1006913.0, 2271.0, 152.0, 47.0, 13.0, 16.0, 9.0, 9.0, 6.0, 4.0, 4.0, 0.0, 5.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.505859375, -2.402496337890625, -2.29913330078125, -2.195770263671875, -2.0924072265625, -1.989044189453125, -1.88568115234375, -1.782318115234375, -1.678955078125, -1.575592041015625, -1.47222900390625, -1.368865966796875, -1.2655029296875, -1.162139892578125, -1.05877685546875, -0.955413818359375, -0.85205078125, -0.748687744140625, -0.64532470703125, -0.541961669921875, -0.4385986328125, -0.335235595703125, -0.23187255859375, -0.128509521484375, -0.025146484375, 0.078216552734375, 0.18157958984375, 0.284942626953125, 0.3883056640625, 0.491668701171875, 0.59503173828125, 0.698394775390625, 0.8017578125, 0.905120849609375, 1.00848388671875, 1.111846923828125, 1.2152099609375, 1.318572998046875, 1.42193603515625, 1.525299072265625, 1.628662109375, 1.732025146484375, 1.83538818359375, 1.938751220703125, 2.0421142578125, 2.145477294921875, 2.24884033203125, 2.352203369140625, 2.45556640625, 2.558929443359375, 2.66229248046875, 2.765655517578125, 2.8690185546875, 2.972381591796875, 3.07574462890625, 3.179107666015625, 3.282470703125, 3.385833740234375, 3.48919677734375, 3.592559814453125, 3.6959228515625, 3.799285888671875, 3.90264892578125, 4.006011962890625, 4.109375]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 5.0, 8.0, 17.0, 24.0, 33.0, 52.0, 74.0, 101.0, 119.0, 138.0, 114.0, 94.0, 73.0, 54.0, 30.0, 24.0, 14.0, 9.0, 9.0, 8.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.408203125, -2.357452392578125, -2.30670166015625, -2.255950927734375, -2.2052001953125, -2.154449462890625, -2.10369873046875, -2.052947998046875, -2.002197265625, -1.951446533203125, -1.90069580078125, -1.849945068359375, -1.7991943359375, -1.748443603515625, -1.69769287109375, -1.646942138671875, -1.59619140625, -1.545440673828125, -1.49468994140625, -1.443939208984375, -1.3931884765625, -1.342437744140625, -1.29168701171875, -1.240936279296875, -1.190185546875, -1.139434814453125, -1.08868408203125, -1.037933349609375, -0.9871826171875, -0.936431884765625, -0.88568115234375, -0.834930419921875, -0.7841796875, -0.733428955078125, -0.68267822265625, -0.631927490234375, -0.5811767578125, -0.530426025390625, -0.47967529296875, -0.428924560546875, -0.378173828125, -0.327423095703125, -0.27667236328125, -0.225921630859375, -0.1751708984375, -0.124420166015625, -0.07366943359375, -0.022918701171875, 0.02783203125, 0.078582763671875, 0.12933349609375, 0.180084228515625, 0.2308349609375, 0.281585693359375, 0.33233642578125, 0.383087158203125, 0.433837890625, 0.484588623046875, 0.53533935546875, 0.586090087890625, 0.6368408203125, 0.687591552734375, 0.73834228515625, 0.789093017578125, 0.83984375]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 7.0, 3.0, 4.0, 5.0, 7.0, 14.0, 11.0, 19.0, 28.0, 52.0, 87.0, 105.0, 211.0, 435.0, 1249.0, 6162.0, 127450.0, 879856.0, 28484.0, 2909.0, 727.0, 301.0, 145.0, 104.0, 54.0, 42.0, 23.0, 17.0, 11.0, 15.0, 2.0, 5.0, 5.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0546875, -1.02203369140625, -0.9893798828125, -0.95672607421875, -0.924072265625, -0.89141845703125, -0.8587646484375, -0.82611083984375, -0.79345703125, -0.76080322265625, -0.7281494140625, -0.69549560546875, -0.662841796875, -0.63018798828125, -0.5975341796875, -0.56488037109375, -0.5322265625, -0.49957275390625, -0.4669189453125, -0.43426513671875, -0.401611328125, -0.36895751953125, -0.3363037109375, -0.30364990234375, -0.27099609375, -0.23834228515625, -0.2056884765625, -0.17303466796875, -0.140380859375, -0.10772705078125, -0.0750732421875, -0.04241943359375, -0.009765625, 0.02288818359375, 0.0555419921875, 0.08819580078125, 0.120849609375, 0.15350341796875, 0.1861572265625, 0.21881103515625, 0.25146484375, 0.28411865234375, 0.3167724609375, 0.34942626953125, 0.382080078125, 0.41473388671875, 0.4473876953125, 0.48004150390625, 0.5126953125, 0.54534912109375, 0.5780029296875, 0.61065673828125, 0.643310546875, 0.67596435546875, 0.7086181640625, 0.74127197265625, 0.77392578125, 0.80657958984375, 0.8392333984375, 0.87188720703125, 0.904541015625, 0.93719482421875, 0.9698486328125, 1.00250244140625, 1.03515625]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 5.0, 4.0, 6.0, 8.0, 8.0, 11.0, 14.0, 19.0, 22.0, 32.0, 24.0, 33.0, 25.0, 46.0, 50.0, 40.0, 50.0, 50.0, 56.0, 51.0, 58.0, 56.0, 45.0, 39.0, 38.0, 32.0, 35.0, 27.0, 20.0, 22.0, 23.0, 7.0, 10.0, 12.0, 6.0, 6.0, 5.0, 4.0, 1.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.77392578125, -0.7477645874023438, -0.7216033935546875, -0.6954421997070312, -0.669281005859375, -0.6431198120117188, -0.6169586181640625, -0.5907974243164062, -0.56463623046875, -0.5384750366210938, -0.5123138427734375, -0.48615264892578125, -0.459991455078125, -0.43383026123046875, -0.4076690673828125, -0.38150787353515625, -0.3553466796875, -0.32918548583984375, -0.3030242919921875, -0.27686309814453125, -0.250701904296875, -0.22454071044921875, -0.1983795166015625, -0.17221832275390625, -0.14605712890625, -0.11989593505859375, -0.0937347412109375, -0.06757354736328125, -0.041412353515625, -0.01525115966796875, 0.0109100341796875, 0.03707122802734375, 0.063232421875, 0.08939361572265625, 0.1155548095703125, 0.14171600341796875, 0.167877197265625, 0.19403839111328125, 0.2201995849609375, 0.24636077880859375, 0.27252197265625, 0.29868316650390625, 0.3248443603515625, 0.35100555419921875, 0.377166748046875, 0.40332794189453125, 0.4294891357421875, 0.45565032958984375, 0.4818115234375, 0.5079727172851562, 0.5341339111328125, 0.5602951049804688, 0.586456298828125, 0.6126174926757812, 0.6387786865234375, 0.6649398803710938, 0.69110107421875, 0.7172622680664062, 0.7434234619140625, 0.7695846557617188, 0.795745849609375, 0.8219070434570312, 0.8480682373046875, 0.8742294311523438, 0.900390625]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 4.0, 5.0, 7.0, 5.0, 19.0, 19.0, 26.0, 58.0, 95.0, 237.0, 513.0, 1633.0, 7818.0, 183793.0, 828288.0, 21525.0, 3002.0, 860.0, 303.0, 137.0, 74.0, 55.0, 25.0, 12.0, 11.0, 5.0, 2.0, 6.0, 4.0, 3.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.345458984375, -0.3343925476074219, -0.32332611083984375, -0.3122596740722656, -0.3011932373046875, -0.2901268005371094, -0.27906036376953125, -0.2679939270019531, -0.256927490234375, -0.24586105346679688, -0.23479461669921875, -0.22372817993164062, -0.2126617431640625, -0.20159530639648438, -0.19052886962890625, -0.17946243286132812, -0.16839599609375, -0.15732955932617188, -0.14626312255859375, -0.13519668579101562, -0.1241302490234375, -0.11306381225585938, -0.10199737548828125, -0.09093093872070312, -0.079864501953125, -0.06879806518554688, -0.05773162841796875, -0.046665191650390625, -0.0355987548828125, -0.024532318115234375, -0.01346588134765625, -0.002399444580078125, 0.0086669921875, 0.019733428955078125, 0.03079986572265625, 0.041866302490234375, 0.0529327392578125, 0.06399917602539062, 0.07506561279296875, 0.08613204956054688, 0.097198486328125, 0.10826492309570312, 0.11933135986328125, 0.13039779663085938, 0.1414642333984375, 0.15253067016601562, 0.16359710693359375, 0.17466354370117188, 0.18572998046875, 0.19679641723632812, 0.20786285400390625, 0.21892929077148438, 0.2299957275390625, 0.24106216430664062, 0.25212860107421875, 0.2631950378417969, 0.274261474609375, 0.2853279113769531, 0.29639434814453125, 0.3074607849121094, 0.3185272216796875, 0.3295936584472656, 0.34066009521484375, 0.3517265319824219, 0.36279296875]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 8.0, 10.0, 11.0, 29.0, 39.0, 74.0, 111.0, 135.0, 194.0, 150.0, 90.0, 59.0, 33.0, 18.0, 16.0, 11.0, 4.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.9696693420410156e-05, -3.83937731385231e-05, -3.709085285663605e-05, -3.578793257474899e-05, -3.448501229286194e-05, -3.3182092010974884e-05, -3.187917172908783e-05, -3.0576251447200775e-05, -2.927333116531372e-05, -2.7970410883426666e-05, -2.6667490601539612e-05, -2.5364570319652557e-05, -2.4061650037765503e-05, -2.275872975587845e-05, -2.1455809473991394e-05, -2.015288919210434e-05, -1.8849968910217285e-05, -1.754704862833023e-05, -1.6244128346443176e-05, -1.4941208064556122e-05, -1.3638287782669067e-05, -1.2335367500782013e-05, -1.1032447218894958e-05, -9.729526937007904e-06, -8.42660665512085e-06, -7.123686373233795e-06, -5.820766091346741e-06, -4.517845809459686e-06, -3.214925527572632e-06, -1.9120052456855774e-06, -6.09084963798523e-07, 6.938353180885315e-07, 1.996755599975586e-06, 3.2996758818626404e-06, 4.602596163749695e-06, 5.905516445636749e-06, 7.208436727523804e-06, 8.511357009410858e-06, 9.814277291297913e-06, 1.1117197573184967e-05, 1.2420117855072021e-05, 1.3723038136959076e-05, 1.502595841884613e-05, 1.6328878700733185e-05, 1.763179898262024e-05, 1.8934719264507294e-05, 2.0237639546394348e-05, 2.1540559828281403e-05, 2.2843480110168457e-05, 2.414640039205551e-05, 2.5449320673942566e-05, 2.675224095582962e-05, 2.8055161237716675e-05, 2.935808151960373e-05, 3.0661001801490784e-05, 3.196392208337784e-05, 3.326684236526489e-05, 3.456976264715195e-05, 3.5872682929039e-05, 3.7175603210926056e-05, 3.847852349281311e-05, 3.9781443774700165e-05, 4.108436405658722e-05, 4.2387284338474274e-05, 4.369020462036133e-05]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 6.0, 13.0, 10.0, 18.0, 23.0, 41.0, 71.0, 131.0, 284.0, 829.0, 3240.0, 47736.0, 950299.0, 41443.0, 3103.0, 732.0, 280.0, 126.0, 70.0, 32.0, 25.0, 14.0, 8.0, 12.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.419189453125, -0.40666961669921875, -0.3941497802734375, -0.38162994384765625, -0.369110107421875, -0.35659027099609375, -0.3440704345703125, -0.33155059814453125, -0.31903076171875, -0.30651092529296875, -0.2939910888671875, -0.28147125244140625, -0.268951416015625, -0.25643157958984375, -0.2439117431640625, -0.23139190673828125, -0.2188720703125, -0.20635223388671875, -0.1938323974609375, -0.18131256103515625, -0.168792724609375, -0.15627288818359375, -0.1437530517578125, -0.13123321533203125, -0.11871337890625, -0.10619354248046875, -0.0936737060546875, -0.08115386962890625, -0.068634033203125, -0.05611419677734375, -0.0435943603515625, -0.03107452392578125, -0.0185546875, -0.00603485107421875, 0.0064849853515625, 0.01900482177734375, 0.031524658203125, 0.04404449462890625, 0.0565643310546875, 0.06908416748046875, 0.08160400390625, 0.09412384033203125, 0.1066436767578125, 0.11916351318359375, 0.131683349609375, 0.14420318603515625, 0.1567230224609375, 0.16924285888671875, 0.1817626953125, 0.19428253173828125, 0.2068023681640625, 0.21932220458984375, 0.231842041015625, 0.24436187744140625, 0.2568817138671875, 0.26940155029296875, 0.28192138671875, 0.29444122314453125, 0.3069610595703125, 0.31948089599609375, 0.332000732421875, 0.34452056884765625, 0.3570404052734375, 0.36956024169921875, 0.382080078125]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 7.0, 11.0, 11.0, 17.0, 31.0, 41.0, 59.0, 72.0, 87.0, 122.0, 118.0, 113.0, 91.0, 62.0, 51.0, 36.0, 26.0, 16.0, 7.0, 11.0, 5.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0938720703125, -0.0911397933959961, -0.08840751647949219, -0.08567523956298828, -0.08294296264648438, -0.08021068572998047, -0.07747840881347656, -0.07474613189697266, -0.07201385498046875, -0.06928157806396484, -0.06654930114746094, -0.06381702423095703, -0.061084747314453125, -0.05835247039794922, -0.05562019348144531, -0.052887916564941406, -0.0501556396484375, -0.047423362731933594, -0.04469108581542969, -0.04195880889892578, -0.039226531982421875, -0.03649425506591797, -0.03376197814941406, -0.031029701232910156, -0.02829742431640625, -0.025565147399902344, -0.022832870483398438, -0.02010059356689453, -0.017368316650390625, -0.014636039733886719, -0.011903762817382812, -0.009171485900878906, -0.006439208984375, -0.0037069320678710938, -0.0009746551513671875, 0.0017576217651367188, 0.004489898681640625, 0.007222175598144531, 0.009954452514648438, 0.012686729431152344, 0.01541900634765625, 0.018151283264160156, 0.020883560180664062, 0.02361583709716797, 0.026348114013671875, 0.02908039093017578, 0.03181266784667969, 0.034544944763183594, 0.0372772216796875, 0.040009498596191406, 0.04274177551269531, 0.04547405242919922, 0.048206329345703125, 0.05093860626220703, 0.05367088317871094, 0.056403160095214844, 0.05913543701171875, 0.061867713928222656, 0.06459999084472656, 0.06733226776123047, 0.07006454467773438, 0.07279682159423828, 0.07552909851074219, 0.0782613754272461, 0.08099365234375]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 7.0, 7.0, 8.0, 24.0, 48.0, 90.0, 195.0, 244.0, 190.0, 104.0, 44.0, 18.0, 13.0, 8.0, 3.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2240744829177856, -1.1540439128875732, -1.0840132236480713, -1.0139826536178589, -0.9439519643783569, -0.8739213943481445, -0.8038907647132874, -0.7338601350784302, -0.663829505443573, -0.5937988758087158, -0.5237682461738586, -0.45373764634132385, -0.3837070167064667, -0.3136763870716095, -0.2436457872390747, -0.17361515760421753, -0.10358452796936035, -0.03355390578508377, 0.03647671639919281, 0.1065073311328888, 0.17653796076774597, 0.24656859040260315, 0.31659919023513794, 0.3866298198699951, 0.4566604495048523, 0.5266910791397095, 0.5967217087745667, 0.6667523384094238, 0.7367829084396362, 0.8068135976791382, 0.8768441677093506, 0.9468747973442078, 1.0169055461883545, 1.086936116218567, 1.1569668054580688, 1.2269973754882812, 1.2970280647277832, 1.3670586347579956, 1.437089204788208, 1.50711989402771, 1.577150583267212, 1.6471811532974243, 1.7172118425369263, 1.7872424125671387, 1.8572731018066406, 1.927303671836853, 1.9973342418670654, 2.0673649311065674, 2.1373953819274902, 2.207426071166992, 2.277456521987915, 2.347487211227417, 2.417517900466919, 2.487548589706421, 2.5575790405273438, 2.6276097297668457, 2.6976404190063477, 2.7676711082458496, 2.8377015590667725, 2.9077322483062744, 2.9777629375457764, 3.0477936267852783, 3.117824077606201, 3.187854766845703, 3.257885456085205]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 1.0, 8.0, 11.0, 3.0, 15.0, 14.0, 17.0, 29.0, 38.0, 32.0, 32.0, 47.0, 50.0, 68.0, 54.0, 58.0, 78.0, 61.0, 71.0, 49.0, 38.0, 47.0, 39.0, 36.0, 27.0, 17.0, 23.0, 11.0, 11.0, 6.0, 6.0, 7.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.2712249755859375, -2.216845750808716, -2.162466287612915, -2.1080870628356934, -2.0537075996398926, -1.999328374862671, -1.9449490308761597, -1.8905696868896484, -1.8361904621124268, -1.7818111181259155, -1.7274317741394043, -1.6730525493621826, -1.6186732053756714, -1.5642938613891602, -1.509914517402649, -1.4555351734161377, -1.4011558294296265, -1.3467764854431152, -1.292397141456604, -1.2380177974700928, -1.183638572692871, -1.1292592287063599, -1.0748798847198486, -1.0205005407333374, -0.966121256351471, -0.9117419123649597, -0.8573626279830933, -0.802983283996582, -0.7486039400100708, -0.6942246556282043, -0.6398453116416931, -0.5854660272598267, -0.531086802482605, -0.47670748829841614, -0.4223281741142273, -0.36794883012771606, -0.3135695159435272, -0.2591902017593384, -0.20481085777282715, -0.1504315435886383, -0.09605222940444946, -0.04167290776968002, 0.012706413865089417, 0.06708574295043945, 0.1214650571346283, 0.17584437131881714, 0.23022371530532837, 0.2846030294895172, 0.33898234367370605, 0.3933616578578949, 0.44774097204208374, 0.502120316028595, 0.5564996004104614, 0.6108789443969727, 0.6652582883834839, 0.7196376323699951, 0.7740169167518616, 0.8283962607383728, 0.8827755451202393, 0.9371548891067505, 0.9915342330932617, 1.0459134578704834, 1.1002929210662842, 1.1546721458435059, 1.209051489830017]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 3.0, 6.0, 5.0, 3.0, 6.0, 4.0, 11.0, 15.0, 40.0, 51.0, 76.0, 105.0, 203.0, 461.0, 942.0, 2533.0, 8920.0, 100285.0, 3442048.0, 605934.0, 25427.0, 4521.0, 1449.0, 590.0, 272.0, 151.0, 87.0, 52.0, 32.0, 21.0, 11.0, 9.0, 6.0, 6.0, 4.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2529296875, -1.21685791015625, -1.1807861328125, -1.14471435546875, -1.108642578125, -1.07257080078125, -1.0364990234375, -1.00042724609375, -0.96435546875, -0.92828369140625, -0.8922119140625, -0.85614013671875, -0.820068359375, -0.78399658203125, -0.7479248046875, -0.71185302734375, -0.67578125, -0.63970947265625, -0.6036376953125, -0.56756591796875, -0.531494140625, -0.49542236328125, -0.4593505859375, -0.42327880859375, -0.38720703125, -0.35113525390625, -0.3150634765625, -0.27899169921875, -0.242919921875, -0.20684814453125, -0.1707763671875, -0.13470458984375, -0.0986328125, -0.06256103515625, -0.0264892578125, 0.00958251953125, 0.045654296875, 0.08172607421875, 0.1177978515625, 0.15386962890625, 0.18994140625, 0.22601318359375, 0.2620849609375, 0.29815673828125, 0.334228515625, 0.37030029296875, 0.4063720703125, 0.44244384765625, 0.478515625, 0.51458740234375, 0.5506591796875, 0.58673095703125, 0.622802734375, 0.65887451171875, 0.6949462890625, 0.73101806640625, 0.76708984375, 0.80316162109375, 0.8392333984375, 0.87530517578125, 0.911376953125, 0.94744873046875, 0.9835205078125, 1.01959228515625, 1.0556640625]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 5.0, 3.0, 3.0, 3.0, 5.0, 6.0, 8.0, 12.0, 25.0, 19.0, 29.0, 38.0, 42.0, 61.0, 72.0, 67.0, 70.0, 65.0, 81.0, 72.0, 55.0, 54.0, 50.0, 34.0, 35.0, 18.0, 20.0, 7.0, 11.0, 9.0, 8.0, 4.0, 10.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.76416015625, -0.7457237243652344, -0.7272872924804688, -0.7088508605957031, -0.6904144287109375, -0.6719779968261719, -0.6535415649414062, -0.6351051330566406, -0.616668701171875, -0.5982322692871094, -0.5797958374023438, -0.5613594055175781, -0.5429229736328125, -0.5244865417480469, -0.5060501098632812, -0.4876136779785156, -0.46917724609375, -0.4507408142089844, -0.43230438232421875, -0.4138679504394531, -0.3954315185546875, -0.3769950866699219, -0.35855865478515625, -0.3401222229003906, -0.321685791015625, -0.3032493591308594, -0.28481292724609375, -0.2663764953613281, -0.2479400634765625, -0.22950363159179688, -0.21106719970703125, -0.19263076782226562, -0.1741943359375, -0.15575790405273438, -0.13732147216796875, -0.11888504028320312, -0.1004486083984375, -0.08201217651367188, -0.06357574462890625, -0.045139312744140625, -0.026702880859375, -0.008266448974609375, 0.01016998291015625, 0.028606414794921875, 0.0470428466796875, 0.06547927856445312, 0.08391571044921875, 0.10235214233398438, 0.12078857421875, 0.13922500610351562, 0.15766143798828125, 0.17609786987304688, 0.1945343017578125, 0.21297073364257812, 0.23140716552734375, 0.24984359741210938, 0.268280029296875, 0.2867164611816406, 0.30515289306640625, 0.3235893249511719, 0.3420257568359375, 0.3604621887207031, 0.37889862060546875, 0.3973350524902344, 0.415771484375]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 2.0, 4.0, 3.0, 5.0, 6.0, 20.0, 18.0, 30.0, 27.0, 47.0, 68.0, 103.0, 157.0, 264.0, 386.0, 675.0, 1266.0, 2556.0, 6342.0, 19202.0, 95171.0, 1992585.0, 1950588.0, 94019.0, 18949.0, 6164.0, 2604.0, 1203.0, 708.0, 381.0, 228.0, 162.0, 93.0, 80.0, 42.0, 35.0, 23.0, 17.0, 16.0, 12.0, 8.0, 4.0, 3.0, 4.0, 1.0, 0.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.53271484375, -0.51434326171875, -0.4959716796875, -0.47760009765625, -0.459228515625, -0.44085693359375, -0.4224853515625, -0.40411376953125, -0.3857421875, -0.36737060546875, -0.3489990234375, -0.33062744140625, -0.312255859375, -0.29388427734375, -0.2755126953125, -0.25714111328125, -0.23876953125, -0.22039794921875, -0.2020263671875, -0.18365478515625, -0.165283203125, -0.14691162109375, -0.1285400390625, -0.11016845703125, -0.091796875, -0.07342529296875, -0.0550537109375, -0.03668212890625, -0.018310546875, 6.103515625e-05, 0.0184326171875, 0.03680419921875, 0.05517578125, 0.07354736328125, 0.0919189453125, 0.11029052734375, 0.128662109375, 0.14703369140625, 0.1654052734375, 0.18377685546875, 0.2021484375, 0.22052001953125, 0.2388916015625, 0.25726318359375, 0.275634765625, 0.29400634765625, 0.3123779296875, 0.33074951171875, 0.34912109375, 0.36749267578125, 0.3858642578125, 0.40423583984375, 0.422607421875, 0.44097900390625, 0.4593505859375, 0.47772216796875, 0.49609375, 0.51446533203125, 0.5328369140625, 0.55120849609375, 0.569580078125, 0.58795166015625, 0.6063232421875, 0.62469482421875, 0.64306640625]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 5.0, 2.0, 2.0, 2.0, 4.0, 7.0, 6.0, 7.0, 11.0, 9.0, 15.0, 29.0, 27.0, 28.0, 42.0, 77.0, 98.0, 152.0, 223.0, 343.0, 512.0, 670.0, 545.0, 408.0, 285.0, 152.0, 98.0, 72.0, 64.0, 45.0, 41.0, 15.0, 17.0, 23.0, 7.0, 7.0, 7.0, 8.0, 9.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.13525390625, -0.13069915771484375, -0.1261444091796875, -0.12158966064453125, -0.117034912109375, -0.11248016357421875, -0.1079254150390625, -0.10337066650390625, -0.09881591796875, -0.09426116943359375, -0.0897064208984375, -0.08515167236328125, -0.080596923828125, -0.07604217529296875, -0.0714874267578125, -0.06693267822265625, -0.0623779296875, -0.05782318115234375, -0.0532684326171875, -0.04871368408203125, -0.044158935546875, -0.03960418701171875, -0.0350494384765625, -0.03049468994140625, -0.02593994140625, -0.02138519287109375, -0.0168304443359375, -0.01227569580078125, -0.007720947265625, -0.00316619873046875, 0.0013885498046875, 0.00594329833984375, 0.010498046875, 0.01505279541015625, 0.0196075439453125, 0.02416229248046875, 0.028717041015625, 0.03327178955078125, 0.0378265380859375, 0.04238128662109375, 0.04693603515625, 0.05149078369140625, 0.0560455322265625, 0.06060028076171875, 0.065155029296875, 0.06970977783203125, 0.0742645263671875, 0.07881927490234375, 0.0833740234375, 0.08792877197265625, 0.0924835205078125, 0.09703826904296875, 0.101593017578125, 0.10614776611328125, 0.1107025146484375, 0.11525726318359375, 0.11981201171875, 0.12436676025390625, 0.1289215087890625, 0.13347625732421875, 0.138031005859375, 0.14258575439453125, 0.1471405029296875, 0.15169525146484375, 0.15625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 4.0, 7.0, 14.0, 19.0, 20.0, 36.0, 80.0, 90.0, 133.0, 150.0, 142.0, 105.0, 83.0, 39.0, 31.0, 11.0, 21.0, 4.0, 6.0, 2.0, 2.0, 2.0, 1.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9516488909721375, -0.9196044206619263, -0.8875599503517151, -0.8555154800415039, -0.8234710693359375, -0.7914265394210815, -0.7593821287155151, -0.727337658405304, -0.6952931880950928, -0.6632487177848816, -0.6312042474746704, -0.5991597771644592, -0.567115306854248, -0.5350708961486816, -0.5030264258384705, -0.4709819555282593, -0.4389374852180481, -0.4068930149078369, -0.37484854459762573, -0.34280410408973694, -0.31075963377952576, -0.2787151634693146, -0.2466707080602646, -0.2146262526512146, -0.18258178234100342, -0.15053731203079224, -0.11849285662174225, -0.08644839376211166, -0.05440393090248108, -0.022359460592269897, 0.00968499481678009, 0.04172945022583008, 0.07377386093139648, 0.10581832379102707, 0.13786278665065765, 0.16990724205970764, 0.20195171236991882, 0.23399618268013, 0.2660406231880188, 0.29808509349823, 0.33012956380844116, 0.36217403411865234, 0.3942185044288635, 0.4262629449367523, 0.4583074152469635, 0.4903518855571747, 0.5223963260650635, 0.5544407963752747, 0.5864852666854858, 0.618529736995697, 0.6505742073059082, 0.6826186776161194, 0.7146631479263306, 0.746707558631897, 0.7787520289421082, 0.8107964992523193, 0.8428409695625305, 0.8748854398727417, 0.9069299101829529, 0.9389743804931641, 0.9710187911987305, 1.0030633211135864, 1.0351077318191528, 1.0671522617340088, 1.0991966724395752]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 1.0, 7.0, 2.0, 8.0, 9.0, 9.0, 22.0, 19.0, 27.0, 33.0, 48.0, 39.0, 55.0, 42.0, 65.0, 68.0, 63.0, 59.0, 74.0, 57.0, 40.0, 42.0, 55.0, 34.0, 34.0, 27.0, 12.0, 15.0, 7.0, 6.0, 9.0, 10.0, 4.0, 3.0, 1.0, 5.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.7626878023147583, -0.7440861463546753, -0.7254844903945923, -0.7068828344345093, -0.6882811784744263, -0.6696795225143433, -0.6510778665542603, -0.632476270198822, -0.613874614238739, -0.595272958278656, -0.576671302318573, -0.55806964635849, -0.539467990398407, -0.5208663940429688, -0.5022647380828857, -0.48366308212280273, -0.46506139636039734, -0.44645974040031433, -0.4278580844402313, -0.4092564582824707, -0.3906548023223877, -0.3720531463623047, -0.3534514904022217, -0.33484983444213867, -0.31624817848205566, -0.29764652252197266, -0.27904486656188965, -0.26044321060180664, -0.24184158444404602, -0.223239928483963, -0.20463827252388, -0.1860366314649582, -0.16743499040603638, -0.14883333444595337, -0.13023169338703156, -0.11163003742694855, -0.09302838891744614, -0.07442674040794373, -0.05582508444786072, -0.037223443388938904, -0.018621787428855896, -2.0137056708335876e-05, 0.018581513315439224, 0.037183165550231934, 0.055784814059734344, 0.07438646256923676, 0.09298811852931976, 0.11158975958824158, 0.13019141554832458, 0.1487930715084076, 0.1673947125673294, 0.18599636852741241, 0.20459800958633423, 0.22319966554641724, 0.24180132150650024, 0.26040297746658325, 0.27900463342666626, 0.29760628938674927, 0.3162079453468323, 0.3348096013069153, 0.3534112274646759, 0.3720128834247589, 0.3906145393848419, 0.40921616554260254, 0.42781782150268555]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 4.0, 5.0, 12.0, 8.0, 16.0, 31.0, 36.0, 49.0, 73.0, 96.0, 209.0, 409.0, 622.0, 1282.0, 2861.0, 6887.0, 18820.0, 58206.0, 185723.0, 386221.0, 257450.0, 85813.0, 26791.0, 9569.0, 3767.0, 1674.0, 848.0, 434.0, 239.0, 136.0, 89.0, 58.0, 30.0, 28.0, 15.0, 12.0, 12.0, 3.0, 3.0, 6.0, 3.0, 5.0, 0.0, 2.0, 1.0, 3.0], "bins": [-0.07672119140625, -0.07468414306640625, -0.0726470947265625, -0.07061004638671875, -0.068572998046875, -0.06653594970703125, -0.0644989013671875, -0.06246185302734375, -0.0604248046875, -0.05838775634765625, -0.0563507080078125, -0.05431365966796875, -0.052276611328125, -0.05023956298828125, -0.0482025146484375, -0.04616546630859375, -0.04412841796875, -0.04209136962890625, -0.0400543212890625, -0.03801727294921875, -0.035980224609375, -0.03394317626953125, -0.0319061279296875, -0.02986907958984375, -0.02783203125, -0.02579498291015625, -0.0237579345703125, -0.02172088623046875, -0.019683837890625, -0.01764678955078125, -0.0156097412109375, -0.01357269287109375, -0.01153564453125, -0.00949859619140625, -0.0074615478515625, -0.00542449951171875, -0.003387451171875, -0.00135040283203125, 0.0006866455078125, 0.00272369384765625, 0.0047607421875, 0.00679779052734375, 0.0088348388671875, 0.01087188720703125, 0.012908935546875, 0.01494598388671875, 0.0169830322265625, 0.01902008056640625, 0.02105712890625, 0.02309417724609375, 0.0251312255859375, 0.02716827392578125, 0.029205322265625, 0.03124237060546875, 0.0332794189453125, 0.03531646728515625, 0.037353515625, 0.03939056396484375, 0.0414276123046875, 0.04346466064453125, 0.045501708984375, 0.04753875732421875, 0.0495758056640625, 0.05161285400390625, 0.05364990234375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 5.0, 4.0, 4.0, 6.0, 5.0, 13.0, 12.0, 16.0, 25.0, 19.0, 30.0, 45.0, 44.0, 46.0, 54.0, 54.0, 56.0, 70.0, 57.0, 60.0, 68.0, 53.0, 36.0, 44.0, 31.0, 29.0, 23.0, 21.0, 18.0, 11.0, 5.0, 11.0, 10.0, 4.0, 5.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.41845703125, -0.40680694580078125, -0.3951568603515625, -0.38350677490234375, -0.371856689453125, -0.36020660400390625, -0.3485565185546875, -0.33690643310546875, -0.32525634765625, -0.31360626220703125, -0.3019561767578125, -0.29030609130859375, -0.278656005859375, -0.26700592041015625, -0.2553558349609375, -0.24370574951171875, -0.2320556640625, -0.22040557861328125, -0.2087554931640625, -0.19710540771484375, -0.185455322265625, -0.17380523681640625, -0.1621551513671875, -0.15050506591796875, -0.13885498046875, -0.12720489501953125, -0.1155548095703125, -0.10390472412109375, -0.092254638671875, -0.08060455322265625, -0.0689544677734375, -0.05730438232421875, -0.045654296875, -0.03400421142578125, -0.0223541259765625, -0.01070404052734375, 0.000946044921875, 0.01259613037109375, 0.0242462158203125, 0.03589630126953125, 0.04754638671875, 0.05919647216796875, 0.0708465576171875, 0.08249664306640625, 0.094146728515625, 0.10579681396484375, 0.1174468994140625, 0.12909698486328125, 0.1407470703125, 0.15239715576171875, 0.1640472412109375, 0.17569732666015625, 0.187347412109375, 0.19899749755859375, 0.2106475830078125, 0.22229766845703125, 0.23394775390625, 0.24559783935546875, 0.2572479248046875, 0.26889801025390625, 0.280548095703125, 0.29219818115234375, 0.3038482666015625, 0.31549835205078125, 0.3271484375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 6.0, 7.0, 28.0, 15.0, 28.0, 31.0, 57.0, 69.0, 117.0, 201.0, 329.0, 533.0, 1021.0, 2332.0, 6851.0, 25478.0, 113273.0, 398309.0, 367972.0, 98209.0, 22685.0, 6391.0, 2254.0, 992.0, 528.0, 303.0, 187.0, 108.0, 82.0, 49.0, 33.0, 21.0, 15.0, 13.0, 9.0, 8.0, 4.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0721435546875, -0.06965160369873047, -0.06715965270996094, -0.0646677017211914, -0.062175750732421875, -0.059683799743652344, -0.05719184875488281, -0.05469989776611328, -0.05220794677734375, -0.04971599578857422, -0.04722404479980469, -0.044732093811035156, -0.042240142822265625, -0.039748191833496094, -0.03725624084472656, -0.03476428985595703, -0.0322723388671875, -0.02978038787841797, -0.027288436889648438, -0.024796485900878906, -0.022304534912109375, -0.019812583923339844, -0.017320632934570312, -0.014828681945800781, -0.01233673095703125, -0.009844779968261719, -0.0073528289794921875, -0.004860877990722656, -0.002368927001953125, 0.00012302398681640625, 0.0026149749755859375, 0.005106925964355469, 0.007598876953125, 0.010090827941894531, 0.012582778930664062, 0.015074729919433594, 0.017566680908203125, 0.020058631896972656, 0.022550582885742188, 0.02504253387451172, 0.02753448486328125, 0.03002643585205078, 0.03251838684082031, 0.035010337829589844, 0.037502288818359375, 0.039994239807128906, 0.04248619079589844, 0.04497814178466797, 0.0474700927734375, 0.04996204376220703, 0.05245399475097656, 0.054945945739746094, 0.057437896728515625, 0.059929847717285156, 0.06242179870605469, 0.06491374969482422, 0.06740570068359375, 0.06989765167236328, 0.07238960266113281, 0.07488155364990234, 0.07737350463867188, 0.0798654556274414, 0.08235740661621094, 0.08484935760498047, 0.08734130859375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 4.0, 6.0, 4.0, 7.0, 6.0, 6.0, 17.0, 11.0, 25.0, 19.0, 16.0, 23.0, 27.0, 24.0, 38.0, 38.0, 41.0, 47.0, 50.0, 56.0, 43.0, 49.0, 50.0, 33.0, 42.0, 51.0, 40.0, 34.0, 34.0, 21.0, 24.0, 20.0, 14.0, 16.0, 14.0, 12.0, 10.0, 7.0, 4.0, 6.0, 2.0, 3.0, 4.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.548828125, -0.5308990478515625, -0.512969970703125, -0.4950408935546875, -0.47711181640625, -0.4591827392578125, -0.441253662109375, -0.4233245849609375, -0.4053955078125, -0.3874664306640625, -0.369537353515625, -0.3516082763671875, -0.33367919921875, -0.3157501220703125, -0.297821044921875, -0.2798919677734375, -0.261962890625, -0.2440338134765625, -0.226104736328125, -0.2081756591796875, -0.19024658203125, -0.1723175048828125, -0.154388427734375, -0.1364593505859375, -0.1185302734375, -0.1006011962890625, -0.082672119140625, -0.0647430419921875, -0.04681396484375, -0.0288848876953125, -0.010955810546875, 0.0069732666015625, 0.02490234375, 0.0428314208984375, 0.060760498046875, 0.0786895751953125, 0.09661865234375, 0.1145477294921875, 0.132476806640625, 0.1504058837890625, 0.1683349609375, 0.1862640380859375, 0.204193115234375, 0.2221221923828125, 0.24005126953125, 0.2579803466796875, 0.275909423828125, 0.2938385009765625, 0.311767578125, 0.3296966552734375, 0.347625732421875, 0.3655548095703125, 0.38348388671875, 0.4014129638671875, 0.419342041015625, 0.4372711181640625, 0.4552001953125, 0.4731292724609375, 0.491058349609375, 0.5089874267578125, 0.52691650390625, 0.5448455810546875, 0.562774658203125, 0.5807037353515625, 0.5986328125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 3.0, 5.0, 1.0, 3.0, 5.0, 12.0, 16.0, 23.0, 30.0, 59.0, 85.0, 133.0, 243.0, 431.0, 958.0, 2347.0, 7437.0, 36592.0, 373733.0, 555476.0, 55820.0, 9964.0, 2878.0, 1124.0, 519.0, 285.0, 145.0, 64.0, 60.0, 34.0, 14.0, 15.0, 10.0, 11.0, 7.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03033447265625, -0.029172420501708984, -0.02801036834716797, -0.026848316192626953, -0.025686264038085938, -0.024524211883544922, -0.023362159729003906, -0.02220010757446289, -0.021038055419921875, -0.01987600326538086, -0.018713951110839844, -0.017551898956298828, -0.016389846801757812, -0.015227794647216797, -0.014065742492675781, -0.012903690338134766, -0.01174163818359375, -0.010579586029052734, -0.009417533874511719, -0.008255481719970703, -0.0070934295654296875, -0.005931377410888672, -0.004769325256347656, -0.0036072731018066406, -0.002445220947265625, -0.0012831687927246094, -0.00012111663818359375, 0.0010409355163574219, 0.0022029876708984375, 0.003365039825439453, 0.004527091979980469, 0.005689144134521484, 0.0068511962890625, 0.008013248443603516, 0.009175300598144531, 0.010337352752685547, 0.011499404907226562, 0.012661457061767578, 0.013823509216308594, 0.01498556137084961, 0.016147613525390625, 0.01730966567993164, 0.018471717834472656, 0.019633769989013672, 0.020795822143554688, 0.021957874298095703, 0.02311992645263672, 0.024281978607177734, 0.02544403076171875, 0.026606082916259766, 0.02776813507080078, 0.028930187225341797, 0.030092239379882812, 0.03125429153442383, 0.032416343688964844, 0.03357839584350586, 0.034740447998046875, 0.03590250015258789, 0.037064552307128906, 0.03822660446166992, 0.03938865661621094, 0.04055070877075195, 0.04171276092529297, 0.042874813079833984, 0.044036865234375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 5.0, 5.0, 10.0, 6.0, 11.0, 17.0, 21.0, 30.0, 36.0, 48.0, 65.0, 90.0, 78.0, 97.0, 96.0, 85.0, 74.0, 77.0, 48.0, 33.0, 23.0, 16.0, 9.0, 8.0, 5.0, 8.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1265277862548828e-05, -1.0806135833263397e-05, -1.0346993803977966e-05, -9.887851774692535e-06, -9.428709745407104e-06, -8.969567716121674e-06, -8.510425686836243e-06, -8.051283657550812e-06, -7.592141628265381e-06, -7.13299959897995e-06, -6.673857569694519e-06, -6.214715540409088e-06, -5.755573511123657e-06, -5.296431481838226e-06, -4.837289452552795e-06, -4.3781474232673645e-06, -3.919005393981934e-06, -3.4598633646965027e-06, -3.0007213354110718e-06, -2.541579306125641e-06, -2.08243727684021e-06, -1.623295247554779e-06, -1.1641532182693481e-06, -7.050111889839172e-07, -2.4586915969848633e-07, 2.1327286958694458e-07, 6.724148988723755e-07, 1.1315569281578064e-06, 1.5906989574432373e-06, 2.0498409867286682e-06, 2.508983016014099e-06, 2.96812504529953e-06, 3.427267074584961e-06, 3.886409103870392e-06, 4.345551133155823e-06, 4.804693162441254e-06, 5.2638351917266846e-06, 5.7229772210121155e-06, 6.182119250297546e-06, 6.641261279582977e-06, 7.100403308868408e-06, 7.559545338153839e-06, 8.01868736743927e-06, 8.477829396724701e-06, 8.936971426010132e-06, 9.396113455295563e-06, 9.855255484580994e-06, 1.0314397513866425e-05, 1.0773539543151855e-05, 1.1232681572437286e-05, 1.1691823601722717e-05, 1.2150965631008148e-05, 1.2610107660293579e-05, 1.306924968957901e-05, 1.3528391718864441e-05, 1.3987533748149872e-05, 1.4446675777435303e-05, 1.4905817806720734e-05, 1.5364959836006165e-05, 1.5824101865291595e-05, 1.6283243894577026e-05, 1.6742385923862457e-05, 1.7201527953147888e-05, 1.766066998243332e-05, 1.811981201171875e-05]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 8.0, 14.0, 17.0, 32.0, 32.0, 68.0, 106.0, 175.0, 333.0, 689.0, 1670.0, 4539.0, 17398.0, 90407.0, 464948.0, 380894.0, 66981.0, 13651.0, 3809.0, 1424.0, 609.0, 316.0, 154.0, 94.0, 57.0, 41.0, 29.0, 19.0, 7.0, 10.0, 13.0, 7.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0264892578125, -0.025573253631591797, -0.024657249450683594, -0.02374124526977539, -0.022825241088867188, -0.021909236907958984, -0.02099323272705078, -0.020077228546142578, -0.019161224365234375, -0.018245220184326172, -0.01732921600341797, -0.016413211822509766, -0.015497207641601562, -0.01458120346069336, -0.013665199279785156, -0.012749195098876953, -0.01183319091796875, -0.010917186737060547, -0.010001182556152344, -0.00908517837524414, -0.008169174194335938, -0.007253170013427734, -0.006337165832519531, -0.005421161651611328, -0.004505157470703125, -0.003589153289794922, -0.0026731491088867188, -0.0017571449279785156, -0.0008411407470703125, 7.486343383789062e-05, 0.0009908676147460938, 0.0019068717956542969, 0.0028228759765625, 0.003738880157470703, 0.004654884338378906, 0.005570888519287109, 0.0064868927001953125, 0.007402896881103516, 0.008318901062011719, 0.009234905242919922, 0.010150909423828125, 0.011066913604736328, 0.011982917785644531, 0.012898921966552734, 0.013814926147460938, 0.01473093032836914, 0.015646934509277344, 0.016562938690185547, 0.01747894287109375, 0.018394947052001953, 0.019310951232910156, 0.02022695541381836, 0.021142959594726562, 0.022058963775634766, 0.02297496795654297, 0.023890972137451172, 0.024806976318359375, 0.025722980499267578, 0.02663898468017578, 0.027554988861083984, 0.028470993041992188, 0.02938699722290039, 0.030303001403808594, 0.031219005584716797, 0.032135009765625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 4.0, 5.0, 1.0, 7.0, 11.0, 12.0, 15.0, 15.0, 24.0, 28.0, 41.0, 44.0, 70.0, 65.0, 63.0, 64.0, 68.0, 65.0, 51.0, 58.0, 76.0, 40.0, 37.0, 28.0, 21.0, 23.0, 12.0, 18.0, 9.0, 6.0, 6.0, 5.0, 7.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.0078887939453125, -0.00768965482711792, -0.00749051570892334, -0.00729137659072876, -0.00709223747253418, -0.0068930983543396, -0.0066939592361450195, -0.0064948201179504395, -0.006295680999755859, -0.006096541881561279, -0.005897402763366699, -0.005698263645172119, -0.005499124526977539, -0.005299985408782959, -0.005100846290588379, -0.004901707172393799, -0.004702568054199219, -0.004503428936004639, -0.004304289817810059, -0.0041051506996154785, -0.0039060115814208984, -0.0037068724632263184, -0.0035077333450317383, -0.003308594226837158, -0.003109455108642578, -0.002910315990447998, -0.002711176872253418, -0.002512037754058838, -0.002312898635864258, -0.0021137595176696777, -0.0019146203994750977, -0.0017154812812805176, -0.0015163421630859375, -0.0013172030448913574, -0.0011180639266967773, -0.0009189248085021973, -0.0007197856903076172, -0.0005206465721130371, -0.00032150745391845703, -0.00012236833572387695, 7.677078247070312e-05, 0.0002759099006652832, 0.0004750490188598633, 0.0006741881370544434, 0.0008733272552490234, 0.0010724663734436035, 0.0012716054916381836, 0.0014707446098327637, 0.0016698837280273438, 0.0018690228462219238, 0.002068161964416504, 0.002267301082611084, 0.002466440200805664, 0.002665579319000244, 0.0028647184371948242, 0.0030638575553894043, 0.0032629966735839844, 0.0034621357917785645, 0.0036612749099731445, 0.0038604140281677246, 0.004059553146362305, 0.004258692264556885, 0.004457831382751465, 0.004656970500946045, 0.004856109619140625]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 10.0, 36.0, 56.0, 221.0, 379.0, 201.0, 65.0, 26.0, 6.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7869116067886353, -0.739274263381958, -0.691636860370636, -0.643999457359314, -0.5963621139526367, -0.5487247705459595, -0.5010873675346375, -0.4534499943256378, -0.4058126211166382, -0.35817524790763855, -0.3105378746986389, -0.2629005014896393, -0.21526312828063965, -0.16762575507164001, -0.11998838186264038, -0.07235100865364075, -0.024713635444641113, 0.02292373776435852, 0.07056111097335815, 0.11819848418235779, 0.16583585739135742, 0.21347323060035706, 0.2611106038093567, 0.3087479770183563, 0.35638535022735596, 0.4040227234363556, 0.4516600966453552, 0.49929746985435486, 0.5469348430633545, 0.5945721864700317, 0.6422095894813538, 0.6898469924926758, 0.7374844551086426, 0.7851217985153198, 0.8327592015266418, 0.8803966045379639, 0.9280339479446411, 0.9756712913513184, 1.0233087539672852, 1.0709460973739624, 1.1185834407806396, 1.166220784187317, 1.2138581275939941, 1.261495590209961, 1.3091329336166382, 1.3567702770233154, 1.4044077396392822, 1.4520450830459595, 1.4996824264526367, 1.547319769859314, 1.5949571132659912, 1.642594575881958, 1.6902319192886353, 1.7378692626953125, 1.7855067253112793, 1.8331440687179565, 1.8807814121246338, 1.928418755531311, 1.9760560989379883, 2.023693561553955, 2.071331024169922, 2.1189682483673096, 2.1666057109832764, 2.214242935180664, 2.261880397796631]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 5.0, 5.0, 9.0, 6.0, 12.0, 19.0, 16.0, 25.0, 41.0, 50.0, 60.0, 49.0, 64.0, 81.0, 69.0, 75.0, 79.0, 59.0, 50.0, 58.0, 43.0, 30.0, 32.0, 13.0, 14.0, 11.0, 6.0, 8.0, 10.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.5753141641616821, -0.5615509152412415, -0.5477876663208008, -0.5340244174003601, -0.5202611684799194, -0.5064979791641235, -0.49273473024368286, -0.4789714813232422, -0.4652082324028015, -0.45144498348236084, -0.43768173456192017, -0.4239185154438019, -0.4101552665233612, -0.39639201760292053, -0.38262879848480225, -0.3688655495643616, -0.3551023006439209, -0.3413390517234802, -0.32757580280303955, -0.31381258368492126, -0.3000493347644806, -0.2862860858440399, -0.27252286672592163, -0.25875961780548096, -0.24499636888504028, -0.2312331199645996, -0.21746988594532013, -0.20370665192604065, -0.18994340300559998, -0.1761801540851593, -0.16241692006587982, -0.14865368604660034, -0.13489043712615967, -0.12112719565629959, -0.10736395418643951, -0.09360071271657944, -0.07983747124671936, -0.06607422977685928, -0.05231098830699921, -0.03854774683713913, -0.024784505367279053, -0.011021263897418976, 0.002741977572441101, 0.016505219042301178, 0.030268460512161255, 0.04403170198202133, 0.05779494345188141, 0.07155818492174149, 0.08532142639160156, 0.09908466786146164, 0.11284790933132172, 0.1266111433506012, 0.14037439227104187, 0.15413764119148254, 0.16790087521076202, 0.1816641092300415, 0.19542735815048218, 0.20919060707092285, 0.22295384109020233, 0.2367170751094818, 0.2504803240299225, 0.26424357295036316, 0.27800679206848145, 0.2917700409889221, 0.3055332899093628]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 7.0, 11.0, 12.0, 9.0, 13.0, 26.0, 35.0, 45.0, 99.0, 141.0, 241.0, 413.0, 792.0, 1543.0, 3529.0, 9604.0, 30846.0, 154558.0, 620106.0, 174993.0, 33869.0, 10315.0, 3847.0, 1647.0, 813.0, 429.0, 231.0, 129.0, 94.0, 47.0, 32.0, 30.0, 21.0, 8.0, 6.0, 2.0, 5.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.3671875, -0.3568534851074219, -0.34651947021484375, -0.3361854553222656, -0.3258514404296875, -0.3155174255371094, -0.30518341064453125, -0.2948493957519531, -0.284515380859375, -0.2741813659667969, -0.26384735107421875, -0.2535133361816406, -0.2431793212890625, -0.23284530639648438, -0.22251129150390625, -0.21217727661132812, -0.20184326171875, -0.19150924682617188, -0.18117523193359375, -0.17084121704101562, -0.1605072021484375, -0.15017318725585938, -0.13983917236328125, -0.12950515747070312, -0.119171142578125, -0.10883712768554688, -0.09850311279296875, -0.08816909790039062, -0.0778350830078125, -0.06750106811523438, -0.05716705322265625, -0.046833038330078125, -0.0364990234375, -0.026165008544921875, -0.01583099365234375, -0.005496978759765625, 0.0048370361328125, 0.015171051025390625, 0.02550506591796875, 0.035839080810546875, 0.046173095703125, 0.056507110595703125, 0.06684112548828125, 0.07717514038085938, 0.0875091552734375, 0.09784317016601562, 0.10817718505859375, 0.11851119995117188, 0.12884521484375, 0.13917922973632812, 0.14951324462890625, 0.15984725952148438, 0.1701812744140625, 0.18051528930664062, 0.19084930419921875, 0.20118331909179688, 0.211517333984375, 0.22185134887695312, 0.23218536376953125, 0.24251937866210938, 0.2528533935546875, 0.2631874084472656, 0.27352142333984375, 0.2838554382324219, 0.294189453125]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 3.0, 3.0, 10.0, 11.0, 11.0, 19.0, 25.0, 26.0, 36.0, 52.0, 57.0, 70.0, 75.0, 77.0, 74.0, 74.0, 87.0, 61.0, 54.0, 50.0, 29.0, 26.0, 16.0, 17.0, 11.0, 10.0, 8.0, 4.0, 5.0, 7.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2900390625, -1.258758544921875, -1.22747802734375, -1.196197509765625, -1.1649169921875, -1.133636474609375, -1.10235595703125, -1.071075439453125, -1.039794921875, -1.008514404296875, -0.97723388671875, -0.945953369140625, -0.9146728515625, -0.883392333984375, -0.85211181640625, -0.820831298828125, -0.78955078125, -0.758270263671875, -0.72698974609375, -0.695709228515625, -0.6644287109375, -0.633148193359375, -0.60186767578125, -0.570587158203125, -0.539306640625, -0.508026123046875, -0.47674560546875, -0.445465087890625, -0.4141845703125, -0.382904052734375, -0.35162353515625, -0.320343017578125, -0.2890625, -0.257781982421875, -0.22650146484375, -0.195220947265625, -0.1639404296875, -0.132659912109375, -0.10137939453125, -0.070098876953125, -0.038818359375, -0.007537841796875, 0.02374267578125, 0.055023193359375, 0.0863037109375, 0.117584228515625, 0.14886474609375, 0.180145263671875, 0.21142578125, 0.242706298828125, 0.27398681640625, 0.305267333984375, 0.3365478515625, 0.367828369140625, 0.39910888671875, 0.430389404296875, 0.461669921875, 0.492950439453125, 0.52423095703125, 0.555511474609375, 0.5867919921875, 0.618072509765625, 0.64935302734375, 0.680633544921875, 0.7119140625]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 1.0, 8.0, 8.0, 10.0, 15.0, 35.0, 40.0, 57.0, 85.0, 143.0, 214.0, 371.0, 833.0, 3397.0, 43072.0, 888211.0, 103920.0, 6009.0, 1086.0, 392.0, 221.0, 126.0, 112.0, 52.0, 36.0, 31.0, 10.0, 13.0, 10.0, 3.0, 9.0, 2.0, 6.0, 4.0, 6.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.72314453125, -0.703399658203125, -0.68365478515625, -0.663909912109375, -0.6441650390625, -0.624420166015625, -0.60467529296875, -0.584930419921875, -0.565185546875, -0.545440673828125, -0.52569580078125, -0.505950927734375, -0.4862060546875, -0.466461181640625, -0.44671630859375, -0.426971435546875, -0.4072265625, -0.387481689453125, -0.36773681640625, -0.347991943359375, -0.3282470703125, -0.308502197265625, -0.28875732421875, -0.269012451171875, -0.249267578125, -0.229522705078125, -0.20977783203125, -0.190032958984375, -0.1702880859375, -0.150543212890625, -0.13079833984375, -0.111053466796875, -0.09130859375, -0.071563720703125, -0.05181884765625, -0.032073974609375, -0.0123291015625, 0.007415771484375, 0.02716064453125, 0.046905517578125, 0.066650390625, 0.086395263671875, 0.10614013671875, 0.125885009765625, 0.1456298828125, 0.165374755859375, 0.18511962890625, 0.204864501953125, 0.224609375, 0.244354248046875, 0.26409912109375, 0.283843994140625, 0.3035888671875, 0.323333740234375, 0.34307861328125, 0.362823486328125, 0.382568359375, 0.402313232421875, 0.42205810546875, 0.441802978515625, 0.4615478515625, 0.481292724609375, 0.50103759765625, 0.520782470703125, 0.54052734375]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 3.0, 6.0, 3.0, 6.0, 9.0, 5.0, 11.0, 11.0, 14.0, 20.0, 20.0, 29.0, 16.0, 33.0, 26.0, 39.0, 34.0, 31.0, 38.0, 44.0, 41.0, 49.0, 38.0, 38.0, 31.0, 43.0, 31.0, 32.0, 35.0, 27.0, 26.0, 32.0, 23.0, 21.0, 20.0, 22.0, 19.0, 12.0, 14.0, 9.0, 10.0, 11.0, 9.0, 6.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0], "bins": [-0.6904296875, -0.6715240478515625, -0.652618408203125, -0.6337127685546875, -0.61480712890625, -0.5959014892578125, -0.576995849609375, -0.5580902099609375, -0.5391845703125, -0.5202789306640625, -0.501373291015625, -0.4824676513671875, -0.46356201171875, -0.4446563720703125, -0.425750732421875, -0.4068450927734375, -0.387939453125, -0.3690338134765625, -0.350128173828125, -0.3312225341796875, -0.31231689453125, -0.2934112548828125, -0.274505615234375, -0.2555999755859375, -0.2366943359375, -0.2177886962890625, -0.198883056640625, -0.1799774169921875, -0.16107177734375, -0.1421661376953125, -0.123260498046875, -0.1043548583984375, -0.08544921875, -0.0665435791015625, -0.047637939453125, -0.0287322998046875, -0.00982666015625, 0.0090789794921875, 0.027984619140625, 0.0468902587890625, 0.0657958984375, 0.0847015380859375, 0.103607177734375, 0.1225128173828125, 0.14141845703125, 0.1603240966796875, 0.179229736328125, 0.1981353759765625, 0.217041015625, 0.2359466552734375, 0.254852294921875, 0.2737579345703125, 0.29266357421875, 0.3115692138671875, 0.330474853515625, 0.3493804931640625, 0.3682861328125, 0.3871917724609375, 0.406097412109375, 0.4250030517578125, 0.44390869140625, 0.4628143310546875, 0.481719970703125, 0.5006256103515625, 0.51953125]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 9.0, 4.0, 8.0, 12.0, 7.0, 18.0, 37.0, 54.0, 171.0, 551.0, 2687.0, 74863.0, 960251.0, 8220.0, 1085.0, 337.0, 110.0, 47.0, 20.0, 17.0, 14.0, 7.0, 5.0, 7.0, 6.0, 1.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.423828125, -0.40827178955078125, -0.3927154541015625, -0.37715911865234375, -0.361602783203125, -0.34604644775390625, -0.3304901123046875, -0.31493377685546875, -0.29937744140625, -0.28382110595703125, -0.2682647705078125, -0.25270843505859375, -0.237152099609375, -0.22159576416015625, -0.2060394287109375, -0.19048309326171875, -0.1749267578125, -0.15937042236328125, -0.1438140869140625, -0.12825775146484375, -0.112701416015625, -0.09714508056640625, -0.0815887451171875, -0.06603240966796875, -0.05047607421875, -0.03491973876953125, -0.0193634033203125, -0.00380706787109375, 0.011749267578125, 0.02730560302734375, 0.0428619384765625, 0.05841827392578125, 0.073974609375, 0.08953094482421875, 0.1050872802734375, 0.12064361572265625, 0.136199951171875, 0.15175628662109375, 0.1673126220703125, 0.18286895751953125, 0.19842529296875, 0.21398162841796875, 0.2295379638671875, 0.24509429931640625, 0.260650634765625, 0.27620697021484375, 0.2917633056640625, 0.30731964111328125, 0.3228759765625, 0.33843231201171875, 0.3539886474609375, 0.36954498291015625, 0.385101318359375, 0.40065765380859375, 0.4162139892578125, 0.43177032470703125, 0.44732666015625, 0.46288299560546875, 0.4784393310546875, 0.49399566650390625, 0.509552001953125, 0.5251083374023438, 0.5406646728515625, 0.5562210083007812, 0.57177734375]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 8.0, 11.0, 30.0, 62.0, 132.0, 297.0, 226.0, 137.0, 48.0, 26.0, 10.0, 5.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.502866744995117e-05, -6.326567381620407e-05, -6.150268018245697e-05, -5.973968654870987e-05, -5.797669291496277e-05, -5.621369928121567e-05, -5.445070564746857e-05, -5.2687712013721466e-05, -5.0924718379974365e-05, -4.9161724746227264e-05, -4.7398731112480164e-05, -4.563573747873306e-05, -4.387274384498596e-05, -4.210975021123886e-05, -4.034675657749176e-05, -3.858376294374466e-05, -3.682076930999756e-05, -3.505777567625046e-05, -3.329478204250336e-05, -3.1531788408756256e-05, -2.9768794775009155e-05, -2.8005801141262054e-05, -2.6242807507514954e-05, -2.4479813873767853e-05, -2.2716820240020752e-05, -2.095382660627365e-05, -1.919083297252655e-05, -1.742783933877945e-05, -1.566484570503235e-05, -1.3901852071285248e-05, -1.2138858437538147e-05, -1.0375864803791046e-05, -8.612871170043945e-06, -6.8498775362968445e-06, -5.086883902549744e-06, -3.323890268802643e-06, -1.560896635055542e-06, 2.0209699869155884e-07, 1.9650906324386597e-06, 3.7280842661857605e-06, 5.491077899932861e-06, 7.254071533679962e-06, 9.017065167427063e-06, 1.0780058801174164e-05, 1.2543052434921265e-05, 1.4306046068668365e-05, 1.6069039702415466e-05, 1.7832033336162567e-05, 1.9595026969909668e-05, 2.135802060365677e-05, 2.312101423740387e-05, 2.488400787115097e-05, 2.664700150489807e-05, 2.8409995138645172e-05, 3.0172988772392273e-05, 3.1935982406139374e-05, 3.3698976039886475e-05, 3.5461969673633575e-05, 3.7224963307380676e-05, 3.898795694112778e-05, 4.075095057487488e-05, 4.251394420862198e-05, 4.427693784236908e-05, 4.603993147611618e-05, 4.780292510986328e-05]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 6.0, 9.0, 13.0, 16.0, 20.0, 40.0, 86.0, 212.0, 519.0, 1830.0, 13702.0, 949154.0, 77703.0, 3771.0, 895.0, 298.0, 134.0, 55.0, 33.0, 14.0, 9.0, 8.0, 7.0, 8.0, 4.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.5537109375, -0.5401115417480469, -0.5265121459960938, -0.5129127502441406, -0.4993133544921875, -0.4857139587402344, -0.47211456298828125, -0.4585151672363281, -0.444915771484375, -0.4313163757324219, -0.41771697998046875, -0.4041175842285156, -0.3905181884765625, -0.3769187927246094, -0.36331939697265625, -0.3497200012207031, -0.33612060546875, -0.3225212097167969, -0.30892181396484375, -0.2953224182128906, -0.2817230224609375, -0.2681236267089844, -0.25452423095703125, -0.24092483520507812, -0.227325439453125, -0.21372604370117188, -0.20012664794921875, -0.18652725219726562, -0.1729278564453125, -0.15932846069335938, -0.14572906494140625, -0.13212966918945312, -0.1185302734375, -0.10493087768554688, -0.09133148193359375, -0.07773208618164062, -0.0641326904296875, -0.050533294677734375, -0.03693389892578125, -0.023334503173828125, -0.009735107421875, 0.003864288330078125, 0.01746368408203125, 0.031063079833984375, 0.0446624755859375, 0.058261871337890625, 0.07186126708984375, 0.08546066284179688, 0.09906005859375, 0.11265945434570312, 0.12625885009765625, 0.13985824584960938, 0.1534576416015625, 0.16705703735351562, 0.18065643310546875, 0.19425582885742188, 0.207855224609375, 0.22145462036132812, 0.23505401611328125, 0.24865341186523438, 0.2622528076171875, 0.2758522033691406, 0.28945159912109375, 0.3030509948730469, 0.316650390625]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 4.0, 3.0, 1.0, 6.0, 12.0, 27.0, 25.0, 40.0, 87.0, 98.0, 154.0, 191.0, 114.0, 99.0, 51.0, 34.0, 24.0, 8.0, 6.0, 4.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.07305908203125, -0.0703744888305664, -0.06768989562988281, -0.06500530242919922, -0.062320709228515625, -0.05963611602783203, -0.05695152282714844, -0.054266929626464844, -0.05158233642578125, -0.048897743225097656, -0.04621315002441406, -0.04352855682373047, -0.040843963623046875, -0.03815937042236328, -0.03547477722167969, -0.032790184020996094, -0.0301055908203125, -0.027420997619628906, -0.024736404418945312, -0.02205181121826172, -0.019367218017578125, -0.01668262481689453, -0.013998031616210938, -0.011313438415527344, -0.00862884521484375, -0.005944252014160156, -0.0032596588134765625, -0.0005750656127929688, 0.002109527587890625, 0.004794120788574219, 0.0074787139892578125, 0.010163307189941406, 0.012847900390625, 0.015532493591308594, 0.018217086791992188, 0.02090167999267578, 0.023586273193359375, 0.02627086639404297, 0.028955459594726562, 0.031640052795410156, 0.03432464599609375, 0.037009239196777344, 0.03969383239746094, 0.04237842559814453, 0.045063018798828125, 0.04774761199951172, 0.05043220520019531, 0.053116798400878906, 0.0558013916015625, 0.058485984802246094, 0.06117057800292969, 0.06385517120361328, 0.06653976440429688, 0.06922435760498047, 0.07190895080566406, 0.07459354400634766, 0.07727813720703125, 0.07996273040771484, 0.08264732360839844, 0.08533191680908203, 0.08801651000976562, 0.09070110321044922, 0.09338569641113281, 0.0960702896118164, 0.0987548828125]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 15.0, 23.0, 62.0, 155.0, 293.0, 257.0, 114.0, 45.0, 18.0, 11.0, 3.0, 1.0, 5.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1709855794906616, -1.0923984050750732, -1.0138112306594849, -0.9352240562438965, -0.8566368818283081, -0.7780497074127197, -0.6994625926017761, -0.6208754181861877, -0.5422882437705994, -0.463701069355011, -0.3851138949394226, -0.3065267503261566, -0.22793957591056824, -0.14935240149497986, -0.07076525688171387, 0.007821917533874512, 0.08640909194946289, 0.16499626636505127, 0.24358342587947845, 0.32217058539390564, 0.400757759809494, 0.4793449342250824, 0.5579320788383484, 0.6365192532539368, 0.7151064276695251, 0.7936936020851135, 0.8722807765007019, 0.9508678913116455, 1.0294550657272339, 1.1080422401428223, 1.1866294145584106, 1.265216588973999, 1.3438036441802979, 1.4223908185958862, 1.5009779930114746, 1.579565167427063, 1.6581523418426514, 1.7367395162582397, 1.8153266906738281, 1.893913745880127, 1.9725010395050049, 2.0510880947113037, 2.1296753883361816, 2.2082624435424805, 2.2868497371673584, 2.3654367923736572, 2.444024085998535, 2.522611141204834, 2.601198196411133, 2.6797852516174316, 2.7583725452423096, 2.8369596004486084, 2.9155468940734863, 2.994133949279785, 3.072721242904663, 3.151308298110962, 3.22989559173584, 3.3084826469421387, 3.3870699405670166, 3.4656569957733154, 3.5442442893981934, 3.622831344604492, 3.70141863822937, 3.780005693435669, 3.858592987060547]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 7.0, 3.0, 6.0, 6.0, 11.0, 8.0, 18.0, 17.0, 18.0, 25.0, 28.0, 29.0, 34.0, 37.0, 49.0, 42.0, 54.0, 43.0, 42.0, 57.0, 38.0, 50.0, 44.0, 49.0, 43.0, 40.0, 27.0, 32.0, 28.0, 24.0, 21.0, 16.0, 11.0, 7.0, 10.0, 6.0, 11.0, 4.0, 6.0, 5.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0], "bins": [-1.475698709487915, -1.4363240003585815, -1.3969491720199585, -1.357574462890625, -1.318199634552002, -1.2788249254226685, -1.2394500970840454, -1.200075387954712, -1.1607005596160889, -1.1213258504867554, -1.0819510221481323, -1.0425763130187988, -1.0032014846801758, -0.9638267159461975, -0.9244519472122192, -0.8850772380828857, -0.8457024693489075, -0.8063277006149292, -0.7669529318809509, -0.7275781631469727, -0.6882033944129944, -0.6488286256790161, -0.6094539165496826, -0.5700790882110596, -0.5307043790817261, -0.4913296103477478, -0.45195484161376953, -0.41258007287979126, -0.373205304145813, -0.3338305354118347, -0.29445579648017883, -0.25508102774620056, -0.2157062292098999, -0.17633146047592163, -0.13695669174194336, -0.09758193790912628, -0.05820716917514801, -0.01883240044116974, 0.02054235339164734, 0.05991712212562561, 0.09929189085960388, 0.13866665959358215, 0.17804142832756042, 0.2174161821603775, 0.2567909359931946, 0.29616570472717285, 0.3355404734611511, 0.3749152421951294, 0.41429001092910767, 0.45366477966308594, 0.4930395483970642, 0.5324143171310425, 0.5717890858650208, 0.611163854598999, 0.6505385637283325, 0.6899133920669556, 0.7292881011962891, 0.7686628699302673, 0.8080376386642456, 0.8474124073982239, 0.8867871761322021, 0.9261619448661804, 0.9655367136001587, 1.0049114227294922, 1.0442862510681152]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 4.0, 2.0, 3.0, 7.0, 5.0, 17.0, 24.0, 33.0, 49.0, 67.0, 99.0, 144.0, 280.0, 538.0, 1153.0, 2708.0, 8536.0, 53176.0, 1154306.0, 2843053.0, 109906.0, 13549.0, 3748.0, 1360.0, 610.0, 352.0, 193.0, 121.0, 73.0, 50.0, 29.0, 20.0, 21.0, 14.0, 7.0, 2.0, 7.0, 4.0, 2.0, 3.0, 1.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.88916015625, -0.86151123046875, -0.8338623046875, -0.80621337890625, -0.778564453125, -0.75091552734375, -0.7232666015625, -0.69561767578125, -0.66796875, -0.64031982421875, -0.6126708984375, -0.58502197265625, -0.557373046875, -0.52972412109375, -0.5020751953125, -0.47442626953125, -0.44677734375, -0.41912841796875, -0.3914794921875, -0.36383056640625, -0.336181640625, -0.30853271484375, -0.2808837890625, -0.25323486328125, -0.2255859375, -0.19793701171875, -0.1702880859375, -0.14263916015625, -0.114990234375, -0.08734130859375, -0.0596923828125, -0.03204345703125, -0.00439453125, 0.02325439453125, 0.0509033203125, 0.07855224609375, 0.106201171875, 0.13385009765625, 0.1614990234375, 0.18914794921875, 0.216796875, 0.24444580078125, 0.2720947265625, 0.29974365234375, 0.327392578125, 0.35504150390625, 0.3826904296875, 0.41033935546875, 0.43798828125, 0.46563720703125, 0.4932861328125, 0.52093505859375, 0.548583984375, 0.57623291015625, 0.6038818359375, 0.63153076171875, 0.6591796875, 0.68682861328125, 0.7144775390625, 0.74212646484375, 0.769775390625, 0.79742431640625, 0.8250732421875, 0.85272216796875, 0.88037109375]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 7.0, 10.0, 7.0, 11.0, 22.0, 26.0, 30.0, 42.0, 36.0, 75.0, 67.0, 73.0, 76.0, 86.0, 72.0, 73.0, 73.0, 42.0, 35.0, 41.0, 30.0, 21.0, 16.0, 5.0, 4.0, 7.0, 4.0, 4.0, 5.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.6806640625, -0.6622886657714844, -0.6439132690429688, -0.6255378723144531, -0.6071624755859375, -0.5887870788574219, -0.5704116821289062, -0.5520362854003906, -0.533660888671875, -0.5152854919433594, -0.49691009521484375, -0.4785346984863281, -0.4601593017578125, -0.4417839050292969, -0.42340850830078125, -0.4050331115722656, -0.38665771484375, -0.3682823181152344, -0.34990692138671875, -0.3315315246582031, -0.3131561279296875, -0.2947807312011719, -0.27640533447265625, -0.2580299377441406, -0.239654541015625, -0.22127914428710938, -0.20290374755859375, -0.18452835083007812, -0.1661529541015625, -0.14777755737304688, -0.12940216064453125, -0.11102676391601562, -0.0926513671875, -0.07427597045898438, -0.05590057373046875, -0.037525177001953125, -0.0191497802734375, -0.000774383544921875, 0.01760101318359375, 0.035976409912109375, 0.054351806640625, 0.07272720336914062, 0.09110260009765625, 0.10947799682617188, 0.1278533935546875, 0.14622879028320312, 0.16460418701171875, 0.18297958374023438, 0.20135498046875, 0.21973037719726562, 0.23810577392578125, 0.2564811706542969, 0.2748565673828125, 0.2932319641113281, 0.31160736083984375, 0.3299827575683594, 0.348358154296875, 0.3667335510253906, 0.38510894775390625, 0.4034843444824219, 0.4218597412109375, 0.4402351379394531, 0.45861053466796875, 0.4769859313964844, 0.495361328125]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 2.0, 3.0, 10.0, 13.0, 15.0, 41.0, 58.0, 79.0, 147.0, 267.0, 535.0, 1129.0, 3010.0, 10562.0, 76309.0, 3623765.0, 444939.0, 24489.0, 5466.0, 1874.0, 719.0, 387.0, 180.0, 100.0, 58.0, 39.0, 24.0, 22.0, 15.0, 12.0, 4.0, 6.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.1630859375, -1.133819580078125, -1.10455322265625, -1.075286865234375, -1.0460205078125, -1.016754150390625, -0.98748779296875, -0.958221435546875, -0.928955078125, -0.899688720703125, -0.87042236328125, -0.841156005859375, -0.8118896484375, -0.782623291015625, -0.75335693359375, -0.724090576171875, -0.69482421875, -0.665557861328125, -0.63629150390625, -0.607025146484375, -0.5777587890625, -0.548492431640625, -0.51922607421875, -0.489959716796875, -0.460693359375, -0.431427001953125, -0.40216064453125, -0.372894287109375, -0.3436279296875, -0.314361572265625, -0.28509521484375, -0.255828857421875, -0.2265625, -0.197296142578125, -0.16802978515625, -0.138763427734375, -0.1094970703125, -0.080230712890625, -0.05096435546875, -0.021697998046875, 0.007568359375, 0.036834716796875, 0.06610107421875, 0.095367431640625, 0.1246337890625, 0.153900146484375, 0.18316650390625, 0.212432861328125, 0.24169921875, 0.270965576171875, 0.30023193359375, 0.329498291015625, 0.3587646484375, 0.388031005859375, 0.41729736328125, 0.446563720703125, 0.475830078125, 0.505096435546875, 0.53436279296875, 0.563629150390625, 0.5928955078125, 0.622161865234375, 0.65142822265625, 0.680694580078125, 0.7099609375]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 2.0, 5.0, 2.0, 11.0, 4.0, 11.0, 10.0, 20.0, 28.0, 46.0, 81.0, 159.0, 277.0, 509.0, 891.0, 906.0, 515.0, 261.0, 125.0, 70.0, 54.0, 28.0, 18.0, 14.0, 10.0, 7.0, 8.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1873779296875, -0.1801738739013672, -0.17296981811523438, -0.16576576232910156, -0.15856170654296875, -0.15135765075683594, -0.14415359497070312, -0.1369495391845703, -0.1297454833984375, -0.12254142761230469, -0.11533737182617188, -0.10813331604003906, -0.10092926025390625, -0.09372520446777344, -0.08652114868164062, -0.07931709289550781, -0.072113037109375, -0.06490898132324219, -0.057704925537109375, -0.05050086975097656, -0.04329681396484375, -0.03609275817871094, -0.028888702392578125, -0.021684646606445312, -0.0144805908203125, -0.0072765350341796875, -7.2479248046875e-05, 0.0071315765380859375, 0.01433563232421875, 0.021539688110351562, 0.028743743896484375, 0.03594779968261719, 0.04315185546875, 0.05035591125488281, 0.057559967041015625, 0.06476402282714844, 0.07196807861328125, 0.07917213439941406, 0.08637619018554688, 0.09358024597167969, 0.1007843017578125, 0.10798835754394531, 0.11519241333007812, 0.12239646911621094, 0.12960052490234375, 0.13680458068847656, 0.14400863647460938, 0.1512126922607422, 0.158416748046875, 0.1656208038330078, 0.17282485961914062, 0.18002891540527344, 0.18723297119140625, 0.19443702697753906, 0.20164108276367188, 0.2088451385498047, 0.2160491943359375, 0.2232532501220703, 0.23045730590820312, 0.23766136169433594, 0.24486541748046875, 0.25206947326660156, 0.2592735290527344, 0.2664775848388672, 0.273681640625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 5.0, 5.0, 14.0, 15.0, 16.0, 29.0, 52.0, 73.0, 91.0, 136.0, 167.0, 116.0, 115.0, 53.0, 37.0, 25.0, 14.0, 17.0, 11.0, 4.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.9358514547348022, -0.9052781462669373, -0.874704897403717, -0.844131588935852, -0.8135582804679871, -0.7829849720001221, -0.7524117231369019, -0.7218384146690369, -0.6912651062011719, -0.6606917977333069, -0.6301185488700867, -0.5995452404022217, -0.5689719319343567, -0.5383986234664917, -0.5078253746032715, -0.4772520661354065, -0.4466787874698639, -0.4161055088043213, -0.3855322003364563, -0.3549589216709137, -0.3243856132030487, -0.2938123345375061, -0.2632390260696411, -0.2326657474040985, -0.20209245383739471, -0.17151916027069092, -0.14094586670398712, -0.11037258058786392, -0.07979928702116013, -0.049226000905036926, -0.01865270733833313, 0.011920586228370667, 0.04249387979507446, 0.07306717336177826, 0.10364046692848206, 0.13421374559402466, 0.16478705406188965, 0.19536033272743225, 0.22593362629413605, 0.25650691986083984, 0.28708022832870483, 0.31765350699424744, 0.3482268154621124, 0.37880009412765503, 0.40937340259552, 0.4399466812610626, 0.4705199599266052, 0.5010932683944702, 0.5316665172576904, 0.5622398257255554, 0.5928130745887756, 0.6233863830566406, 0.6539596915245056, 0.6845329999923706, 0.7151062488555908, 0.7456795573234558, 0.7762528657913208, 0.8068261742591858, 0.837399423122406, 0.867972731590271, 0.898546040058136, 0.929119348526001, 0.9596925973892212, 0.9902659058570862, 1.0208392143249512]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 4.0, 5.0, 6.0, 19.0, 14.0, 21.0, 32.0, 27.0, 42.0, 58.0, 49.0, 61.0, 65.0, 69.0, 67.0, 71.0, 62.0, 60.0, 67.0, 37.0, 40.0, 25.0, 29.0, 31.0, 20.0, 4.0, 7.0, 2.0, 4.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7828695178031921, -0.7627837657928467, -0.7426980137825012, -0.7226122617721558, -0.7025264501571655, -0.6824406981468201, -0.6623549461364746, -0.6422691941261292, -0.6221834421157837, -0.6020976901054382, -0.5820119380950928, -0.5619261264801025, -0.5418403744697571, -0.5217546224594116, -0.5016688704490662, -0.4815831184387207, -0.46149733662605286, -0.4414115846157074, -0.42132580280303955, -0.4012400507926941, -0.38115429878234863, -0.3610685467720032, -0.3409827649593353, -0.32089701294898987, -0.300811231136322, -0.28072547912597656, -0.2606396973133087, -0.24055394530296326, -0.2204681932926178, -0.20038242638111115, -0.1802966594696045, -0.16021090745925903, -0.14012515544891357, -0.12003939598798752, -0.09995363652706146, -0.07986786961555481, -0.059782110154628754, -0.0396963506937027, -0.019610583782196045, 0.00047516822814941406, 0.020560935139656067, 0.04064669460058212, 0.06073245778679848, 0.08081822097301483, 0.10090398043394089, 0.12098973989486694, 0.1410755068063736, 0.16116125881671906, 0.1812470257282257, 0.20133279263973236, 0.22141854465007782, 0.24150431156158447, 0.26159006357192993, 0.2816758155822754, 0.30176159739494324, 0.3218473494052887, 0.34193313121795654, 0.362018883228302, 0.38210466504096985, 0.4021904170513153, 0.42227616906166077, 0.4423619508743286, 0.4624477028846741, 0.48253345489501953, 0.502619206905365]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 4.0, 6.0, 9.0, 19.0, 27.0, 51.0, 99.0, 176.0, 341.0, 828.0, 2366.0, 9352.0, 53465.0, 412911.0, 486132.0, 67164.0, 11091.0, 2719.0, 958.0, 390.0, 203.0, 100.0, 54.0, 29.0, 16.0, 11.0, 12.0, 5.0, 5.0, 2.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1246337890625, -0.1206207275390625, -0.116607666015625, -0.1125946044921875, -0.10858154296875, -0.1045684814453125, -0.100555419921875, -0.0965423583984375, -0.092529296875, -0.0885162353515625, -0.084503173828125, -0.0804901123046875, -0.07647705078125, -0.0724639892578125, -0.068450927734375, -0.0644378662109375, -0.0604248046875, -0.0564117431640625, -0.052398681640625, -0.0483856201171875, -0.04437255859375, -0.0403594970703125, -0.036346435546875, -0.0323333740234375, -0.0283203125, -0.0243072509765625, -0.020294189453125, -0.0162811279296875, -0.01226806640625, -0.0082550048828125, -0.004241943359375, -0.0002288818359375, 0.0037841796875, 0.0077972412109375, 0.011810302734375, 0.0158233642578125, 0.01983642578125, 0.0238494873046875, 0.027862548828125, 0.0318756103515625, 0.035888671875, 0.0399017333984375, 0.043914794921875, 0.0479278564453125, 0.05194091796875, 0.0559539794921875, 0.059967041015625, 0.0639801025390625, 0.0679931640625, 0.0720062255859375, 0.076019287109375, 0.0800323486328125, 0.08404541015625, 0.0880584716796875, 0.092071533203125, 0.0960845947265625, 0.10009765625, 0.1041107177734375, 0.108123779296875, 0.1121368408203125, 0.11614990234375, 0.1201629638671875, 0.124176025390625, 0.1281890869140625, 0.1322021484375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 6.0, 20.0, 11.0, 13.0, 22.0, 34.0, 29.0, 33.0, 52.0, 57.0, 64.0, 72.0, 79.0, 58.0, 78.0, 59.0, 71.0, 46.0, 52.0, 31.0, 31.0, 24.0, 21.0, 13.0, 8.0, 7.0, 7.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0], "bins": [-0.64501953125, -0.6300468444824219, -0.6150741577148438, -0.6001014709472656, -0.5851287841796875, -0.5701560974121094, -0.5551834106445312, -0.5402107238769531, -0.525238037109375, -0.5102653503417969, -0.49529266357421875, -0.4803199768066406, -0.4653472900390625, -0.4503746032714844, -0.43540191650390625, -0.4204292297363281, -0.40545654296875, -0.3904838562011719, -0.37551116943359375, -0.3605384826660156, -0.3455657958984375, -0.3305931091308594, -0.31562042236328125, -0.3006477355957031, -0.285675048828125, -0.2707023620605469, -0.25572967529296875, -0.24075698852539062, -0.2257843017578125, -0.21081161499023438, -0.19583892822265625, -0.18086624145507812, -0.1658935546875, -0.15092086791992188, -0.13594818115234375, -0.12097549438476562, -0.1060028076171875, -0.09103012084960938, -0.07605743408203125, -0.061084747314453125, -0.046112060546875, -0.031139373779296875, -0.01616668701171875, -0.001194000244140625, 0.0137786865234375, 0.028751373291015625, 0.04372406005859375, 0.058696746826171875, 0.07366943359375, 0.08864212036132812, 0.10361480712890625, 0.11858749389648438, 0.1335601806640625, 0.14853286743164062, 0.16350555419921875, 0.17847824096679688, 0.193450927734375, 0.20842361450195312, 0.22339630126953125, 0.23836898803710938, 0.2533416748046875, 0.2683143615722656, 0.28328704833984375, 0.2982597351074219, 0.313232421875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 5.0, 6.0, 13.0, 4.0, 10.0, 19.0, 19.0, 25.0, 47.0, 67.0, 89.0, 133.0, 278.0, 506.0, 964.0, 2386.0, 7399.0, 31704.0, 166712.0, 502914.0, 264360.0, 53015.0, 11686.0, 3494.0, 1296.0, 619.0, 328.0, 166.0, 113.0, 52.0, 32.0, 22.0, 21.0, 15.0, 10.0, 10.0, 6.0, 8.0, 5.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0799560546875, -0.07706451416015625, -0.0741729736328125, -0.07128143310546875, -0.068389892578125, -0.06549835205078125, -0.0626068115234375, -0.05971527099609375, -0.05682373046875, -0.05393218994140625, -0.0510406494140625, -0.04814910888671875, -0.045257568359375, -0.04236602783203125, -0.0394744873046875, -0.03658294677734375, -0.03369140625, -0.03079986572265625, -0.0279083251953125, -0.02501678466796875, -0.022125244140625, -0.01923370361328125, -0.0163421630859375, -0.01345062255859375, -0.01055908203125, -0.00766754150390625, -0.0047760009765625, -0.00188446044921875, 0.001007080078125, 0.00389862060546875, 0.0067901611328125, 0.00968170166015625, 0.0125732421875, 0.01546478271484375, 0.0183563232421875, 0.02124786376953125, 0.024139404296875, 0.02703094482421875, 0.0299224853515625, 0.03281402587890625, 0.03570556640625, 0.03859710693359375, 0.0414886474609375, 0.04438018798828125, 0.047271728515625, 0.05016326904296875, 0.0530548095703125, 0.05594635009765625, 0.058837890625, 0.06172943115234375, 0.0646209716796875, 0.06751251220703125, 0.070404052734375, 0.07329559326171875, 0.0761871337890625, 0.07907867431640625, 0.08197021484375, 0.08486175537109375, 0.0877532958984375, 0.09064483642578125, 0.093536376953125, 0.09642791748046875, 0.0993194580078125, 0.10221099853515625, 0.1051025390625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 2.0, 10.0, 11.0, 6.0, 10.0, 15.0, 19.0, 18.0, 22.0, 23.0, 29.0, 39.0, 41.0, 37.0, 45.0, 52.0, 47.0, 54.0, 30.0, 31.0, 35.0, 52.0, 42.0, 47.0, 42.0, 37.0, 35.0, 27.0, 21.0, 12.0, 19.0, 11.0, 16.0, 15.0, 12.0, 6.0, 7.0, 4.0, 3.0, 3.0, 3.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.51123046875, -0.49297332763671875, -0.4747161865234375, -0.45645904541015625, -0.438201904296875, -0.41994476318359375, -0.4016876220703125, -0.38343048095703125, -0.36517333984375, -0.34691619873046875, -0.3286590576171875, -0.31040191650390625, -0.292144775390625, -0.27388763427734375, -0.2556304931640625, -0.23737335205078125, -0.2191162109375, -0.20085906982421875, -0.1826019287109375, -0.16434478759765625, -0.146087646484375, -0.12783050537109375, -0.1095733642578125, -0.09131622314453125, -0.07305908203125, -0.05480194091796875, -0.0365447998046875, -0.01828765869140625, -3.0517578125e-05, 0.01822662353515625, 0.0364837646484375, 0.05474090576171875, 0.072998046875, 0.09125518798828125, 0.1095123291015625, 0.12776947021484375, 0.146026611328125, 0.16428375244140625, 0.1825408935546875, 0.20079803466796875, 0.21905517578125, 0.23731231689453125, 0.2555694580078125, 0.27382659912109375, 0.292083740234375, 0.31034088134765625, 0.3285980224609375, 0.34685516357421875, 0.3651123046875, 0.38336944580078125, 0.4016265869140625, 0.41988372802734375, 0.438140869140625, 0.45639801025390625, 0.4746551513671875, 0.49291229248046875, 0.51116943359375, 0.5294265747070312, 0.5476837158203125, 0.5659408569335938, 0.584197998046875, 0.6024551391601562, 0.6207122802734375, 0.6389694213867188, 0.6572265625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 8.0, 17.0, 8.0, 25.0, 54.0, 83.0, 148.0, 331.0, 909.0, 2683.0, 12682.0, 146161.0, 769028.0, 102328.0, 10469.0, 2281.0, 738.0, 287.0, 148.0, 78.0, 38.0, 20.0, 20.0, 8.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.033538818359375, -0.03197431564331055, -0.030409812927246094, -0.02884531021118164, -0.027280807495117188, -0.025716304779052734, -0.02415180206298828, -0.022587299346923828, -0.021022796630859375, -0.019458293914794922, -0.01789379119873047, -0.016329288482666016, -0.014764785766601562, -0.01320028305053711, -0.011635780334472656, -0.010071277618408203, -0.00850677490234375, -0.006942272186279297, -0.005377769470214844, -0.0038132667541503906, -0.0022487640380859375, -0.0006842613220214844, 0.0008802413940429688, 0.002444744110107422, 0.004009246826171875, 0.005573749542236328, 0.007138252258300781, 0.008702754974365234, 0.010267257690429688, 0.01183176040649414, 0.013396263122558594, 0.014960765838623047, 0.0165252685546875, 0.018089771270751953, 0.019654273986816406, 0.02121877670288086, 0.022783279418945312, 0.024347782135009766, 0.02591228485107422, 0.027476787567138672, 0.029041290283203125, 0.030605792999267578, 0.03217029571533203, 0.033734798431396484, 0.03529930114746094, 0.03686380386352539, 0.038428306579589844, 0.0399928092956543, 0.04155731201171875, 0.0431218147277832, 0.044686317443847656, 0.04625082015991211, 0.04781532287597656, 0.049379825592041016, 0.05094432830810547, 0.05250883102416992, 0.054073333740234375, 0.05563783645629883, 0.05720233917236328, 0.058766841888427734, 0.06033134460449219, 0.06189584732055664, 0.0634603500366211, 0.06502485275268555, 0.06658935546875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 5.0, 8.0, 7.0, 6.0, 6.0, 21.0, 13.0, 33.0, 30.0, 32.0, 30.0, 42.0, 46.0, 64.0, 55.0, 75.0, 75.0, 61.0, 60.0, 47.0, 46.0, 47.0, 35.0, 27.0, 26.0, 17.0, 21.0, 14.0, 11.0, 3.0, 10.0, 5.0, 6.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.3053417205810547e-05, -1.2705102562904358e-05, -1.2356787919998169e-05, -1.200847327709198e-05, -1.1660158634185791e-05, -1.1311843991279602e-05, -1.0963529348373413e-05, -1.0615214705467224e-05, -1.0266900062561035e-05, -9.918585419654846e-06, -9.570270776748657e-06, -9.221956133842468e-06, -8.87364149093628e-06, -8.52532684803009e-06, -8.177012205123901e-06, -7.828697562217712e-06, -7.4803829193115234e-06, -7.1320682764053345e-06, -6.7837536334991455e-06, -6.4354389905929565e-06, -6.087124347686768e-06, -5.738809704780579e-06, -5.39049506187439e-06, -5.042180418968201e-06, -4.693865776062012e-06, -4.345551133155823e-06, -3.997236490249634e-06, -3.648921847343445e-06, -3.300607204437256e-06, -2.952292561531067e-06, -2.603977918624878e-06, -2.255663275718689e-06, -1.9073486328125e-06, -1.559033989906311e-06, -1.210719347000122e-06, -8.624047040939331e-07, -5.140900611877441e-07, -1.6577541828155518e-07, 1.825392246246338e-07, 5.308538675308228e-07, 8.791685104370117e-07, 1.2274831533432007e-06, 1.5757977962493896e-06, 1.9241124391555786e-06, 2.2724270820617676e-06, 2.6207417249679565e-06, 2.9690563678741455e-06, 3.3173710107803345e-06, 3.6656856536865234e-06, 4.014000296592712e-06, 4.362314939498901e-06, 4.71062958240509e-06, 5.058944225311279e-06, 5.407258868217468e-06, 5.755573511123657e-06, 6.103888154029846e-06, 6.452202796936035e-06, 6.800517439842224e-06, 7.148832082748413e-06, 7.497146725654602e-06, 7.845461368560791e-06, 8.19377601146698e-06, 8.542090654373169e-06, 8.890405297279358e-06, 9.238719940185547e-06]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 8.0, 8.0, 7.0, 15.0, 33.0, 47.0, 79.0, 161.0, 305.0, 683.0, 2199.0, 10343.0, 83600.0, 612933.0, 300501.0, 30568.0, 4817.0, 1282.0, 458.0, 221.0, 125.0, 70.0, 30.0, 28.0, 16.0, 8.0, 3.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.03851318359375, -0.03712654113769531, -0.035739898681640625, -0.03435325622558594, -0.03296661376953125, -0.03157997131347656, -0.030193328857421875, -0.028806686401367188, -0.0274200439453125, -0.026033401489257812, -0.024646759033203125, -0.023260116577148438, -0.02187347412109375, -0.020486831665039062, -0.019100189208984375, -0.017713546752929688, -0.016326904296875, -0.014940261840820312, -0.013553619384765625, -0.012166976928710938, -0.01078033447265625, -0.009393692016601562, -0.008007049560546875, -0.0066204071044921875, -0.0052337646484375, -0.0038471221923828125, -0.002460479736328125, -0.0010738372802734375, 0.00031280517578125, 0.0016994476318359375, 0.003086090087890625, 0.0044727325439453125, 0.005859375, 0.0072460174560546875, 0.008632659912109375, 0.010019302368164062, 0.01140594482421875, 0.012792587280273438, 0.014179229736328125, 0.015565872192382812, 0.0169525146484375, 0.018339157104492188, 0.019725799560546875, 0.021112442016601562, 0.02249908447265625, 0.023885726928710938, 0.025272369384765625, 0.026659011840820312, 0.028045654296875, 0.029432296752929688, 0.030818939208984375, 0.03220558166503906, 0.03359222412109375, 0.03497886657714844, 0.036365509033203125, 0.03775215148925781, 0.0391387939453125, 0.04052543640136719, 0.041912078857421875, 0.04329872131347656, 0.04468536376953125, 0.04607200622558594, 0.047458648681640625, 0.04884529113769531, 0.05023193359375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 6.0, 4.0, 7.0, 13.0, 17.0, 25.0, 20.0, 31.0, 51.0, 55.0, 54.0, 50.0, 71.0, 70.0, 71.0, 61.0, 72.0, 53.0, 65.0, 49.0, 39.0, 30.0, 26.0, 17.0, 16.0, 9.0, 8.0, 6.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00951385498046875, -0.009265720844268799, -0.009017586708068848, -0.008769452571868896, -0.008521318435668945, -0.008273184299468994, -0.008025050163269043, -0.007776916027069092, -0.007528781890869141, -0.0072806477546691895, -0.007032513618469238, -0.006784379482269287, -0.006536245346069336, -0.006288111209869385, -0.006039977073669434, -0.005791842937469482, -0.005543708801269531, -0.00529557466506958, -0.005047440528869629, -0.004799306392669678, -0.0045511722564697266, -0.004303038120269775, -0.004054903984069824, -0.003806769847869873, -0.003558635711669922, -0.0033105015754699707, -0.0030623674392700195, -0.0028142333030700684, -0.002566099166870117, -0.002317965030670166, -0.002069830894470215, -0.0018216967582702637, -0.0015735626220703125, -0.0013254284858703613, -0.0010772943496704102, -0.000829160213470459, -0.0005810260772705078, -0.00033289194107055664, -8.475780487060547e-05, 0.0001633763313293457, 0.0004115104675292969, 0.000659644603729248, 0.0009077787399291992, 0.0011559128761291504, 0.0014040470123291016, 0.0016521811485290527, 0.001900315284729004, 0.002148449420928955, 0.0023965835571289062, 0.0026447176933288574, 0.0028928518295288086, 0.0031409859657287598, 0.003389120101928711, 0.003637254238128662, 0.0038853883743286133, 0.0041335225105285645, 0.004381656646728516, 0.004629790782928467, 0.004877924919128418, 0.005126059055328369, 0.00537419319152832, 0.0056223273277282715, 0.005870461463928223, 0.006118595600128174, 0.006366729736328125]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 7.0, 19.0, 40.0, 99.0, 220.0, 342.0, 159.0, 66.0, 28.0, 10.0, 8.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6818559169769287, -0.6402559280395508, -0.5986559391021729, -0.5570559501647949, -0.515455961227417, -0.4738559424877167, -0.43225592374801636, -0.3906559348106384, -0.3490559458732605, -0.30745595693588257, -0.26585596799850464, -0.22425594925880432, -0.1826559603214264, -0.14105597138404846, -0.09945596754550934, -0.057855963706970215, -0.016255974769592285, 0.02534402161836624, 0.06694401800632477, 0.1085440143942833, 0.15014401078224182, 0.19174399971961975, 0.23334400355815887, 0.274944007396698, 0.3165439963340759, 0.35814398527145386, 0.3997439742088318, 0.4413439929485321, 0.48294398188591003, 0.5245440006256104, 0.5661439895629883, 0.6077439785003662, 0.6493438482284546, 0.6909438371658325, 0.7325438261032104, 0.7741438150405884, 0.8157438039779663, 0.8573437929153442, 0.8989438414573669, 0.9405438303947449, 0.9821438193321228, 1.0237438678741455, 1.0653438568115234, 1.1069438457489014, 1.1485438346862793, 1.1901438236236572, 1.2317438125610352, 1.273343801498413, 1.314943790435791, 1.356543779373169, 1.3981437683105469, 1.4397437572479248, 1.4813437461853027, 1.5229437351226807, 1.5645437240600586, 1.6061437129974365, 1.6477437019348145, 1.6893436908721924, 1.7309436798095703, 1.7725436687469482, 1.8141436576843262, 1.855743646621704, 1.897343635559082, 1.93894362449646, 1.9805437326431274]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 4.0, 6.0, 9.0, 11.0, 21.0, 20.0, 31.0, 46.0, 51.0, 61.0, 67.0, 77.0, 94.0, 85.0, 70.0, 74.0, 77.0, 46.0, 38.0, 36.0, 28.0, 23.0, 13.0, 4.0, 7.0, 1.0, 2.0, 1.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6080535054206848, -0.5916590690612793, -0.575264573097229, -0.5588701367378235, -0.542475700378418, -0.5260812044143677, -0.5096867680549622, -0.49329233169555664, -0.47689786553382874, -0.46050339937210083, -0.4441089630126953, -0.4277144968509674, -0.4113200306892395, -0.394925594329834, -0.3785311281681061, -0.3621366620063782, -0.34574222564697266, -0.32934775948524475, -0.31295332312583923, -0.29655885696411133, -0.2801644206047058, -0.2637699544429779, -0.24737548828125, -0.2309810370206833, -0.21458658576011658, -0.19819213449954987, -0.18179768323898315, -0.16540321707725525, -0.14900876581668854, -0.13261431455612183, -0.11621985584497452, -0.09982539713382721, -0.08343100547790527, -0.06703655421733856, -0.050642095506191254, -0.034247640520334244, -0.017853185534477234, -0.0014587342739105225, 0.014935724437236786, 0.031330183148384094, 0.047724634408950806, 0.06411908566951752, 0.08051354438066483, 0.09690800309181213, 0.11330245435237885, 0.12969690561294556, 0.14609137177467346, 0.16248582303524017, 0.17888027429580688, 0.1952747255563736, 0.2116691768169403, 0.2280636429786682, 0.24445809423923492, 0.26085254549980164, 0.27724701166152954, 0.29364144802093506, 0.31003591418266296, 0.32643038034439087, 0.3428248167037964, 0.3592192828655243, 0.3756137490272522, 0.3920081853866577, 0.4084026515483856, 0.4247971177101135, 0.44119155406951904]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 5.0, 3.0, 9.0, 8.0, 8.0, 12.0, 22.0, 30.0, 44.0, 55.0, 81.0, 115.0, 175.0, 296.0, 464.0, 848.0, 1578.0, 3338.0, 7105.0, 18278.0, 59543.0, 302516.0, 507320.0, 101492.0, 26581.0, 9697.0, 4118.0, 2026.0, 1111.0, 625.0, 332.0, 205.0, 167.0, 113.0, 64.0, 43.0, 44.0, 18.0, 21.0, 12.0, 4.0, 7.0, 7.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.264404296875, -0.2566680908203125, -0.248931884765625, -0.2411956787109375, -0.23345947265625, -0.2257232666015625, -0.217987060546875, -0.2102508544921875, -0.2025146484375, -0.1947784423828125, -0.187042236328125, -0.1793060302734375, -0.17156982421875, -0.1638336181640625, -0.156097412109375, -0.1483612060546875, -0.140625, -0.1328887939453125, -0.125152587890625, -0.1174163818359375, -0.10968017578125, -0.1019439697265625, -0.094207763671875, -0.0864715576171875, -0.0787353515625, -0.0709991455078125, -0.063262939453125, -0.0555267333984375, -0.04779052734375, -0.0400543212890625, -0.032318115234375, -0.0245819091796875, -0.016845703125, -0.0091094970703125, -0.001373291015625, 0.0063629150390625, 0.01409912109375, 0.0218353271484375, 0.029571533203125, 0.0373077392578125, 0.0450439453125, 0.0527801513671875, 0.060516357421875, 0.0682525634765625, 0.07598876953125, 0.0837249755859375, 0.091461181640625, 0.0991973876953125, 0.10693359375, 0.1146697998046875, 0.122406005859375, 0.1301422119140625, 0.13787841796875, 0.1456146240234375, 0.153350830078125, 0.1610870361328125, 0.1688232421875, 0.1765594482421875, 0.184295654296875, 0.1920318603515625, 0.19976806640625, 0.2075042724609375, 0.215240478515625, 0.2229766845703125, 0.230712890625]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 12.0, 6.0, 5.0, 7.0, 16.0, 19.0, 15.0, 27.0, 45.0, 58.0, 60.0, 65.0, 82.0, 80.0, 77.0, 83.0, 61.0, 54.0, 60.0, 39.0, 36.0, 32.0, 20.0, 16.0, 13.0, 5.0, 4.0, 4.0, 3.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2177734375, -1.1866302490234375, -1.155487060546875, -1.1243438720703125, -1.09320068359375, -1.0620574951171875, -1.030914306640625, -0.9997711181640625, -0.9686279296875, -0.9374847412109375, -0.906341552734375, -0.8751983642578125, -0.84405517578125, -0.8129119873046875, -0.781768798828125, -0.7506256103515625, -0.719482421875, -0.6883392333984375, -0.657196044921875, -0.6260528564453125, -0.59490966796875, -0.5637664794921875, -0.532623291015625, -0.5014801025390625, -0.4703369140625, -0.4391937255859375, -0.408050537109375, -0.3769073486328125, -0.34576416015625, -0.3146209716796875, -0.283477783203125, -0.2523345947265625, -0.22119140625, -0.1900482177734375, -0.158905029296875, -0.1277618408203125, -0.09661865234375, -0.0654754638671875, -0.034332275390625, -0.0031890869140625, 0.0279541015625, 0.0590972900390625, 0.090240478515625, 0.1213836669921875, 0.15252685546875, 0.1836700439453125, 0.214813232421875, 0.2459564208984375, 0.277099609375, 0.3082427978515625, 0.339385986328125, 0.3705291748046875, 0.40167236328125, 0.4328155517578125, 0.463958740234375, 0.4951019287109375, 0.5262451171875, 0.5573883056640625, 0.588531494140625, 0.6196746826171875, 0.65081787109375, 0.6819610595703125, 0.713104248046875, 0.7442474365234375, 0.775390625]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 4.0, 3.0, 10.0, 11.0, 11.0, 22.0, 26.0, 24.0, 49.0, 59.0, 91.0, 152.0, 231.0, 451.0, 950.0, 3470.0, 27856.0, 835774.0, 167305.0, 8775.0, 1706.0, 663.0, 328.0, 186.0, 117.0, 75.0, 58.0, 41.0, 30.0, 25.0, 15.0, 7.0, 9.0, 7.0, 5.0, 4.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.58056640625, -0.562286376953125, -0.54400634765625, -0.525726318359375, -0.5074462890625, -0.489166259765625, -0.47088623046875, -0.452606201171875, -0.434326171875, -0.416046142578125, -0.39776611328125, -0.379486083984375, -0.3612060546875, -0.342926025390625, -0.32464599609375, -0.306365966796875, -0.2880859375, -0.269805908203125, -0.25152587890625, -0.233245849609375, -0.2149658203125, -0.196685791015625, -0.17840576171875, -0.160125732421875, -0.141845703125, -0.123565673828125, -0.10528564453125, -0.087005615234375, -0.0687255859375, -0.050445556640625, -0.03216552734375, -0.013885498046875, 0.00439453125, 0.022674560546875, 0.04095458984375, 0.059234619140625, 0.0775146484375, 0.095794677734375, 0.11407470703125, 0.132354736328125, 0.150634765625, 0.168914794921875, 0.18719482421875, 0.205474853515625, 0.2237548828125, 0.242034912109375, 0.26031494140625, 0.278594970703125, 0.296875, 0.315155029296875, 0.33343505859375, 0.351715087890625, 0.3699951171875, 0.388275146484375, 0.40655517578125, 0.424835205078125, 0.443115234375, 0.461395263671875, 0.47967529296875, 0.497955322265625, 0.5162353515625, 0.534515380859375, 0.55279541015625, 0.571075439453125, 0.58935546875]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 2.0, 3.0, 5.0, 3.0, 4.0, 9.0, 3.0, 9.0, 10.0, 15.0, 19.0, 24.0, 28.0, 30.0, 24.0, 47.0, 53.0, 56.0, 54.0, 46.0, 40.0, 52.0, 46.0, 49.0, 50.0, 42.0, 50.0, 41.0, 24.0, 26.0, 18.0, 22.0, 18.0, 12.0, 14.0, 13.0, 11.0, 9.0, 13.0, 4.0, 3.0, 2.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.70947265625, -0.684356689453125, -0.65924072265625, -0.634124755859375, -0.6090087890625, -0.583892822265625, -0.55877685546875, -0.533660888671875, -0.508544921875, -0.483428955078125, -0.45831298828125, -0.433197021484375, -0.4080810546875, -0.382965087890625, -0.35784912109375, -0.332733154296875, -0.3076171875, -0.282501220703125, -0.25738525390625, -0.232269287109375, -0.2071533203125, -0.182037353515625, -0.15692138671875, -0.131805419921875, -0.106689453125, -0.081573486328125, -0.05645751953125, -0.031341552734375, -0.0062255859375, 0.018890380859375, 0.04400634765625, 0.069122314453125, 0.09423828125, 0.119354248046875, 0.14447021484375, 0.169586181640625, 0.1947021484375, 0.219818115234375, 0.24493408203125, 0.270050048828125, 0.295166015625, 0.320281982421875, 0.34539794921875, 0.370513916015625, 0.3956298828125, 0.420745849609375, 0.44586181640625, 0.470977783203125, 0.49609375, 0.521209716796875, 0.54632568359375, 0.571441650390625, 0.5965576171875, 0.621673583984375, 0.64678955078125, 0.671905517578125, 0.697021484375, 0.722137451171875, 0.74725341796875, 0.772369384765625, 0.7974853515625, 0.822601318359375, 0.84771728515625, 0.872833251953125, 0.89794921875]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 7.0, 12.0, 38.0, 93.0, 229.0, 562.0, 2368.0, 52206.0, 981662.0, 9558.0, 1179.0, 340.0, 141.0, 83.0, 33.0, 22.0, 12.0, 4.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33935546875, -0.32645416259765625, -0.3135528564453125, -0.30065155029296875, -0.287750244140625, -0.27484893798828125, -0.2619476318359375, -0.24904632568359375, -0.23614501953125, -0.22324371337890625, -0.2103424072265625, -0.19744110107421875, -0.184539794921875, -0.17163848876953125, -0.1587371826171875, -0.14583587646484375, -0.1329345703125, -0.12003326416015625, -0.1071319580078125, -0.09423065185546875, -0.081329345703125, -0.06842803955078125, -0.0555267333984375, -0.04262542724609375, -0.02972412109375, -0.01682281494140625, -0.0039215087890625, 0.00897979736328125, 0.021881103515625, 0.03478240966796875, 0.0476837158203125, 0.06058502197265625, 0.073486328125, 0.08638763427734375, 0.0992889404296875, 0.11219024658203125, 0.125091552734375, 0.13799285888671875, 0.1508941650390625, 0.16379547119140625, 0.17669677734375, 0.18959808349609375, 0.2024993896484375, 0.21540069580078125, 0.228302001953125, 0.24120330810546875, 0.2541046142578125, 0.26700592041015625, 0.2799072265625, 0.29280853271484375, 0.3057098388671875, 0.31861114501953125, 0.331512451171875, 0.34441375732421875, 0.3573150634765625, 0.37021636962890625, 0.38311767578125, 0.39601898193359375, 0.4089202880859375, 0.42182159423828125, 0.434722900390625, 0.44762420654296875, 0.4605255126953125, 0.47342681884765625, 0.486328125]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 4.0, 5.0, 8.0, 4.0, 21.0, 20.0, 43.0, 96.0, 163.0, 231.0, 168.0, 108.0, 53.0, 31.0, 23.0, 9.0, 6.0, 1.0, 6.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1604042053222656e-05, -4.040449857711792e-05, -3.9204955101013184e-05, -3.800541162490845e-05, -3.680586814880371e-05, -3.5606324672698975e-05, -3.440678119659424e-05, -3.32072377204895e-05, -3.2007694244384766e-05, -3.080815076828003e-05, -2.9608607292175293e-05, -2.8409063816070557e-05, -2.720952033996582e-05, -2.6009976863861084e-05, -2.4810433387756348e-05, -2.361088991165161e-05, -2.2411346435546875e-05, -2.121180295944214e-05, -2.0012259483337402e-05, -1.8812716007232666e-05, -1.761317253112793e-05, -1.6413629055023193e-05, -1.5214085578918457e-05, -1.401454210281372e-05, -1.2814998626708984e-05, -1.1615455150604248e-05, -1.0415911674499512e-05, -9.216368198394775e-06, -8.016824722290039e-06, -6.817281246185303e-06, -5.617737770080566e-06, -4.41819429397583e-06, -3.2186508178710938e-06, -2.0191073417663574e-06, -8.195638656616211e-07, 3.7997961044311523e-07, 1.5795230865478516e-06, 2.779066562652588e-06, 3.978610038757324e-06, 5.1781535148620605e-06, 6.377696990966797e-06, 7.577240467071533e-06, 8.77678394317627e-06, 9.976327419281006e-06, 1.1175870895385742e-05, 1.2375414371490479e-05, 1.3574957847595215e-05, 1.4774501323699951e-05, 1.5974044799804688e-05, 1.7173588275909424e-05, 1.837313175201416e-05, 1.9572675228118896e-05, 2.0772218704223633e-05, 2.197176218032837e-05, 2.3171305656433105e-05, 2.4370849132537842e-05, 2.5570392608642578e-05, 2.6769936084747314e-05, 2.796947956085205e-05, 2.9169023036956787e-05, 3.0368566513061523e-05, 3.156810998916626e-05, 3.2767653465270996e-05, 3.396719694137573e-05, 3.516674041748047e-05]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 7.0, 15.0, 19.0, 36.0, 103.0, 253.0, 590.0, 2161.0, 16140.0, 945827.0, 77776.0, 4065.0, 974.0, 331.0, 146.0, 56.0, 27.0, 12.0, 4.0, 6.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.37548828125, -0.36400604248046875, -0.3525238037109375, -0.34104156494140625, -0.329559326171875, -0.31807708740234375, -0.3065948486328125, -0.29511260986328125, -0.28363037109375, -0.27214813232421875, -0.2606658935546875, -0.24918365478515625, -0.237701416015625, -0.22621917724609375, -0.2147369384765625, -0.20325469970703125, -0.1917724609375, -0.18029022216796875, -0.1688079833984375, -0.15732574462890625, -0.145843505859375, -0.13436126708984375, -0.1228790283203125, -0.11139678955078125, -0.09991455078125, -0.08843231201171875, -0.0769500732421875, -0.06546783447265625, -0.053985595703125, -0.04250335693359375, -0.0310211181640625, -0.01953887939453125, -0.008056640625, 0.00342559814453125, 0.0149078369140625, 0.02639007568359375, 0.037872314453125, 0.04935455322265625, 0.0608367919921875, 0.07231903076171875, 0.08380126953125, 0.09528350830078125, 0.1067657470703125, 0.11824798583984375, 0.129730224609375, 0.14121246337890625, 0.1526947021484375, 0.16417694091796875, 0.1756591796875, 0.18714141845703125, 0.1986236572265625, 0.21010589599609375, 0.221588134765625, 0.23307037353515625, 0.2445526123046875, 0.25603485107421875, 0.26751708984375, 0.27899932861328125, 0.2904815673828125, 0.30196380615234375, 0.313446044921875, 0.32492828369140625, 0.3364105224609375, 0.34789276123046875, 0.359375]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 5.0, 7.0, 8.0, 20.0, 13.0, 30.0, 35.0, 64.0, 75.0, 102.0, 144.0, 136.0, 94.0, 76.0, 48.0, 42.0, 18.0, 18.0, 15.0, 14.0, 8.0, 10.0, 3.0, 6.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0614013671875, -0.0595860481262207, -0.057770729064941406, -0.05595541000366211, -0.05414009094238281, -0.052324771881103516, -0.05050945281982422, -0.04869413375854492, -0.046878814697265625, -0.04506349563598633, -0.04324817657470703, -0.041432857513427734, -0.03961753845214844, -0.03780221939086914, -0.035986900329589844, -0.03417158126831055, -0.03235626220703125, -0.030540943145751953, -0.028725624084472656, -0.02691030502319336, -0.025094985961914062, -0.023279666900634766, -0.02146434783935547, -0.019649028778076172, -0.017833709716796875, -0.016018390655517578, -0.014203071594238281, -0.012387752532958984, -0.010572433471679688, -0.00875711441040039, -0.006941795349121094, -0.005126476287841797, -0.0033111572265625, -0.0014958381652832031, 0.00031948089599609375, 0.0021347999572753906, 0.0039501190185546875, 0.005765438079833984, 0.007580757141113281, 0.009396076202392578, 0.011211395263671875, 0.013026714324951172, 0.014842033386230469, 0.016657352447509766, 0.018472671508789062, 0.02028799057006836, 0.022103309631347656, 0.023918628692626953, 0.02573394775390625, 0.027549266815185547, 0.029364585876464844, 0.03117990493774414, 0.03299522399902344, 0.034810543060302734, 0.03662586212158203, 0.03844118118286133, 0.040256500244140625, 0.04207181930541992, 0.04388713836669922, 0.045702457427978516, 0.04751777648925781, 0.04933309555053711, 0.051148414611816406, 0.0529637336730957, 0.054779052734375]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 8.0, 24.0, 49.0, 118.0, 250.0, 294.0, 153.0, 60.0, 25.0, 7.0, 7.0, 6.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-4.325191497802734, -4.2423810958862305, -4.159570693969727, -4.076760292053223, -3.9939498901367188, -3.911139488220215, -3.828329086303711, -3.745518922805786, -3.6627085208892822, -3.5798981189727783, -3.4970877170562744, -3.4142773151397705, -3.3314669132232666, -3.248656749725342, -3.165846347808838, -3.083035945892334, -3.00022554397583, -2.917415142059326, -2.8346047401428223, -2.7517943382263184, -2.6689839363098145, -2.5861735343933105, -2.5033631324768066, -2.420552968978882, -2.337742328643799, -2.254931926727295, -2.172121524810791, -2.089311122894287, -2.006500720977783, -1.9236904382705688, -1.840880036354065, -1.7580697536468506, -1.6752595901489258, -1.5924491882324219, -1.509638786315918, -1.426828384399414, -1.3440181016921997, -1.2612076997756958, -1.178397297859192, -1.0955870151519775, -1.012776494026184, -0.9299660921096802, -0.847155749797821, -0.7643453478813171, -0.681535005569458, -0.5987246036529541, -0.5159142017364502, -0.43310385942459106, -0.35029345750808716, -0.26748308539390564, -0.18467269837856293, -0.10186231136322021, -0.019051939249038696, 0.06375843286514282, 0.14656883478164673, 0.22937917709350586, 0.31218957901000977, 0.3949999511241913, 0.4778103232383728, 0.5606207251548767, 0.6434310674667358, 0.7262414693832397, 0.8090518712997437, 0.8918622136116028, 0.9746726155281067]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 4.0, 3.0, 10.0, 8.0, 12.0, 13.0, 13.0, 10.0, 13.0, 23.0, 23.0, 27.0, 29.0, 28.0, 24.0, 30.0, 37.0, 30.0, 32.0, 38.0, 40.0, 42.0, 31.0, 30.0, 31.0, 27.0, 30.0, 32.0, 22.0, 42.0, 43.0, 32.0, 31.0, 15.0, 19.0, 25.0, 11.0, 20.0, 11.0, 9.0, 12.0, 10.0, 10.0, 3.0, 5.0, 4.0, 1.0, 2.0, 0.0, 2.0, 3.0, 0.0, 3.0], "bins": [-1.0858317613601685, -1.0538185834884644, -1.0218055248260498, -0.9897923469543457, -0.9577792286872864, -0.925766110420227, -0.893752932548523, -0.8617398142814636, -0.8297266960144043, -0.797713577747345, -0.7657003998756409, -0.7336872816085815, -0.7016741633415222, -0.6696610450744629, -0.6376478672027588, -0.6056347489356995, -0.5736215710639954, -0.541608452796936, -0.5095952749252319, -0.4775821566581726, -0.4455690383911133, -0.41355589032173157, -0.38154274225234985, -0.3495296239852905, -0.3175164759159088, -0.2855033278465271, -0.2534902095794678, -0.22147706151008606, -0.18946392834186554, -0.15745079517364502, -0.1254376471042633, -0.09342451393604279, -0.06141132116317749, -0.029398184269666672, 0.0026149526238441467, 0.034628093242645264, 0.06664122641086578, 0.0986543595790863, 0.13066750764846802, 0.16268064081668854, 0.19469377398490906, 0.22670690715312958, 0.2587200403213501, 0.2907331883907318, 0.3227463364601135, 0.35475945472717285, 0.38677260279655457, 0.4187857508659363, 0.4507988691329956, 0.4828120172023773, 0.514825165271759, 0.5468382835388184, 0.5788514018058777, 0.610864520072937, 0.6428776979446411, 0.6748908162117004, 0.7069039344787598, 0.7389170527458191, 0.7709302306175232, 0.8029433488845825, 0.8349564671516418, 0.8669695854187012, 0.8989827632904053, 0.9309958815574646, 0.9630090594291687]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 5.0, 4.0, 4.0, 12.0, 16.0, 19.0, 26.0, 43.0, 67.0, 80.0, 149.0, 265.0, 564.0, 1018.0, 2368.0, 7524.0, 56850.0, 2650885.0, 1424657.0, 38456.0, 6953.0, 2275.0, 909.0, 469.0, 250.0, 165.0, 75.0, 61.0, 41.0, 31.0, 12.0, 10.0, 6.0, 8.0, 1.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9794921875, -0.9444122314453125, -0.909332275390625, -0.8742523193359375, -0.83917236328125, -0.8040924072265625, -0.769012451171875, -0.7339324951171875, -0.6988525390625, -0.6637725830078125, -0.628692626953125, -0.5936126708984375, -0.55853271484375, -0.5234527587890625, -0.488372802734375, -0.4532928466796875, -0.418212890625, -0.3831329345703125, -0.348052978515625, -0.3129730224609375, -0.27789306640625, -0.2428131103515625, -0.207733154296875, -0.1726531982421875, -0.1375732421875, -0.1024932861328125, -0.067413330078125, -0.0323333740234375, 0.00274658203125, 0.0378265380859375, 0.072906494140625, 0.1079864501953125, 0.14306640625, 0.1781463623046875, 0.213226318359375, 0.2483062744140625, 0.28338623046875, 0.3184661865234375, 0.353546142578125, 0.3886260986328125, 0.4237060546875, 0.4587860107421875, 0.493865966796875, 0.5289459228515625, 0.56402587890625, 0.5991058349609375, 0.634185791015625, 0.6692657470703125, 0.704345703125, 0.7394256591796875, 0.774505615234375, 0.8095855712890625, 0.84466552734375, 0.8797454833984375, 0.914825439453125, 0.9499053955078125, 0.9849853515625, 1.0200653076171875, 1.055145263671875, 1.0902252197265625, 1.12530517578125, 1.1603851318359375, 1.195465087890625, 1.2305450439453125, 1.265625]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 11.0, 16.0, 19.0, 15.0, 25.0, 36.0, 35.0, 45.0, 73.0, 83.0, 93.0, 91.0, 79.0, 83.0, 74.0, 52.0, 43.0, 35.0, 29.0, 11.0, 22.0, 8.0, 6.0, 6.0, 5.0, 2.0, 2.0, 4.0, 0.0, 3.0], "bins": [-0.86767578125, -0.8485832214355469, -0.8294906616210938, -0.8103981018066406, -0.7913055419921875, -0.7722129821777344, -0.7531204223632812, -0.7340278625488281, -0.714935302734375, -0.6958427429199219, -0.6767501831054688, -0.6576576232910156, -0.6385650634765625, -0.6194725036621094, -0.6003799438476562, -0.5812873840332031, -0.56219482421875, -0.5431022644042969, -0.5240097045898438, -0.5049171447753906, -0.4858245849609375, -0.4667320251464844, -0.44763946533203125, -0.4285469055175781, -0.409454345703125, -0.3903617858886719, -0.37126922607421875, -0.3521766662597656, -0.3330841064453125, -0.3139915466308594, -0.29489898681640625, -0.2758064270019531, -0.2567138671875, -0.23762130737304688, -0.21852874755859375, -0.19943618774414062, -0.1803436279296875, -0.16125106811523438, -0.14215850830078125, -0.12306594848632812, -0.103973388671875, -0.08488082885742188, -0.06578826904296875, -0.046695709228515625, -0.0276031494140625, -0.008510589599609375, 0.01058197021484375, 0.029674530029296875, 0.04876708984375, 0.06785964965820312, 0.08695220947265625, 0.10604476928710938, 0.1251373291015625, 0.14422988891601562, 0.16332244873046875, 0.18241500854492188, 0.201507568359375, 0.22060012817382812, 0.23969268798828125, 0.2587852478027344, 0.2778778076171875, 0.2969703674316406, 0.31606292724609375, 0.3351554870605469, 0.354248046875]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 7.0, 8.0, 4.0, 6.0, 19.0, 13.0, 19.0, 18.0, 41.0, 54.0, 89.0, 113.0, 190.0, 296.0, 519.0, 940.0, 1721.0, 3747.0, 8977.0, 29249.0, 190095.0, 3418819.0, 471551.0, 45640.0, 12438.0, 4743.0, 2149.0, 1115.0, 636.0, 365.0, 249.0, 154.0, 93.0, 66.0, 47.0, 24.0, 27.0, 18.0, 8.0, 4.0, 6.0, 3.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.61572265625, -0.5942306518554688, -0.5727386474609375, -0.5512466430664062, -0.529754638671875, -0.5082626342773438, -0.4867706298828125, -0.46527862548828125, -0.44378662109375, -0.42229461669921875, -0.4008026123046875, -0.37931060791015625, -0.357818603515625, -0.33632659912109375, -0.3148345947265625, -0.29334259033203125, -0.2718505859375, -0.25035858154296875, -0.2288665771484375, -0.20737457275390625, -0.185882568359375, -0.16439056396484375, -0.1428985595703125, -0.12140655517578125, -0.09991455078125, -0.07842254638671875, -0.0569305419921875, -0.03543853759765625, -0.013946533203125, 0.00754547119140625, 0.0290374755859375, 0.05052947998046875, 0.072021484375, 0.09351348876953125, 0.1150054931640625, 0.13649749755859375, 0.157989501953125, 0.17948150634765625, 0.2009735107421875, 0.22246551513671875, 0.24395751953125, 0.26544952392578125, 0.2869415283203125, 0.30843353271484375, 0.329925537109375, 0.35141754150390625, 0.3729095458984375, 0.39440155029296875, 0.4158935546875, 0.43738555908203125, 0.4588775634765625, 0.48036956787109375, 0.501861572265625, 0.5233535766601562, 0.5448455810546875, 0.5663375854492188, 0.58782958984375, 0.6093215942382812, 0.6308135986328125, 0.6523056030273438, 0.673797607421875, 0.6952896118164062, 0.7167816162109375, 0.7382736206054688, 0.759765625]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 0.0, 0.0, 1.0, 4.0, 6.0, 7.0, 3.0, 8.0, 16.0, 20.0, 17.0, 31.0, 49.0, 80.0, 135.0, 286.0, 509.0, 821.0, 886.0, 508.0, 289.0, 144.0, 84.0, 43.0, 32.0, 28.0, 24.0, 13.0, 12.0, 7.0, 3.0, 5.0, 1.0, 2.0, 1.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.259521484375, -0.25189781188964844, -0.24427413940429688, -0.2366504669189453, -0.22902679443359375, -0.2214031219482422, -0.21377944946289062, -0.20615577697753906, -0.1985321044921875, -0.19090843200683594, -0.18328475952148438, -0.1756610870361328, -0.16803741455078125, -0.1604137420654297, -0.15279006958007812, -0.14516639709472656, -0.137542724609375, -0.12991905212402344, -0.12229537963867188, -0.11467170715332031, -0.10704803466796875, -0.09942436218261719, -0.09180068969726562, -0.08417701721191406, -0.0765533447265625, -0.06892967224121094, -0.061305999755859375, -0.05368232727050781, -0.04605865478515625, -0.03843498229980469, -0.030811309814453125, -0.023187637329101562, -0.01556396484375, -0.007940292358398438, -0.000316619873046875, 0.0073070526123046875, 0.01493072509765625, 0.022554397583007812, 0.030178070068359375, 0.03780174255371094, 0.0454254150390625, 0.05304908752441406, 0.060672760009765625, 0.06829643249511719, 0.07592010498046875, 0.08354377746582031, 0.09116744995117188, 0.09879112243652344, 0.106414794921875, 0.11403846740722656, 0.12166213989257812, 0.1292858123779297, 0.13690948486328125, 0.1445331573486328, 0.15215682983398438, 0.15978050231933594, 0.1674041748046875, 0.17502784729003906, 0.18265151977539062, 0.1902751922607422, 0.19789886474609375, 0.2055225372314453, 0.21314620971679688, 0.22076988220214844, 0.2283935546875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 4.0, 7.0, 6.0, 13.0, 16.0, 16.0, 31.0, 37.0, 74.0, 82.0, 100.0, 127.0, 122.0, 103.0, 72.0, 46.0, 50.0, 23.0, 25.0, 15.0, 8.0, 6.0, 5.0, 4.0, 5.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0084772109985352, -0.9805503487586975, -0.9526234865188599, -0.9246966242790222, -0.8967697620391846, -0.8688428997993469, -0.8409160375595093, -0.8129891157150269, -0.785062313079834, -0.7571354508399963, -0.7292085886001587, -0.701281726360321, -0.6733548641204834, -0.6454280018806458, -0.6175011396408081, -0.5895742177963257, -0.561647355556488, -0.5337204933166504, -0.5057936310768127, -0.4778667688369751, -0.44993990659713745, -0.4220130443572998, -0.39408615231513977, -0.3661592900753021, -0.3382324278354645, -0.31030556559562683, -0.2823787033557892, -0.25445181131362915, -0.2265249639749527, -0.19859810173511505, -0.1706712245941162, -0.14274436235427856, -0.11481750011444092, -0.08689063787460327, -0.05896376818418503, -0.031036898493766785, -0.003110036253929138, 0.02481682598590851, 0.05274370312690735, 0.080670565366745, 0.10859742760658264, 0.1365242898464203, 0.16445115208625793, 0.19237802922725677, 0.22030489146709442, 0.24823175370693207, 0.2761586308479309, 0.30408549308776855, 0.3320123553276062, 0.35993921756744385, 0.3878660798072815, 0.41579294204711914, 0.4437198042869568, 0.47164666652679443, 0.49957355856895447, 0.5275003910064697, 0.5554273128509521, 0.5833541750907898, 0.6112810373306274, 0.6392078995704651, 0.6671347618103027, 0.6950616240501404, 0.722988486289978, 0.7509154081344604, 0.7788422107696533]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 1.0, 4.0, 3.0, 8.0, 12.0, 15.0, 11.0, 17.0, 17.0, 19.0, 21.0, 34.0, 43.0, 38.0, 52.0, 56.0, 54.0, 55.0, 52.0, 63.0, 48.0, 44.0, 51.0, 43.0, 35.0, 44.0, 30.0, 27.0, 25.0, 14.0, 17.0, 10.0, 16.0, 8.0, 7.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.7128046154975891, -0.6952500343322754, -0.6776953935623169, -0.6601408123970032, -0.6425862312316895, -0.6250316500663757, -0.6074770092964172, -0.5899224281311035, -0.5723678469657898, -0.5548132658004761, -0.5372586250305176, -0.5197040438652039, -0.5021494626998901, -0.48459485173225403, -0.4670402407646179, -0.4494856595993042, -0.4319310486316681, -0.414376437664032, -0.39682185649871826, -0.37926724553108215, -0.36171266436576843, -0.3441580533981323, -0.3266034722328186, -0.3090488612651825, -0.2914942502975464, -0.2739396393299103, -0.25638505816459656, -0.23883044719696045, -0.22127586603164673, -0.20372125506401062, -0.1861666589975357, -0.1686120629310608, -0.15105748176574707, -0.13350288569927216, -0.11594828963279724, -0.09839368611574173, -0.08083909004926682, -0.0632844939827919, -0.04572989046573639, -0.028175294399261475, -0.01062069833278656, 0.006933899596333504, 0.024488497525453568, 0.04204309731721878, 0.059597693383693695, 0.07715228945016861, 0.09470689296722412, 0.11226148903369904, 0.12981608510017395, 0.14737068116664886, 0.16492527723312378, 0.1824798882007599, 0.2000344693660736, 0.21758908033370972, 0.23514367640018463, 0.25269827246665955, 0.27025288343429565, 0.28780749440193176, 0.3053620755672455, 0.3229166865348816, 0.3404712677001953, 0.3580258786678314, 0.37558048963546753, 0.39313507080078125, 0.41068965196609497]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 7.0, 8.0, 10.0, 21.0, 46.0, 67.0, 133.0, 322.0, 817.0, 2463.0, 10488.0, 285181.0, 726959.0, 16873.0, 3455.0, 1047.0, 345.0, 161.0, 53.0, 39.0, 15.0, 17.0, 11.0, 3.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.251220703125, -0.2403564453125, -0.2294921875, -0.2186279296875, -0.207763671875, -0.1968994140625, -0.18603515625, -0.1751708984375, -0.164306640625, -0.1534423828125, -0.142578125, -0.1317138671875, -0.120849609375, -0.1099853515625, -0.09912109375, -0.0882568359375, -0.077392578125, -0.0665283203125, -0.0556640625, -0.0447998046875, -0.033935546875, -0.0230712890625, -0.01220703125, -0.0013427734375, 0.009521484375, 0.0203857421875, 0.03125, 0.0421142578125, 0.052978515625, 0.0638427734375, 0.07470703125, 0.0855712890625, 0.096435546875, 0.1072998046875, 0.1181640625, 0.1290283203125, 0.139892578125, 0.1507568359375, 0.16162109375, 0.1724853515625, 0.183349609375, 0.1942138671875, 0.205078125, 0.2159423828125, 0.226806640625, 0.2376708984375, 0.24853515625, 0.2593994140625, 0.270263671875, 0.2811279296875, 0.2919921875, 0.3028564453125, 0.313720703125, 0.3245849609375, 0.33544921875, 0.3463134765625, 0.357177734375, 0.3680419921875, 0.37890625, 0.3897705078125, 0.400634765625, 0.4114990234375, 0.42236328125, 0.4332275390625, 0.444091796875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 3.0, 6.0, 9.0, 8.0, 7.0, 13.0, 18.0, 14.0, 22.0, 31.0, 45.0, 48.0, 50.0, 57.0, 71.0, 58.0, 72.0, 76.0, 63.0, 59.0, 49.0, 47.0, 31.0, 27.0, 29.0, 21.0, 26.0, 8.0, 8.0, 10.0, 5.0, 6.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5341796875, -0.5206069946289062, -0.5070343017578125, -0.49346160888671875, -0.479888916015625, -0.46631622314453125, -0.4527435302734375, -0.43917083740234375, -0.42559814453125, -0.41202545166015625, -0.3984527587890625, -0.38488006591796875, -0.371307373046875, -0.35773468017578125, -0.3441619873046875, -0.33058929443359375, -0.3170166015625, -0.30344390869140625, -0.2898712158203125, -0.27629852294921875, -0.262725830078125, -0.24915313720703125, -0.2355804443359375, -0.22200775146484375, -0.20843505859375, -0.19486236572265625, -0.1812896728515625, -0.16771697998046875, -0.154144287109375, -0.14057159423828125, -0.1269989013671875, -0.11342620849609375, -0.099853515625, -0.08628082275390625, -0.0727081298828125, -0.05913543701171875, -0.045562744140625, -0.03199005126953125, -0.0184173583984375, -0.00484466552734375, 0.00872802734375, 0.02230072021484375, 0.0358734130859375, 0.04944610595703125, 0.063018798828125, 0.07659149169921875, 0.0901641845703125, 0.10373687744140625, 0.1173095703125, 0.13088226318359375, 0.1444549560546875, 0.15802764892578125, 0.171600341796875, 0.18517303466796875, 0.1987457275390625, 0.21231842041015625, 0.22589111328125, 0.23946380615234375, 0.2530364990234375, 0.26660919189453125, 0.280181884765625, 0.29375457763671875, 0.3073272705078125, 0.32089996337890625, 0.33447265625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 5.0, 6.0, 11.0, 17.0, 36.0, 44.0, 79.0, 138.0, 270.0, 490.0, 1053.0, 2365.0, 5984.0, 21542.0, 241268.0, 679652.0, 76626.0, 11759.0, 3910.0, 1640.0, 772.0, 381.0, 205.0, 114.0, 62.0, 37.0, 31.0, 16.0, 15.0, 11.0, 1.0, 3.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.155029296875, -0.15037155151367188, -0.14571380615234375, -0.14105606079101562, -0.1363983154296875, -0.13174057006835938, -0.12708282470703125, -0.12242507934570312, -0.117767333984375, -0.11310958862304688, -0.10845184326171875, -0.10379409790039062, -0.0991363525390625, -0.09447860717773438, -0.08982086181640625, -0.08516311645507812, -0.08050537109375, -0.07584762573242188, -0.07118988037109375, -0.06653213500976562, -0.0618743896484375, -0.057216644287109375, -0.05255889892578125, -0.047901153564453125, -0.043243408203125, -0.038585662841796875, -0.03392791748046875, -0.029270172119140625, -0.0246124267578125, -0.019954681396484375, -0.01529693603515625, -0.010639190673828125, -0.0059814453125, -0.001323699951171875, 0.00333404541015625, 0.007991790771484375, 0.0126495361328125, 0.017307281494140625, 0.02196502685546875, 0.026622772216796875, 0.031280517578125, 0.035938262939453125, 0.04059600830078125, 0.045253753662109375, 0.0499114990234375, 0.054569244384765625, 0.05922698974609375, 0.06388473510742188, 0.06854248046875, 0.07320022583007812, 0.07785797119140625, 0.08251571655273438, 0.0871734619140625, 0.09183120727539062, 0.09648895263671875, 0.10114669799804688, 0.105804443359375, 0.11046218872070312, 0.11511993408203125, 0.11977767944335938, 0.1244354248046875, 0.12909317016601562, 0.13375091552734375, 0.13840866088867188, 0.14306640625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 8.0, 3.0, 5.0, 7.0, 9.0, 11.0, 18.0, 20.0, 17.0, 24.0, 33.0, 28.0, 34.0, 31.0, 43.0, 44.0, 37.0, 49.0, 52.0, 32.0, 42.0, 41.0, 37.0, 42.0, 38.0, 39.0, 46.0, 31.0, 27.0, 20.0, 19.0, 20.0, 20.0, 10.0, 10.0, 15.0, 6.0, 7.0, 5.0, 5.0, 3.0, 2.0, 6.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5126953125, -0.49469757080078125, -0.4766998291015625, -0.45870208740234375, -0.440704345703125, -0.42270660400390625, -0.4047088623046875, -0.38671112060546875, -0.36871337890625, -0.35071563720703125, -0.3327178955078125, -0.31472015380859375, -0.296722412109375, -0.27872467041015625, -0.2607269287109375, -0.24272918701171875, -0.2247314453125, -0.20673370361328125, -0.1887359619140625, -0.17073822021484375, -0.152740478515625, -0.13474273681640625, -0.1167449951171875, -0.09874725341796875, -0.08074951171875, -0.06275177001953125, -0.0447540283203125, -0.02675628662109375, -0.008758544921875, 0.00923919677734375, 0.0272369384765625, 0.04523468017578125, 0.063232421875, 0.08123016357421875, 0.0992279052734375, 0.11722564697265625, 0.135223388671875, 0.15322113037109375, 0.1712188720703125, 0.18921661376953125, 0.20721435546875, 0.22521209716796875, 0.2432098388671875, 0.26120758056640625, 0.279205322265625, 0.29720306396484375, 0.3152008056640625, 0.33319854736328125, 0.3511962890625, 0.36919403076171875, 0.3871917724609375, 0.40518951416015625, 0.423187255859375, 0.44118499755859375, 0.4591827392578125, 0.47718048095703125, 0.49517822265625, 0.5131759643554688, 0.5311737060546875, 0.5491714477539062, 0.567169189453125, 0.5851669311523438, 0.6031646728515625, 0.6211624145507812, 0.63916015625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 7.0, 3.0, 5.0, 4.0, 10.0, 13.0, 16.0, 34.0, 58.0, 77.0, 99.0, 154.0, 243.0, 442.0, 794.0, 1399.0, 2885.0, 6113.0, 14717.0, 41666.0, 147185.0, 438263.0, 277466.0, 75499.0, 23616.0, 9204.0, 3988.0, 1987.0, 1077.0, 551.0, 355.0, 216.0, 140.0, 89.0, 58.0, 30.0, 27.0, 14.0, 12.0, 10.0, 8.0, 8.0, 9.0, 4.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0238494873046875, -0.023047685623168945, -0.02224588394165039, -0.021444082260131836, -0.02064228057861328, -0.019840478897094727, -0.019038677215576172, -0.018236875534057617, -0.017435073852539062, -0.016633272171020508, -0.015831470489501953, -0.015029668807983398, -0.014227867126464844, -0.013426065444946289, -0.012624263763427734, -0.01182246208190918, -0.011020660400390625, -0.01021885871887207, -0.009417057037353516, -0.008615255355834961, -0.007813453674316406, -0.0070116519927978516, -0.006209850311279297, -0.005408048629760742, -0.0046062469482421875, -0.003804445266723633, -0.003002643585205078, -0.0022008419036865234, -0.0013990402221679688, -0.0005972385406494141, 0.00020456314086914062, 0.0010063648223876953, 0.00180816650390625, 0.0026099681854248047, 0.0034117698669433594, 0.004213571548461914, 0.005015373229980469, 0.0058171749114990234, 0.006618976593017578, 0.007420778274536133, 0.008222579956054688, 0.009024381637573242, 0.009826183319091797, 0.010627985000610352, 0.011429786682128906, 0.012231588363647461, 0.013033390045166016, 0.01383519172668457, 0.014636993408203125, 0.01543879508972168, 0.016240596771240234, 0.01704239845275879, 0.017844200134277344, 0.0186460018157959, 0.019447803497314453, 0.020249605178833008, 0.021051406860351562, 0.021853208541870117, 0.022655010223388672, 0.023456811904907227, 0.02425861358642578, 0.025060415267944336, 0.02586221694946289, 0.026664018630981445, 0.0274658203125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 3.0, 5.0, 17.0, 20.0, 29.0, 49.0, 67.0, 90.0, 119.0, 133.0, 127.0, 96.0, 89.0, 62.0, 31.0, 17.0, 14.0, 12.0, 4.0, 2.0, 4.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7881393432617188e-05, -1.715961843729019e-05, -1.6437843441963196e-05, -1.57160684466362e-05, -1.4994293451309204e-05, -1.4272518455982208e-05, -1.3550743460655212e-05, -1.2828968465328217e-05, -1.210719347000122e-05, -1.1385418474674225e-05, -1.0663643479347229e-05, -9.941868484020233e-06, -9.220093488693237e-06, -8.498318493366241e-06, -7.776543498039246e-06, -7.05476850271225e-06, -6.332993507385254e-06, -5.611218512058258e-06, -4.889443516731262e-06, -4.167668521404266e-06, -3.4458935260772705e-06, -2.7241185307502747e-06, -2.002343535423279e-06, -1.280568540096283e-06, -5.587935447692871e-07, 1.6298145055770874e-07, 8.847564458847046e-07, 1.6065314412117004e-06, 2.3283064365386963e-06, 3.050081431865692e-06, 3.771856427192688e-06, 4.493631422519684e-06, 5.21540641784668e-06, 5.9371814131736755e-06, 6.658956408500671e-06, 7.380731403827667e-06, 8.102506399154663e-06, 8.824281394481659e-06, 9.546056389808655e-06, 1.026783138513565e-05, 1.0989606380462646e-05, 1.1711381375789642e-05, 1.2433156371116638e-05, 1.3154931366443634e-05, 1.387670636177063e-05, 1.4598481357097626e-05, 1.532025635242462e-05, 1.6042031347751617e-05, 1.6763806343078613e-05, 1.748558133840561e-05, 1.8207356333732605e-05, 1.89291313290596e-05, 1.9650906324386597e-05, 2.0372681319713593e-05, 2.109445631504059e-05, 2.1816231310367584e-05, 2.253800630569458e-05, 2.3259781301021576e-05, 2.3981556296348572e-05, 2.4703331291675568e-05, 2.5425106287002563e-05, 2.614688128232956e-05, 2.6868656277656555e-05, 2.759043127298355e-05, 2.8312206268310547e-05]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 9.0, 7.0, 6.0, 16.0, 15.0, 26.0, 38.0, 75.0, 103.0, 151.0, 274.0, 459.0, 923.0, 1710.0, 3398.0, 7434.0, 17473.0, 46295.0, 145133.0, 386882.0, 290629.0, 92439.0, 31436.0, 12638.0, 5380.0, 2569.0, 1320.0, 678.0, 385.0, 234.0, 141.0, 85.0, 56.0, 46.0, 30.0, 18.0, 17.0, 9.0, 6.0, 5.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0299530029296875, -0.029139280319213867, -0.028325557708740234, -0.0275118350982666, -0.02669811248779297, -0.025884389877319336, -0.025070667266845703, -0.02425694465637207, -0.023443222045898438, -0.022629499435424805, -0.021815776824951172, -0.02100205421447754, -0.020188331604003906, -0.019374608993530273, -0.01856088638305664, -0.017747163772583008, -0.016933441162109375, -0.016119718551635742, -0.01530599594116211, -0.014492273330688477, -0.013678550720214844, -0.012864828109741211, -0.012051105499267578, -0.011237382888793945, -0.010423660278320312, -0.00960993766784668, -0.008796215057373047, -0.007982492446899414, -0.007168769836425781, -0.0063550472259521484, -0.005541324615478516, -0.004727602005004883, -0.00391387939453125, -0.003100156784057617, -0.0022864341735839844, -0.0014727115631103516, -0.0006589889526367188, 0.00015473365783691406, 0.0009684562683105469, 0.0017821788787841797, 0.0025959014892578125, 0.0034096240997314453, 0.004223346710205078, 0.005037069320678711, 0.005850791931152344, 0.0066645145416259766, 0.007478237152099609, 0.008291959762573242, 0.009105682373046875, 0.009919404983520508, 0.01073312759399414, 0.011546850204467773, 0.012360572814941406, 0.013174295425415039, 0.013988018035888672, 0.014801740646362305, 0.015615463256835938, 0.01642918586730957, 0.017242908477783203, 0.018056631088256836, 0.01887035369873047, 0.0196840763092041, 0.020497798919677734, 0.021311521530151367, 0.022125244140625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 6.0, 8.0, 5.0, 8.0, 11.0, 19.0, 17.0, 17.0, 23.0, 35.0, 33.0, 51.0, 49.0, 52.0, 71.0, 65.0, 59.0, 61.0, 60.0, 60.0, 46.0, 53.0, 31.0, 27.0, 33.0, 19.0, 12.0, 6.0, 10.0, 12.0, 7.0, 12.0, 8.0, 4.0, 5.0, 4.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.0081787109375, -0.007954597473144531, -0.0077304840087890625, -0.007506370544433594, -0.007282257080078125, -0.007058143615722656, -0.0068340301513671875, -0.006609916687011719, -0.00638580322265625, -0.006161689758300781, -0.0059375762939453125, -0.005713462829589844, -0.005489349365234375, -0.005265235900878906, -0.0050411224365234375, -0.004817008972167969, -0.0045928955078125, -0.004368782043457031, -0.0041446685791015625, -0.003920555114746094, -0.003696441650390625, -0.0034723281860351562, -0.0032482147216796875, -0.0030241012573242188, -0.00279998779296875, -0.0025758743286132812, -0.0023517608642578125, -0.0021276473999023438, -0.001903533935546875, -0.0016794204711914062, -0.0014553070068359375, -0.0012311935424804688, -0.001007080078125, -0.0007829666137695312, -0.0005588531494140625, -0.00033473968505859375, -0.000110626220703125, 0.00011348724365234375, 0.0003376007080078125, 0.0005617141723632812, 0.00078582763671875, 0.0010099411010742188, 0.0012340545654296875, 0.0014581680297851562, 0.001682281494140625, 0.0019063949584960938, 0.0021305084228515625, 0.0023546218872070312, 0.0025787353515625, 0.0028028488159179688, 0.0030269622802734375, 0.0032510757446289062, 0.003475189208984375, 0.0036993026733398438, 0.0039234161376953125, 0.004147529602050781, 0.00437164306640625, 0.004595756530761719, 0.0048198699951171875, 0.005043983459472656, 0.005268096923828125, 0.005492210388183594, 0.0057163238525390625, 0.005940437316894531, 0.00616455078125]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 3.0, 3.0, 13.0, 8.0, 21.0, 39.0, 71.0, 107.0, 187.0, 189.0, 156.0, 80.0, 39.0, 39.0, 19.0, 12.0, 4.0, 8.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5792648196220398, -0.5532782077789307, -0.5272916555404663, -0.5013050436973572, -0.47531846165657043, -0.4493318796157837, -0.42334526777267456, -0.3973586857318878, -0.3713721036911011, -0.34538552165031433, -0.3193989396095276, -0.29341232776641846, -0.2674257457256317, -0.24143916368484497, -0.21545256674289703, -0.1894659698009491, -0.16347938776016235, -0.1374928057193756, -0.11150620877742767, -0.08551961928606033, -0.05953302979469299, -0.03354644775390625, -0.007559850811958313, 0.018426746129989624, 0.04441332817077637, 0.07039991766214371, 0.09638650715351105, 0.12237309664487839, 0.14835968613624573, 0.17434626817703247, 0.2003328651189804, 0.22631946206092834, 0.2523059844970703, 0.27829256653785706, 0.3042791485786438, 0.33026576042175293, 0.3562523424625397, 0.3822389245033264, 0.40822553634643555, 0.4342121183872223, 0.46019870042800903, 0.4861852824687958, 0.5121718645095825, 0.5381584763526917, 0.5641450881958008, 0.5901316404342651, 0.6161182522773743, 0.6421048641204834, 0.6680914163589478, 0.6940780282020569, 0.7200645804405212, 0.7460511922836304, 0.7720377445220947, 0.7980243563652039, 0.824010968208313, 0.8499975204467773, 0.8759841322898865, 0.9019707441329956, 0.92795729637146, 0.9539439082145691, 0.9799305200576782, 1.0059170722961426, 1.031903624534607, 1.0578902959823608, 1.0838768482208252]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 3.0, 5.0, 1.0, 3.0, 21.0, 10.0, 13.0, 15.0, 20.0, 22.0, 22.0, 39.0, 46.0, 54.0, 56.0, 54.0, 63.0, 55.0, 72.0, 51.0, 49.0, 50.0, 46.0, 51.0, 43.0, 22.0, 34.0, 17.0, 17.0, 10.0, 13.0, 9.0, 7.0, 6.0, 6.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.49656617641448975, -0.48438894748687744, -0.47221168875694275, -0.46003445982933044, -0.44785720109939575, -0.43567997217178345, -0.42350274324417114, -0.41132551431655884, -0.39914825558662415, -0.38697102665901184, -0.37479376792907715, -0.36261653900146484, -0.35043931007385254, -0.33826205134391785, -0.32608482241630554, -0.31390756368637085, -0.30173033475875854, -0.28955310583114624, -0.27737584710121155, -0.26519861817359924, -0.25302135944366455, -0.24084413051605225, -0.22866690158843994, -0.21648965775966644, -0.20431241393089294, -0.19213517010211945, -0.17995792627334595, -0.16778069734573364, -0.15560345351696014, -0.14342620968818665, -0.13124898076057434, -0.11907173693180084, -0.10689452290534973, -0.09471727907657623, -0.08254004269838333, -0.07036280632019043, -0.05818556249141693, -0.04600832238793373, -0.03383108228445053, -0.02165384590625763, -0.00947660207748413, 0.002700638025999069, 0.01487787812948227, 0.02705511823296547, 0.03923235833644867, 0.05140959843993187, 0.06358683854341507, 0.07576407492160797, 0.08794131875038147, 0.10011856257915497, 0.11229579895734787, 0.12447303533554077, 0.13665027916431427, 0.14882752299308777, 0.16100475192070007, 0.17318199574947357, 0.18535923957824707, 0.19753648340702057, 0.20971372723579407, 0.22189095616340637, 0.23406819999217987, 0.24624544382095337, 0.2584226727485657, 0.270599901676178, 0.28277716040611267]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 3.0, 0.0, 11.0, 14.0, 15.0, 29.0, 46.0, 70.0, 136.0, 281.0, 533.0, 1722.0, 7495.0, 55191.0, 792732.0, 168249.0, 17247.0, 3116.0, 893.0, 335.0, 199.0, 99.0, 56.0, 37.0, 17.0, 17.0, 5.0, 8.0, 3.0, 0.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.469970703125, -0.4556083679199219, -0.44124603271484375, -0.4268836975097656, -0.4125213623046875, -0.3981590270996094, -0.38379669189453125, -0.3694343566894531, -0.355072021484375, -0.3407096862792969, -0.32634735107421875, -0.3119850158691406, -0.2976226806640625, -0.2832603454589844, -0.26889801025390625, -0.2545356750488281, -0.24017333984375, -0.22581100463867188, -0.21144866943359375, -0.19708633422851562, -0.1827239990234375, -0.16836166381835938, -0.15399932861328125, -0.13963699340820312, -0.125274658203125, -0.11091232299804688, -0.09654998779296875, -0.08218765258789062, -0.0678253173828125, -0.053462982177734375, -0.03910064697265625, -0.024738311767578125, -0.0103759765625, 0.003986358642578125, 0.01834869384765625, 0.032711029052734375, 0.0470733642578125, 0.061435699462890625, 0.07579803466796875, 0.09016036987304688, 0.104522705078125, 0.11888504028320312, 0.13324737548828125, 0.14760971069335938, 0.1619720458984375, 0.17633438110351562, 0.19069671630859375, 0.20505905151367188, 0.21942138671875, 0.23378372192382812, 0.24814605712890625, 0.2625083923339844, 0.2768707275390625, 0.2912330627441406, 0.30559539794921875, 0.3199577331542969, 0.334320068359375, 0.3486824035644531, 0.36304473876953125, 0.3774070739746094, 0.3917694091796875, 0.4061317443847656, 0.42049407958984375, 0.4348564147949219, 0.44921875]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 2.0, 6.0, 2.0, 7.0, 17.0, 20.0, 29.0, 23.0, 35.0, 50.0, 61.0, 67.0, 91.0, 78.0, 74.0, 73.0, 65.0, 75.0, 59.0, 38.0, 31.0, 32.0, 15.0, 17.0, 18.0, 8.0, 5.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.44140625, -1.4087142944335938, -1.3760223388671875, -1.3433303833007812, -1.310638427734375, -1.2779464721679688, -1.2452545166015625, -1.2125625610351562, -1.17987060546875, -1.1471786499023438, -1.1144866943359375, -1.0817947387695312, -1.049102783203125, -1.0164108276367188, -0.9837188720703125, -0.9510269165039062, -0.9183349609375, -0.8856430053710938, -0.8529510498046875, -0.8202590942382812, -0.787567138671875, -0.7548751831054688, -0.7221832275390625, -0.6894912719726562, -0.65679931640625, -0.6241073608398438, -0.5914154052734375, -0.5587234497070312, -0.526031494140625, -0.49333953857421875, -0.4606475830078125, -0.42795562744140625, -0.395263671875, -0.36257171630859375, -0.3298797607421875, -0.29718780517578125, -0.264495849609375, -0.23180389404296875, -0.1991119384765625, -0.16641998291015625, -0.13372802734375, -0.10103607177734375, -0.0683441162109375, -0.03565216064453125, -0.002960205078125, 0.02973175048828125, 0.0624237060546875, 0.09511566162109375, 0.1278076171875, 0.16049957275390625, 0.1931915283203125, 0.22588348388671875, 0.258575439453125, 0.29126739501953125, 0.3239593505859375, 0.35665130615234375, 0.38934326171875, 0.42203521728515625, 0.4547271728515625, 0.48741912841796875, 0.520111083984375, 0.5528030395507812, 0.5854949951171875, 0.6181869506835938, 0.65087890625]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 7.0, 9.0, 7.0, 10.0, 13.0, 18.0, 26.0, 28.0, 41.0, 43.0, 71.0, 111.0, 202.0, 396.0, 987.0, 17418.0, 1006284.0, 20733.0, 1128.0, 403.0, 199.0, 119.0, 56.0, 62.0, 36.0, 36.0, 19.0, 15.0, 16.0, 22.0, 17.0, 2.0, 6.0, 5.0, 3.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.92724609375, -0.8958358764648438, -0.8644256591796875, -0.8330154418945312, -0.801605224609375, -0.7701950073242188, -0.7387847900390625, -0.7073745727539062, -0.67596435546875, -0.6445541381835938, -0.6131439208984375, -0.5817337036132812, -0.550323486328125, -0.5189132690429688, -0.4875030517578125, -0.45609283447265625, -0.4246826171875, -0.39327239990234375, -0.3618621826171875, -0.33045196533203125, -0.299041748046875, -0.26763153076171875, -0.2362213134765625, -0.20481109619140625, -0.17340087890625, -0.14199066162109375, -0.1105804443359375, -0.07917022705078125, -0.047760009765625, -0.01634979248046875, 0.0150604248046875, 0.04647064208984375, 0.077880859375, 0.10929107666015625, 0.1407012939453125, 0.17211151123046875, 0.203521728515625, 0.23493194580078125, 0.2663421630859375, 0.29775238037109375, 0.32916259765625, 0.36057281494140625, 0.3919830322265625, 0.42339324951171875, 0.454803466796875, 0.48621368408203125, 0.5176239013671875, 0.5490341186523438, 0.5804443359375, 0.6118545532226562, 0.6432647705078125, 0.6746749877929688, 0.706085205078125, 0.7374954223632812, 0.7689056396484375, 0.8003158569335938, 0.83172607421875, 0.8631362915039062, 0.8945465087890625, 0.9259567260742188, 0.957366943359375, 0.9887771606445312, 1.0201873779296875, 1.0515975952148438, 1.0830078125]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 4.0, 2.0, 6.0, 6.0, 6.0, 6.0, 13.0, 17.0, 10.0, 17.0, 15.0, 21.0, 27.0, 29.0, 40.0, 36.0, 38.0, 42.0, 48.0, 52.0, 40.0, 47.0, 50.0, 38.0, 43.0, 48.0, 43.0, 45.0, 40.0, 16.0, 27.0, 27.0, 23.0, 14.0, 15.0, 10.0, 11.0, 6.0, 6.0, 5.0, 5.0, 4.0, 8.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7294921875, -0.7054977416992188, -0.6815032958984375, -0.6575088500976562, -0.633514404296875, -0.6095199584960938, -0.5855255126953125, -0.5615310668945312, -0.53753662109375, -0.5135421752929688, -0.4895477294921875, -0.46555328369140625, -0.441558837890625, -0.41756439208984375, -0.3935699462890625, -0.36957550048828125, -0.3455810546875, -0.32158660888671875, -0.2975921630859375, -0.27359771728515625, -0.249603271484375, -0.22560882568359375, -0.2016143798828125, -0.17761993408203125, -0.15362548828125, -0.12963104248046875, -0.1056365966796875, -0.08164215087890625, -0.057647705078125, -0.03365325927734375, -0.0096588134765625, 0.01433563232421875, 0.038330078125, 0.06232452392578125, 0.0863189697265625, 0.11031341552734375, 0.134307861328125, 0.15830230712890625, 0.1822967529296875, 0.20629119873046875, 0.23028564453125, 0.25428009033203125, 0.2782745361328125, 0.30226898193359375, 0.326263427734375, 0.35025787353515625, 0.3742523193359375, 0.39824676513671875, 0.4222412109375, 0.44623565673828125, 0.4702301025390625, 0.49422454833984375, 0.518218994140625, 0.5422134399414062, 0.5662078857421875, 0.5902023315429688, 0.61419677734375, 0.6381912231445312, 0.6621856689453125, 0.6861801147460938, 0.710174560546875, 0.7341690063476562, 0.7581634521484375, 0.7821578979492188, 0.80615234375]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 7.0, 5.0, 13.0, 9.0, 17.0, 24.0, 39.0, 71.0, 84.0, 114.0, 239.0, 407.0, 854.0, 1944.0, 7562.0, 98039.0, 889123.0, 42146.0, 4755.0, 1521.0, 697.0, 367.0, 201.0, 115.0, 57.0, 42.0, 37.0, 16.0, 12.0, 10.0, 0.0, 6.0, 6.0, 5.0, 6.0, 3.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.279296875, -0.2720165252685547, -0.2647361755371094, -0.25745582580566406, -0.25017547607421875, -0.24289512634277344, -0.23561477661132812, -0.2283344268798828, -0.2210540771484375, -0.2137737274169922, -0.20649337768554688, -0.19921302795410156, -0.19193267822265625, -0.18465232849121094, -0.17737197875976562, -0.1700916290283203, -0.162811279296875, -0.1555309295654297, -0.14825057983398438, -0.14097023010253906, -0.13368988037109375, -0.12640953063964844, -0.11912918090820312, -0.11184883117675781, -0.1045684814453125, -0.09728813171386719, -0.09000778198242188, -0.08272743225097656, -0.07544708251953125, -0.06816673278808594, -0.060886383056640625, -0.05360603332519531, -0.04632568359375, -0.03904533386230469, -0.031764984130859375, -0.024484634399414062, -0.01720428466796875, -0.009923934936523438, -0.002643585205078125, 0.0046367645263671875, 0.0119171142578125, 0.019197463989257812, 0.026477813720703125, 0.03375816345214844, 0.04103851318359375, 0.04831886291503906, 0.055599212646484375, 0.06287956237792969, 0.070159912109375, 0.07744026184082031, 0.08472061157226562, 0.09200096130371094, 0.09928131103515625, 0.10656166076660156, 0.11384201049804688, 0.12112236022949219, 0.1284027099609375, 0.1356830596923828, 0.14296340942382812, 0.15024375915527344, 0.15752410888671875, 0.16480445861816406, 0.17208480834960938, 0.1793651580810547, 0.1866455078125]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 13.0, 31.0, 129.0, 648.0, 137.0, 37.0, 9.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.226799011230469e-05, -8.87848436832428e-05, -8.530169725418091e-05, -8.181855082511902e-05, -7.833540439605713e-05, -7.485225796699524e-05, -7.136911153793335e-05, -6.788596510887146e-05, -6.440281867980957e-05, -6.091967225074768e-05, -5.743652582168579e-05, -5.39533793926239e-05, -5.047023296356201e-05, -4.698708653450012e-05, -4.350394010543823e-05, -4.002079367637634e-05, -3.653764724731445e-05, -3.3054500818252563e-05, -2.9571354389190674e-05, -2.6088207960128784e-05, -2.2605061531066895e-05, -1.9121915102005005e-05, -1.5638768672943115e-05, -1.2155622243881226e-05, -8.672475814819336e-06, -5.189329385757446e-06, -1.7061829566955566e-06, 1.776963472366333e-06, 5.260109901428223e-06, 8.743256330490112e-06, 1.2226402759552002e-05, 1.570954918861389e-05, 1.919269561767578e-05, 2.267584204673767e-05, 2.615898847579956e-05, 2.964213490486145e-05, 3.312528133392334e-05, 3.660842776298523e-05, 4.009157419204712e-05, 4.357472062110901e-05, 4.70578670501709e-05, 5.054101347923279e-05, 5.402415990829468e-05, 5.750730633735657e-05, 6.099045276641846e-05, 6.447359919548035e-05, 6.795674562454224e-05, 7.143989205360413e-05, 7.492303848266602e-05, 7.84061849117279e-05, 8.18893313407898e-05, 8.537247776985168e-05, 8.885562419891357e-05, 9.233877062797546e-05, 9.582191705703735e-05, 9.930506348609924e-05, 0.00010278820991516113, 0.00010627135634422302, 0.00010975450277328491, 0.0001132376492023468, 0.00011672079563140869, 0.00012020394206047058, 0.00012368708848953247, 0.00012717023491859436, 0.00013065338134765625]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 6.0, 7.0, 5.0, 2.0, 5.0, 12.0, 27.0, 17.0, 32.0, 35.0, 47.0, 50.0, 100.0, 138.0, 179.0, 327.0, 547.0, 1252.0, 3838.0, 24564.0, 801428.0, 199684.0, 11587.0, 2401.0, 962.0, 453.0, 255.0, 159.0, 96.0, 85.0, 63.0, 53.0, 27.0, 26.0, 31.0, 11.0, 7.0, 8.0, 6.0, 11.0, 3.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.261474609375, -0.2529945373535156, -0.24451446533203125, -0.23603439331054688, -0.2275543212890625, -0.21907424926757812, -0.21059417724609375, -0.20211410522460938, -0.193634033203125, -0.18515396118164062, -0.17667388916015625, -0.16819381713867188, -0.1597137451171875, -0.15123367309570312, -0.14275360107421875, -0.13427352905273438, -0.12579345703125, -0.11731338500976562, -0.10883331298828125, -0.10035324096679688, -0.0918731689453125, -0.08339309692382812, -0.07491302490234375, -0.06643295288085938, -0.057952880859375, -0.049472808837890625, -0.04099273681640625, -0.032512664794921875, -0.0240325927734375, -0.015552520751953125, -0.00707244873046875, 0.001407623291015625, 0.0098876953125, 0.018367767333984375, 0.02684783935546875, 0.035327911376953125, 0.0438079833984375, 0.052288055419921875, 0.06076812744140625, 0.06924819946289062, 0.077728271484375, 0.08620834350585938, 0.09468841552734375, 0.10316848754882812, 0.1116485595703125, 0.12012863159179688, 0.12860870361328125, 0.13708877563476562, 0.14556884765625, 0.15404891967773438, 0.16252899169921875, 0.17100906372070312, 0.1794891357421875, 0.18796920776367188, 0.19644927978515625, 0.20492935180664062, 0.213409423828125, 0.22188949584960938, 0.23036956787109375, 0.23884963989257812, 0.2473297119140625, 0.2558097839355469, 0.26428985595703125, 0.2727699279785156, 0.28125]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 7.0, 9.0, 3.0, 10.0, 14.0, 15.0, 38.0, 40.0, 73.0, 151.0, 309.0, 119.0, 61.0, 40.0, 35.0, 23.0, 16.0, 11.0, 12.0, 7.0, 6.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0845947265625, -0.08189678192138672, -0.07919883728027344, -0.07650089263916016, -0.07380294799804688, -0.0711050033569336, -0.06840705871582031, -0.06570911407470703, -0.06301116943359375, -0.06031322479248047, -0.05761528015136719, -0.054917335510253906, -0.052219390869140625, -0.049521446228027344, -0.04682350158691406, -0.04412555694580078, -0.0414276123046875, -0.03872966766357422, -0.03603172302246094, -0.033333778381347656, -0.030635833740234375, -0.027937889099121094, -0.025239944458007812, -0.02254199981689453, -0.01984405517578125, -0.01714611053466797, -0.014448165893554688, -0.011750221252441406, -0.009052276611328125, -0.006354331970214844, -0.0036563873291015625, -0.0009584426879882812, 0.001739501953125, 0.004437446594238281, 0.0071353912353515625, 0.009833335876464844, 0.012531280517578125, 0.015229225158691406, 0.017927169799804688, 0.02062511444091797, 0.02332305908203125, 0.02602100372314453, 0.028718948364257812, 0.031416893005371094, 0.034114837646484375, 0.036812782287597656, 0.03951072692871094, 0.04220867156982422, 0.0449066162109375, 0.04760456085205078, 0.05030250549316406, 0.053000450134277344, 0.055698394775390625, 0.058396339416503906, 0.06109428405761719, 0.06379222869873047, 0.06649017333984375, 0.06918811798095703, 0.07188606262207031, 0.0745840072631836, 0.07728195190429688, 0.07997989654541016, 0.08267784118652344, 0.08537578582763672, 0.08807373046875]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 4.0, 22.0, 37.0, 156.0, 309.0, 305.0, 112.0, 33.0, 17.0, 11.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6705989837646484, -2.5592265129089355, -2.4478540420532227, -2.3364815711975098, -2.225109100341797, -2.113736629486084, -2.002364158630371, -1.890991449356079, -1.7796189785003662, -1.6682465076446533, -1.5568740367889404, -1.4455015659332275, -1.334128975868225, -1.2227565050125122, -1.1113840341567993, -1.0000114440917969, -0.8886390924453735, -0.7772666215896606, -0.665894091129303, -0.5545216202735901, -0.4431491196155548, -0.33177661895751953, -0.22040414810180664, -0.10903161764144897, 0.002340853214263916, 0.1137133464217186, 0.22508583962917328, 0.33645832538604736, 0.44783082604408264, 0.5592033267021179, 0.6705757975578308, 0.7819483280181885, 0.8933207988739014, 1.0046932697296143, 1.1160657405853271, 1.22743821144104, 1.3388108015060425, 1.4501832723617554, 1.5615557432174683, 1.6729283332824707, 1.7843008041381836, 1.8956732749938965, 2.0070457458496094, 2.1184182167053223, 2.229790687561035, 2.341163158416748, 2.452535629272461, 2.563908338546753, 2.6752805709838867, 2.7866530418395996, 2.8980255126953125, 3.0093979835510254, 3.1207704544067383, 3.232142925262451, 3.343515396118164, 3.454888105392456, 3.566260576248169, 3.677633047103882, 3.7890055179595947, 3.9003779888153076, 4.0117506980896, 4.1231231689453125, 4.234495639801025, 4.345868110656738, 4.457240581512451]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 5.0, 2.0, 1.0, 4.0, 8.0, 11.0, 6.0, 15.0, 13.0, 15.0, 13.0, 19.0, 16.0, 25.0, 33.0, 21.0, 23.0, 29.0, 43.0, 41.0, 40.0, 45.0, 44.0, 38.0, 37.0, 46.0, 36.0, 52.0, 42.0, 52.0, 40.0, 28.0, 26.0, 24.0, 22.0, 19.0, 12.0, 12.0, 10.0, 9.0, 9.0, 8.0, 4.0, 3.0, 5.0, 1.0, 2.0, 0.0, 4.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-1.3646152019500732, -1.324114441871643, -1.283613681793213, -1.2431129217147827, -1.2026121616363525, -1.1621112823486328, -1.1216105222702026, -1.0811097621917725, -1.0406090021133423, -1.000108242034912, -0.9596074819564819, -0.919106662273407, -0.8786059021949768, -0.8381051421165466, -0.7976043224334717, -0.7571035623550415, -0.7166028022766113, -0.6761020421981812, -0.635601282119751, -0.595100462436676, -0.5545997023582458, -0.5140989422798157, -0.4735981523990631, -0.43309736251831055, -0.39259660243988037, -0.3520958423614502, -0.31159505248069763, -0.27109426259994507, -0.2305935025215149, -0.19009272754192352, -0.14959195256233215, -0.10909116268157959, -0.06859052181243896, -0.028089746832847595, 0.012411028146743774, 0.052911803126335144, 0.09341257810592651, 0.13391335308551788, 0.17441412806510925, 0.21491491794586182, 0.255415678024292, 0.29591643810272217, 0.33641722798347473, 0.3769180178642273, 0.41741877794265747, 0.45791953802108765, 0.4984203279018402, 0.5389211177825928, 0.579421877861023, 0.6199226379394531, 0.6604233980178833, 0.7009242177009583, 0.7414249777793884, 0.7819257378578186, 0.8224265575408936, 0.8629273176193237, 0.9034280776977539, 0.9439288377761841, 0.9844295978546143, 1.0249303579330444, 1.0654311180114746, 1.1059319972991943, 1.1464327573776245, 1.1869335174560547, 1.2274342775344849]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 6.0, 1.0, 5.0, 6.0, 11.0, 12.0, 10.0, 21.0, 24.0, 31.0, 40.0, 59.0, 82.0, 120.0, 169.0, 261.0, 447.0, 812.0, 1796.0, 4346.0, 14807.0, 217515.0, 3764200.0, 167604.0, 14011.0, 4076.0, 1648.0, 841.0, 464.0, 256.0, 164.0, 117.0, 85.0, 56.0, 41.0, 29.0, 35.0, 22.0, 18.0, 13.0, 10.0, 2.0, 5.0, 5.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.2919921875, -1.253387451171875, -1.21478271484375, -1.176177978515625, -1.1375732421875, -1.098968505859375, -1.06036376953125, -1.021759033203125, -0.983154296875, -0.944549560546875, -0.90594482421875, -0.867340087890625, -0.8287353515625, -0.790130615234375, -0.75152587890625, -0.712921142578125, -0.67431640625, -0.635711669921875, -0.59710693359375, -0.558502197265625, -0.5198974609375, -0.481292724609375, -0.44268798828125, -0.404083251953125, -0.365478515625, -0.326873779296875, -0.28826904296875, -0.249664306640625, -0.2110595703125, -0.172454833984375, -0.13385009765625, -0.095245361328125, -0.056640625, -0.018035888671875, 0.02056884765625, 0.059173583984375, 0.0977783203125, 0.136383056640625, 0.17498779296875, 0.213592529296875, 0.252197265625, 0.290802001953125, 0.32940673828125, 0.368011474609375, 0.4066162109375, 0.445220947265625, 0.48382568359375, 0.522430419921875, 0.56103515625, 0.599639892578125, 0.63824462890625, 0.676849365234375, 0.7154541015625, 0.754058837890625, 0.79266357421875, 0.831268310546875, 0.869873046875, 0.908477783203125, 0.94708251953125, 0.985687255859375, 1.0242919921875, 1.062896728515625, 1.10150146484375, 1.140106201171875, 1.1787109375]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 0.0, 6.0, 3.0, 9.0, 6.0, 18.0, 18.0, 21.0, 29.0, 36.0, 31.0, 52.0, 60.0, 73.0, 49.0, 67.0, 84.0, 62.0, 74.0, 44.0, 47.0, 52.0, 37.0, 32.0, 26.0, 22.0, 11.0, 19.0, 2.0, 9.0, 6.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.64208984375, -0.6264572143554688, -0.6108245849609375, -0.5951919555664062, -0.579559326171875, -0.5639266967773438, -0.5482940673828125, -0.5326614379882812, -0.51702880859375, -0.5013961791992188, -0.4857635498046875, -0.47013092041015625, -0.454498291015625, -0.43886566162109375, -0.4232330322265625, -0.40760040283203125, -0.3919677734375, -0.37633514404296875, -0.3607025146484375, -0.34506988525390625, -0.329437255859375, -0.31380462646484375, -0.2981719970703125, -0.28253936767578125, -0.26690673828125, -0.25127410888671875, -0.2356414794921875, -0.22000885009765625, -0.204376220703125, -0.18874359130859375, -0.1731109619140625, -0.15747833251953125, -0.141845703125, -0.12621307373046875, -0.1105804443359375, -0.09494781494140625, -0.079315185546875, -0.06368255615234375, -0.0480499267578125, -0.03241729736328125, -0.01678466796875, -0.00115203857421875, 0.0144805908203125, 0.03011322021484375, 0.045745849609375, 0.06137847900390625, 0.0770111083984375, 0.09264373779296875, 0.1082763671875, 0.12390899658203125, 0.1395416259765625, 0.15517425537109375, 0.170806884765625, 0.18643951416015625, 0.2020721435546875, 0.21770477294921875, 0.23333740234375, 0.24897003173828125, 0.2646026611328125, 0.28023529052734375, 0.295867919921875, 0.31150054931640625, 0.3271331787109375, 0.34276580810546875, 0.3583984375]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 11.0, 10.0, 13.0, 26.0, 51.0, 88.0, 147.0, 308.0, 594.0, 1350.0, 3339.0, 10480.0, 54566.0, 2890345.0, 1182696.0, 36976.0, 8227.0, 2851.0, 1132.0, 504.0, 255.0, 136.0, 66.0, 35.0, 34.0, 14.0, 10.0, 9.0, 3.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0234375, -0.991363525390625, -0.95928955078125, -0.927215576171875, -0.8951416015625, -0.863067626953125, -0.83099365234375, -0.798919677734375, -0.766845703125, -0.734771728515625, -0.70269775390625, -0.670623779296875, -0.6385498046875, -0.606475830078125, -0.57440185546875, -0.542327880859375, -0.51025390625, -0.478179931640625, -0.44610595703125, -0.414031982421875, -0.3819580078125, -0.349884033203125, -0.31781005859375, -0.285736083984375, -0.253662109375, -0.221588134765625, -0.18951416015625, -0.157440185546875, -0.1253662109375, -0.093292236328125, -0.06121826171875, -0.029144287109375, 0.0029296875, 0.035003662109375, 0.06707763671875, 0.099151611328125, 0.1312255859375, 0.163299560546875, 0.19537353515625, 0.227447509765625, 0.259521484375, 0.291595458984375, 0.32366943359375, 0.355743408203125, 0.3878173828125, 0.419891357421875, 0.45196533203125, 0.484039306640625, 0.51611328125, 0.548187255859375, 0.58026123046875, 0.612335205078125, 0.6444091796875, 0.676483154296875, 0.70855712890625, 0.740631103515625, 0.772705078125, 0.804779052734375, 0.83685302734375, 0.868927001953125, 0.9010009765625, 0.933074951171875, 0.96514892578125, 0.997222900390625, 1.029296875]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 5.0, 7.0, 10.0, 7.0, 10.0, 29.0, 26.0, 53.0, 106.0, 212.0, 430.0, 854.0, 1076.0, 598.0, 313.0, 127.0, 66.0, 39.0, 32.0, 18.0, 12.0, 15.0, 6.0, 5.0, 4.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.189453125, -0.18055343627929688, -0.17165374755859375, -0.16275405883789062, -0.1538543701171875, -0.14495468139648438, -0.13605499267578125, -0.12715530395507812, -0.118255615234375, -0.10935592651367188, -0.10045623779296875, -0.09155654907226562, -0.0826568603515625, -0.07375717163085938, -0.06485748291015625, -0.055957794189453125, -0.04705810546875, -0.038158416748046875, -0.02925872802734375, -0.020359039306640625, -0.0114593505859375, -0.002559661865234375, 0.00634002685546875, 0.015239715576171875, 0.024139404296875, 0.033039093017578125, 0.04193878173828125, 0.050838470458984375, 0.0597381591796875, 0.06863784790039062, 0.07753753662109375, 0.08643722534179688, 0.0953369140625, 0.10423660278320312, 0.11313629150390625, 0.12203598022460938, 0.1309356689453125, 0.13983535766601562, 0.14873504638671875, 0.15763473510742188, 0.166534423828125, 0.17543411254882812, 0.18433380126953125, 0.19323348999023438, 0.2021331787109375, 0.21103286743164062, 0.21993255615234375, 0.22883224487304688, 0.23773193359375, 0.24663162231445312, 0.25553131103515625, 0.2644309997558594, 0.2733306884765625, 0.2822303771972656, 0.29113006591796875, 0.3000297546386719, 0.308929443359375, 0.3178291320800781, 0.32672882080078125, 0.3356285095214844, 0.3445281982421875, 0.3534278869628906, 0.36232757568359375, 0.3712272644042969, 0.380126953125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 8.0, 13.0, 11.0, 38.0, 54.0, 84.0, 139.0, 165.0, 182.0, 124.0, 85.0, 43.0, 30.0, 10.0, 5.0, 6.0, 4.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.6381860971450806, -1.5971119403839111, -1.5560376644134521, -1.5149635076522827, -1.4738893508911133, -1.4328151941299438, -1.3917410373687744, -1.3506667613983154, -1.309592604637146, -1.2685184478759766, -1.2274441719055176, -1.1863700151443481, -1.1452958583831787, -1.1042217016220093, -1.0631475448608398, -1.0220732688903809, -0.9809991121292114, -0.939924955368042, -0.8988507390022278, -0.8577765226364136, -0.8167023658752441, -0.7756282091140747, -0.7345539927482605, -0.6934797763824463, -0.6524056196212769, -0.6113314628601074, -0.5702572464942932, -0.529183030128479, -0.48810887336730957, -0.44703468680381775, -0.4059605002403259, -0.3648863136768341, -0.32381224632263184, -0.28273805975914, -0.2416638731956482, -0.20058968663215637, -0.15951550006866455, -0.11844131350517273, -0.07736712694168091, -0.03629294037818909, 0.004781246185302734, 0.045855432748794556, 0.08692961931228638, 0.1280038058757782, 0.16907799243927002, 0.21015217900276184, 0.25122636556625366, 0.2923005521297455, 0.3333747386932373, 0.3744489252567291, 0.41552311182022095, 0.45659729838371277, 0.4976714849472046, 0.538745641708374, 0.5798198580741882, 0.6208940744400024, 0.6619682312011719, 0.7030423879623413, 0.7441166043281555, 0.7851908206939697, 0.8262649774551392, 0.8673391342163086, 0.9084133505821228, 0.949487566947937, 0.9905617237091064]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 8.0, 8.0, 2.0, 8.0, 8.0, 17.0, 21.0, 17.0, 23.0, 23.0, 25.0, 35.0, 45.0, 37.0, 46.0, 52.0, 53.0, 53.0, 57.0, 40.0, 48.0, 52.0, 40.0, 33.0, 37.0, 35.0, 35.0, 24.0, 22.0, 22.0, 19.0, 14.0, 14.0, 9.0, 9.0, 4.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.6263447999954224, -0.6105846166610718, -0.594824492931366, -0.5790643095970154, -0.5633041858673096, -0.547544002532959, -0.5317838191986084, -0.5160236954689026, -0.500263512134552, -0.4845033586025238, -0.4687432050704956, -0.452983021736145, -0.4372228682041168, -0.4214627146720886, -0.40570253133773804, -0.38994237780570984, -0.37418222427368164, -0.35842207074165344, -0.34266191720962524, -0.32690173387527466, -0.31114158034324646, -0.29538142681121826, -0.2796212434768677, -0.2638610899448395, -0.24810093641281128, -0.23234078288078308, -0.2165806144475937, -0.2008204460144043, -0.1850602924823761, -0.1693001389503479, -0.1535399705171585, -0.13777980208396912, -0.12201958894729614, -0.10625942796468735, -0.09049926698207855, -0.07473910599946976, -0.05897894501686096, -0.04321878403425217, -0.02745862305164337, -0.011698462069034576, 0.004061698913574219, 0.019821859896183014, 0.03558202087879181, 0.051342181861400604, 0.0671023428440094, 0.0828625038266182, 0.09862266480922699, 0.11438282579183578, 0.13014298677444458, 0.14590314030647278, 0.16166330873966217, 0.17742347717285156, 0.19318363070487976, 0.20894378423690796, 0.22470395267009735, 0.24046412110328674, 0.25622427463531494, 0.27198442816734314, 0.28774458169937134, 0.3035047650337219, 0.3192649185657501, 0.3350250720977783, 0.3507852554321289, 0.3665454089641571, 0.3823055624961853]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 0.0, 3.0, 3.0, 5.0, 4.0, 11.0, 14.0, 13.0, 20.0, 25.0, 30.0, 44.0, 57.0, 99.0, 137.0, 228.0, 335.0, 545.0, 866.0, 1433.0, 2443.0, 4292.0, 8508.0, 20000.0, 97579.0, 657721.0, 202157.0, 28562.0, 10774.0, 5346.0, 2912.0, 1604.0, 971.0, 599.0, 376.0, 266.0, 174.0, 120.0, 84.0, 61.0, 35.0, 28.0, 23.0, 17.0, 16.0, 1.0, 3.0, 5.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.231689453125, -0.2245941162109375, -0.217498779296875, -0.2104034423828125, -0.20330810546875, -0.1962127685546875, -0.189117431640625, -0.1820220947265625, -0.1749267578125, -0.1678314208984375, -0.160736083984375, -0.1536407470703125, -0.14654541015625, -0.1394500732421875, -0.132354736328125, -0.1252593994140625, -0.1181640625, -0.1110687255859375, -0.103973388671875, -0.0968780517578125, -0.08978271484375, -0.0826873779296875, -0.075592041015625, -0.0684967041015625, -0.0614013671875, -0.0543060302734375, -0.047210693359375, -0.0401153564453125, -0.03302001953125, -0.0259246826171875, -0.018829345703125, -0.0117340087890625, -0.004638671875, 0.0024566650390625, 0.009552001953125, 0.0166473388671875, 0.02374267578125, 0.0308380126953125, 0.037933349609375, 0.0450286865234375, 0.0521240234375, 0.0592193603515625, 0.066314697265625, 0.0734100341796875, 0.08050537109375, 0.0876007080078125, 0.094696044921875, 0.1017913818359375, 0.10888671875, 0.1159820556640625, 0.123077392578125, 0.1301727294921875, 0.13726806640625, 0.1443634033203125, 0.151458740234375, 0.1585540771484375, 0.1656494140625, 0.1727447509765625, 0.179840087890625, 0.1869354248046875, 0.19403076171875, 0.2011260986328125, 0.208221435546875, 0.2153167724609375, 0.222412109375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 3.0, 8.0, 6.0, 10.0, 7.0, 8.0, 15.0, 16.0, 18.0, 24.0, 24.0, 26.0, 43.0, 39.0, 50.0, 32.0, 49.0, 51.0, 62.0, 49.0, 51.0, 55.0, 40.0, 46.0, 39.0, 35.0, 39.0, 32.0, 23.0, 13.0, 16.0, 21.0, 11.0, 7.0, 9.0, 6.0, 5.0, 6.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 1.0], "bins": [-0.4248046875, -0.41359710693359375, -0.4023895263671875, -0.39118194580078125, -0.379974365234375, -0.36876678466796875, -0.3575592041015625, -0.34635162353515625, -0.33514404296875, -0.32393646240234375, -0.3127288818359375, -0.30152130126953125, -0.290313720703125, -0.27910614013671875, -0.2678985595703125, -0.25669097900390625, -0.2454833984375, -0.23427581787109375, -0.2230682373046875, -0.21186065673828125, -0.200653076171875, -0.18944549560546875, -0.1782379150390625, -0.16703033447265625, -0.15582275390625, -0.14461517333984375, -0.1334075927734375, -0.12220001220703125, -0.110992431640625, -0.09978485107421875, -0.0885772705078125, -0.07736968994140625, -0.066162109375, -0.05495452880859375, -0.0437469482421875, -0.03253936767578125, -0.021331787109375, -0.01012420654296875, 0.0010833740234375, 0.01229095458984375, 0.02349853515625, 0.03470611572265625, 0.0459136962890625, 0.05712127685546875, 0.068328857421875, 0.07953643798828125, 0.0907440185546875, 0.10195159912109375, 0.1131591796875, 0.12436676025390625, 0.1355743408203125, 0.14678192138671875, 0.157989501953125, 0.16919708251953125, 0.1804046630859375, 0.19161224365234375, 0.20281982421875, 0.21402740478515625, 0.2252349853515625, 0.23644256591796875, 0.247650146484375, 0.25885772705078125, 0.2700653076171875, 0.28127288818359375, 0.29248046875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 6.0, 4.0, 6.0, 17.0, 10.0, 25.0, 37.0, 55.0, 69.0, 133.0, 219.0, 393.0, 735.0, 1534.0, 3553.0, 10146.0, 48924.0, 518673.0, 409279.0, 39535.0, 9009.0, 3196.0, 1443.0, 706.0, 383.0, 183.0, 105.0, 56.0, 39.0, 28.0, 26.0, 14.0, 8.0, 4.0, 2.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.2452392578125, -0.23894119262695312, -0.23264312744140625, -0.22634506225585938, -0.2200469970703125, -0.21374893188476562, -0.20745086669921875, -0.20115280151367188, -0.194854736328125, -0.18855667114257812, -0.18225860595703125, -0.17596054077148438, -0.1696624755859375, -0.16336441040039062, -0.15706634521484375, -0.15076828002929688, -0.14447021484375, -0.13817214965820312, -0.13187408447265625, -0.12557601928710938, -0.1192779541015625, -0.11297988891601562, -0.10668182373046875, -0.10038375854492188, -0.094085693359375, -0.08778762817382812, -0.08148956298828125, -0.07519149780273438, -0.0688934326171875, -0.06259536743164062, -0.05629730224609375, -0.049999237060546875, -0.043701171875, -0.037403106689453125, -0.03110504150390625, -0.024806976318359375, -0.0185089111328125, -0.012210845947265625, -0.00591278076171875, 0.000385284423828125, 0.006683349609375, 0.012981414794921875, 0.01927947998046875, 0.025577545166015625, 0.0318756103515625, 0.038173675537109375, 0.04447174072265625, 0.050769805908203125, 0.05706787109375, 0.06336593627929688, 0.06966400146484375, 0.07596206665039062, 0.0822601318359375, 0.08855819702148438, 0.09485626220703125, 0.10115432739257812, 0.107452392578125, 0.11375045776367188, 0.12004852294921875, 0.12634658813476562, 0.1326446533203125, 0.13894271850585938, 0.14524078369140625, 0.15153884887695312, 0.1578369140625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 7.0, 6.0, 2.0, 13.0, 8.0, 13.0, 12.0, 14.0, 11.0, 20.0, 24.0, 23.0, 29.0, 33.0, 60.0, 56.0, 34.0, 51.0, 50.0, 55.0, 61.0, 54.0, 50.0, 43.0, 43.0, 44.0, 29.0, 18.0, 34.0, 25.0, 18.0, 16.0, 14.0, 7.0, 6.0, 8.0, 2.0, 6.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.76513671875, -0.7434234619140625, -0.721710205078125, -0.6999969482421875, -0.67828369140625, -0.6565704345703125, -0.634857177734375, -0.6131439208984375, -0.5914306640625, -0.5697174072265625, -0.548004150390625, -0.5262908935546875, -0.50457763671875, -0.4828643798828125, -0.461151123046875, -0.4394378662109375, -0.417724609375, -0.3960113525390625, -0.374298095703125, -0.3525848388671875, -0.33087158203125, -0.3091583251953125, -0.287445068359375, -0.2657318115234375, -0.2440185546875, -0.2223052978515625, -0.200592041015625, -0.1788787841796875, -0.15716552734375, -0.1354522705078125, -0.113739013671875, -0.0920257568359375, -0.0703125, -0.0485992431640625, -0.026885986328125, -0.0051727294921875, 0.01654052734375, 0.0382537841796875, 0.059967041015625, 0.0816802978515625, 0.1033935546875, 0.1251068115234375, 0.146820068359375, 0.1685333251953125, 0.19024658203125, 0.2119598388671875, 0.233673095703125, 0.2553863525390625, 0.277099609375, 0.2988128662109375, 0.320526123046875, 0.3422393798828125, 0.36395263671875, 0.3856658935546875, 0.407379150390625, 0.4290924072265625, 0.4508056640625, 0.4725189208984375, 0.494232177734375, 0.5159454345703125, 0.53765869140625, 0.5593719482421875, 0.581085205078125, 0.6027984619140625, 0.62451171875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 0.0, 3.0, 10.0, 7.0, 8.0, 10.0, 17.0, 26.0, 30.0, 48.0, 62.0, 101.0, 164.0, 313.0, 522.0, 1061.0, 2329.0, 5367.0, 14875.0, 49690.0, 190960.0, 483689.0, 215705.0, 55844.0, 16462.0, 6040.0, 2547.0, 1218.0, 596.0, 291.0, 205.0, 121.0, 76.0, 54.0, 26.0, 23.0, 17.0, 20.0, 9.0, 3.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.037841796875, -0.036806344985961914, -0.03577089309692383, -0.03473544120788574, -0.033699989318847656, -0.03266453742980957, -0.031629085540771484, -0.0305936336517334, -0.029558181762695312, -0.028522729873657227, -0.02748727798461914, -0.026451826095581055, -0.02541637420654297, -0.024380922317504883, -0.023345470428466797, -0.02231001853942871, -0.021274566650390625, -0.02023911476135254, -0.019203662872314453, -0.018168210983276367, -0.01713275909423828, -0.016097307205200195, -0.01506185531616211, -0.014026403427124023, -0.012990951538085938, -0.011955499649047852, -0.010920047760009766, -0.00988459587097168, -0.008849143981933594, -0.007813692092895508, -0.006778240203857422, -0.005742788314819336, -0.00470733642578125, -0.003671884536743164, -0.002636432647705078, -0.0016009807586669922, -0.0005655288696289062, 0.0004699230194091797, 0.0015053749084472656, 0.0025408267974853516, 0.0035762786865234375, 0.0046117305755615234, 0.005647182464599609, 0.006682634353637695, 0.007718086242675781, 0.008753538131713867, 0.009788990020751953, 0.010824441909790039, 0.011859893798828125, 0.012895345687866211, 0.013930797576904297, 0.014966249465942383, 0.01600170135498047, 0.017037153244018555, 0.01807260513305664, 0.019108057022094727, 0.020143508911132812, 0.0211789608001709, 0.022214412689208984, 0.02324986457824707, 0.024285316467285156, 0.025320768356323242, 0.026356220245361328, 0.027391672134399414, 0.0284271240234375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 8.0, 2.0, 2.0, 6.0, 5.0, 11.0, 12.0, 12.0, 20.0, 32.0, 33.0, 35.0, 58.0, 58.0, 86.0, 93.0, 92.0, 75.0, 72.0, 67.0, 58.0, 40.0, 37.0, 21.0, 12.0, 9.0, 6.0, 7.0, 9.0, 10.0, 4.0, 0.0, 4.0, 1.0, 1.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.7583370208740234e-05, -1.699943095445633e-05, -1.6415491700172424e-05, -1.583155244588852e-05, -1.5247613191604614e-05, -1.466367393732071e-05, -1.4079734683036804e-05, -1.34957954287529e-05, -1.2911856174468994e-05, -1.2327916920185089e-05, -1.1743977665901184e-05, -1.1160038411617279e-05, -1.0576099157333374e-05, -9.992159903049469e-06, -9.408220648765564e-06, -8.824281394481659e-06, -8.240342140197754e-06, -7.656402885913849e-06, -7.072463631629944e-06, -6.488524377346039e-06, -5.904585123062134e-06, -5.320645868778229e-06, -4.736706614494324e-06, -4.152767360210419e-06, -3.5688281059265137e-06, -2.9848888516426086e-06, -2.4009495973587036e-06, -1.8170103430747986e-06, -1.2330710887908936e-06, -6.491318345069885e-07, -6.51925802230835e-08, 5.187466740608215e-07, 1.1026859283447266e-06, 1.6866251826286316e-06, 2.2705644369125366e-06, 2.8545036911964417e-06, 3.4384429454803467e-06, 4.022382199764252e-06, 4.606321454048157e-06, 5.190260708332062e-06, 5.774199962615967e-06, 6.358139216899872e-06, 6.942078471183777e-06, 7.526017725467682e-06, 8.109956979751587e-06, 8.693896234035492e-06, 9.277835488319397e-06, 9.861774742603302e-06, 1.0445713996887207e-05, 1.1029653251171112e-05, 1.1613592505455017e-05, 1.2197531759738922e-05, 1.2781471014022827e-05, 1.3365410268306732e-05, 1.3949349522590637e-05, 1.4533288776874542e-05, 1.5117228031158447e-05, 1.5701167285442352e-05, 1.6285106539726257e-05, 1.6869045794010162e-05, 1.7452985048294067e-05, 1.8036924302577972e-05, 1.8620863556861877e-05, 1.9204802811145782e-05, 1.9788742065429688e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 6.0, 9.0, 8.0, 11.0, 13.0, 24.0, 47.0, 58.0, 134.0, 278.0, 593.0, 1586.0, 5555.0, 27507.0, 178956.0, 612335.0, 184712.0, 28257.0, 5689.0, 1620.0, 579.0, 250.0, 139.0, 75.0, 45.0, 21.0, 13.0, 11.0, 3.0, 4.0, 8.0, 4.0, 1.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.05596923828125, -0.05429887771606445, -0.052628517150878906, -0.05095815658569336, -0.04928779602050781, -0.047617435455322266, -0.04594707489013672, -0.04427671432495117, -0.042606353759765625, -0.04093599319458008, -0.03926563262939453, -0.037595272064208984, -0.03592491149902344, -0.03425455093383789, -0.032584190368652344, -0.030913829803466797, -0.02924346923828125, -0.027573108673095703, -0.025902748107910156, -0.02423238754272461, -0.022562026977539062, -0.020891666412353516, -0.01922130584716797, -0.017550945281982422, -0.015880584716796875, -0.014210224151611328, -0.012539863586425781, -0.010869503021240234, -0.009199142456054688, -0.007528781890869141, -0.005858421325683594, -0.004188060760498047, -0.0025177001953125, -0.0008473396301269531, 0.0008230209350585938, 0.0024933815002441406, 0.0041637420654296875, 0.005834102630615234, 0.007504463195800781, 0.009174823760986328, 0.010845184326171875, 0.012515544891357422, 0.014185905456542969, 0.015856266021728516, 0.017526626586914062, 0.01919698715209961, 0.020867347717285156, 0.022537708282470703, 0.02420806884765625, 0.025878429412841797, 0.027548789978027344, 0.02921915054321289, 0.030889511108398438, 0.032559871673583984, 0.03423023223876953, 0.03590059280395508, 0.037570953369140625, 0.03924131393432617, 0.04091167449951172, 0.042582035064697266, 0.04425239562988281, 0.04592275619506836, 0.047593116760253906, 0.04926347732543945, 0.050933837890625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 4.0, 3.0, 7.0, 9.0, 12.0, 9.0, 26.0, 22.0, 66.0, 65.0, 80.0, 124.0, 130.0, 115.0, 99.0, 70.0, 39.0, 40.0, 24.0, 14.0, 18.0, 10.0, 7.0, 5.0, 5.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.018798828125, -0.018285751342773438, -0.017772674560546875, -0.017259597778320312, -0.01674652099609375, -0.016233444213867188, -0.015720367431640625, -0.015207290649414062, -0.0146942138671875, -0.014181137084960938, -0.013668060302734375, -0.013154983520507812, -0.01264190673828125, -0.012128829956054688, -0.011615753173828125, -0.011102676391601562, -0.010589599609375, -0.010076522827148438, -0.009563446044921875, -0.009050369262695312, -0.00853729248046875, -0.008024215698242188, -0.007511138916015625, -0.0069980621337890625, -0.0064849853515625, -0.0059719085693359375, -0.005458831787109375, -0.0049457550048828125, -0.00443267822265625, -0.0039196014404296875, -0.003406524658203125, -0.0028934478759765625, -0.00238037109375, -0.0018672943115234375, -0.001354217529296875, -0.0008411407470703125, -0.00032806396484375, 0.0001850128173828125, 0.000698089599609375, 0.0012111663818359375, 0.0017242431640625, 0.0022373199462890625, 0.002750396728515625, 0.0032634735107421875, 0.00377655029296875, 0.0042896270751953125, 0.004802703857421875, 0.0053157806396484375, 0.005828857421875, 0.0063419342041015625, 0.006855010986328125, 0.0073680877685546875, 0.00788116455078125, 0.008394241333007812, 0.008907318115234375, 0.009420394897460938, 0.0099334716796875, 0.010446548461914062, 0.010959625244140625, 0.011472702026367188, 0.01198577880859375, 0.012498855590820312, 0.013011932373046875, 0.013525009155273438, 0.0140380859375]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 10.0, 25.0, 51.0, 75.0, 157.0, 222.0, 232.0, 123.0, 53.0, 29.0, 10.0, 6.0, 7.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6343822479248047, -0.5987179279327393, -0.5630536079406738, -0.5273893475532532, -0.49172502756118774, -0.4560607075691223, -0.4203964173793793, -0.38473212718963623, -0.3490678071975708, -0.31340348720550537, -0.27773919701576233, -0.2420748919248581, -0.20641058683395386, -0.17074628174304962, -0.13508197665214539, -0.09941767156124115, -0.06375336647033691, -0.028089061379432678, 0.007575243711471558, 0.04323954880237579, 0.07890385389328003, 0.11456815898418427, 0.1502324640750885, 0.18589676916599274, 0.22156107425689697, 0.2572253942489624, 0.29288968443870544, 0.3285539746284485, 0.3642182946205139, 0.39988261461257935, 0.4355469048023224, 0.47121119499206543, 0.5068753957748413, 0.5425397157669067, 0.5782040357589722, 0.6138682961463928, 0.6495326161384583, 0.6851969361305237, 0.7208611965179443, 0.7565255165100098, 0.7921898365020752, 0.8278541564941406, 0.863518476486206, 0.8991827368736267, 0.9348470568656921, 0.9705113768577576, 1.0061756372451782, 1.0418399572372437, 1.077504277229309, 1.1131685972213745, 1.14883291721344, 1.1844972372055054, 1.2201614379882812, 1.2558257579803467, 1.291490077972412, 1.3271543979644775, 1.362818717956543, 1.3984830379486084, 1.4341473579406738, 1.4698116779327393, 1.5054759979248047, 1.5411401987075806, 1.576804518699646, 1.6124688386917114, 1.6481331586837769]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 7.0, 6.0, 5.0, 7.0, 8.0, 16.0, 20.0, 28.0, 22.0, 21.0, 31.0, 30.0, 46.0, 50.0, 53.0, 57.0, 53.0, 59.0, 44.0, 58.0, 42.0, 50.0, 39.0, 34.0, 40.0, 35.0, 24.0, 23.0, 20.0, 14.0, 20.0, 14.0, 8.0, 5.0, 4.0, 1.0, 2.0, 5.0, 0.0, 2.0, 2.0], "bins": [-0.45456960797309875, -0.44338274002075195, -0.43219590187072754, -0.42100903391838074, -0.40982216596603394, -0.39863529801368713, -0.38744843006134033, -0.3762615919113159, -0.3650747239589691, -0.3538878560066223, -0.3427010178565979, -0.3315141499042511, -0.3203272819519043, -0.3091404139995575, -0.2979535460472107, -0.2867667078971863, -0.2755798399448395, -0.2643929719924927, -0.25320613384246826, -0.24201926589012146, -0.23083239793777466, -0.21964552998542786, -0.20845867693424225, -0.19727182388305664, -0.18608495593070984, -0.17489808797836304, -0.16371123492717743, -0.15252438187599182, -0.14133751392364502, -0.13015064597129822, -0.11896379292011261, -0.1077769324183464, -0.0965900719165802, -0.085403211414814, -0.07421635091304779, -0.06302949041128159, -0.05184262990951538, -0.040655769407749176, -0.02946890890598297, -0.018282048404216766, -0.0070951879024505615, 0.004091672599315643, 0.015278533101081848, 0.026465393602848053, 0.03765225410461426, 0.04883911460638046, 0.06002597510814667, 0.07121283560991287, 0.08239969611167908, 0.09358655661344528, 0.10477341711521149, 0.11596027761697769, 0.1271471381187439, 0.1383340060710907, 0.1495208591222763, 0.16070771217346191, 0.17189458012580872, 0.18308144807815552, 0.19426830112934113, 0.20545515418052673, 0.21664202213287354, 0.22782889008522034, 0.23901574313640594, 0.25020259618759155, 0.26138946413993835]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 1.0, 2.0, 1.0, 6.0, 9.0, 6.0, 21.0, 20.0, 43.0, 48.0, 77.0, 147.0, 315.0, 661.0, 1790.0, 5842.0, 26897.0, 195639.0, 715486.0, 81559.0, 14204.0, 3537.0, 1170.0, 518.0, 230.0, 121.0, 86.0, 45.0, 29.0, 14.0, 12.0, 8.0, 8.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.55615234375, -0.5399398803710938, -0.5237274169921875, -0.5075149536132812, -0.491302490234375, -0.47509002685546875, -0.4588775634765625, -0.44266510009765625, -0.42645263671875, -0.41024017333984375, -0.3940277099609375, -0.37781524658203125, -0.361602783203125, -0.34539031982421875, -0.3291778564453125, -0.31296539306640625, -0.2967529296875, -0.28054046630859375, -0.2643280029296875, -0.24811553955078125, -0.231903076171875, -0.21569061279296875, -0.1994781494140625, -0.18326568603515625, -0.16705322265625, -0.15084075927734375, -0.1346282958984375, -0.11841583251953125, -0.102203369140625, -0.08599090576171875, -0.0697784423828125, -0.05356597900390625, -0.037353515625, -0.02114105224609375, -0.0049285888671875, 0.01128387451171875, 0.027496337890625, 0.04370880126953125, 0.0599212646484375, 0.07613372802734375, 0.09234619140625, 0.10855865478515625, 0.1247711181640625, 0.14098358154296875, 0.157196044921875, 0.17340850830078125, 0.1896209716796875, 0.20583343505859375, 0.2220458984375, 0.23825836181640625, 0.2544708251953125, 0.27068328857421875, 0.286895751953125, 0.30310821533203125, 0.3193206787109375, 0.33553314208984375, 0.35174560546875, 0.36795806884765625, 0.3841705322265625, 0.40038299560546875, 0.416595458984375, 0.43280792236328125, 0.4490203857421875, 0.46523284912109375, 0.4814453125]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 6.0, 5.0, 8.0, 19.0, 25.0, 31.0, 34.0, 38.0, 59.0, 66.0, 85.0, 85.0, 76.0, 96.0, 75.0, 60.0, 51.0, 45.0, 35.0, 27.0, 21.0, 23.0, 9.0, 8.0, 10.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.400390625, -1.3680572509765625, -1.335723876953125, -1.3033905029296875, -1.27105712890625, -1.2387237548828125, -1.206390380859375, -1.1740570068359375, -1.1417236328125, -1.1093902587890625, -1.077056884765625, -1.0447235107421875, -1.01239013671875, -0.9800567626953125, -0.947723388671875, -0.9153900146484375, -0.883056640625, -0.8507232666015625, -0.818389892578125, -0.7860565185546875, -0.75372314453125, -0.7213897705078125, -0.689056396484375, -0.6567230224609375, -0.6243896484375, -0.5920562744140625, -0.559722900390625, -0.5273895263671875, -0.49505615234375, -0.4627227783203125, -0.430389404296875, -0.3980560302734375, -0.36572265625, -0.3333892822265625, -0.301055908203125, -0.2687225341796875, -0.23638916015625, -0.2040557861328125, -0.171722412109375, -0.1393890380859375, -0.1070556640625, -0.0747222900390625, -0.042388916015625, -0.0100555419921875, 0.02227783203125, 0.0546112060546875, 0.086944580078125, 0.1192779541015625, 0.151611328125, 0.1839447021484375, 0.216278076171875, 0.2486114501953125, 0.28094482421875, 0.3132781982421875, 0.345611572265625, 0.3779449462890625, 0.4102783203125, 0.4426116943359375, 0.474945068359375, 0.5072784423828125, 0.53961181640625, 0.5719451904296875, 0.604278564453125, 0.6366119384765625, 0.6689453125]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 7.0, 3.0, 1.0, 2.0, 8.0, 10.0, 12.0, 14.0, 18.0, 20.0, 13.0, 37.0, 43.0, 66.0, 102.0, 128.0, 274.0, 765.0, 9976.0, 974220.0, 60531.0, 1368.0, 380.0, 193.0, 101.0, 53.0, 48.0, 45.0, 26.0, 19.0, 18.0, 8.0, 12.0, 9.0, 5.0, 5.0, 4.0, 5.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2177734375, -1.1780853271484375, -1.138397216796875, -1.0987091064453125, -1.05902099609375, -1.0193328857421875, -0.979644775390625, -0.9399566650390625, -0.9002685546875, -0.8605804443359375, -0.820892333984375, -0.7812042236328125, -0.74151611328125, -0.7018280029296875, -0.662139892578125, -0.6224517822265625, -0.582763671875, -0.5430755615234375, -0.503387451171875, -0.4636993408203125, -0.42401123046875, -0.3843231201171875, -0.344635009765625, -0.3049468994140625, -0.2652587890625, -0.2255706787109375, -0.185882568359375, -0.1461944580078125, -0.10650634765625, -0.0668182373046875, -0.027130126953125, 0.0125579833984375, 0.05224609375, 0.0919342041015625, 0.131622314453125, 0.1713104248046875, 0.21099853515625, 0.2506866455078125, 0.290374755859375, 0.3300628662109375, 0.3697509765625, 0.4094390869140625, 0.449127197265625, 0.4888153076171875, 0.52850341796875, 0.5681915283203125, 0.607879638671875, 0.6475677490234375, 0.687255859375, 0.7269439697265625, 0.766632080078125, 0.8063201904296875, 0.84600830078125, 0.8856964111328125, 0.925384521484375, 0.9650726318359375, 1.0047607421875, 1.0444488525390625, 1.084136962890625, 1.1238250732421875, 1.16351318359375, 1.2032012939453125, 1.242889404296875, 1.2825775146484375, 1.322265625]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 7.0, 5.0, 7.0, 5.0, 1.0, 5.0, 8.0, 10.0, 18.0, 12.0, 17.0, 17.0, 27.0, 36.0, 35.0, 37.0, 35.0, 45.0, 57.0, 53.0, 49.0, 48.0, 57.0, 46.0, 45.0, 39.0, 41.0, 35.0, 45.0, 24.0, 36.0, 18.0, 19.0, 13.0, 12.0, 11.0, 9.0, 7.0, 3.0, 6.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.708984375, -0.6863021850585938, -0.6636199951171875, -0.6409378051757812, -0.618255615234375, -0.5955734252929688, -0.5728912353515625, -0.5502090454101562, -0.52752685546875, -0.5048446655273438, -0.4821624755859375, -0.45948028564453125, -0.436798095703125, -0.41411590576171875, -0.3914337158203125, -0.36875152587890625, -0.3460693359375, -0.32338714599609375, -0.3007049560546875, -0.27802276611328125, -0.255340576171875, -0.23265838623046875, -0.2099761962890625, -0.18729400634765625, -0.16461181640625, -0.14192962646484375, -0.1192474365234375, -0.09656524658203125, -0.073883056640625, -0.05120086669921875, -0.0285186767578125, -0.00583648681640625, 0.016845703125, 0.03952789306640625, 0.0622100830078125, 0.08489227294921875, 0.107574462890625, 0.13025665283203125, 0.1529388427734375, 0.17562103271484375, 0.19830322265625, 0.22098541259765625, 0.2436676025390625, 0.26634979248046875, 0.289031982421875, 0.31171417236328125, 0.3343963623046875, 0.35707855224609375, 0.3797607421875, 0.40244293212890625, 0.4251251220703125, 0.44780731201171875, 0.470489501953125, 0.49317169189453125, 0.5158538818359375, 0.5385360717773438, 0.56121826171875, 0.5839004516601562, 0.6065826416015625, 0.6292648315429688, 0.651947021484375, 0.6746292114257812, 0.6973114013671875, 0.7199935913085938, 0.74267578125]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 8.0, 14.0, 10.0, 18.0, 35.0, 74.0, 173.0, 455.0, 1420.0, 6534.0, 119906.0, 886633.0, 28622.0, 3229.0, 850.0, 290.0, 129.0, 64.0, 33.0, 18.0, 11.0, 9.0, 3.0, 6.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26611328125, -0.2567100524902344, -0.24730682373046875, -0.23790359497070312, -0.2285003662109375, -0.21909713745117188, -0.20969390869140625, -0.20029067993164062, -0.190887451171875, -0.18148422241210938, -0.17208099365234375, -0.16267776489257812, -0.1532745361328125, -0.14387130737304688, -0.13446807861328125, -0.12506484985351562, -0.11566162109375, -0.10625839233398438, -0.09685516357421875, -0.08745193481445312, -0.0780487060546875, -0.06864547729492188, -0.05924224853515625, -0.049839019775390625, -0.040435791015625, -0.031032562255859375, -0.02162933349609375, -0.012226104736328125, -0.0028228759765625, 0.006580352783203125, 0.01598358154296875, 0.025386810302734375, 0.0347900390625, 0.044193267822265625, 0.05359649658203125, 0.06299972534179688, 0.0724029541015625, 0.08180618286132812, 0.09120941162109375, 0.10061264038085938, 0.110015869140625, 0.11941909790039062, 0.12882232666015625, 0.13822555541992188, 0.1476287841796875, 0.15703201293945312, 0.16643524169921875, 0.17583847045898438, 0.18524169921875, 0.19464492797851562, 0.20404815673828125, 0.21345138549804688, 0.2228546142578125, 0.23225784301757812, 0.24166107177734375, 0.2510643005371094, 0.260467529296875, 0.2698707580566406, 0.27927398681640625, 0.2886772155761719, 0.2980804443359375, 0.3074836730957031, 0.31688690185546875, 0.3262901306152344, 0.335693359375]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 4.0, 4.0, 3.0, 9.0, 22.0, 20.0, 50.0, 66.0, 124.0, 204.0, 202.0, 105.0, 69.0, 30.0, 25.0, 24.0, 11.0, 9.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 7.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.832578659057617e-05, -3.712717443704605e-05, -3.592856228351593e-05, -3.472995012998581e-05, -3.353133797645569e-05, -3.233272582292557e-05, -3.113411366939545e-05, -2.9935501515865326e-05, -2.8736889362335205e-05, -2.7538277208805084e-05, -2.6339665055274963e-05, -2.5141052901744843e-05, -2.394244074821472e-05, -2.27438285946846e-05, -2.154521644115448e-05, -2.034660428762436e-05, -1.9147992134094238e-05, -1.7949379980564117e-05, -1.6750767827033997e-05, -1.5552155673503876e-05, -1.4353543519973755e-05, -1.3154931366443634e-05, -1.1956319212913513e-05, -1.0757707059383392e-05, -9.559094905853271e-06, -8.36048275232315e-06, -7.16187059879303e-06, -5.963258445262909e-06, -4.764646291732788e-06, -3.5660341382026672e-06, -2.3674219846725464e-06, -1.1688098311424255e-06, 2.9802322387695312e-08, 1.2284144759178162e-06, 2.427026629447937e-06, 3.625638782978058e-06, 4.824250936508179e-06, 6.0228630900382996e-06, 7.22147524356842e-06, 8.420087397098541e-06, 9.618699550628662e-06, 1.0817311704158783e-05, 1.2015923857688904e-05, 1.3214536011219025e-05, 1.4413148164749146e-05, 1.5611760318279266e-05, 1.6810372471809387e-05, 1.8008984625339508e-05, 1.920759677886963e-05, 2.040620893239975e-05, 2.160482108592987e-05, 2.280343323945999e-05, 2.4002045392990112e-05, 2.5200657546520233e-05, 2.6399269700050354e-05, 2.7597881853580475e-05, 2.8796494007110596e-05, 2.9995106160640717e-05, 3.119371831417084e-05, 3.239233046770096e-05, 3.359094262123108e-05, 3.47895547747612e-05, 3.598816692829132e-05, 3.718677908182144e-05, 3.838539123535156e-05]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 9.0, 6.0, 10.0, 23.0, 27.0, 49.0, 102.0, 250.0, 502.0, 1272.0, 3623.0, 14584.0, 177794.0, 789875.0, 49114.0, 7454.0, 2228.0, 886.0, 388.0, 162.0, 98.0, 37.0, 23.0, 13.0, 12.0, 6.0, 5.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.267333984375, -0.2599658966064453, -0.2525978088378906, -0.24522972106933594, -0.23786163330078125, -0.23049354553222656, -0.22312545776367188, -0.2157573699951172, -0.2083892822265625, -0.2010211944580078, -0.19365310668945312, -0.18628501892089844, -0.17891693115234375, -0.17154884338378906, -0.16418075561523438, -0.1568126678466797, -0.149444580078125, -0.1420764923095703, -0.13470840454101562, -0.12734031677246094, -0.11997222900390625, -0.11260414123535156, -0.10523605346679688, -0.09786796569824219, -0.0904998779296875, -0.08313179016113281, -0.07576370239257812, -0.06839561462402344, -0.06102752685546875, -0.05365943908691406, -0.046291351318359375, -0.03892326354980469, -0.03155517578125, -0.024187088012695312, -0.016819000244140625, -0.009450912475585938, -0.00208282470703125, 0.0052852630615234375, 0.012653350830078125, 0.020021438598632812, 0.0273895263671875, 0.03475761413574219, 0.042125701904296875, 0.04949378967285156, 0.05686187744140625, 0.06422996520996094, 0.07159805297851562, 0.07896614074707031, 0.086334228515625, 0.09370231628417969, 0.10107040405273438, 0.10843849182128906, 0.11580657958984375, 0.12317466735839844, 0.13054275512695312, 0.1379108428955078, 0.1452789306640625, 0.1526470184326172, 0.16001510620117188, 0.16738319396972656, 0.17475128173828125, 0.18211936950683594, 0.18948745727539062, 0.1968555450439453, 0.2042236328125]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 6.0, 8.0, 8.0, 12.0, 13.0, 25.0, 25.0, 46.0, 47.0, 65.0, 64.0, 89.0, 148.0, 100.0, 73.0, 73.0, 62.0, 23.0, 26.0, 16.0, 17.0, 9.0, 8.0, 4.0, 4.0, 4.0, 3.0, 4.0, 5.0, 4.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.061920166015625, -0.05995321273803711, -0.05798625946044922, -0.05601930618286133, -0.05405235290527344, -0.05208539962768555, -0.050118446350097656, -0.048151493072509766, -0.046184539794921875, -0.044217586517333984, -0.042250633239746094, -0.0402836799621582, -0.03831672668457031, -0.03634977340698242, -0.03438282012939453, -0.03241586685180664, -0.03044891357421875, -0.02848196029663086, -0.02651500701904297, -0.024548053741455078, -0.022581100463867188, -0.020614147186279297, -0.018647193908691406, -0.016680240631103516, -0.014713287353515625, -0.012746334075927734, -0.010779380798339844, -0.008812427520751953, -0.0068454742431640625, -0.004878520965576172, -0.0029115676879882812, -0.0009446144104003906, 0.0010223388671875, 0.0029892921447753906, 0.004956245422363281, 0.006923198699951172, 0.008890151977539062, 0.010857105255126953, 0.012824058532714844, 0.014791011810302734, 0.016757965087890625, 0.018724918365478516, 0.020691871643066406, 0.022658824920654297, 0.024625778198242188, 0.026592731475830078, 0.02855968475341797, 0.03052663803100586, 0.03249359130859375, 0.03446054458618164, 0.03642749786376953, 0.03839445114135742, 0.04036140441894531, 0.0423283576965332, 0.044295310974121094, 0.046262264251708984, 0.048229217529296875, 0.050196170806884766, 0.052163124084472656, 0.05413007736206055, 0.05609703063964844, 0.05806398391723633, 0.06003093719482422, 0.06199789047241211, 0.06396484375]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 8.0, 13.0, 17.0, 27.0, 47.0, 86.0, 116.0, 169.0, 185.0, 130.0, 80.0, 56.0, 23.0, 20.0, 7.0, 7.0, 5.0, 6.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1437605619430542, -1.091931939125061, -1.0401034355163574, -0.9882748126983643, -0.9364462494850159, -0.8846176862716675, -0.8327890634536743, -0.7809605002403259, -0.7291319370269775, -0.6773033738136292, -0.6254748106002808, -0.5736461877822876, -0.5218176245689392, -0.4699890613555908, -0.41816046833992004, -0.36633187532424927, -0.3145033121109009, -0.2626747488975525, -0.2108461558818817, -0.15901757776737213, -0.10718899965286255, -0.05536043643951416, -0.003531843423843384, 0.04829674959182739, 0.10012531280517578, 0.15195389091968536, 0.20378246903419495, 0.2556110620498657, 0.3074396252632141, 0.3592681884765625, 0.4110967814922333, 0.46292537450790405, 0.5147538185119629, 0.5665823817253113, 0.6184109449386597, 0.6702395677566528, 0.7220681309700012, 0.7738966941833496, 0.8257253170013428, 0.8775538802146912, 0.9293824434280396, 0.9812110066413879, 1.0330395698547363, 1.0848681926727295, 1.1366968154907227, 1.1885253190994263, 1.2403539419174194, 1.292182445526123, 1.3440110683441162, 1.3958396911621094, 1.447668194770813, 1.4994968175888062, 1.5513253211975098, 1.603153944015503, 1.654982566833496, 1.7068111896514893, 1.7586396932601929, 1.810468316078186, 1.8622968196868896, 1.9141254425048828, 1.965954065322876, 2.017782688140869, 2.069611072540283, 2.1214396953582764, 2.1732683181762695]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 6.0, 12.0, 10.0, 11.0, 11.0, 14.0, 12.0, 17.0, 10.0, 26.0, 25.0, 32.0, 34.0, 29.0, 33.0, 31.0, 50.0, 51.0, 42.0, 39.0, 32.0, 50.0, 46.0, 27.0, 38.0, 31.0, 37.0, 32.0, 32.0, 23.0, 31.0, 21.0, 20.0, 13.0, 11.0, 17.0, 13.0, 13.0, 7.0, 4.0, 6.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.192755937576294, -1.1580311059951782, -1.123306155204773, -1.0885813236236572, -1.0538564920425415, -1.0191316604614258, -0.9844067096710205, -0.9496818780899048, -0.9149569869041443, -0.8802320957183838, -0.8455072641372681, -0.8107823729515076, -0.7760574817657471, -0.7413326501846313, -0.7066077589988708, -0.6718828678131104, -0.6371580362319946, -0.6024331450462341, -0.5677083134651184, -0.5329834222793579, -0.4982585608959198, -0.4635336995124817, -0.4288088083267212, -0.3940839469432831, -0.35935908555984497, -0.32463422417640686, -0.28990936279296875, -0.25518447160720825, -0.22045961022377014, -0.18573474884033203, -0.15100987255573273, -0.11628499627113342, -0.08156025409698486, -0.046835385262966156, -0.012110516428947449, 0.02261435240507126, 0.057339221239089966, 0.09206408262252808, 0.12678895890712738, 0.16151383519172668, 0.1962386965751648, 0.2309635579586029, 0.265688419342041, 0.3004133105278015, 0.3351381719112396, 0.36986303329467773, 0.40458792448043823, 0.43931278586387634, 0.47403764724731445, 0.508762538433075, 0.5434873700141907, 0.5782122611999512, 0.6129370927810669, 0.6476619839668274, 0.6823868751525879, 0.7171117067337036, 0.7518365979194641, 0.7865614891052246, 0.8212863206863403, 0.8560112118721008, 0.8907361030578613, 0.925460934638977, 0.9601858258247375, 0.994910717010498, 1.0296355485916138]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 3.0, 7.0, 7.0, 9.0, 15.0, 25.0, 29.0, 55.0, 49.0, 82.0, 123.0, 221.0, 314.0, 526.0, 991.0, 1691.0, 3225.0, 6416.0, 16050.0, 83889.0, 3092828.0, 927257.0, 38699.0, 10665.0, 4806.0, 2573.0, 1412.0, 870.0, 501.0, 320.0, 186.0, 139.0, 86.0, 65.0, 36.0, 34.0, 21.0, 14.0, 9.0, 11.0, 7.0, 5.0, 5.0, 6.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.96142578125, -0.9302291870117188, -0.8990325927734375, -0.8678359985351562, -0.836639404296875, -0.8054428100585938, -0.7742462158203125, -0.7430496215820312, -0.71185302734375, -0.6806564331054688, -0.6494598388671875, -0.6182632446289062, -0.587066650390625, -0.5558700561523438, -0.5246734619140625, -0.49347686767578125, -0.4622802734375, -0.43108367919921875, -0.3998870849609375, -0.36869049072265625, -0.337493896484375, -0.30629730224609375, -0.2751007080078125, -0.24390411376953125, -0.21270751953125, -0.18151092529296875, -0.1503143310546875, -0.11911773681640625, -0.087921142578125, -0.05672454833984375, -0.0255279541015625, 0.00566864013671875, 0.036865234375, 0.06806182861328125, 0.0992584228515625, 0.13045501708984375, 0.161651611328125, 0.19284820556640625, 0.2240447998046875, 0.25524139404296875, 0.28643798828125, 0.31763458251953125, 0.3488311767578125, 0.38002777099609375, 0.411224365234375, 0.44242095947265625, 0.4736175537109375, 0.5048141479492188, 0.5360107421875, 0.5672073364257812, 0.5984039306640625, 0.6296005249023438, 0.660797119140625, 0.6919937133789062, 0.7231903076171875, 0.7543869018554688, 0.78558349609375, 0.8167800903320312, 0.8479766845703125, 0.8791732788085938, 0.910369873046875, 0.9415664672851562, 0.9727630615234375, 1.0039596557617188, 1.03515625]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 4.0, 8.0, 5.0, 4.0, 6.0, 17.0, 14.0, 18.0, 24.0, 33.0, 22.0, 33.0, 40.0, 45.0, 52.0, 40.0, 38.0, 62.0, 59.0, 53.0, 60.0, 49.0, 41.0, 50.0, 34.0, 47.0, 39.0, 25.0, 22.0, 12.0, 12.0, 9.0, 8.0, 4.0, 5.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.392578125, -0.38175201416015625, -0.3709259033203125, -0.36009979248046875, -0.349273681640625, -0.33844757080078125, -0.3276214599609375, -0.31679534912109375, -0.30596923828125, -0.29514312744140625, -0.2843170166015625, -0.27349090576171875, -0.262664794921875, -0.25183868408203125, -0.2410125732421875, -0.23018646240234375, -0.2193603515625, -0.20853424072265625, -0.1977081298828125, -0.18688201904296875, -0.176055908203125, -0.16522979736328125, -0.1544036865234375, -0.14357757568359375, -0.13275146484375, -0.12192535400390625, -0.1110992431640625, -0.10027313232421875, -0.089447021484375, -0.07862091064453125, -0.0677947998046875, -0.05696868896484375, -0.046142578125, -0.03531646728515625, -0.0244903564453125, -0.01366424560546875, -0.002838134765625, 0.00798797607421875, 0.0188140869140625, 0.02964019775390625, 0.04046630859375, 0.05129241943359375, 0.0621185302734375, 0.07294464111328125, 0.083770751953125, 0.09459686279296875, 0.1054229736328125, 0.11624908447265625, 0.1270751953125, 0.13790130615234375, 0.1487274169921875, 0.15955352783203125, 0.170379638671875, 0.18120574951171875, 0.1920318603515625, 0.20285797119140625, 0.21368408203125, 0.22451019287109375, 0.2353363037109375, 0.24616241455078125, 0.256988525390625, 0.26781463623046875, 0.2786407470703125, 0.28946685791015625, 0.30029296875]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 6.0, 3.0, 3.0, 11.0, 11.0, 31.0, 35.0, 56.0, 110.0, 194.0, 408.0, 1031.0, 2916.0, 9871.0, 50814.0, 2868280.0, 1211245.0, 37033.0, 7990.0, 2439.0, 1000.0, 392.0, 190.0, 95.0, 38.0, 34.0, 18.0, 12.0, 5.0, 5.0, 6.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1748046875, -1.13800048828125, -1.1011962890625, -1.06439208984375, -1.027587890625, -0.99078369140625, -0.9539794921875, -0.91717529296875, -0.88037109375, -0.84356689453125, -0.8067626953125, -0.76995849609375, -0.733154296875, -0.69635009765625, -0.6595458984375, -0.62274169921875, -0.5859375, -0.54913330078125, -0.5123291015625, -0.47552490234375, -0.438720703125, -0.40191650390625, -0.3651123046875, -0.32830810546875, -0.29150390625, -0.25469970703125, -0.2178955078125, -0.18109130859375, -0.144287109375, -0.10748291015625, -0.0706787109375, -0.03387451171875, 0.0029296875, 0.03973388671875, 0.0765380859375, 0.11334228515625, 0.150146484375, 0.18695068359375, 0.2237548828125, 0.26055908203125, 0.29736328125, 0.33416748046875, 0.3709716796875, 0.40777587890625, 0.444580078125, 0.48138427734375, 0.5181884765625, 0.55499267578125, 0.591796875, 0.62860107421875, 0.6654052734375, 0.70220947265625, 0.739013671875, 0.77581787109375, 0.8126220703125, 0.84942626953125, 0.88623046875, 0.92303466796875, 0.9598388671875, 0.99664306640625, 1.033447265625, 1.07025146484375, 1.1070556640625, 1.14385986328125, 1.1806640625]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 8.0, 5.0, 8.0, 9.0, 7.0, 12.0, 24.0, 25.0, 61.0, 61.0, 86.0, 207.0, 422.0, 838.0, 986.0, 632.0, 290.0, 148.0, 77.0, 46.0, 32.0, 20.0, 13.0, 11.0, 9.0, 5.0, 6.0, 5.0, 9.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.27197265625, -0.2632789611816406, -0.25458526611328125, -0.24589157104492188, -0.2371978759765625, -0.22850418090820312, -0.21981048583984375, -0.21111679077148438, -0.202423095703125, -0.19372940063476562, -0.18503570556640625, -0.17634201049804688, -0.1676483154296875, -0.15895462036132812, -0.15026092529296875, -0.14156723022460938, -0.13287353515625, -0.12417984008789062, -0.11548614501953125, -0.10679244995117188, -0.0980987548828125, -0.08940505981445312, -0.08071136474609375, -0.07201766967773438, -0.063323974609375, -0.054630279541015625, -0.04593658447265625, -0.037242889404296875, -0.0285491943359375, -0.019855499267578125, -0.01116180419921875, -0.002468109130859375, 0.0062255859375, 0.014919281005859375, 0.02361297607421875, 0.032306671142578125, 0.0410003662109375, 0.049694061279296875, 0.05838775634765625, 0.06708145141601562, 0.075775146484375, 0.08446884155273438, 0.09316253662109375, 0.10185623168945312, 0.1105499267578125, 0.11924362182617188, 0.12793731689453125, 0.13663101196289062, 0.14532470703125, 0.15401840209960938, 0.16271209716796875, 0.17140579223632812, 0.1800994873046875, 0.18879318237304688, 0.19748687744140625, 0.20618057250976562, 0.214874267578125, 0.22356796264648438, 0.23226165771484375, 0.24095535278320312, 0.2496490478515625, 0.2583427429199219, 0.26703643798828125, 0.2757301330566406, 0.284423828125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 7.0, 7.0, 8.0, 15.0, 20.0, 26.0, 32.0, 42.0, 66.0, 80.0, 111.0, 110.0, 127.0, 89.0, 74.0, 59.0, 33.0, 29.0, 21.0, 16.0, 12.0, 9.0, 8.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7396411299705505, -0.7150020599365234, -0.6903629899024963, -0.6657239198684692, -0.6410848498344421, -0.616445779800415, -0.5918066501617432, -0.5671675801277161, -0.542528510093689, -0.5178894400596619, -0.49325037002563477, -0.46861129999160767, -0.4439722001552582, -0.4193331301212311, -0.394694060087204, -0.3700549602508545, -0.3454159200191498, -0.3207768499851227, -0.2961377799510956, -0.2714986801147461, -0.246859610080719, -0.2222205400466919, -0.1975814700126648, -0.1729423850774765, -0.1483033150434494, -0.1236642375588417, -0.09902516007423401, -0.07438609004020691, -0.04974701255559921, -0.025107935070991516, -0.0004688650369644165, 0.024170219898223877, 0.04880928993225098, 0.07344836741685867, 0.09808744490146637, 0.12272651493549347, 0.14736559987068176, 0.17200466990470886, 0.19664373993873596, 0.22128282487392426, 0.24592189490795135, 0.27056097984313965, 0.29520004987716675, 0.31983911991119385, 0.34447818994522095, 0.36911725997924805, 0.39375633001327515, 0.41839542984962463, 0.44303449988365173, 0.46767356991767883, 0.49231263995170593, 0.5169517397880554, 0.5415908098220825, 0.5662298798561096, 0.5908689498901367, 0.6155080199241638, 0.6401470899581909, 0.664786159992218, 0.6894252300262451, 0.7140643000602722, 0.7387033700942993, 0.7633424997329712, 0.7879815101623535, 0.8126206398010254, 0.8372597098350525]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 4.0, 3.0, 2.0, 6.0, 8.0, 13.0, 17.0, 14.0, 9.0, 18.0, 15.0, 17.0, 27.0, 17.0, 26.0, 29.0, 34.0, 29.0, 37.0, 35.0, 52.0, 45.0, 43.0, 41.0, 38.0, 45.0, 35.0, 40.0, 29.0, 32.0, 29.0, 32.0, 21.0, 27.0, 11.0, 19.0, 15.0, 21.0, 11.0, 9.0, 10.0, 9.0, 6.0, 3.0, 5.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0], "bins": [-0.35865145921707153, -0.3469490110874176, -0.3352465331554413, -0.32354408502578735, -0.3118416368961334, -0.3001391589641571, -0.2884367108345032, -0.27673423290252686, -0.2650317847728729, -0.253329336643219, -0.24162687361240387, -0.22992441058158875, -0.21822194755077362, -0.2065194845199585, -0.19481703639030457, -0.18311457335948944, -0.1714121252298355, -0.15970966219902039, -0.14800721406936646, -0.13630475103855133, -0.1246022880077362, -0.11289983242750168, -0.10119737684726715, -0.08949491381645203, -0.0777924582362175, -0.06609000265598297, -0.05438753962516785, -0.04268508404493332, -0.030982624739408493, -0.019280165433883667, -0.007577709853649139, 0.004124753177165985, 0.015827208757400513, 0.02752966806292534, 0.039232127368450165, 0.05093458294868469, 0.06263704597949982, 0.07433950155973434, 0.08604195713996887, 0.097744420170784, 0.10944687575101852, 0.12114933133125305, 0.13285179436206818, 0.1445542573928833, 0.15625670552253723, 0.16795916855335236, 0.17966163158416748, 0.1913640797138214, 0.20306654274463654, 0.21476900577545166, 0.2264714539051056, 0.23817391693592072, 0.24987637996673584, 0.26157882809638977, 0.2732812762260437, 0.28498375415802, 0.29668620228767395, 0.3083886504173279, 0.3200911283493042, 0.33179357647895813, 0.34349602460861206, 0.3551985025405884, 0.3669009506702423, 0.37860339879989624, 0.39030587673187256]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 1.0, 6.0, 13.0, 16.0, 21.0, 34.0, 60.0, 113.0, 152.0, 273.0, 478.0, 806.0, 1434.0, 2436.0, 4741.0, 9597.0, 23414.0, 82497.0, 487162.0, 341498.0, 58060.0, 18536.0, 8106.0, 4034.0, 2175.0, 1177.0, 655.0, 412.0, 253.0, 136.0, 99.0, 61.0, 39.0, 17.0, 14.0, 12.0, 6.0, 4.0, 4.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.16552734375, -0.16033554077148438, -0.15514373779296875, -0.14995193481445312, -0.1447601318359375, -0.13956832885742188, -0.13437652587890625, -0.12918472290039062, -0.123992919921875, -0.11880111694335938, -0.11360931396484375, -0.10841751098632812, -0.1032257080078125, -0.09803390502929688, -0.09284210205078125, -0.08765029907226562, -0.08245849609375, -0.07726669311523438, -0.07207489013671875, -0.06688308715820312, -0.0616912841796875, -0.056499481201171875, -0.05130767822265625, -0.046115875244140625, -0.040924072265625, -0.035732269287109375, -0.03054046630859375, -0.025348663330078125, -0.0201568603515625, -0.014965057373046875, -0.00977325439453125, -0.004581451416015625, 0.0006103515625, 0.005802154541015625, 0.01099395751953125, 0.016185760498046875, 0.0213775634765625, 0.026569366455078125, 0.03176116943359375, 0.036952972412109375, 0.042144775390625, 0.047336578369140625, 0.05252838134765625, 0.057720184326171875, 0.0629119873046875, 0.06810379028320312, 0.07329559326171875, 0.07848739624023438, 0.08367919921875, 0.08887100219726562, 0.09406280517578125, 0.09925460815429688, 0.1044464111328125, 0.10963821411132812, 0.11483001708984375, 0.12002182006835938, 0.125213623046875, 0.13040542602539062, 0.13559722900390625, 0.14078903198242188, 0.1459808349609375, 0.15117263793945312, 0.15636444091796875, 0.16155624389648438, 0.166748046875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 5.0, 3.0, 3.0, 4.0, 4.0, 11.0, 10.0, 12.0, 13.0, 15.0, 16.0, 20.0, 18.0, 26.0, 29.0, 24.0, 38.0, 25.0, 38.0, 40.0, 44.0, 54.0, 43.0, 47.0, 55.0, 41.0, 36.0, 30.0, 39.0, 36.0, 36.0, 31.0, 25.0, 23.0, 25.0, 17.0, 6.0, 13.0, 10.0, 10.0, 10.0, 3.0, 8.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0], "bins": [-0.251953125, -0.24410247802734375, -0.2362518310546875, -0.22840118408203125, -0.220550537109375, -0.21269989013671875, -0.2048492431640625, -0.19699859619140625, -0.18914794921875, -0.18129730224609375, -0.1734466552734375, -0.16559600830078125, -0.157745361328125, -0.14989471435546875, -0.1420440673828125, -0.13419342041015625, -0.1263427734375, -0.11849212646484375, -0.1106414794921875, -0.10279083251953125, -0.094940185546875, -0.08708953857421875, -0.0792388916015625, -0.07138824462890625, -0.06353759765625, -0.05568695068359375, -0.0478363037109375, -0.03998565673828125, -0.032135009765625, -0.02428436279296875, -0.0164337158203125, -0.00858306884765625, -0.000732421875, 0.00711822509765625, 0.0149688720703125, 0.02281951904296875, 0.030670166015625, 0.03852081298828125, 0.0463714599609375, 0.05422210693359375, 0.06207275390625, 0.06992340087890625, 0.0777740478515625, 0.08562469482421875, 0.093475341796875, 0.10132598876953125, 0.1091766357421875, 0.11702728271484375, 0.1248779296875, 0.13272857666015625, 0.1405792236328125, 0.14842987060546875, 0.156280517578125, 0.16413116455078125, 0.1719818115234375, 0.17983245849609375, 0.18768310546875, 0.19553375244140625, 0.2033843994140625, 0.21123504638671875, 0.219085693359375, 0.22693634033203125, 0.2347869873046875, 0.24263763427734375, 0.25048828125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 6.0, 7.0, 8.0, 12.0, 24.0, 40.0, 72.0, 86.0, 155.0, 292.0, 561.0, 1117.0, 2646.0, 7522.0, 27081.0, 164729.0, 636907.0, 167343.0, 27418.0, 7527.0, 2682.0, 1095.0, 533.0, 269.0, 144.0, 87.0, 67.0, 40.0, 22.0, 17.0, 11.0, 8.0, 7.0, 2.0, 5.0, 2.0, 2.0, 0.0, 5.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.12115478515625, -0.11690425872802734, -0.11265373229980469, -0.10840320587158203, -0.10415267944335938, -0.09990215301513672, -0.09565162658691406, -0.0914011001586914, -0.08715057373046875, -0.0829000473022461, -0.07864952087402344, -0.07439899444580078, -0.07014846801757812, -0.06589794158935547, -0.06164741516113281, -0.057396888732910156, -0.0531463623046875, -0.048895835876464844, -0.04464530944824219, -0.04039478302001953, -0.036144256591796875, -0.03189373016357422, -0.027643203735351562, -0.023392677307128906, -0.01914215087890625, -0.014891624450683594, -0.010641098022460938, -0.006390571594238281, -0.002140045166015625, 0.0021104812622070312, 0.0063610076904296875, 0.010611534118652344, 0.014862060546875, 0.019112586975097656, 0.023363113403320312, 0.02761363983154297, 0.031864166259765625, 0.03611469268798828, 0.04036521911621094, 0.044615745544433594, 0.04886627197265625, 0.053116798400878906, 0.05736732482910156, 0.06161785125732422, 0.06586837768554688, 0.07011890411376953, 0.07436943054199219, 0.07861995697021484, 0.0828704833984375, 0.08712100982666016, 0.09137153625488281, 0.09562206268310547, 0.09987258911132812, 0.10412311553955078, 0.10837364196777344, 0.1126241683959961, 0.11687469482421875, 0.1211252212524414, 0.12537574768066406, 0.12962627410888672, 0.13387680053710938, 0.13812732696533203, 0.1423778533935547, 0.14662837982177734, 0.15087890625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 7.0, 5.0, 10.0, 5.0, 8.0, 11.0, 13.0, 18.0, 14.0, 27.0, 25.0, 24.0, 25.0, 29.0, 31.0, 36.0, 46.0, 36.0, 51.0, 39.0, 39.0, 47.0, 50.0, 61.0, 52.0, 38.0, 36.0, 22.0, 23.0, 23.0, 26.0, 28.0, 16.0, 18.0, 11.0, 11.0, 12.0, 8.0, 5.0, 5.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.50634765625, -0.4906730651855469, -0.47499847412109375, -0.4593238830566406, -0.4436492919921875, -0.4279747009277344, -0.41230010986328125, -0.3966255187988281, -0.380950927734375, -0.3652763366699219, -0.34960174560546875, -0.3339271545410156, -0.3182525634765625, -0.3025779724121094, -0.28690338134765625, -0.2712287902832031, -0.25555419921875, -0.23987960815429688, -0.22420501708984375, -0.20853042602539062, -0.1928558349609375, -0.17718124389648438, -0.16150665283203125, -0.14583206176757812, -0.130157470703125, -0.11448287963867188, -0.09880828857421875, -0.08313369750976562, -0.0674591064453125, -0.051784515380859375, -0.03610992431640625, -0.020435333251953125, -0.0047607421875, 0.010913848876953125, 0.02658843994140625, 0.042263031005859375, 0.0579376220703125, 0.07361221313476562, 0.08928680419921875, 0.10496139526367188, 0.120635986328125, 0.13631057739257812, 0.15198516845703125, 0.16765975952148438, 0.1833343505859375, 0.19900894165039062, 0.21468353271484375, 0.23035812377929688, 0.24603271484375, 0.2617073059082031, 0.27738189697265625, 0.2930564880371094, 0.3087310791015625, 0.3244056701660156, 0.34008026123046875, 0.3557548522949219, 0.371429443359375, 0.3871040344238281, 0.40277862548828125, 0.4184532165527344, 0.4341278076171875, 0.4498023986816406, 0.46547698974609375, 0.4811515808105469, 0.496826171875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 6.0, 13.0, 11.0, 20.0, 25.0, 56.0, 76.0, 146.0, 238.0, 409.0, 820.0, 1778.0, 4502.0, 13192.0, 55663.0, 367762.0, 500319.0, 77467.0, 16561.0, 5359.0, 2115.0, 913.0, 480.0, 244.0, 150.0, 85.0, 40.0, 37.0, 24.0, 18.0, 3.0, 8.0, 8.0, 7.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.06170654296875, -0.060128211975097656, -0.05854988098144531, -0.05697154998779297, -0.055393218994140625, -0.05381488800048828, -0.05223655700683594, -0.050658226013183594, -0.04907989501953125, -0.047501564025878906, -0.04592323303222656, -0.04434490203857422, -0.042766571044921875, -0.04118824005126953, -0.03960990905761719, -0.038031578063964844, -0.0364532470703125, -0.034874916076660156, -0.03329658508300781, -0.03171825408935547, -0.030139923095703125, -0.02856159210205078, -0.026983261108398438, -0.025404930114746094, -0.02382659912109375, -0.022248268127441406, -0.020669937133789062, -0.01909160614013672, -0.017513275146484375, -0.01593494415283203, -0.014356613159179688, -0.012778282165527344, -0.011199951171875, -0.009621620178222656, -0.008043289184570312, -0.006464958190917969, -0.004886627197265625, -0.0033082962036132812, -0.0017299652099609375, -0.00015163421630859375, 0.00142669677734375, 0.0030050277709960938, 0.0045833587646484375, 0.006161689758300781, 0.007740020751953125, 0.009318351745605469, 0.010896682739257812, 0.012475013732910156, 0.0140533447265625, 0.015631675720214844, 0.017210006713867188, 0.01878833770751953, 0.020366668701171875, 0.02194499969482422, 0.023523330688476562, 0.025101661682128906, 0.02667999267578125, 0.028258323669433594, 0.029836654663085938, 0.03141498565673828, 0.032993316650390625, 0.03457164764404297, 0.03614997863769531, 0.037728309631347656, 0.039306640625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 6.0, 5.0, 3.0, 4.0, 14.0, 12.0, 24.0, 28.0, 31.0, 47.0, 55.0, 96.0, 91.0, 117.0, 85.0, 113.0, 72.0, 62.0, 31.0, 34.0, 18.0, 12.0, 14.0, 7.0, 8.0, 0.0, 2.0, 4.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.0265579223632812e-05, -1.9505620002746582e-05, -1.874566078186035e-05, -1.798570156097412e-05, -1.722574234008789e-05, -1.646578311920166e-05, -1.570582389831543e-05, -1.49458646774292e-05, -1.4185905456542969e-05, -1.3425946235656738e-05, -1.2665987014770508e-05, -1.1906027793884277e-05, -1.1146068572998047e-05, -1.0386109352111816e-05, -9.626150131225586e-06, -8.866190910339355e-06, -8.106231689453125e-06, -7.3462724685668945e-06, -6.586313247680664e-06, -5.826354026794434e-06, -5.066394805908203e-06, -4.306435585021973e-06, -3.546476364135742e-06, -2.7865171432495117e-06, -2.0265579223632812e-06, -1.2665987014770508e-06, -5.066394805908203e-07, 2.5331974029541016e-07, 1.0132789611816406e-06, 1.773238182067871e-06, 2.5331974029541016e-06, 3.293156623840332e-06, 4.0531158447265625e-06, 4.813075065612793e-06, 5.5730342864990234e-06, 6.332993507385254e-06, 7.092952728271484e-06, 7.852911949157715e-06, 8.612871170043945e-06, 9.372830390930176e-06, 1.0132789611816406e-05, 1.0892748832702637e-05, 1.1652708053588867e-05, 1.2412667274475098e-05, 1.3172626495361328e-05, 1.3932585716247559e-05, 1.4692544937133789e-05, 1.545250415802002e-05, 1.621246337890625e-05, 1.697242259979248e-05, 1.773238182067871e-05, 1.849234104156494e-05, 1.9252300262451172e-05, 2.0012259483337402e-05, 2.0772218704223633e-05, 2.1532177925109863e-05, 2.2292137145996094e-05, 2.3052096366882324e-05, 2.3812055587768555e-05, 2.4572014808654785e-05, 2.5331974029541016e-05, 2.6091933250427246e-05, 2.6851892471313477e-05, 2.7611851692199707e-05, 2.8371810913085938e-05]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 2.0, 5.0, 4.0, 12.0, 27.0, 41.0, 55.0, 115.0, 143.0, 330.0, 550.0, 1159.0, 2353.0, 5433.0, 14189.0, 47621.0, 216166.0, 530180.0, 169869.0, 39122.0, 12171.0, 4764.0, 2048.0, 1057.0, 497.0, 271.0, 159.0, 71.0, 42.0, 33.0, 17.0, 21.0, 6.0, 8.0, 2.0, 4.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05126953125, -0.04968833923339844, -0.048107147216796875, -0.04652595520019531, -0.04494476318359375, -0.04336357116699219, -0.041782379150390625, -0.04020118713378906, -0.0386199951171875, -0.03703880310058594, -0.035457611083984375, -0.03387641906738281, -0.03229522705078125, -0.030714035034179688, -0.029132843017578125, -0.027551651000976562, -0.025970458984375, -0.024389266967773438, -0.022808074951171875, -0.021226882934570312, -0.01964569091796875, -0.018064498901367188, -0.016483306884765625, -0.014902114868164062, -0.0133209228515625, -0.011739730834960938, -0.010158538818359375, -0.008577346801757812, -0.00699615478515625, -0.0054149627685546875, -0.003833770751953125, -0.0022525787353515625, -0.00067138671875, 0.0009098052978515625, 0.002490997314453125, 0.0040721893310546875, 0.00565338134765625, 0.0072345733642578125, 0.008815765380859375, 0.010396957397460938, 0.0119781494140625, 0.013559341430664062, 0.015140533447265625, 0.016721725463867188, 0.01830291748046875, 0.019884109497070312, 0.021465301513671875, 0.023046493530273438, 0.024627685546875, 0.026208877563476562, 0.027790069580078125, 0.029371261596679688, 0.03095245361328125, 0.03253364562988281, 0.034114837646484375, 0.03569602966308594, 0.0372772216796875, 0.03885841369628906, 0.040439605712890625, 0.04202079772949219, 0.04360198974609375, 0.04518318176269531, 0.046764373779296875, 0.04834556579589844, 0.0499267578125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 5.0, 4.0, 0.0, 5.0, 7.0, 12.0, 17.0, 11.0, 22.0, 29.0, 47.0, 67.0, 80.0, 69.0, 106.0, 98.0, 98.0, 87.0, 54.0, 51.0, 39.0, 16.0, 20.0, 20.0, 12.0, 7.0, 8.0, 4.0, 6.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01157379150390625, -0.011160612106323242, -0.010747432708740234, -0.010334253311157227, -0.009921073913574219, -0.009507894515991211, -0.009094715118408203, -0.008681535720825195, -0.008268356323242188, -0.00785517692565918, -0.007441997528076172, -0.007028818130493164, -0.006615638732910156, -0.0062024593353271484, -0.005789279937744141, -0.005376100540161133, -0.004962921142578125, -0.004549741744995117, -0.004136562347412109, -0.0037233829498291016, -0.0033102035522460938, -0.002897024154663086, -0.002483844757080078, -0.0020706653594970703, -0.0016574859619140625, -0.0012443065643310547, -0.0008311271667480469, -0.00041794776916503906, -4.76837158203125e-06, 0.00040841102600097656, 0.0008215904235839844, 0.0012347698211669922, 0.00164794921875, 0.002061128616333008, 0.0024743080139160156, 0.0028874874114990234, 0.0033006668090820312, 0.003713846206665039, 0.004127025604248047, 0.004540205001831055, 0.0049533843994140625, 0.00536656379699707, 0.005779743194580078, 0.006192922592163086, 0.006606101989746094, 0.0070192813873291016, 0.007432460784912109, 0.007845640182495117, 0.008258819580078125, 0.008671998977661133, 0.00908517837524414, 0.009498357772827148, 0.009911537170410156, 0.010324716567993164, 0.010737895965576172, 0.01115107536315918, 0.011564254760742188, 0.011977434158325195, 0.012390613555908203, 0.012803792953491211, 0.013216972351074219, 0.013630151748657227, 0.014043331146240234, 0.014456510543823242, 0.01486968994140625]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 3.0, 6.0, 8.0, 12.0, 16.0, 21.0, 37.0, 51.0, 66.0, 109.0, 117.0, 144.0, 127.0, 83.0, 65.0, 34.0, 34.0, 24.0, 14.0, 11.0, 11.0, 7.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.29080694913864136, -0.2751384973526001, -0.2594700753688812, -0.24380162358283997, -0.2281331717967987, -0.21246473491191864, -0.19679629802703857, -0.18112784624099731, -0.16545940935611725, -0.14979097247123718, -0.13412252068519592, -0.11845408380031586, -0.1027856394648552, -0.08711719512939453, -0.07144875824451447, -0.0557803139090538, -0.04011186957359314, -0.024443427100777626, -0.008774984627962112, 0.006893455982208252, 0.022561900317668915, 0.03823034465312958, 0.053898781538009644, 0.0695672258734703, 0.08523567020893097, 0.10090411454439163, 0.1165725588798523, 0.13224099576473236, 0.14790943264961243, 0.1635778844356537, 0.17924632132053375, 0.19491475820541382, 0.21058320999145508, 0.22625164687633514, 0.2419200986623764, 0.25758853554725647, 0.27325698733329773, 0.2889254093170166, 0.30459386110305786, 0.3202623128890991, 0.3359307646751404, 0.35159921646118164, 0.3672676384449005, 0.3829360902309418, 0.39860454201698303, 0.4142729640007019, 0.42994141578674316, 0.4456098675727844, 0.4612782895565033, 0.47694674134254456, 0.4926151633262634, 0.5082836151123047, 0.523952066898346, 0.5396205186843872, 0.5552889108657837, 0.570957362651825, 0.5866258144378662, 0.6022942662239075, 0.6179627180099487, 0.6336311101913452, 0.6492995619773865, 0.6649680137634277, 0.680636465549469, 0.6963049173355103, 0.7119733691215515]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 4.0, 4.0, 6.0, 11.0, 5.0, 11.0, 7.0, 15.0, 14.0, 13.0, 23.0, 20.0, 20.0, 36.0, 30.0, 25.0, 36.0, 30.0, 39.0, 45.0, 50.0, 37.0, 46.0, 47.0, 42.0, 46.0, 42.0, 35.0, 31.0, 32.0, 35.0, 22.0, 17.0, 22.0, 15.0, 13.0, 19.0, 14.0, 7.0, 10.0, 9.0, 2.0, 4.0, 3.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.22526301443576813, -0.21805152297019958, -0.21084003150463104, -0.2036285400390625, -0.19641704857349396, -0.18920555710792542, -0.18199406564235687, -0.17478257417678833, -0.1675710827112198, -0.16035959124565125, -0.1531480997800827, -0.14593660831451416, -0.13872511684894562, -0.13151362538337708, -0.12430213391780853, -0.11709064245223999, -0.10987914353609085, -0.10266765207052231, -0.09545616060495377, -0.08824466913938522, -0.08103317767381668, -0.07382167875766754, -0.066610187292099, -0.059398699551820755, -0.05218720808625221, -0.04497571662068367, -0.03776422515511513, -0.030552731826901436, -0.023341240361332893, -0.0161297470331192, -0.00891825556755066, -0.0017067641019821167, 0.005504727363586426, 0.012716218829154968, 0.01992771029472351, 0.027139203622937202, 0.034350693225860596, 0.04156218841671944, 0.04877367988228798, 0.05598517134785652, 0.06319665908813477, 0.07040815055370331, 0.07761964201927185, 0.0848311334848404, 0.09204262495040894, 0.09925411641597748, 0.10646560788154602, 0.11367709934711456, 0.1208885982632637, 0.12810009717941284, 0.13531158864498138, 0.14252308011054993, 0.14973457157611847, 0.156946063041687, 0.16415755450725555, 0.1713690459728241, 0.17858053743839264, 0.18579202890396118, 0.19300352036952972, 0.20021501183509827, 0.2074265033006668, 0.21463799476623535, 0.2218494862318039, 0.22906097769737244, 0.23627246916294098]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 7.0, 13.0, 6.0, 23.0, 31.0, 33.0, 54.0, 70.0, 104.0, 158.0, 222.0, 308.0, 470.0, 646.0, 903.0, 1384.0, 2075.0, 3486.0, 6072.0, 11691.0, 27449.0, 97874.0, 532848.0, 272007.0, 50894.0, 18298.0, 8474.0, 4674.0, 2746.0, 1745.0, 1222.0, 790.0, 514.0, 370.0, 291.0, 190.0, 112.0, 92.0, 62.0, 48.0, 40.0, 20.0, 13.0, 8.0, 10.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.380859375, -0.36887359619140625, -0.3568878173828125, -0.34490203857421875, -0.332916259765625, -0.32093048095703125, -0.3089447021484375, -0.29695892333984375, -0.28497314453125, -0.27298736572265625, -0.2610015869140625, -0.24901580810546875, -0.237030029296875, -0.22504425048828125, -0.2130584716796875, -0.20107269287109375, -0.1890869140625, -0.17710113525390625, -0.1651153564453125, -0.15312957763671875, -0.141143798828125, -0.12915802001953125, -0.1171722412109375, -0.10518646240234375, -0.09320068359375, -0.08121490478515625, -0.0692291259765625, -0.05724334716796875, -0.045257568359375, -0.03327178955078125, -0.0212860107421875, -0.00930023193359375, 0.002685546875, 0.01467132568359375, 0.0266571044921875, 0.03864288330078125, 0.050628662109375, 0.06261444091796875, 0.0746002197265625, 0.08658599853515625, 0.09857177734375, 0.11055755615234375, 0.1225433349609375, 0.13452911376953125, 0.146514892578125, 0.15850067138671875, 0.1704864501953125, 0.18247222900390625, 0.1944580078125, 0.20644378662109375, 0.2184295654296875, 0.23041534423828125, 0.242401123046875, 0.25438690185546875, 0.2663726806640625, 0.27835845947265625, 0.29034423828125, 0.30233001708984375, 0.3143157958984375, 0.32630157470703125, 0.338287353515625, 0.35027313232421875, 0.3622589111328125, 0.37424468994140625, 0.38623046875]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 6.0, 1.0, 5.0, 4.0, 6.0, 11.0, 7.0, 13.0, 13.0, 11.0, 17.0, 18.0, 21.0, 30.0, 27.0, 42.0, 27.0, 33.0, 52.0, 45.0, 47.0, 50.0, 63.0, 58.0, 53.0, 44.0, 44.0, 37.0, 45.0, 22.0, 27.0, 22.0, 17.0, 17.0, 17.0, 7.0, 14.0, 10.0, 8.0, 6.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.51904296875, -0.50274658203125, -0.4864501953125, -0.47015380859375, -0.453857421875, -0.43756103515625, -0.4212646484375, -0.40496826171875, -0.388671875, -0.37237548828125, -0.3560791015625, -0.33978271484375, -0.323486328125, -0.30718994140625, -0.2908935546875, -0.27459716796875, -0.25830078125, -0.24200439453125, -0.2257080078125, -0.20941162109375, -0.193115234375, -0.17681884765625, -0.1605224609375, -0.14422607421875, -0.1279296875, -0.11163330078125, -0.0953369140625, -0.07904052734375, -0.062744140625, -0.04644775390625, -0.0301513671875, -0.01385498046875, 0.00244140625, 0.01873779296875, 0.0350341796875, 0.05133056640625, 0.067626953125, 0.08392333984375, 0.1002197265625, 0.11651611328125, 0.1328125, 0.14910888671875, 0.1654052734375, 0.18170166015625, 0.197998046875, 0.21429443359375, 0.2305908203125, 0.24688720703125, 0.26318359375, 0.27947998046875, 0.2957763671875, 0.31207275390625, 0.328369140625, 0.34466552734375, 0.3609619140625, 0.37725830078125, 0.3935546875, 0.40985107421875, 0.4261474609375, 0.44244384765625, 0.458740234375, 0.47503662109375, 0.4913330078125, 0.50762939453125, 0.52392578125]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 0.0, 2.0, 5.0, 6.0, 12.0, 14.0, 20.0, 30.0, 35.0, 57.0, 78.0, 120.0, 184.0, 271.0, 455.0, 758.0, 1197.0, 2248.0, 4489.0, 11162.0, 36269.0, 368770.0, 553036.0, 45618.0, 12710.0, 5146.0, 2393.0, 1413.0, 737.0, 447.0, 268.0, 182.0, 141.0, 92.0, 66.0, 55.0, 26.0, 10.0, 13.0, 11.0, 4.0, 5.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5224609375, -0.5050888061523438, -0.4877166748046875, -0.47034454345703125, -0.452972412109375, -0.43560028076171875, -0.4182281494140625, -0.40085601806640625, -0.38348388671875, -0.36611175537109375, -0.3487396240234375, -0.33136749267578125, -0.313995361328125, -0.29662322998046875, -0.2792510986328125, -0.26187896728515625, -0.2445068359375, -0.22713470458984375, -0.2097625732421875, -0.19239044189453125, -0.175018310546875, -0.15764617919921875, -0.1402740478515625, -0.12290191650390625, -0.10552978515625, -0.08815765380859375, -0.0707855224609375, -0.05341339111328125, -0.036041259765625, -0.01866912841796875, -0.0012969970703125, 0.01607513427734375, 0.033447265625, 0.05081939697265625, 0.0681915283203125, 0.08556365966796875, 0.102935791015625, 0.12030792236328125, 0.1376800537109375, 0.15505218505859375, 0.17242431640625, 0.18979644775390625, 0.2071685791015625, 0.22454071044921875, 0.241912841796875, 0.25928497314453125, 0.2766571044921875, 0.29402923583984375, 0.3114013671875, 0.32877349853515625, 0.3461456298828125, 0.36351776123046875, 0.380889892578125, 0.39826202392578125, 0.4156341552734375, 0.43300628662109375, 0.45037841796875, 0.46775054931640625, 0.4851226806640625, 0.5024948120117188, 0.519866943359375, 0.5372390747070312, 0.5546112060546875, 0.5719833374023438, 0.58935546875]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 1.0, 3.0, 3.0, 0.0, 5.0, 5.0, 10.0, 6.0, 10.0, 12.0, 14.0, 12.0, 15.0, 19.0, 31.0, 32.0, 20.0, 37.0, 49.0, 42.0, 49.0, 71.0, 54.0, 47.0, 46.0, 55.0, 42.0, 44.0, 41.0, 37.0, 34.0, 34.0, 27.0, 15.0, 17.0, 14.0, 9.0, 10.0, 12.0, 8.0, 5.0, 4.0, 2.0, 3.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.493408203125, -0.4746284484863281, -0.45584869384765625, -0.4370689392089844, -0.4182891845703125, -0.3995094299316406, -0.38072967529296875, -0.3619499206542969, -0.343170166015625, -0.3243904113769531, -0.30561065673828125, -0.2868309020996094, -0.2680511474609375, -0.24927139282226562, -0.23049163818359375, -0.21171188354492188, -0.19293212890625, -0.17415237426757812, -0.15537261962890625, -0.13659286499023438, -0.1178131103515625, -0.09903335571289062, -0.08025360107421875, -0.061473846435546875, -0.042694091796875, -0.023914337158203125, -0.00513458251953125, 0.013645172119140625, 0.0324249267578125, 0.051204681396484375, 0.06998443603515625, 0.08876419067382812, 0.1075439453125, 0.12632369995117188, 0.14510345458984375, 0.16388320922851562, 0.1826629638671875, 0.20144271850585938, 0.22022247314453125, 0.23900222778320312, 0.257781982421875, 0.2765617370605469, 0.29534149169921875, 0.3141212463378906, 0.3329010009765625, 0.3516807556152344, 0.37046051025390625, 0.3892402648925781, 0.40802001953125, 0.4267997741699219, 0.44557952880859375, 0.4643592834472656, 0.4831390380859375, 0.5019187927246094, 0.5206985473632812, 0.5394783020019531, 0.558258056640625, 0.5770378112792969, 0.5958175659179688, 0.6145973205566406, 0.6333770751953125, 0.6521568298339844, 0.6709365844726562, 0.6897163391113281, 0.70849609375]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 6.0, 5.0, 3.0, 8.0, 17.0, 23.0, 23.0, 39.0, 63.0, 91.0, 166.0, 244.0, 488.0, 1070.0, 2487.0, 7196.0, 38149.0, 629945.0, 336867.0, 22535.0, 5239.0, 1925.0, 860.0, 468.0, 227.0, 150.0, 85.0, 43.0, 39.0, 28.0, 19.0, 12.0, 11.0, 6.0, 5.0, 5.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1534423828125, -0.1487751007080078, -0.14410781860351562, -0.13944053649902344, -0.13477325439453125, -0.13010597229003906, -0.12543869018554688, -0.12077140808105469, -0.1161041259765625, -0.11143684387207031, -0.10676956176757812, -0.10210227966308594, -0.09743499755859375, -0.09276771545410156, -0.08810043334960938, -0.08343315124511719, -0.078765869140625, -0.07409858703613281, -0.06943130493164062, -0.06476402282714844, -0.06009674072265625, -0.05542945861816406, -0.050762176513671875, -0.04609489440917969, -0.0414276123046875, -0.03676033020019531, -0.032093048095703125, -0.027425765991210938, -0.02275848388671875, -0.018091201782226562, -0.013423919677734375, -0.008756637573242188, -0.00408935546875, 0.0005779266357421875, 0.005245208740234375, 0.009912490844726562, 0.01457977294921875, 0.019247055053710938, 0.023914337158203125, 0.028581619262695312, 0.0332489013671875, 0.03791618347167969, 0.042583465576171875, 0.04725074768066406, 0.05191802978515625, 0.05658531188964844, 0.061252593994140625, 0.06591987609863281, 0.070587158203125, 0.07525444030761719, 0.07992172241210938, 0.08458900451660156, 0.08925628662109375, 0.09392356872558594, 0.09859085083007812, 0.10325813293457031, 0.1079254150390625, 0.11259269714355469, 0.11725997924804688, 0.12192726135253906, 0.12659454345703125, 0.13126182556152344, 0.13592910766601562, 0.1405963897705078, 0.145263671875]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 0.0, 2.0, 2.0, 2.0, 6.0, 4.0, 13.0, 22.0, 29.0, 37.0, 42.0, 77.0, 137.0, 151.0, 153.0, 102.0, 72.0, 56.0, 33.0, 23.0, 5.0, 8.0, 6.0, 12.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3663043975830078e-05, -2.2984109818935394e-05, -2.230517566204071e-05, -2.1626241505146027e-05, -2.0947307348251343e-05, -2.026837319135666e-05, -1.9589439034461975e-05, -1.891050487756729e-05, -1.8231570720672607e-05, -1.7552636563777924e-05, -1.687370240688324e-05, -1.6194768249988556e-05, -1.5515834093093872e-05, -1.4836899936199188e-05, -1.4157965779304504e-05, -1.347903162240982e-05, -1.2800097465515137e-05, -1.2121163308620453e-05, -1.1442229151725769e-05, -1.0763294994831085e-05, -1.0084360837936401e-05, -9.405426681041718e-06, -8.726492524147034e-06, -8.04755836725235e-06, -7.368624210357666e-06, -6.689690053462982e-06, -6.010755896568298e-06, -5.3318217396736145e-06, -4.652887582778931e-06, -3.973953425884247e-06, -3.295019268989563e-06, -2.616085112094879e-06, -1.9371509552001953e-06, -1.2582167983055115e-06, -5.792826414108276e-07, 9.96515154838562e-08, 7.7858567237854e-07, 1.4575198292732239e-06, 2.1364539861679077e-06, 2.8153881430625916e-06, 3.4943222999572754e-06, 4.173256456851959e-06, 4.852190613746643e-06, 5.531124770641327e-06, 6.210058927536011e-06, 6.888993084430695e-06, 7.567927241325378e-06, 8.246861398220062e-06, 8.925795555114746e-06, 9.60472971200943e-06, 1.0283663868904114e-05, 1.0962598025798798e-05, 1.1641532182693481e-05, 1.2320466339588165e-05, 1.2999400496482849e-05, 1.3678334653377533e-05, 1.4357268810272217e-05, 1.50362029671669e-05, 1.5715137124061584e-05, 1.639407128095627e-05, 1.7073005437850952e-05, 1.7751939594745636e-05, 1.843087375164032e-05, 1.9109807908535004e-05, 1.9788742065429688e-05]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 4.0, 5.0, 4.0, 10.0, 11.0, 9.0, 26.0, 38.0, 61.0, 86.0, 146.0, 197.0, 406.0, 900.0, 2315.0, 6865.0, 28628.0, 309478.0, 627044.0, 56170.0, 10466.0, 3209.0, 1249.0, 486.0, 312.0, 158.0, 101.0, 57.0, 39.0, 28.0, 13.0, 12.0, 10.0, 3.0, 3.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.1510009765625, -0.14615631103515625, -0.1413116455078125, -0.13646697998046875, -0.131622314453125, -0.12677764892578125, -0.1219329833984375, -0.11708831787109375, -0.11224365234375, -0.10739898681640625, -0.1025543212890625, -0.09770965576171875, -0.092864990234375, -0.08802032470703125, -0.0831756591796875, -0.07833099365234375, -0.073486328125, -0.06864166259765625, -0.0637969970703125, -0.05895233154296875, -0.054107666015625, -0.04926300048828125, -0.0444183349609375, -0.03957366943359375, -0.03472900390625, -0.02988433837890625, -0.0250396728515625, -0.02019500732421875, -0.015350341796875, -0.01050567626953125, -0.0056610107421875, -0.00081634521484375, 0.0040283203125, 0.00887298583984375, 0.0137176513671875, 0.01856231689453125, 0.023406982421875, 0.02825164794921875, 0.0330963134765625, 0.03794097900390625, 0.04278564453125, 0.04763031005859375, 0.0524749755859375, 0.05731964111328125, 0.062164306640625, 0.06700897216796875, 0.0718536376953125, 0.07669830322265625, 0.08154296875, 0.08638763427734375, 0.0912322998046875, 0.09607696533203125, 0.100921630859375, 0.10576629638671875, 0.1106109619140625, 0.11545562744140625, 0.12030029296875, 0.12514495849609375, 0.1299896240234375, 0.13483428955078125, 0.139678955078125, 0.14452362060546875, 0.1493682861328125, 0.15421295166015625, 0.1590576171875]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 4.0, 5.0, 8.0, 13.0, 20.0, 18.0, 31.0, 41.0, 56.0, 83.0, 97.0, 135.0, 135.0, 85.0, 74.0, 59.0, 43.0, 30.0, 17.0, 14.0, 11.0, 4.0, 6.0, 5.0, 3.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06939697265625, -0.06728458404541016, -0.06517219543457031, -0.06305980682373047, -0.060947418212890625, -0.05883502960205078, -0.05672264099121094, -0.054610252380371094, -0.05249786376953125, -0.050385475158691406, -0.04827308654785156, -0.04616069793701172, -0.044048309326171875, -0.04193592071533203, -0.03982353210449219, -0.037711143493652344, -0.0355987548828125, -0.033486366271972656, -0.03137397766113281, -0.02926158905029297, -0.027149200439453125, -0.02503681182861328, -0.022924423217773438, -0.020812034606933594, -0.01869964599609375, -0.016587257385253906, -0.014474868774414062, -0.012362480163574219, -0.010250091552734375, -0.008137702941894531, -0.0060253143310546875, -0.003912925720214844, -0.001800537109375, 0.00031185150146484375, 0.0024242401123046875, 0.004536628723144531, 0.006649017333984375, 0.008761405944824219, 0.010873794555664062, 0.012986183166503906, 0.01509857177734375, 0.017210960388183594, 0.019323348999023438, 0.02143573760986328, 0.023548126220703125, 0.02566051483154297, 0.027772903442382812, 0.029885292053222656, 0.0319976806640625, 0.034110069274902344, 0.03622245788574219, 0.03833484649658203, 0.040447235107421875, 0.04255962371826172, 0.04467201232910156, 0.046784400939941406, 0.04889678955078125, 0.051009178161621094, 0.05312156677246094, 0.05523395538330078, 0.057346343994140625, 0.05945873260498047, 0.06157112121582031, 0.06368350982666016, 0.0657958984375]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 2.0, 4.0, 4.0, 10.0, 11.0, 27.0, 46.0, 71.0, 87.0, 118.0, 135.0, 150.0, 104.0, 80.0, 52.0, 38.0, 24.0, 21.0, 9.0, 7.0, 5.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1682071685791016, -1.131699800491333, -1.095192313194275, -1.0586849451065063, -1.0221774578094482, -0.9856700897216797, -0.9491627216339111, -0.9126552939414978, -0.8761478662490845, -0.8396404385566711, -0.8031330108642578, -0.7666256427764893, -0.7301182150840759, -0.6936107873916626, -0.657103419303894, -0.6205959916114807, -0.5840885639190674, -0.547581136226654, -0.5110737085342407, -0.47456634044647217, -0.43805891275405884, -0.4015514850616455, -0.36504408717155457, -0.3285366892814636, -0.2920292615890503, -0.25552183389663696, -0.21901443600654602, -0.18250702321529388, -0.14599961042404175, -0.10949219763278961, -0.07298478484153748, -0.03647738695144653, 2.9921531677246094e-05, 0.03653733432292938, 0.07304474711418152, 0.10955215990543365, 0.1460595726966858, 0.18256698548793793, 0.21907439827919006, 0.255581796169281, 0.29208922386169434, 0.32859665155410767, 0.3651040494441986, 0.40161144733428955, 0.4381188750267029, 0.4746263027191162, 0.5111336708068848, 0.5476410984992981, 0.5841485261917114, 0.6206559538841248, 0.6571633815765381, 0.6936707496643066, 0.73017817735672, 0.7666856050491333, 0.8031929731369019, 0.8397004008293152, 0.8762078285217285, 0.9127152562141418, 0.9492226839065552, 0.9857300519943237, 1.0222375392913818, 1.0587449073791504, 1.095252275466919, 1.1317596435546875, 1.1682671308517456]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 8.0, 7.0, 6.0, 3.0, 11.0, 8.0, 11.0, 10.0, 19.0, 16.0, 22.0, 18.0, 30.0, 24.0, 40.0, 37.0, 38.0, 41.0, 39.0, 45.0, 51.0, 39.0, 42.0, 53.0, 36.0, 37.0, 39.0, 36.0, 40.0, 28.0, 24.0, 20.0, 26.0, 25.0, 12.0, 18.0, 14.0, 4.0, 13.0, 7.0, 1.0, 4.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.9341480731964111, -0.9063374400138855, -0.8785267472267151, -0.8507161140441895, -0.822905421257019, -0.7950947880744934, -0.7672841548919678, -0.7394734621047974, -0.711662769317627, -0.6838521361351013, -0.6560414433479309, -0.6282308101654053, -0.6004201173782349, -0.5726094841957092, -0.5447988510131836, -0.5169881582260132, -0.48917752504348755, -0.4613668620586395, -0.4335561990737915, -0.40574556589126587, -0.37793487310409546, -0.3501242399215698, -0.3223135769367218, -0.2945029139518738, -0.26669225096702576, -0.23888158798217773, -0.2110709249973297, -0.18326027691364288, -0.15544961392879486, -0.12763895094394684, -0.09982830286026001, -0.07201763987541199, -0.044206976890563965, -0.01639631763100624, 0.011414341628551483, 0.03922499716281891, 0.06703566014766693, 0.09484632313251495, 0.12265697121620178, 0.1504676342010498, 0.17827829718589783, 0.20608896017074585, 0.23389962315559387, 0.2617102861404419, 0.28952091932296753, 0.31733161211013794, 0.3451422452926636, 0.3729529082775116, 0.4007635712623596, 0.42857423424720764, 0.45638489723205566, 0.4841955304145813, 0.5120062232017517, 0.5398168563842773, 0.5676275491714478, 0.5954381823539734, 0.623248815536499, 0.6510594487190247, 0.6788701415061951, 0.7066807746887207, 0.7344914674758911, 0.7623021006584167, 0.7901127338409424, 0.8179234266281128, 0.8457341194152832]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 6.0, 2.0, 7.0, 12.0, 18.0, 13.0, 45.0, 51.0, 74.0, 109.0, 153.0, 228.0, 336.0, 499.0, 748.0, 1217.0, 2328.0, 5336.0, 20928.0, 502871.0, 3519834.0, 120079.0, 11352.0, 3638.0, 1613.0, 929.0, 604.0, 393.0, 250.0, 192.0, 134.0, 95.0, 53.0, 48.0, 40.0, 15.0, 11.0, 15.0, 8.0, 1.0, 2.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.84130859375, -0.815277099609375, -0.78924560546875, -0.763214111328125, -0.7371826171875, -0.711151123046875, -0.68511962890625, -0.659088134765625, -0.633056640625, -0.607025146484375, -0.58099365234375, -0.554962158203125, -0.5289306640625, -0.502899169921875, -0.47686767578125, -0.450836181640625, -0.4248046875, -0.398773193359375, -0.37274169921875, -0.346710205078125, -0.3206787109375, -0.294647216796875, -0.26861572265625, -0.242584228515625, -0.216552734375, -0.190521240234375, -0.16448974609375, -0.138458251953125, -0.1124267578125, -0.086395263671875, -0.06036376953125, -0.034332275390625, -0.00830078125, 0.017730712890625, 0.04376220703125, 0.069793701171875, 0.0958251953125, 0.121856689453125, 0.14788818359375, 0.173919677734375, 0.199951171875, 0.225982666015625, 0.25201416015625, 0.278045654296875, 0.3040771484375, 0.330108642578125, 0.35614013671875, 0.382171630859375, 0.408203125, 0.434234619140625, 0.46026611328125, 0.486297607421875, 0.5123291015625, 0.538360595703125, 0.56439208984375, 0.590423583984375, 0.616455078125, 0.642486572265625, 0.66851806640625, 0.694549560546875, 0.7205810546875, 0.746612548828125, 0.77264404296875, 0.798675537109375, 0.82470703125]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 2.0, 9.0, 3.0, 3.0, 10.0, 8.0, 9.0, 20.0, 20.0, 16.0, 17.0, 29.0, 30.0, 20.0, 31.0, 33.0, 47.0, 42.0, 39.0, 35.0, 48.0, 55.0, 52.0, 45.0, 45.0, 34.0, 41.0, 38.0, 30.0, 30.0, 36.0, 23.0, 22.0, 14.0, 14.0, 12.0, 8.0, 13.0, 2.0, 4.0, 3.0, 2.0, 4.0, 2.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.2408447265625, -0.23314857482910156, -0.22545242309570312, -0.2177562713623047, -0.21006011962890625, -0.2023639678955078, -0.19466781616210938, -0.18697166442871094, -0.1792755126953125, -0.17157936096191406, -0.16388320922851562, -0.1561870574951172, -0.14849090576171875, -0.1407947540283203, -0.13309860229492188, -0.12540245056152344, -0.117706298828125, -0.11001014709472656, -0.10231399536132812, -0.09461784362792969, -0.08692169189453125, -0.07922554016113281, -0.07152938842773438, -0.06383323669433594, -0.0561370849609375, -0.04844093322753906, -0.040744781494140625, -0.03304862976074219, -0.02535247802734375, -0.017656326293945312, -0.009960174560546875, -0.0022640228271484375, 0.00543212890625, 0.013128280639648438, 0.020824432373046875, 0.028520584106445312, 0.03621673583984375, 0.04391288757324219, 0.051609039306640625, 0.05930519104003906, 0.0670013427734375, 0.07469749450683594, 0.08239364624023438, 0.09008979797363281, 0.09778594970703125, 0.10548210144042969, 0.11317825317382812, 0.12087440490722656, 0.128570556640625, 0.13626670837402344, 0.14396286010742188, 0.1516590118408203, 0.15935516357421875, 0.1670513153076172, 0.17474746704101562, 0.18244361877441406, 0.1901397705078125, 0.19783592224121094, 0.20553207397460938, 0.2132282257080078, 0.22092437744140625, 0.2286205291748047, 0.23631668090820312, 0.24401283264160156, 0.251708984375]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 8.0, 3.0, 2.0, 4.0, 12.0, 8.0, 13.0, 8.0, 15.0, 38.0, 65.0, 97.0, 193.0, 451.0, 1139.0, 3539.0, 13838.0, 172799.0, 3868279.0, 117110.0, 11634.0, 3143.0, 1027.0, 401.0, 202.0, 83.0, 58.0, 38.0, 23.0, 14.0, 7.0, 16.0, 5.0, 7.0, 2.0, 0.0, 3.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7607421875, -0.7308502197265625, -0.700958251953125, -0.6710662841796875, -0.64117431640625, -0.6112823486328125, -0.581390380859375, -0.5514984130859375, -0.5216064453125, -0.4917144775390625, -0.461822509765625, -0.4319305419921875, -0.40203857421875, -0.3721466064453125, -0.342254638671875, -0.3123626708984375, -0.282470703125, -0.2525787353515625, -0.222686767578125, -0.1927947998046875, -0.16290283203125, -0.1330108642578125, -0.103118896484375, -0.0732269287109375, -0.0433349609375, -0.0134429931640625, 0.016448974609375, 0.0463409423828125, 0.07623291015625, 0.1061248779296875, 0.136016845703125, 0.1659088134765625, 0.19580078125, 0.2256927490234375, 0.255584716796875, 0.2854766845703125, 0.31536865234375, 0.3452606201171875, 0.375152587890625, 0.4050445556640625, 0.4349365234375, 0.4648284912109375, 0.494720458984375, 0.5246124267578125, 0.55450439453125, 0.5843963623046875, 0.614288330078125, 0.6441802978515625, 0.674072265625, 0.7039642333984375, 0.733856201171875, 0.7637481689453125, 0.79364013671875, 0.8235321044921875, 0.853424072265625, 0.8833160400390625, 0.9132080078125, 0.9430999755859375, 0.972991943359375, 1.0028839111328125, 1.03277587890625, 1.0626678466796875, 1.092559814453125, 1.1224517822265625, 1.15234375]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 3.0, 5.0, 2.0, 6.0, 1.0, 9.0, 11.0, 18.0, 15.0, 27.0, 50.0, 67.0, 117.0, 216.0, 330.0, 543.0, 746.0, 682.0, 485.0, 287.0, 157.0, 97.0, 54.0, 41.0, 23.0, 23.0, 13.0, 13.0, 5.0, 2.0, 5.0, 4.0, 4.0, 2.0, 3.0, 0.0, 3.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.197998046875, -0.1923084259033203, -0.18661880493164062, -0.18092918395996094, -0.17523956298828125, -0.16954994201660156, -0.16386032104492188, -0.1581707000732422, -0.1524810791015625, -0.1467914581298828, -0.14110183715820312, -0.13541221618652344, -0.12972259521484375, -0.12403297424316406, -0.11834335327148438, -0.11265373229980469, -0.106964111328125, -0.10127449035644531, -0.09558486938476562, -0.08989524841308594, -0.08420562744140625, -0.07851600646972656, -0.07282638549804688, -0.06713676452636719, -0.0614471435546875, -0.05575752258300781, -0.050067901611328125, -0.04437828063964844, -0.03868865966796875, -0.03299903869628906, -0.027309417724609375, -0.021619796752929688, -0.01593017578125, -0.010240554809570312, -0.004550933837890625, 0.0011386871337890625, 0.00682830810546875, 0.012517929077148438, 0.018207550048828125, 0.023897171020507812, 0.0295867919921875, 0.03527641296386719, 0.040966033935546875, 0.04665565490722656, 0.05234527587890625, 0.05803489685058594, 0.06372451782226562, 0.06941413879394531, 0.075103759765625, 0.08079338073730469, 0.08648300170898438, 0.09217262268066406, 0.09786224365234375, 0.10355186462402344, 0.10924148559570312, 0.11493110656738281, 0.1206207275390625, 0.1263103485107422, 0.13199996948242188, 0.13768959045410156, 0.14337921142578125, 0.14906883239746094, 0.15475845336914062, 0.1604480743408203, 0.1661376953125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 6.0, 8.0, 10.0, 18.0, 17.0, 25.0, 23.0, 53.0, 50.0, 60.0, 61.0, 61.0, 70.0, 66.0, 71.0, 48.0, 57.0, 49.0, 54.0, 46.0, 25.0, 24.0, 23.0, 26.0, 17.0, 10.0, 7.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.5131106376647949, -0.4995444715023041, -0.48597827553749084, -0.472412109375, -0.45884591341018677, -0.4452797472476959, -0.4317135810852051, -0.41814738512039185, -0.404581218957901, -0.39101505279541016, -0.3774488568305969, -0.3638826906681061, -0.35031652450561523, -0.336750328540802, -0.32318416237831116, -0.3096179962158203, -0.2960518002510071, -0.28248563408851624, -0.268919438123703, -0.25535327196121216, -0.24178709089756012, -0.22822090983390808, -0.21465474367141724, -0.2010885626077652, -0.18752238154411316, -0.17395620048046112, -0.16039001941680908, -0.14682385325431824, -0.1332576721906662, -0.11969149112701416, -0.10612531751394272, -0.09255914390087128, -0.07899293303489685, -0.06542675197124481, -0.05186057835817337, -0.03829440101981163, -0.02472822368144989, -0.011162042617797852, 0.00240413099527359, 0.015970304608345032, 0.02953648567199707, 0.04310266301035881, 0.05666884034872055, 0.07023501396179199, 0.08380119502544403, 0.09736737608909607, 0.11093354970216751, 0.12449972331523895, 0.138065904378891, 0.15163208544254303, 0.16519826650619507, 0.1787644326686859, 0.19233061373233795, 0.20589679479599, 0.21946296095848083, 0.23302914202213287, 0.2465953230857849, 0.26016148924827576, 0.273727685213089, 0.28729385137557983, 0.30086004734039307, 0.3144262135028839, 0.32799237966537476, 0.341558575630188, 0.35512474179267883]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 10.0, 4.0, 4.0, 6.0, 8.0, 14.0, 15.0, 14.0, 11.0, 26.0, 30.0, 31.0, 31.0, 35.0, 39.0, 52.0, 47.0, 52.0, 52.0, 53.0, 59.0, 35.0, 36.0, 39.0, 42.0, 30.0, 45.0, 32.0, 21.0, 26.0, 22.0, 14.0, 15.0, 14.0, 12.0, 12.0, 6.0, 7.0, 3.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3394536077976227, -0.3283222019672394, -0.3171907961368561, -0.3060593903064728, -0.2949279844760895, -0.2837965786457062, -0.27266520261764526, -0.26153379678726196, -0.25040239095687866, -0.23927098512649536, -0.22813957929611206, -0.21700817346572876, -0.20587676763534546, -0.19474536180496216, -0.18361397087574005, -0.17248256504535675, -0.16135114431381226, -0.15021973848342896, -0.13908833265304565, -0.12795692682266235, -0.11682552844285965, -0.10569412261247635, -0.09456272423267365, -0.08343131840229034, -0.07229991257190704, -0.06116850674152374, -0.05003710463643074, -0.03890570253133774, -0.027774296700954437, -0.016642890870571136, -0.005511492490768433, 0.005619913339614868, 0.01675128936767578, 0.027882693335413933, 0.039014097303152084, 0.05014549940824509, 0.06127690523862839, 0.07240831106901169, 0.08353970944881439, 0.09467111527919769, 0.105802521109581, 0.1169339269399643, 0.1280653327703476, 0.1391967236995697, 0.150328129529953, 0.1614595353603363, 0.1725909411907196, 0.1837223470211029, 0.1948537528514862, 0.2059851586818695, 0.2171165645122528, 0.2282479703426361, 0.2393793761730194, 0.2505107820034027, 0.2616421580314636, 0.2727735638618469, 0.2839049696922302, 0.2950363755226135, 0.3061677813529968, 0.3172991871833801, 0.3284305930137634, 0.33956199884414673, 0.35069340467453003, 0.36182481050491333, 0.37295621633529663]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 4.0, 2.0, 10.0, 7.0, 11.0, 12.0, 23.0, 32.0, 42.0, 67.0, 85.0, 147.0, 256.0, 472.0, 883.0, 1737.0, 3631.0, 7986.0, 19089.0, 70396.0, 587810.0, 294063.0, 36669.0, 13428.0, 5974.0, 2811.0, 1317.0, 689.0, 362.0, 190.0, 115.0, 91.0, 47.0, 34.0, 18.0, 13.0, 14.0, 8.0, 9.0, 4.0, 5.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.1552734375, -0.15081214904785156, -0.14635086059570312, -0.1418895721435547, -0.13742828369140625, -0.1329669952392578, -0.12850570678710938, -0.12404441833496094, -0.1195831298828125, -0.11512184143066406, -0.11066055297851562, -0.10619926452636719, -0.10173797607421875, -0.09727668762207031, -0.09281539916992188, -0.08835411071777344, -0.083892822265625, -0.07943153381347656, -0.07497024536132812, -0.07050895690917969, -0.06604766845703125, -0.06158638000488281, -0.057125091552734375, -0.05266380310058594, -0.0482025146484375, -0.04374122619628906, -0.039279937744140625, -0.03481864929199219, -0.03035736083984375, -0.025896072387695312, -0.021434783935546875, -0.016973495483398438, -0.01251220703125, -0.008050918579101562, -0.003589630126953125, 0.0008716583251953125, 0.00533294677734375, 0.009794235229492188, 0.014255523681640625, 0.018716812133789062, 0.0231781005859375, 0.027639389038085938, 0.032100677490234375, 0.03656196594238281, 0.04102325439453125, 0.04548454284667969, 0.049945831298828125, 0.05440711975097656, 0.058868408203125, 0.06332969665527344, 0.06779098510742188, 0.07225227355957031, 0.07671356201171875, 0.08117485046386719, 0.08563613891601562, 0.09009742736816406, 0.0945587158203125, 0.09902000427246094, 0.10348129272460938, 0.10794258117675781, 0.11240386962890625, 0.11686515808105469, 0.12132644653320312, 0.12578773498535156, 0.1302490234375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 5.0, 9.0, 6.0, 11.0, 8.0, 21.0, 18.0, 17.0, 26.0, 26.0, 39.0, 49.0, 35.0, 39.0, 55.0, 55.0, 65.0, 52.0, 55.0, 49.0, 46.0, 37.0, 32.0, 44.0, 43.0, 21.0, 30.0, 16.0, 25.0, 6.0, 15.0, 15.0, 10.0, 12.0, 6.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2283935546875, -0.22044944763183594, -0.21250534057617188, -0.2045612335205078, -0.19661712646484375, -0.1886730194091797, -0.18072891235351562, -0.17278480529785156, -0.1648406982421875, -0.15689659118652344, -0.14895248413085938, -0.1410083770751953, -0.13306427001953125, -0.1251201629638672, -0.11717605590820312, -0.10923194885253906, -0.101287841796875, -0.09334373474121094, -0.08539962768554688, -0.07745552062988281, -0.06951141357421875, -0.06156730651855469, -0.053623199462890625, -0.04567909240722656, -0.0377349853515625, -0.029790878295898438, -0.021846771240234375, -0.013902664184570312, -0.00595855712890625, 0.0019855499267578125, 0.009929656982421875, 0.017873764038085938, 0.02581787109375, 0.03376197814941406, 0.041706085205078125, 0.04965019226074219, 0.05759429931640625, 0.06553840637207031, 0.07348251342773438, 0.08142662048339844, 0.0893707275390625, 0.09731483459472656, 0.10525894165039062, 0.11320304870605469, 0.12114715576171875, 0.1290912628173828, 0.13703536987304688, 0.14497947692871094, 0.152923583984375, 0.16086769104003906, 0.16881179809570312, 0.1767559051513672, 0.18470001220703125, 0.1926441192626953, 0.20058822631835938, 0.20853233337402344, 0.2164764404296875, 0.22442054748535156, 0.23236465454101562, 0.2403087615966797, 0.24825286865234375, 0.2561969757080078, 0.2641410827636719, 0.27208518981933594, 0.280029296875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 0.0, 5.0, 9.0, 10.0, 8.0, 20.0, 13.0, 24.0, 30.0, 59.0, 88.0, 165.0, 286.0, 547.0, 1194.0, 2559.0, 6373.0, 16952.0, 62180.0, 348113.0, 480289.0, 93299.0, 22361.0, 7772.0, 3263.0, 1420.0, 683.0, 348.0, 178.0, 107.0, 69.0, 52.0, 27.0, 15.0, 11.0, 9.0, 10.0, 3.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08551025390625, -0.08257389068603516, -0.07963752746582031, -0.07670116424560547, -0.07376480102539062, -0.07082843780517578, -0.06789207458496094, -0.0649557113647461, -0.06201934814453125, -0.059082984924316406, -0.05614662170410156, -0.05321025848388672, -0.050273895263671875, -0.04733753204345703, -0.04440116882324219, -0.041464805603027344, -0.0385284423828125, -0.035592079162597656, -0.03265571594238281, -0.02971935272216797, -0.026782989501953125, -0.02384662628173828, -0.020910263061523438, -0.017973899841308594, -0.01503753662109375, -0.012101173400878906, -0.009164810180664062, -0.006228446960449219, -0.003292083740234375, -0.00035572052001953125, 0.0025806427001953125, 0.005517005920410156, 0.008453369140625, 0.011389732360839844, 0.014326095581054688, 0.01726245880126953, 0.020198822021484375, 0.02313518524169922, 0.026071548461914062, 0.029007911682128906, 0.03194427490234375, 0.034880638122558594, 0.03781700134277344, 0.04075336456298828, 0.043689727783203125, 0.04662609100341797, 0.04956245422363281, 0.052498817443847656, 0.0554351806640625, 0.058371543884277344, 0.06130790710449219, 0.06424427032470703, 0.06718063354492188, 0.07011699676513672, 0.07305335998535156, 0.0759897232055664, 0.07892608642578125, 0.0818624496459961, 0.08479881286621094, 0.08773517608642578, 0.09067153930664062, 0.09360790252685547, 0.09654426574707031, 0.09948062896728516, 0.1024169921875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 3.0, 3.0, 2.0, 6.0, 9.0, 5.0, 11.0, 7.0, 12.0, 14.0, 13.0, 19.0, 14.0, 21.0, 25.0, 26.0, 39.0, 26.0, 23.0, 25.0, 44.0, 42.0, 44.0, 39.0, 45.0, 40.0, 40.0, 44.0, 37.0, 30.0, 39.0, 32.0, 26.0, 29.0, 30.0, 18.0, 20.0, 15.0, 17.0, 20.0, 10.0, 10.0, 8.0, 1.0, 2.0, 3.0, 5.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.47900390625, -0.4644317626953125, -0.449859619140625, -0.4352874755859375, -0.42071533203125, -0.4061431884765625, -0.391571044921875, -0.3769989013671875, -0.3624267578125, -0.3478546142578125, -0.333282470703125, -0.3187103271484375, -0.30413818359375, -0.2895660400390625, -0.274993896484375, -0.2604217529296875, -0.245849609375, -0.2312774658203125, -0.216705322265625, -0.2021331787109375, -0.18756103515625, -0.1729888916015625, -0.158416748046875, -0.1438446044921875, -0.1292724609375, -0.1147003173828125, -0.100128173828125, -0.0855560302734375, -0.07098388671875, -0.0564117431640625, -0.041839599609375, -0.0272674560546875, -0.0126953125, 0.0018768310546875, 0.016448974609375, 0.0310211181640625, 0.04559326171875, 0.0601654052734375, 0.074737548828125, 0.0893096923828125, 0.1038818359375, 0.1184539794921875, 0.133026123046875, 0.1475982666015625, 0.16217041015625, 0.1767425537109375, 0.191314697265625, 0.2058868408203125, 0.220458984375, 0.2350311279296875, 0.249603271484375, 0.2641754150390625, 0.27874755859375, 0.2933197021484375, 0.307891845703125, 0.3224639892578125, 0.3370361328125, 0.3516082763671875, 0.366180419921875, 0.3807525634765625, 0.39532470703125, 0.4098968505859375, 0.424468994140625, 0.4390411376953125, 0.45361328125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 8.0, 5.0, 10.0, 15.0, 33.0, 20.0, 32.0, 58.0, 95.0, 144.0, 313.0, 490.0, 935.0, 1971.0, 5028.0, 19257.0, 352843.0, 629163.0, 27180.0, 6068.0, 2349.0, 1117.0, 610.0, 311.0, 186.0, 133.0, 55.0, 41.0, 28.0, 23.0, 5.0, 12.0, 8.0, 4.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0780029296875, -0.07541084289550781, -0.07281875610351562, -0.07022666931152344, -0.06763458251953125, -0.06504249572753906, -0.062450408935546875, -0.05985832214355469, -0.0572662353515625, -0.05467414855957031, -0.052082061767578125, -0.04948997497558594, -0.04689788818359375, -0.04430580139160156, -0.041713714599609375, -0.03912162780761719, -0.036529541015625, -0.03393745422363281, -0.031345367431640625, -0.028753280639648438, -0.02616119384765625, -0.023569107055664062, -0.020977020263671875, -0.018384933471679688, -0.0157928466796875, -0.013200759887695312, -0.010608673095703125, -0.008016586303710938, -0.00542449951171875, -0.0028324127197265625, -0.000240325927734375, 0.0023517608642578125, 0.00494384765625, 0.0075359344482421875, 0.010128021240234375, 0.012720108032226562, 0.01531219482421875, 0.017904281616210938, 0.020496368408203125, 0.023088455200195312, 0.0256805419921875, 0.028272628784179688, 0.030864715576171875, 0.03345680236816406, 0.03604888916015625, 0.03864097595214844, 0.041233062744140625, 0.04382514953613281, 0.046417236328125, 0.04900932312011719, 0.051601409912109375, 0.05419349670410156, 0.05678558349609375, 0.05937767028808594, 0.061969757080078125, 0.06456184387207031, 0.0671539306640625, 0.06974601745605469, 0.07233810424804688, 0.07493019104003906, 0.07752227783203125, 0.08011436462402344, 0.08270645141601562, 0.08529853820800781, 0.087890625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 5.0, 13.0, 16.0, 44.0, 100.0, 220.0, 299.0, 171.0, 63.0, 30.0, 18.0, 14.0, 6.0, 6.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.540515899658203e-05, -3.3746473491191864e-05, -3.20877879858017e-05, -3.042910248041153e-05, -2.8770416975021362e-05, -2.7111731469631195e-05, -2.5453045964241028e-05, -2.379436045885086e-05, -2.2135674953460693e-05, -2.0476989448070526e-05, -1.881830394268036e-05, -1.715961843729019e-05, -1.5500932931900024e-05, -1.3842247426509857e-05, -1.218356192111969e-05, -1.0524876415729523e-05, -8.866190910339355e-06, -7.207505404949188e-06, -5.548819899559021e-06, -3.890134394168854e-06, -2.2314488887786865e-06, -5.727633833885193e-07, 1.085922122001648e-06, 2.744607627391815e-06, 4.403293132781982e-06, 6.06197863817215e-06, 7.720664143562317e-06, 9.379349648952484e-06, 1.1038035154342651e-05, 1.2696720659732819e-05, 1.4355406165122986e-05, 1.6014091670513153e-05, 1.767277717590332e-05, 1.9331462681293488e-05, 2.0990148186683655e-05, 2.2648833692073822e-05, 2.430751919746399e-05, 2.5966204702854156e-05, 2.7624890208244324e-05, 2.928357571363449e-05, 3.094226121902466e-05, 3.2600946724414825e-05, 3.425963222980499e-05, 3.591831773519516e-05, 3.757700324058533e-05, 3.9235688745975494e-05, 4.089437425136566e-05, 4.255305975675583e-05, 4.4211745262145996e-05, 4.587043076753616e-05, 4.752911627292633e-05, 4.91878017783165e-05, 5.0846487283706665e-05, 5.250517278909683e-05, 5.4163858294487e-05, 5.582254379987717e-05, 5.7481229305267334e-05, 5.91399148106575e-05, 6.079860031604767e-05, 6.245728582143784e-05, 6.4115971326828e-05, 6.577465683221817e-05, 6.743334233760834e-05, 6.90920278429985e-05, 7.075071334838867e-05]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 7.0, 6.0, 4.0, 8.0, 14.0, 18.0, 22.0, 33.0, 42.0, 77.0, 79.0, 113.0, 189.0, 226.0, 323.0, 463.0, 660.0, 930.0, 1336.0, 2190.0, 4135.0, 10672.0, 41017.0, 265869.0, 565822.0, 114769.0, 22345.0, 7250.0, 3375.0, 1953.0, 1307.0, 919.0, 657.0, 469.0, 334.0, 254.0, 203.0, 123.0, 100.0, 60.0, 64.0, 37.0, 25.0, 19.0, 12.0, 14.0, 6.0, 7.0, 7.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0506591796875, -0.04909038543701172, -0.04752159118652344, -0.045952796936035156, -0.044384002685546875, -0.042815208435058594, -0.04124641418457031, -0.03967761993408203, -0.03810882568359375, -0.03654003143310547, -0.03497123718261719, -0.033402442932128906, -0.031833648681640625, -0.030264854431152344, -0.028696060180664062, -0.02712726593017578, -0.0255584716796875, -0.02398967742919922, -0.022420883178710938, -0.020852088928222656, -0.019283294677734375, -0.017714500427246094, -0.016145706176757812, -0.014576911926269531, -0.01300811767578125, -0.011439323425292969, -0.009870529174804688, -0.008301734924316406, -0.006732940673828125, -0.005164146423339844, -0.0035953521728515625, -0.0020265579223632812, -0.000457763671875, 0.0011110305786132812, 0.0026798248291015625, 0.004248619079589844, 0.005817413330078125, 0.007386207580566406, 0.008955001831054688, 0.010523796081542969, 0.01209259033203125, 0.013661384582519531, 0.015230178833007812, 0.016798973083496094, 0.018367767333984375, 0.019936561584472656, 0.021505355834960938, 0.02307415008544922, 0.0246429443359375, 0.02621173858642578, 0.027780532836914062, 0.029349327087402344, 0.030918121337890625, 0.032486915588378906, 0.03405570983886719, 0.03562450408935547, 0.03719329833984375, 0.03876209259033203, 0.04033088684082031, 0.041899681091308594, 0.043468475341796875, 0.045037269592285156, 0.04660606384277344, 0.04817485809326172, 0.04974365234375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 11.0, 8.0, 11.0, 19.0, 39.0, 88.0, 129.0, 181.0, 173.0, 129.0, 81.0, 43.0, 25.0, 20.0, 7.0, 7.0, 3.0, 5.0, 3.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02001953125, -0.01933145523071289, -0.01864337921142578, -0.017955303192138672, -0.017267227172851562, -0.016579151153564453, -0.015891075134277344, -0.015202999114990234, -0.014514923095703125, -0.013826847076416016, -0.013138771057128906, -0.012450695037841797, -0.011762619018554688, -0.011074542999267578, -0.010386466979980469, -0.00969839096069336, -0.00901031494140625, -0.00832223892211914, -0.007634162902832031, -0.006946086883544922, -0.0062580108642578125, -0.005569934844970703, -0.004881858825683594, -0.004193782806396484, -0.003505706787109375, -0.0028176307678222656, -0.0021295547485351562, -0.0014414787292480469, -0.0007534027099609375, -6.532669067382812e-05, 0.0006227493286132812, 0.0013108253479003906, 0.0019989013671875, 0.0026869773864746094, 0.0033750534057617188, 0.004063129425048828, 0.0047512054443359375, 0.005439281463623047, 0.006127357482910156, 0.006815433502197266, 0.007503509521484375, 0.008191585540771484, 0.008879661560058594, 0.009567737579345703, 0.010255813598632812, 0.010943889617919922, 0.011631965637207031, 0.01232004165649414, 0.01300811767578125, 0.01369619369506836, 0.014384269714355469, 0.015072345733642578, 0.015760421752929688, 0.016448497772216797, 0.017136573791503906, 0.017824649810791016, 0.018512725830078125, 0.019200801849365234, 0.019888877868652344, 0.020576953887939453, 0.021265029907226562, 0.021953105926513672, 0.02264118194580078, 0.02332925796508789, 0.024017333984375]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 8.0, 5.0, 9.0, 9.0, 27.0, 26.0, 45.0, 45.0, 76.0, 79.0, 80.0, 66.0, 96.0, 83.0, 67.0, 61.0, 55.0, 39.0, 41.0, 23.0, 19.0, 13.0, 9.0, 6.0, 8.0, 3.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.41423943638801575, -0.40392085909843445, -0.39360228180885315, -0.38328373432159424, -0.37296515703201294, -0.36264657974243164, -0.35232800245285034, -0.34200942516326904, -0.33169084787368774, -0.32137227058410645, -0.31105369329452515, -0.30073514580726624, -0.29041656851768494, -0.28009799122810364, -0.26977941393852234, -0.25946083664894104, -0.24914228916168213, -0.23882371187210083, -0.22850514948368073, -0.21818657219409943, -0.20786800980567932, -0.19754943251609802, -0.18723085522651672, -0.17691227793693542, -0.16659371554851532, -0.15627513825893402, -0.14595657587051392, -0.13563799858093262, -0.12531942129135132, -0.11500085890293121, -0.10468228161334991, -0.09436371177434921, -0.08404512703418732, -0.07372655719518661, -0.06340798735618591, -0.053089410066604614, -0.04277084022760391, -0.03245227038860321, -0.02213369682431221, -0.01181512326002121, -0.0014965534210205078, 0.008822018280625343, 0.019140589982271194, 0.029459161683917046, 0.0397777333855629, 0.0500963032245636, 0.0604148767888546, 0.0707334503531456, 0.0810520201921463, 0.091370590031147, 0.1016891598701477, 0.112007737159729, 0.1223263069987297, 0.1326448768377304, 0.1429634541273117, 0.1532820165157318, 0.1636005938053131, 0.1739191710948944, 0.18423773348331451, 0.1945563107728958, 0.20487487316131592, 0.21519345045089722, 0.22551202774047852, 0.23583060503005981, 0.24614916741847992]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 6.0, 7.0, 9.0, 13.0, 12.0, 7.0, 17.0, 17.0, 25.0, 23.0, 37.0, 46.0, 39.0, 48.0, 57.0, 55.0, 48.0, 60.0, 49.0, 48.0, 45.0, 39.0, 46.0, 34.0, 37.0, 35.0, 29.0, 27.0, 23.0, 12.0, 13.0, 10.0, 12.0, 8.0, 6.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2212778627872467, -0.2136402428150177, -0.2060026079416275, -0.1983649879693985, -0.1907273530960083, -0.1830897331237793, -0.1754521131515503, -0.1678144782781601, -0.1601768434047699, -0.1525392234325409, -0.1449015885591507, -0.1372639685869217, -0.1296263337135315, -0.12198871374130249, -0.11435108631849289, -0.10671345889568329, -0.09907583892345428, -0.09143821150064468, -0.08380058407783508, -0.07616296410560608, -0.06852532923221588, -0.06088770553469658, -0.05325008183717728, -0.045612454414367676, -0.037974826991558075, -0.030337199568748474, -0.022699574008584023, -0.015061948448419571, -0.00742432102560997, 0.00021330639719963074, 0.007850930094718933, 0.015488557517528534, 0.023126184940338135, 0.030763812363147736, 0.038401439785957336, 0.04603906348347664, 0.05367669090628624, 0.06131431832909584, 0.06895194202661514, 0.07658956944942474, 0.08422719687223434, 0.09186482429504395, 0.09950245171785355, 0.10714007914066315, 0.11477769911289215, 0.12241533398628235, 0.13005295395851135, 0.13769057393074036, 0.14532820880413055, 0.15296582877635956, 0.16060346364974976, 0.16824108362197876, 0.17587871849536896, 0.18351633846759796, 0.19115397334098816, 0.19879159331321716, 0.20642921328544617, 0.21406683325767517, 0.22170446813106537, 0.22934208810329437, 0.23697972297668457, 0.24461734294891357, 0.2522549629211426, 0.2598925828933716, 0.267530232667923]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 6.0, 4.0, 2.0, 2.0, 8.0, 9.0, 25.0, 18.0, 30.0, 45.0, 74.0, 101.0, 124.0, 195.0, 317.0, 456.0, 709.0, 1185.0, 1917.0, 3240.0, 5735.0, 10606.0, 21119.0, 47996.0, 134143.0, 373698.0, 282369.0, 91804.0, 35498.0, 16337.0, 8702.0, 4771.0, 2795.0, 1693.0, 1042.0, 609.0, 422.0, 243.0, 189.0, 121.0, 54.0, 52.0, 44.0, 12.0, 17.0, 10.0, 8.0, 4.0, 7.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.343994140625, -0.3324623107910156, -0.32093048095703125, -0.3093986511230469, -0.2978668212890625, -0.2863349914550781, -0.27480316162109375, -0.2632713317871094, -0.251739501953125, -0.24020767211914062, -0.22867584228515625, -0.21714401245117188, -0.2056121826171875, -0.19408035278320312, -0.18254852294921875, -0.17101669311523438, -0.15948486328125, -0.14795303344726562, -0.13642120361328125, -0.12488937377929688, -0.1133575439453125, -0.10182571411132812, -0.09029388427734375, -0.07876205444335938, -0.067230224609375, -0.055698394775390625, -0.04416656494140625, -0.032634735107421875, -0.0211029052734375, -0.009571075439453125, 0.00196075439453125, 0.013492584228515625, 0.0250244140625, 0.036556243896484375, 0.04808807373046875, 0.059619903564453125, 0.0711517333984375, 0.08268356323242188, 0.09421539306640625, 0.10574722290039062, 0.117279052734375, 0.12881088256835938, 0.14034271240234375, 0.15187454223632812, 0.1634063720703125, 0.17493820190429688, 0.18647003173828125, 0.19800186157226562, 0.20953369140625, 0.22106552124023438, 0.23259735107421875, 0.24412918090820312, 0.2556610107421875, 0.2671928405761719, 0.27872467041015625, 0.2902565002441406, 0.301788330078125, 0.3133201599121094, 0.32485198974609375, 0.3363838195800781, 0.3479156494140625, 0.3594474792480469, 0.37097930908203125, 0.3825111389160156, 0.39404296875]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 6.0, 2.0, 4.0, 7.0, 9.0, 16.0, 15.0, 22.0, 26.0, 25.0, 26.0, 49.0, 51.0, 52.0, 77.0, 64.0, 65.0, 72.0, 67.0, 60.0, 42.0, 49.0, 44.0, 31.0, 27.0, 25.0, 21.0, 12.0, 10.0, 10.0, 9.0, 9.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.468505859375, -0.453826904296875, -0.43914794921875, -0.424468994140625, -0.4097900390625, -0.395111083984375, -0.38043212890625, -0.365753173828125, -0.35107421875, -0.336395263671875, -0.32171630859375, -0.307037353515625, -0.2923583984375, -0.277679443359375, -0.26300048828125, -0.248321533203125, -0.233642578125, -0.218963623046875, -0.20428466796875, -0.189605712890625, -0.1749267578125, -0.160247802734375, -0.14556884765625, -0.130889892578125, -0.1162109375, -0.101531982421875, -0.08685302734375, -0.072174072265625, -0.0574951171875, -0.042816162109375, -0.02813720703125, -0.013458251953125, 0.001220703125, 0.015899658203125, 0.03057861328125, 0.045257568359375, 0.0599365234375, 0.074615478515625, 0.08929443359375, 0.103973388671875, 0.11865234375, 0.133331298828125, 0.14801025390625, 0.162689208984375, 0.1773681640625, 0.192047119140625, 0.20672607421875, 0.221405029296875, 0.236083984375, 0.250762939453125, 0.26544189453125, 0.280120849609375, 0.2947998046875, 0.309478759765625, 0.32415771484375, 0.338836669921875, 0.353515625, 0.368194580078125, 0.38287353515625, 0.397552490234375, 0.4122314453125, 0.426910400390625, 0.44158935546875, 0.456268310546875, 0.470947265625]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 5.0, 5.0, 10.0, 4.0, 10.0, 15.0, 37.0, 37.0, 66.0, 74.0, 131.0, 177.0, 270.0, 381.0, 588.0, 802.0, 1319.0, 2031.0, 3282.0, 5526.0, 9507.0, 17779.0, 36688.0, 87350.0, 236334.0, 357568.0, 164127.0, 62373.0, 28025.0, 13996.0, 7706.0, 4482.0, 2712.0, 1759.0, 1090.0, 735.0, 504.0, 329.0, 221.0, 160.0, 131.0, 68.0, 44.0, 41.0, 21.0, 15.0, 11.0, 7.0, 1.0, 4.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.284423828125, -0.2743797302246094, -0.26433563232421875, -0.2542915344238281, -0.2442474365234375, -0.23420333862304688, -0.22415924072265625, -0.21411514282226562, -0.204071044921875, -0.19402694702148438, -0.18398284912109375, -0.17393875122070312, -0.1638946533203125, -0.15385055541992188, -0.14380645751953125, -0.13376235961914062, -0.12371826171875, -0.11367416381835938, -0.10363006591796875, -0.09358596801757812, -0.0835418701171875, -0.07349777221679688, -0.06345367431640625, -0.053409576416015625, -0.043365478515625, -0.033321380615234375, -0.02327728271484375, -0.013233184814453125, -0.0031890869140625, 0.006855010986328125, 0.01689910888671875, 0.026943206787109375, 0.0369873046875, 0.047031402587890625, 0.05707550048828125, 0.06711959838867188, 0.0771636962890625, 0.08720779418945312, 0.09725189208984375, 0.10729598999023438, 0.117340087890625, 0.12738418579101562, 0.13742828369140625, 0.14747238159179688, 0.1575164794921875, 0.16756057739257812, 0.17760467529296875, 0.18764877319335938, 0.19769287109375, 0.20773696899414062, 0.21778106689453125, 0.22782516479492188, 0.2378692626953125, 0.24791336059570312, 0.25795745849609375, 0.2680015563964844, 0.278045654296875, 0.2880897521972656, 0.29813385009765625, 0.3081779479980469, 0.3182220458984375, 0.3282661437988281, 0.33831024169921875, 0.3483543395996094, 0.3583984375]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 4.0, 4.0, 6.0, 3.0, 9.0, 7.0, 18.0, 11.0, 13.0, 12.0, 23.0, 26.0, 38.0, 30.0, 27.0, 28.0, 50.0, 46.0, 48.0, 57.0, 54.0, 49.0, 59.0, 44.0, 50.0, 42.0, 41.0, 23.0, 23.0, 24.0, 17.0, 25.0, 14.0, 15.0, 19.0, 14.0, 10.0, 7.0, 8.0, 1.0, 8.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.366455078125, -0.3543052673339844, -0.34215545654296875, -0.3300056457519531, -0.3178558349609375, -0.3057060241699219, -0.29355621337890625, -0.2814064025878906, -0.269256591796875, -0.2571067810058594, -0.24495697021484375, -0.23280715942382812, -0.2206573486328125, -0.20850753784179688, -0.19635772705078125, -0.18420791625976562, -0.17205810546875, -0.15990829467773438, -0.14775848388671875, -0.13560867309570312, -0.1234588623046875, -0.11130905151367188, -0.09915924072265625, -0.08700942993164062, -0.074859619140625, -0.06270980834960938, -0.05055999755859375, -0.038410186767578125, -0.0262603759765625, -0.014110565185546875, -0.00196075439453125, 0.010189056396484375, 0.0223388671875, 0.034488677978515625, 0.04663848876953125, 0.058788299560546875, 0.0709381103515625, 0.08308792114257812, 0.09523773193359375, 0.10738754272460938, 0.119537353515625, 0.13168716430664062, 0.14383697509765625, 0.15598678588867188, 0.1681365966796875, 0.18028640747070312, 0.19243621826171875, 0.20458602905273438, 0.21673583984375, 0.22888565063476562, 0.24103546142578125, 0.2531852722167969, 0.2653350830078125, 0.2774848937988281, 0.28963470458984375, 0.3017845153808594, 0.313934326171875, 0.3260841369628906, 0.33823394775390625, 0.3503837585449219, 0.3625335693359375, 0.3746833801269531, 0.38683319091796875, 0.3989830017089844, 0.4111328125]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 9.0, 3.0, 6.0, 11.0, 14.0, 21.0, 29.0, 40.0, 60.0, 80.0, 158.0, 203.0, 292.0, 401.0, 586.0, 828.0, 1376.0, 2376.0, 4316.0, 9881.0, 27535.0, 114496.0, 489776.0, 297924.0, 64104.0, 18075.0, 7077.0, 3465.0, 1899.0, 1104.0, 753.0, 502.0, 372.0, 235.0, 181.0, 128.0, 78.0, 52.0, 40.0, 23.0, 21.0, 15.0, 8.0, 2.0, 4.0, 10.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11944580078125, -0.1156911849975586, -0.11193656921386719, -0.10818195343017578, -0.10442733764648438, -0.10067272186279297, -0.09691810607910156, -0.09316349029541016, -0.08940887451171875, -0.08565425872802734, -0.08189964294433594, -0.07814502716064453, -0.07439041137695312, -0.07063579559326172, -0.06688117980957031, -0.0631265640258789, -0.0593719482421875, -0.055617332458496094, -0.05186271667480469, -0.04810810089111328, -0.044353485107421875, -0.04059886932373047, -0.03684425354003906, -0.033089637756347656, -0.02933502197265625, -0.025580406188964844, -0.021825790405273438, -0.01807117462158203, -0.014316558837890625, -0.010561943054199219, -0.0068073272705078125, -0.0030527114868164062, 0.000701904296875, 0.004456520080566406, 0.008211135864257812, 0.011965751647949219, 0.015720367431640625, 0.01947498321533203, 0.023229598999023438, 0.026984214782714844, 0.03073883056640625, 0.034493446350097656, 0.03824806213378906, 0.04200267791748047, 0.045757293701171875, 0.04951190948486328, 0.05326652526855469, 0.057021141052246094, 0.0607757568359375, 0.0645303726196289, 0.06828498840332031, 0.07203960418701172, 0.07579421997070312, 0.07954883575439453, 0.08330345153808594, 0.08705806732177734, 0.09081268310546875, 0.09456729888916016, 0.09832191467285156, 0.10207653045654297, 0.10583114624023438, 0.10958576202392578, 0.11334037780761719, 0.1170949935913086, 0.120849609375]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 9.0, 8.0, 2.0, 16.0, 16.0, 23.0, 40.0, 97.0, 112.0, 217.0, 162.0, 115.0, 69.0, 52.0, 24.0, 12.0, 8.0, 8.0, 4.0, 3.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.285573959350586e-05, -4.16608527302742e-05, -4.046596586704254e-05, -3.927107900381088e-05, -3.8076192140579224e-05, -3.6881305277347565e-05, -3.5686418414115906e-05, -3.449153155088425e-05, -3.329664468765259e-05, -3.210175782442093e-05, -3.090687096118927e-05, -2.971198409795761e-05, -2.8517097234725952e-05, -2.7322210371494293e-05, -2.6127323508262634e-05, -2.4932436645030975e-05, -2.3737549781799316e-05, -2.2542662918567657e-05, -2.1347776055336e-05, -2.015288919210434e-05, -1.895800232887268e-05, -1.7763115465641022e-05, -1.6568228602409363e-05, -1.5373341739177704e-05, -1.4178454875946045e-05, -1.2983568012714386e-05, -1.1788681149482727e-05, -1.0593794286251068e-05, -9.39890742301941e-06, -8.20402055978775e-06, -7.009133696556091e-06, -5.814246833324432e-06, -4.6193599700927734e-06, -3.4244731068611145e-06, -2.2295862436294556e-06, -1.0346993803977966e-06, 1.601874828338623e-07, 1.3550743460655212e-06, 2.54996120929718e-06, 3.744848072528839e-06, 4.939734935760498e-06, 6.134621798992157e-06, 7.329508662223816e-06, 8.524395525455475e-06, 9.719282388687134e-06, 1.0914169251918793e-05, 1.2109056115150452e-05, 1.330394297838211e-05, 1.449882984161377e-05, 1.569371670484543e-05, 1.6888603568077087e-05, 1.8083490431308746e-05, 1.9278377294540405e-05, 2.0473264157772064e-05, 2.1668151021003723e-05, 2.2863037884235382e-05, 2.405792474746704e-05, 2.52528116106987e-05, 2.644769847393036e-05, 2.7642585337162018e-05, 2.8837472200393677e-05, 3.0032359063625336e-05, 3.1227245926856995e-05, 3.2422132790088654e-05, 3.361701965332031e-05]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 9.0, 2.0, 16.0, 10.0, 11.0, 27.0, 37.0, 54.0, 76.0, 82.0, 124.0, 163.0, 218.0, 319.0, 495.0, 703.0, 1031.0, 1635.0, 2818.0, 5300.0, 12683.0, 40428.0, 194934.0, 564876.0, 163246.0, 35260.0, 11495.0, 5137.0, 2611.0, 1517.0, 912.0, 637.0, 509.0, 334.0, 240.0, 158.0, 114.0, 89.0, 69.0, 46.0, 45.0, 25.0, 14.0, 14.0, 3.0, 12.0, 8.0, 7.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.1304931640625, -0.1262073516845703, -0.12192153930664062, -0.11763572692871094, -0.11334991455078125, -0.10906410217285156, -0.10477828979492188, -0.10049247741699219, -0.0962066650390625, -0.09192085266113281, -0.08763504028320312, -0.08334922790527344, -0.07906341552734375, -0.07477760314941406, -0.07049179077148438, -0.06620597839355469, -0.061920166015625, -0.05763435363769531, -0.053348541259765625, -0.04906272888183594, -0.04477691650390625, -0.04049110412597656, -0.036205291748046875, -0.03191947937011719, -0.0276336669921875, -0.023347854614257812, -0.019062042236328125, -0.014776229858398438, -0.01049041748046875, -0.0062046051025390625, -0.001918792724609375, 0.0023670196533203125, 0.00665283203125, 0.010938644409179688, 0.015224456787109375, 0.019510269165039062, 0.02379608154296875, 0.028081893920898438, 0.032367706298828125, 0.03665351867675781, 0.0409393310546875, 0.04522514343261719, 0.049510955810546875, 0.05379676818847656, 0.05808258056640625, 0.06236839294433594, 0.06665420532226562, 0.07094001770019531, 0.075225830078125, 0.07951164245605469, 0.08379745483398438, 0.08808326721191406, 0.09236907958984375, 0.09665489196777344, 0.10094070434570312, 0.10522651672363281, 0.1095123291015625, 0.11379814147949219, 0.11808395385742188, 0.12236976623535156, 0.12665557861328125, 0.13094139099121094, 0.13522720336914062, 0.1395130157470703, 0.143798828125]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 4.0, 6.0, 5.0, 5.0, 6.0, 10.0, 15.0, 19.0, 30.0, 52.0, 62.0, 89.0, 100.0, 132.0, 126.0, 89.0, 64.0, 42.0, 44.0, 27.0, 17.0, 16.0, 15.0, 5.0, 3.0, 6.0, 3.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.10980224609375, -0.10697650909423828, -0.10415077209472656, -0.10132503509521484, -0.09849929809570312, -0.0956735610961914, -0.09284782409667969, -0.09002208709716797, -0.08719635009765625, -0.08437061309814453, -0.08154487609863281, -0.0787191390991211, -0.07589340209960938, -0.07306766510009766, -0.07024192810058594, -0.06741619110107422, -0.0645904541015625, -0.06176471710205078, -0.05893898010253906, -0.056113243103027344, -0.053287506103515625, -0.050461769104003906, -0.04763603210449219, -0.04481029510498047, -0.04198455810546875, -0.03915882110595703, -0.03633308410644531, -0.033507347106933594, -0.030681610107421875, -0.027855873107910156, -0.025030136108398438, -0.02220439910888672, -0.019378662109375, -0.01655292510986328, -0.013727188110351562, -0.010901451110839844, -0.008075714111328125, -0.005249977111816406, -0.0024242401123046875, 0.00040149688720703125, 0.00322723388671875, 0.006052970886230469, 0.008878707885742188, 0.011704444885253906, 0.014530181884765625, 0.017355918884277344, 0.020181655883789062, 0.02300739288330078, 0.0258331298828125, 0.02865886688232422, 0.03148460388183594, 0.034310340881347656, 0.037136077880859375, 0.039961814880371094, 0.04278755187988281, 0.04561328887939453, 0.04843902587890625, 0.05126476287841797, 0.05409049987792969, 0.056916236877441406, 0.059741973876953125, 0.06256771087646484, 0.06539344787597656, 0.06821918487548828, 0.071044921875]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 6.0, 7.0, 8.0, 15.0, 21.0, 39.0, 72.0, 79.0, 124.0, 101.0, 116.0, 109.0, 92.0, 75.0, 46.0, 24.0, 21.0, 14.0, 13.0, 7.0, 6.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.7622910141944885, -0.7332448959350586, -0.7041987776756287, -0.6751526594161987, -0.6461066007614136, -0.6170604228973389, -0.5880143642425537, -0.5589682459831238, -0.5299221277236938, -0.5008760094642639, -0.471829891204834, -0.44278380274772644, -0.4137376844882965, -0.3846915662288666, -0.35564547777175903, -0.3265993595123291, -0.29755324125289917, -0.26850712299346924, -0.2394610196352005, -0.21041491627693176, -0.18136879801750183, -0.1523226797580719, -0.12327657639980316, -0.09423047304153442, -0.06518435478210449, -0.03613824397325516, -0.007092133164405823, 0.021953977644443512, 0.05100008845329285, 0.08004620671272278, 0.10909231007099152, 0.13813841342926025, 0.1671844720840454, 0.19623059034347534, 0.22527669370174408, 0.2543227970600128, 0.28336891531944275, 0.3124150335788727, 0.3414611220359802, 0.37050724029541016, 0.3995533585548401, 0.42859947681427, 0.45764559507369995, 0.4866916835308075, 0.515737771987915, 0.5447839498519897, 0.5738300085067749, 0.6028761267662048, 0.6319222450256348, 0.6609683632850647, 0.6900144815444946, 0.7190605998039246, 0.7481067180633545, 0.7771527767181396, 0.8061988949775696, 0.8352450132369995, 0.8642911314964294, 0.8933372497558594, 0.9223833680152893, 0.9514294862747192, 0.9804755449295044, 1.009521722793579, 1.0385677814483643, 1.0676138401031494, 1.0966600179672241]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 5.0, 4.0, 1.0, 7.0, 7.0, 6.0, 17.0, 13.0, 7.0, 17.0, 9.0, 19.0, 30.0, 26.0, 21.0, 32.0, 36.0, 42.0, 43.0, 38.0, 38.0, 39.0, 41.0, 47.0, 36.0, 40.0, 37.0, 35.0, 37.0, 32.0, 27.0, 17.0, 30.0, 18.0, 17.0, 20.0, 20.0, 20.0, 12.0, 11.0, 15.0, 4.0, 4.0, 5.0, 6.0, 5.0, 5.0, 3.0, 1.0, 3.0, 5.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.5655021071434021, -0.547374963760376, -0.5292478203773499, -0.5111206769943237, -0.49299356341362, -0.47486642003059387, -0.45673927664756775, -0.438612163066864, -0.4204850196838379, -0.40235787630081177, -0.38423073291778564, -0.3661035895347595, -0.3479764759540558, -0.32984933257102966, -0.31172218918800354, -0.2935950756072998, -0.2754679024219513, -0.25734075903892517, -0.23921363055706024, -0.22108648717403412, -0.2029593586921692, -0.18483221530914307, -0.16670507192611694, -0.14857794344425201, -0.1304508000612259, -0.11232366412878036, -0.09419652819633484, -0.07606938481330872, -0.05794224888086319, -0.039815112948417664, -0.02168796956539154, -0.0035608410835266113, 0.014566302299499512, 0.03269343823194504, 0.05082057788968086, 0.06894771754741669, 0.08707485347986221, 0.10520198941230774, 0.12332913279533386, 0.1414562612771988, 0.15958340466022491, 0.17771054804325104, 0.19583767652511597, 0.2139648199081421, 0.2320919632911682, 0.25021910667419434, 0.26834625005722046, 0.2864733636379242, 0.3046005070209503, 0.32272765040397644, 0.34085479378700256, 0.3589819073677063, 0.3771090507507324, 0.39523619413375854, 0.41336333751678467, 0.4314904808998108, 0.4496176242828369, 0.46774476766586304, 0.48587191104888916, 0.5039990544319153, 0.5221261978149414, 0.5402532815933228, 0.5583804845809937, 0.576507568359375, 0.5946347117424011]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 5.0, 9.0, 8.0, 11.0, 19.0, 18.0, 23.0, 36.0, 47.0, 48.0, 38.0, 56.0, 87.0, 127.0, 230.0, 480.0, 931.0, 2729.0, 10647.0, 1023141.0, 7871.0, 2166.0, 802.0, 363.0, 187.0, 126.0, 85.0, 56.0, 46.0, 47.0, 40.0, 29.0, 18.0, 16.0, 14.0, 10.0, 9.0, 10.0, 6.0, 9.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2355692386627197, -1.1974384784698486, -1.1593077182769775, -1.1211769580841064, -1.0830461978912354, -1.0449154376983643, -1.0067846775054932, -0.9686539769172668, -0.9305232167243958, -0.8923924565315247, -0.8542616963386536, -0.8161309361457825, -0.7780002355575562, -0.7398694753646851, -0.701738715171814, -0.6636079549789429, -0.6254771947860718, -0.5873464345932007, -0.5492156744003296, -0.5110849142074585, -0.4729541838169098, -0.4348234236240387, -0.39669269323349, -0.3585619330406189, -0.3204311728477478, -0.2823004126548767, -0.2441696673631668, -0.2060389220714569, -0.16790816187858582, -0.12977740168571472, -0.09164665639400482, -0.05351591110229492, -0.015385031700134277, 0.02274572104215622, 0.060876473784446716, 0.09900722652673721, 0.1371379792690277, 0.1752687394618988, 0.2133994847536087, 0.2515302300453186, 0.2896609902381897, 0.3277917504310608, 0.3659225106239319, 0.4040532410144806, 0.4421840012073517, 0.4803147614002228, 0.5184454917907715, 0.5565762519836426, 0.5947070121765137, 0.6328377723693848, 0.6709685325622559, 0.709099292755127, 0.747230052947998, 0.7853608131408691, 0.8234915137290955, 0.8616222739219666, 0.8997530341148376, 0.9378837943077087, 0.9760145545005798, 1.0141452550888062, 1.0522760152816772, 1.0904067754745483, 1.1285375356674194, 1.1666682958602905, 1.2047990560531616]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 9.0, 7.0, 33.0, 129.0, 407.0, 1372.0, 4788.0, 51450024.0, 10344.0, 2225.0, 689.0, 191.0, 68.0, 23.0, 9.0, 6.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.197341918945312, -14.70218563079834, -14.207029342651367, -13.711874008178711, -13.216717720031738, -12.721561431884766, -12.22640609741211, -11.731249809265137, -11.236093521118164, -10.740937232971191, -10.245780944824219, -9.750625610351562, -9.25546932220459, -8.760313034057617, -8.265157699584961, -7.770001411437988, -7.274845123291016, -6.779688835144043, -6.2845330238342285, -5.789377212524414, -5.294220924377441, -4.799064636230469, -4.303908824920654, -3.8087527751922607, -3.313596725463867, -2.8184406757354736, -2.32328462600708, -1.8281285762786865, -1.332972526550293, -0.8378164768218994, -0.34266042709350586, 0.1524956226348877, 0.6476516723632812, 1.1428077220916748, 1.6379637718200684, 2.133119821548462, 2.6282758712768555, 3.123431921005249, 3.6185879707336426, 4.113743782043457, 4.60890007019043, 5.104056358337402, 5.599212169647217, 6.094367980957031, 6.589524269104004, 7.084680557250977, 7.579836368560791, 8.074992179870605, 8.570148468017578, 9.06530475616455, 9.560461044311523, 10.05561637878418, 10.550772666931152, 11.045928955078125, 11.541084289550781, 12.036240577697754, 12.531396865844727, 13.0265531539917, 13.521709442138672, 14.016864776611328, 14.5120210647583, 15.007177352905273, 15.50233268737793, 15.997488975524902, 16.492645263671875]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 8.0, 10.0, 16.0, 28.0, 38.0, 74.0, 76.0, 157.0, 198.0, 332.0, 538.0, 947.0, 1692.0, 2782.0, 4644.0, 8100.0, 13914.0, 23998.0, 40956.0, 68247.0, 111838.0, 173813.0, 253373.0, 344627.0, 746204.0, 3152187.0, 437716.0, 306834.0, 221567.0, 147686.0, 92643.0, 56294.0, 33071.0, 19357.0, 11237.0, 6463.0, 3842.0, 2372.0, 1365.0, 871.0, 502.0, 329.0, 180.0, 114.0, 85.0, 43.0, 25.0, 23.0, 10.0, 7.0, 6.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.4501953125, -0.4362602233886719, -0.42232513427734375, -0.4083900451660156, -0.3944549560546875, -0.3805198669433594, -0.36658477783203125, -0.3526496887207031, -0.338714599609375, -0.3247795104980469, -0.31084442138671875, -0.2969093322753906, -0.2829742431640625, -0.2690391540527344, -0.25510406494140625, -0.24116897583007812, -0.22723388671875, -0.21329879760742188, -0.19936370849609375, -0.18542861938476562, -0.1714935302734375, -0.15755844116210938, -0.14362335205078125, -0.12968826293945312, -0.115753173828125, -0.10181808471679688, -0.08788299560546875, -0.07394790649414062, -0.0600128173828125, -0.046077728271484375, -0.03214263916015625, -0.018207550048828125, -0.0042724609375, 0.009662628173828125, 0.02359771728515625, 0.037532806396484375, 0.0514678955078125, 0.06540298461914062, 0.07933807373046875, 0.09327316284179688, 0.107208251953125, 0.12114334106445312, 0.13507843017578125, 0.14901351928710938, 0.1629486083984375, 0.17688369750976562, 0.19081878662109375, 0.20475387573242188, 0.21868896484375, 0.23262405395507812, 0.24655914306640625, 0.2604942321777344, 0.2744293212890625, 0.2883644104003906, 0.30229949951171875, 0.3162345886230469, 0.330169677734375, 0.3441047668457031, 0.35803985595703125, 0.3719749450683594, 0.3859100341796875, 0.3998451232910156, 0.41378021240234375, 0.4277153015136719, 0.441650390625]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 6.0, 7.0, 3.0, 7.0, 9.0, 16.0, 12.0, 19.0, 22.0, 26.0, 39.0, 42.0, 35.0, 41.0, 50.0, 44.0, 68.0, 401.0, 679.0, 87.0, 55.0, 43.0, 48.0, 54.0, 42.0, 37.0, 23.0, 24.0, 21.0, 19.0, 12.0, 7.0, 9.0, 12.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.2890625, -5.1427001953125, -4.996337890625, -4.8499755859375, -4.70361328125, -4.5572509765625, -4.410888671875, -4.2645263671875, -4.1181640625, -3.9718017578125, -3.825439453125, -3.6790771484375, -3.53271484375, -3.3863525390625, -3.239990234375, -3.0936279296875, -2.947265625, -2.8009033203125, -2.654541015625, -2.5081787109375, -2.36181640625, -2.2154541015625, -2.069091796875, -1.9227294921875, -1.7763671875, -1.6300048828125, -1.483642578125, -1.3372802734375, -1.19091796875, -1.0445556640625, -0.898193359375, -0.7518310546875, -0.60546875, -0.4591064453125, -0.312744140625, -0.1663818359375, -0.02001953125, 0.1263427734375, 0.272705078125, 0.4190673828125, 0.5654296875, 0.7117919921875, 0.858154296875, 1.0045166015625, 1.15087890625, 1.2972412109375, 1.443603515625, 1.5899658203125, 1.736328125, 1.8826904296875, 2.029052734375, 2.1754150390625, 2.32177734375, 2.4681396484375, 2.614501953125, 2.7608642578125, 2.9072265625, 3.0535888671875, 3.199951171875, 3.3463134765625, 3.49267578125, 3.6390380859375, 3.785400390625, 3.9317626953125, 4.078125]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 1.0, 5.0, 6.0, 10.0, 26.0, 34.0, 43.0, 51.0, 128.0, 158.0, 254.0, 427.0, 635.0, 1070.0, 1695.0, 2587.0, 4182.0, 6272.0, 9824.0, 14857.0, 22938.0, 34182.0, 50778.0, 72272.0, 101193.0, 136559.0, 177555.0, 219154.0, 257421.0, 362831.0, 3100838.0, 542811.0, 263362.0, 227121.0, 185864.0, 145125.0, 108303.0, 78140.0, 54409.0, 37112.0, 24850.0, 16497.0, 10430.0, 7096.0, 4482.0, 2838.0, 1785.0, 1202.0, 726.0, 501.0, 306.0, 204.0, 112.0, 64.0, 51.0, 29.0, 16.0, 14.0, 4.0, 2.0, 7.0], "bins": [-0.25439453125, -0.2468242645263672, -0.23925399780273438, -0.23168373107910156, -0.22411346435546875, -0.21654319763183594, -0.20897293090820312, -0.2014026641845703, -0.1938323974609375, -0.1862621307373047, -0.17869186401367188, -0.17112159729003906, -0.16355133056640625, -0.15598106384277344, -0.14841079711914062, -0.1408405303955078, -0.133270263671875, -0.1256999969482422, -0.11812973022460938, -0.11055946350097656, -0.10298919677734375, -0.09541893005371094, -0.08784866333007812, -0.08027839660644531, -0.0727081298828125, -0.06513786315917969, -0.057567596435546875, -0.04999732971191406, -0.04242706298828125, -0.03485679626464844, -0.027286529541015625, -0.019716262817382812, -0.01214599609375, -0.0045757293701171875, 0.002994537353515625, 0.010564804077148438, 0.01813507080078125, 0.025705337524414062, 0.033275604248046875, 0.04084587097167969, 0.0484161376953125, 0.05598640441894531, 0.06355667114257812, 0.07112693786621094, 0.07869720458984375, 0.08626747131347656, 0.09383773803710938, 0.10140800476074219, 0.108978271484375, 0.11654853820800781, 0.12411880493164062, 0.13168907165527344, 0.13925933837890625, 0.14682960510253906, 0.15439987182617188, 0.1619701385498047, 0.1695404052734375, 0.1771106719970703, 0.18468093872070312, 0.19225120544433594, 0.19982147216796875, 0.20739173889160156, 0.21496200561523438, 0.2225322723388672, 0.2301025390625]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [3.0, 4.0, 0.0, 2.0, 1.0, 6.0, 0.0, 2.0, 7.0, 6.0, 5.0, 6.0, 7.0, 8.0, 10.0, 12.0, 23.0, 16.0, 21.0, 25.0, 38.0, 32.0, 30.0, 37.0, 35.0, 29.0, 34.0, 25.0, 67.0, 638.0, 417.0, 47.0, 45.0, 43.0, 40.0, 34.0, 44.0, 34.0, 23.0, 22.0, 25.0, 24.0, 16.0, 16.0, 19.0, 12.0, 11.0, 11.0, 8.0, 6.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-3.07421875, -2.97125244140625, -2.8682861328125, -2.76531982421875, -2.662353515625, -2.55938720703125, -2.4564208984375, -2.35345458984375, -2.25048828125, -2.14752197265625, -2.0445556640625, -1.94158935546875, -1.838623046875, -1.73565673828125, -1.6326904296875, -1.52972412109375, -1.4267578125, -1.32379150390625, -1.2208251953125, -1.11785888671875, -1.014892578125, -0.91192626953125, -0.8089599609375, -0.70599365234375, -0.60302734375, -0.50006103515625, -0.3970947265625, -0.29412841796875, -0.191162109375, -0.08819580078125, 0.0147705078125, 0.11773681640625, 0.220703125, 0.32366943359375, 0.4266357421875, 0.52960205078125, 0.632568359375, 0.73553466796875, 0.8385009765625, 0.94146728515625, 1.04443359375, 1.14739990234375, 1.2503662109375, 1.35333251953125, 1.456298828125, 1.55926513671875, 1.6622314453125, 1.76519775390625, 1.8681640625, 1.97113037109375, 2.0740966796875, 2.17706298828125, 2.280029296875, 2.38299560546875, 2.4859619140625, 2.58892822265625, 2.69189453125, 2.79486083984375, 2.8978271484375, 3.00079345703125, 3.103759765625, 3.20672607421875, 3.3096923828125, 3.41265869140625, 3.515625]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 7.0, 15.0, 11.0, 17.0, 19.0, 38.0, 48.0, 66.0, 89.0, 146.0, 203.0, 322.0, 508.0, 760.0, 1191.0, 1810.0, 3161.0, 5645.0, 11448.0, 26853.0, 64964.0, 148574.0, 5670502.0, 206264.0, 82563.0, 34731.0, 14719.0, 6885.0, 3741.0, 2136.0, 1329.0, 806.0, 573.0, 405.0, 254.0, 178.0, 136.0, 103.0, 63.0, 53.0, 36.0, 32.0, 12.0, 7.0, 9.0, 8.0, 4.0], "bins": [-1.732421875, -1.688720703125, -1.64501953125, -1.601318359375, -1.5576171875, -1.513916015625, -1.47021484375, -1.426513671875, -1.3828125, -1.339111328125, -1.29541015625, -1.251708984375, -1.2080078125, -1.164306640625, -1.12060546875, -1.076904296875, -1.033203125, -0.989501953125, -0.94580078125, -0.902099609375, -0.8583984375, -0.814697265625, -0.77099609375, -0.727294921875, -0.68359375, -0.639892578125, -0.59619140625, -0.552490234375, -0.5087890625, -0.465087890625, -0.42138671875, -0.377685546875, -0.333984375, -0.290283203125, -0.24658203125, -0.202880859375, -0.1591796875, -0.115478515625, -0.07177734375, -0.028076171875, 0.015625, 0.059326171875, 0.10302734375, 0.146728515625, 0.1904296875, 0.234130859375, 0.27783203125, 0.321533203125, 0.365234375, 0.408935546875, 0.45263671875, 0.496337890625, 0.5400390625, 0.583740234375, 0.62744140625, 0.671142578125, 0.71484375, 0.758544921875, 0.80224609375, 0.845947265625, 0.8896484375, 0.933349609375, 0.97705078125, 1.020751953125, 1.064453125]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 10.0, 4.0, 7.0, 7.0, 9.0, 16.0, 8.0, 17.0, 17.0, 23.0, 27.0, 26.0, 29.0, 45.0, 31.0, 38.0, 40.0, 33.0, 33.0, 42.0, 218.0, 863.0, 52.0, 40.0, 43.0, 42.0, 34.0, 29.0, 37.0, 27.0, 24.0, 28.0, 15.0, 21.0, 14.0, 8.0, 16.0, 11.0, 8.0, 11.0, 7.0, 5.0, 2.0, 7.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-3.935546875, -3.81341552734375, -3.6912841796875, -3.56915283203125, -3.447021484375, -3.32489013671875, -3.2027587890625, -3.08062744140625, -2.95849609375, -2.83636474609375, -2.7142333984375, -2.59210205078125, -2.469970703125, -2.34783935546875, -2.2257080078125, -2.10357666015625, -1.9814453125, -1.85931396484375, -1.7371826171875, -1.61505126953125, -1.492919921875, -1.37078857421875, -1.2486572265625, -1.12652587890625, -1.00439453125, -0.88226318359375, -0.7601318359375, -0.63800048828125, -0.515869140625, -0.39373779296875, -0.2716064453125, -0.14947509765625, -0.02734375, 0.09478759765625, 0.2169189453125, 0.33905029296875, 0.461181640625, 0.58331298828125, 0.7054443359375, 0.82757568359375, 0.94970703125, 1.07183837890625, 1.1939697265625, 1.31610107421875, 1.438232421875, 1.56036376953125, 1.6824951171875, 1.80462646484375, 1.9267578125, 2.04888916015625, 2.1710205078125, 2.29315185546875, 2.415283203125, 2.53741455078125, 2.6595458984375, 2.78167724609375, 2.90380859375, 3.02593994140625, 3.1480712890625, 3.27020263671875, 3.392333984375, 3.51446533203125, 3.6365966796875, 3.75872802734375, 3.880859375]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 13.0, 34.0, 104.0, 328.0, 334.0, 108.0, 48.0, 18.0, 5.0, 5.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.41218566894531, -35.604400634765625, -34.79661178588867, -33.988826751708984, -33.18103790283203, -32.373252868652344, -31.565465927124023, -30.757678985595703, -29.949892044067383, -29.142105102539062, -28.334318161010742, -27.526531219482422, -26.718746185302734, -25.91095733642578, -25.103172302246094, -24.295385360717773, -23.487598419189453, -22.679811477661133, -21.872024536132812, -21.064237594604492, -20.256450653076172, -19.448665618896484, -18.640878677368164, -17.833091735839844, -17.025304794311523, -16.217517852783203, -15.409730911254883, -14.601944923400879, -13.794157981872559, -12.986371040344238, -12.178585052490234, -11.370798110961914, -10.563011169433594, -9.755224227905273, -8.947437286376953, -8.13965129852295, -7.331864356994629, -6.524077415466309, -5.7162909507751465, -4.908504486083984, -4.100717544555664, -3.292930841445923, -2.4851441383361816, -1.6773574352264404, -0.8695707321166992, -0.061783790588378906, 0.7460026741027832, 1.5537891387939453, 2.3615760803222656, 3.169362783432007, 3.977149486541748, 4.78493595123291, 5.5927228927612305, 6.400509834289551, 7.208296298980713, 8.016082763671875, 8.823869705200195, 9.631656646728516, 10.439443588256836, 11.24722957611084, 12.05501651763916, 12.86280345916748, 13.670589447021484, 14.478376388549805, 15.286163330078125]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 3.0, 2.0, 3.0, 1.0, 4.0, 10.0, 7.0, 6.0, 6.0, 6.0, 12.0, 12.0, 14.0, 16.0, 22.0, 43.0, 40.0, 49.0, 57.0, 67.0, 78.0, 84.0, 68.0, 88.0, 53.0, 52.0, 39.0, 32.0, 21.0, 18.0, 11.0, 20.0, 10.0, 8.0, 7.0, 7.0, 7.0, 3.0, 4.0, 4.0, 4.0, 5.0, 0.0, 5.0, 1.0, 0.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.251605987548828, -13.782289505004883, -13.312973022460938, -12.843656539916992, -12.374340057373047, -11.905023574829102, -11.435707092285156, -10.966389656066895, -10.49707317352295, -10.027756690979004, -9.558440208435059, -9.089123725891113, -8.619807243347168, -8.150489807128906, -7.681173801422119, -7.211856842041016, -6.7425408363342285, -6.273224353790283, -5.803907871246338, -5.334590911865234, -4.865274429321289, -4.395957946777344, -3.9266414642333984, -3.457324743270874, -2.9880082607269287, -2.5186917781829834, -2.049375057220459, -1.5800585746765137, -1.1107419729232788, -0.641425371170044, -0.17210888862609863, 0.2972078323364258, 0.7665243148803711, 1.235840916633606, 1.7051575183868408, 2.174474000930786, 2.6437907218933105, 3.113107204437256, 3.582423686981201, 4.051740646362305, 4.52105712890625, 4.990373611450195, 5.459690093994141, 5.929006576538086, 6.3983235359191895, 6.867640018463135, 7.33695650100708, 7.806273460388184, 8.275588989257812, 8.744905471801758, 9.214221954345703, 9.683538436889648, 10.152854919433594, 10.622171401977539, 11.091487884521484, 11.560805320739746, 12.030121803283691, 12.499438285827637, 12.968754768371582, 13.438071250915527, 13.907387733459473, 14.376705169677734, 14.84602165222168, 15.315338134765625, 15.78465461730957]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 0.0, 4.0, 4.0, 6.0, 12.0, 19.0, 21.0, 29.0, 56.0, 62.0, 92.0, 142.0, 225.0, 341.0, 478.0, 826.0, 1234.0, 2213.0, 3964.0, 7835.0, 17718.0, 63481.0, 3856706.0, 176892.0, 32268.0, 13443.0, 6490.0, 3608.0, 2149.0, 1361.0, 829.0, 582.0, 370.0, 263.0, 171.0, 117.0, 87.0, 55.0, 55.0, 26.0, 23.0, 10.0, 7.0, 5.0, 5.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.09100341796875, -0.08830547332763672, -0.08560752868652344, -0.08290958404541016, -0.08021163940429688, -0.0775136947631836, -0.07481575012207031, -0.07211780548095703, -0.06941986083984375, -0.06672191619873047, -0.06402397155761719, -0.061326026916503906, -0.058628082275390625, -0.055930137634277344, -0.05323219299316406, -0.05053424835205078, -0.0478363037109375, -0.04513835906982422, -0.04244041442871094, -0.039742469787597656, -0.037044525146484375, -0.034346580505371094, -0.03164863586425781, -0.02895069122314453, -0.02625274658203125, -0.02355480194091797, -0.020856857299804688, -0.018158912658691406, -0.015460968017578125, -0.012763023376464844, -0.010065078735351562, -0.007367134094238281, -0.004669189453125, -0.0019712448120117188, 0.0007266998291015625, 0.0034246444702148438, 0.006122589111328125, 0.008820533752441406, 0.011518478393554688, 0.014216423034667969, 0.01691436767578125, 0.01961231231689453, 0.022310256958007812, 0.025008201599121094, 0.027706146240234375, 0.030404090881347656, 0.03310203552246094, 0.03579998016357422, 0.0384979248046875, 0.04119586944580078, 0.04389381408691406, 0.046591758728027344, 0.049289703369140625, 0.051987648010253906, 0.05468559265136719, 0.05738353729248047, 0.06008148193359375, 0.06277942657470703, 0.06547737121582031, 0.0681753158569336, 0.07087326049804688, 0.07357120513916016, 0.07626914978027344, 0.07896709442138672, 0.0816650390625]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 5.0, 2.0, 2.0, 5.0, 2.0, 6.0, 5.0, 8.0, 7.0, 7.0, 8.0, 15.0, 25.0, 71.0, 625.0, 53.0, 24.0, 16.0, 19.0, 13.0, 5.0, 6.0, 10.0, 8.0, 8.0, 10.0, 5.0, 5.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.03814697265625, -0.036913394927978516, -0.03567981719970703, -0.03444623947143555, -0.03321266174316406, -0.03197908401489258, -0.030745506286621094, -0.02951192855834961, -0.028278350830078125, -0.02704477310180664, -0.025811195373535156, -0.024577617645263672, -0.023344039916992188, -0.022110462188720703, -0.02087688446044922, -0.019643306732177734, -0.01840972900390625, -0.017176151275634766, -0.01594257354736328, -0.014708995819091797, -0.013475418090820312, -0.012241840362548828, -0.011008262634277344, -0.00977468490600586, -0.008541107177734375, -0.007307529449462891, -0.006073951721191406, -0.004840373992919922, -0.0036067962646484375, -0.002373218536376953, -0.0011396408081054688, 9.393692016601562e-05, 0.0013275146484375, 0.0025610923767089844, 0.0037946701049804688, 0.005028247833251953, 0.0062618255615234375, 0.007495403289794922, 0.008728981018066406, 0.00996255874633789, 0.011196136474609375, 0.01242971420288086, 0.013663291931152344, 0.014896869659423828, 0.016130447387695312, 0.017364025115966797, 0.01859760284423828, 0.019831180572509766, 0.02106475830078125, 0.022298336029052734, 0.02353191375732422, 0.024765491485595703, 0.025999069213867188, 0.027232646942138672, 0.028466224670410156, 0.02969980239868164, 0.030933380126953125, 0.03216695785522461, 0.033400535583496094, 0.03463411331176758, 0.03586769104003906, 0.03710126876831055, 0.03833484649658203, 0.039568424224853516, 0.040802001953125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 5.0, 3.0, 4.0, 4.0, 2.0, 11.0, 12.0, 19.0, 33.0, 38.0, 72.0, 144.0, 242.0, 531.0, 1165.0, 3071.0, 9362.0, 38293.0, 242813.0, 3460789.0, 369240.0, 50637.0, 11694.0, 3598.0, 1390.0, 557.0, 245.0, 128.0, 80.0, 27.0, 15.0, 10.0, 13.0, 11.0, 12.0, 4.0, 2.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11187744140625, -0.1084442138671875, -0.105010986328125, -0.1015777587890625, -0.09814453125, -0.0947113037109375, -0.091278076171875, -0.0878448486328125, -0.08441162109375, -0.0809783935546875, -0.077545166015625, -0.0741119384765625, -0.0706787109375, -0.0672454833984375, -0.063812255859375, -0.0603790283203125, -0.05694580078125, -0.0535125732421875, -0.050079345703125, -0.0466461181640625, -0.043212890625, -0.0397796630859375, -0.036346435546875, -0.0329132080078125, -0.02947998046875, -0.0260467529296875, -0.022613525390625, -0.0191802978515625, -0.0157470703125, -0.0123138427734375, -0.008880615234375, -0.0054473876953125, -0.00201416015625, 0.0014190673828125, 0.004852294921875, 0.0082855224609375, 0.01171875, 0.0151519775390625, 0.018585205078125, 0.0220184326171875, 0.02545166015625, 0.0288848876953125, 0.032318115234375, 0.0357513427734375, 0.0391845703125, 0.0426177978515625, 0.046051025390625, 0.0494842529296875, 0.05291748046875, 0.0563507080078125, 0.059783935546875, 0.0632171630859375, 0.066650390625, 0.0700836181640625, 0.073516845703125, 0.0769500732421875, 0.08038330078125, 0.0838165283203125, 0.087249755859375, 0.0906829833984375, 0.0941162109375, 0.0975494384765625, 0.100982666015625, 0.1044158935546875, 0.10784912109375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 4.0, 2.0, 4.0, 4.0, 5.0, 13.0, 7.0, 13.0, 14.0, 25.0, 22.0, 44.0, 68.0, 86.0, 103.0, 183.0, 344.0, 1196.0, 1008.0, 336.0, 186.0, 112.0, 84.0, 56.0, 30.0, 36.0, 25.0, 10.0, 10.0, 10.0, 6.0, 4.0, 8.0, 11.0, 2.0, 1.0, 3.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.047637939453125, -0.046235084533691406, -0.04483222961425781, -0.04342937469482422, -0.042026519775390625, -0.04062366485595703, -0.03922080993652344, -0.037817955017089844, -0.03641510009765625, -0.035012245178222656, -0.03360939025878906, -0.03220653533935547, -0.030803680419921875, -0.02940082550048828, -0.027997970581054688, -0.026595115661621094, -0.0251922607421875, -0.023789405822753906, -0.022386550903320312, -0.02098369598388672, -0.019580841064453125, -0.01817798614501953, -0.016775131225585938, -0.015372276306152344, -0.01396942138671875, -0.012566566467285156, -0.011163711547851562, -0.009760856628417969, -0.008358001708984375, -0.006955146789550781, -0.0055522918701171875, -0.004149436950683594, -0.00274658203125, -0.0013437271118164062, 5.91278076171875e-05, 0.0014619827270507812, 0.002864837646484375, 0.004267692565917969, 0.0056705474853515625, 0.007073402404785156, 0.00847625732421875, 0.009879112243652344, 0.011281967163085938, 0.012684822082519531, 0.014087677001953125, 0.015490531921386719, 0.016893386840820312, 0.018296241760253906, 0.0196990966796875, 0.021101951599121094, 0.022504806518554688, 0.02390766143798828, 0.025310516357421875, 0.02671337127685547, 0.028116226196289062, 0.029519081115722656, 0.03092193603515625, 0.032324790954589844, 0.03372764587402344, 0.03513050079345703, 0.036533355712890625, 0.03793621063232422, 0.03933906555175781, 0.040741920471191406, 0.042144775390625]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 10.0, 57.0, 535.0, 369.0, 32.0, 2.0, 3.0], "bins": [-1.8639609813690186, -1.8328315019607544, -1.8017021417617798, -1.7705726623535156, -1.7394431829452515, -1.7083138227462769, -1.6771843433380127, -1.6460548639297485, -1.614925503730774, -1.5837960243225098, -1.5526666641235352, -1.521537184715271, -1.4904077053070068, -1.4592783451080322, -1.428148865699768, -1.397019386291504, -1.3658900260925293, -1.3347605466842651, -1.3036311864852905, -1.2725017070770264, -1.2413722276687622, -1.2102428674697876, -1.1791133880615234, -1.1479839086532593, -1.1168544292449951, -1.085724949836731, -1.0545955896377563, -1.0234661102294922, -0.9923366904258728, -0.9612072706222534, -0.9300777912139893, -0.8989483714103699, -0.8678189516067505, -0.8366895318031311, -0.8055600523948669, -0.7744306325912476, -0.7433012127876282, -0.7121717929840088, -0.6810423135757446, -0.6499128937721252, -0.6187834143638611, -0.5876539945602417, -0.5565245151519775, -0.5253950953483582, -0.49426567554473877, -0.463136225938797, -0.4320067763328552, -0.40087735652923584, -0.36974790692329407, -0.3386184573173523, -0.3074890375137329, -0.27635958790779114, -0.24523015320301056, -0.21410071849822998, -0.1829712688922882, -0.15184183418750763, -0.12071239948272705, -0.08958296477794647, -0.0584535226225853, -0.02732408046722412, 0.0038053542375564575, 0.034934788942337036, 0.06606423854827881, 0.09719367325305939, 0.12832310795783997]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 4.0, 4.0, 6.0, 4.0, 9.0, 10.0, 6.0, 16.0, 15.0, 19.0, 24.0, 31.0, 48.0, 48.0, 58.0, 57.0, 56.0, 80.0, 59.0, 49.0, 66.0, 73.0, 42.0, 42.0, 45.0, 33.0, 27.0, 16.0, 17.0, 11.0, 8.0, 5.0, 8.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2086063027381897, -0.20205935835838318, -0.19551241397857666, -0.18896546959877014, -0.18241852521896362, -0.1758715808391571, -0.1693246215581894, -0.16277767717838287, -0.15623073279857635, -0.14968378841876984, -0.14313684403896332, -0.1365898996591568, -0.1300429403781891, -0.12349600344896317, -0.11694905161857605, -0.11040210723876953, -0.10385516285896301, -0.0973082184791565, -0.09076127409934998, -0.08421432226896286, -0.07766737788915634, -0.07112043350934982, -0.06457348167896271, -0.05802653729915619, -0.05147959291934967, -0.04493264853954315, -0.038385700434446335, -0.03183875232934952, -0.025291807949543, -0.01874486356973648, -0.012197915464639664, -0.005650967359542847, 0.0008959770202636719, 0.00744292326271534, 0.013989869505167007, 0.020536815747618675, 0.027083761990070343, 0.03363070636987686, 0.04017765447497368, 0.046724602580070496, 0.053271546959877014, 0.05981849133968353, 0.06636543571949005, 0.07291238754987717, 0.07945933192968369, 0.0860062763094902, 0.09255322813987732, 0.09910017251968384, 0.10564711689949036, 0.11219406127929688, 0.1187410056591034, 0.1252879500389099, 0.13183489441871643, 0.13838183879852295, 0.14492879807949066, 0.15147574245929718, 0.1580226868391037, 0.16456963121891022, 0.17111657559871674, 0.17766351997852325, 0.18421047925949097, 0.19075742363929749, 0.197304368019104, 0.20385131239891052, 0.21039825677871704]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 6.0, 6.0, 8.0, 17.0, 15.0, 21.0, 33.0, 33.0, 53.0, 81.0, 99.0, 155.0, 202.0, 299.0, 415.0, 544.0, 856.0, 1250.0, 1794.0, 2794.0, 4289.0, 7003.0, 11750.0, 21306.0, 47291.0, 757957.0, 120513.0, 29185.0, 15517.0, 9000.0, 5392.0, 3550.0, 2229.0, 1503.0, 1019.0, 673.0, 500.0, 345.0, 239.0, 173.0, 134.0, 96.0, 70.0, 46.0, 32.0, 24.0, 13.0, 12.0, 6.0, 4.0, 5.0, 3.0, 2.0, 3.0, 3.0, 0.0, 2.0], "bins": [-0.141357421875, -0.1370391845703125, -0.132720947265625, -0.1284027099609375, -0.12408447265625, -0.1197662353515625, -0.115447998046875, -0.1111297607421875, -0.1068115234375, -0.1024932861328125, -0.098175048828125, -0.0938568115234375, -0.08953857421875, -0.0852203369140625, -0.080902099609375, -0.0765838623046875, -0.072265625, -0.0679473876953125, -0.063629150390625, -0.0593109130859375, -0.05499267578125, -0.0506744384765625, -0.046356201171875, -0.0420379638671875, -0.0377197265625, -0.0334014892578125, -0.029083251953125, -0.0247650146484375, -0.02044677734375, -0.0161285400390625, -0.011810302734375, -0.0074920654296875, -0.003173828125, 0.0011444091796875, 0.005462646484375, 0.0097808837890625, 0.01409912109375, 0.0184173583984375, 0.022735595703125, 0.0270538330078125, 0.0313720703125, 0.0356903076171875, 0.040008544921875, 0.0443267822265625, 0.04864501953125, 0.0529632568359375, 0.057281494140625, 0.0615997314453125, 0.06591796875, 0.0702362060546875, 0.074554443359375, 0.0788726806640625, 0.08319091796875, 0.0875091552734375, 0.091827392578125, 0.0961456298828125, 0.1004638671875, 0.1047821044921875, 0.109100341796875, 0.1134185791015625, 0.11773681640625, 0.1220550537109375, 0.126373291015625, 0.1306915283203125, 0.135009765625]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 4.0, 0.0, 3.0, 2.0, 2.0, 3.0, 4.0, 5.0, 3.0, 5.0, 9.0, 10.0, 8.0, 8.0, 13.0, 29.0, 135.0, 526.0, 79.0, 33.0, 13.0, 13.0, 17.0, 13.0, 7.0, 7.0, 8.0, 10.0, 9.0, 4.0, 5.0, 2.0, 1.0, 5.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.04266357421875, -0.04140472412109375, -0.0401458740234375, -0.03888702392578125, -0.037628173828125, -0.03636932373046875, -0.0351104736328125, -0.03385162353515625, -0.0325927734375, -0.03133392333984375, -0.0300750732421875, -0.02881622314453125, -0.027557373046875, -0.02629852294921875, -0.0250396728515625, -0.02378082275390625, -0.02252197265625, -0.02126312255859375, -0.0200042724609375, -0.01874542236328125, -0.017486572265625, -0.01622772216796875, -0.0149688720703125, -0.01371002197265625, -0.012451171875, -0.01119232177734375, -0.0099334716796875, -0.00867462158203125, -0.007415771484375, -0.00615692138671875, -0.0048980712890625, -0.00363922119140625, -0.00238037109375, -0.00112152099609375, 0.0001373291015625, 0.00139617919921875, 0.002655029296875, 0.00391387939453125, 0.0051727294921875, 0.00643157958984375, 0.0076904296875, 0.00894927978515625, 0.0102081298828125, 0.01146697998046875, 0.012725830078125, 0.01398468017578125, 0.0152435302734375, 0.01650238037109375, 0.01776123046875, 0.01902008056640625, 0.0202789306640625, 0.02153778076171875, 0.022796630859375, 0.02405548095703125, 0.0253143310546875, 0.02657318115234375, 0.02783203125, 0.02909088134765625, 0.0303497314453125, 0.03160858154296875, 0.032867431640625, 0.03412628173828125, 0.0353851318359375, 0.03664398193359375, 0.03790283203125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 3.0, 5.0, 3.0, 8.0, 9.0, 8.0, 13.0, 9.0, 14.0, 42.0, 22.0, 23.0, 49.0, 62.0, 77.0, 91.0, 130.0, 177.0, 247.0, 386.0, 691.0, 1184.0, 2406.0, 4812.0, 10690.0, 25601.0, 69280.0, 226484.0, 441341.0, 171113.0, 54733.0, 20944.0, 8867.0, 4038.0, 2065.0, 1043.0, 614.0, 368.0, 209.0, 170.0, 123.0, 89.0, 68.0, 63.0, 35.0, 34.0, 27.0, 24.0, 15.0, 13.0, 11.0, 6.0, 6.0, 8.0, 4.0, 6.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.08685302734375, -0.08417129516601562, -0.08148956298828125, -0.07880783081054688, -0.0761260986328125, -0.07344436645507812, -0.07076263427734375, -0.06808090209960938, -0.065399169921875, -0.06271743774414062, -0.06003570556640625, -0.057353973388671875, -0.0546722412109375, -0.051990509033203125, -0.04930877685546875, -0.046627044677734375, -0.0439453125, -0.041263580322265625, -0.03858184814453125, -0.035900115966796875, -0.0332183837890625, -0.030536651611328125, -0.02785491943359375, -0.025173187255859375, -0.022491455078125, -0.019809722900390625, -0.01712799072265625, -0.014446258544921875, -0.0117645263671875, -0.009082794189453125, -0.00640106201171875, -0.003719329833984375, -0.00103759765625, 0.001644134521484375, 0.00432586669921875, 0.007007598876953125, 0.0096893310546875, 0.012371063232421875, 0.01505279541015625, 0.017734527587890625, 0.020416259765625, 0.023097991943359375, 0.02577972412109375, 0.028461456298828125, 0.0311431884765625, 0.033824920654296875, 0.03650665283203125, 0.039188385009765625, 0.0418701171875, 0.044551849365234375, 0.04723358154296875, 0.049915313720703125, 0.0525970458984375, 0.055278778076171875, 0.05796051025390625, 0.060642242431640625, 0.063323974609375, 0.06600570678710938, 0.06868743896484375, 0.07136917114257812, 0.0740509033203125, 0.07673263549804688, 0.07941436767578125, 0.08209609985351562, 0.08477783203125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 1.0, 4.0, 0.0, 4.0, 3.0, 7.0, 8.0, 13.0, 6.0, 16.0, 9.0, 21.0, 7.0, 24.0, 12.0, 16.0, 32.0, 30.0, 39.0, 39.0, 38.0, 36.0, 42.0, 38.0, 32.0, 42.0, 49.0, 41.0, 37.0, 44.0, 31.0, 27.0, 31.0, 35.0, 21.0, 25.0, 22.0, 24.0, 19.0, 14.0, 13.0, 10.0, 11.0, 10.0, 4.0, 3.0, 4.0, 2.0, 5.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.145263671875, -0.1407623291015625, -0.136260986328125, -0.1317596435546875, -0.12725830078125, -0.1227569580078125, -0.118255615234375, -0.1137542724609375, -0.1092529296875, -0.1047515869140625, -0.100250244140625, -0.0957489013671875, -0.09124755859375, -0.0867462158203125, -0.082244873046875, -0.0777435302734375, -0.0732421875, -0.0687408447265625, -0.064239501953125, -0.0597381591796875, -0.05523681640625, -0.0507354736328125, -0.046234130859375, -0.0417327880859375, -0.0372314453125, -0.0327301025390625, -0.028228759765625, -0.0237274169921875, -0.01922607421875, -0.0147247314453125, -0.010223388671875, -0.0057220458984375, -0.001220703125, 0.0032806396484375, 0.007781982421875, 0.0122833251953125, 0.01678466796875, 0.0212860107421875, 0.025787353515625, 0.0302886962890625, 0.0347900390625, 0.0392913818359375, 0.043792724609375, 0.0482940673828125, 0.05279541015625, 0.0572967529296875, 0.061798095703125, 0.0662994384765625, 0.07080078125, 0.0753021240234375, 0.079803466796875, 0.0843048095703125, 0.08880615234375, 0.0933074951171875, 0.097808837890625, 0.1023101806640625, 0.1068115234375, 0.1113128662109375, 0.115814208984375, 0.1203155517578125, 0.12481689453125, 0.1293182373046875, 0.133819580078125, 0.1383209228515625, 0.142822265625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 6.0, 3.0, 9.0, 7.0, 16.0, 21.0, 25.0, 40.0, 82.0, 99.0, 169.0, 281.0, 516.0, 1037.0, 2171.0, 5937.0, 22193.0, 227525.0, 720928.0, 50998.0, 10278.0, 3256.0, 1376.0, 666.0, 352.0, 205.0, 131.0, 74.0, 59.0, 33.0, 17.0, 9.0, 14.0, 6.0, 9.0, 3.0, 6.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11407470703125, -0.11017131805419922, -0.10626792907714844, -0.10236454010009766, -0.09846115112304688, -0.0945577621459961, -0.09065437316894531, -0.08675098419189453, -0.08284759521484375, -0.07894420623779297, -0.07504081726074219, -0.0711374282836914, -0.06723403930664062, -0.06333065032958984, -0.05942726135253906, -0.05552387237548828, -0.0516204833984375, -0.04771709442138672, -0.04381370544433594, -0.039910316467285156, -0.036006927490234375, -0.032103538513183594, -0.028200149536132812, -0.02429676055908203, -0.02039337158203125, -0.01648998260498047, -0.012586593627929688, -0.008683204650878906, -0.004779815673828125, -0.0008764266967773438, 0.0030269622802734375, 0.006930351257324219, 0.010833740234375, 0.014737129211425781, 0.018640518188476562, 0.022543907165527344, 0.026447296142578125, 0.030350685119628906, 0.03425407409667969, 0.03815746307373047, 0.04206085205078125, 0.04596424102783203, 0.04986763000488281, 0.053771018981933594, 0.057674407958984375, 0.061577796936035156, 0.06548118591308594, 0.06938457489013672, 0.0732879638671875, 0.07719135284423828, 0.08109474182128906, 0.08499813079833984, 0.08890151977539062, 0.0928049087524414, 0.09670829772949219, 0.10061168670654297, 0.10451507568359375, 0.10841846466064453, 0.11232185363769531, 0.1162252426147461, 0.12012863159179688, 0.12403202056884766, 0.12793540954589844, 0.13183879852294922, 0.1357421875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 11.0, 8.0, 6.0, 3.0, 9.0, 13.0, 18.0, 20.0, 25.0, 29.0, 55.0, 62.0, 69.0, 65.0, 94.0, 82.0, 75.0, 73.0, 58.0, 41.0, 38.0, 32.0, 24.0, 23.0, 16.0, 12.0, 10.0, 5.0, 2.0, 7.0, 3.0, 5.0, 7.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.8650970458984375e-05, -5.698949098587036e-05, -5.532801151275635e-05, -5.3666532039642334e-05, -5.200505256652832e-05, -5.034357309341431e-05, -4.868209362030029e-05, -4.702061414718628e-05, -4.5359134674072266e-05, -4.369765520095825e-05, -4.203617572784424e-05, -4.0374696254730225e-05, -3.871321678161621e-05, -3.70517373085022e-05, -3.5390257835388184e-05, -3.372877836227417e-05, -3.2067298889160156e-05, -3.0405819416046143e-05, -2.874433994293213e-05, -2.7082860469818115e-05, -2.54213809967041e-05, -2.3759901523590088e-05, -2.2098422050476074e-05, -2.043694257736206e-05, -1.8775463104248047e-05, -1.7113983631134033e-05, -1.545250415802002e-05, -1.3791024684906006e-05, -1.2129545211791992e-05, -1.0468065738677979e-05, -8.806586265563965e-06, -7.145106792449951e-06, -5.4836273193359375e-06, -3.822147846221924e-06, -2.16066837310791e-06, -4.991888999938965e-07, 1.1622905731201172e-06, 2.823770046234131e-06, 4.4852495193481445e-06, 6.146728992462158e-06, 7.808208465576172e-06, 9.469687938690186e-06, 1.11311674118042e-05, 1.2792646884918213e-05, 1.4454126358032227e-05, 1.611560583114624e-05, 1.7777085304260254e-05, 1.9438564777374268e-05, 2.110004425048828e-05, 2.2761523723602295e-05, 2.442300319671631e-05, 2.6084482669830322e-05, 2.7745962142944336e-05, 2.940744161605835e-05, 3.106892108917236e-05, 3.273040056228638e-05, 3.439188003540039e-05, 3.6053359508514404e-05, 3.771483898162842e-05, 3.937631845474243e-05, 4.1037797927856445e-05, 4.269927740097046e-05, 4.436075687408447e-05, 4.6022236347198486e-05, 4.76837158203125e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 1.0, 3.0, 7.0, 9.0, 9.0, 10.0, 29.0, 45.0, 82.0, 147.0, 322.0, 682.0, 1812.0, 5587.0, 25895.0, 280323.0, 664394.0, 55260.0, 9562.0, 2650.0, 950.0, 373.0, 177.0, 84.0, 47.0, 33.0, 24.0, 10.0, 5.0, 8.0, 8.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.10882568359375, -0.10522079467773438, -0.10161590576171875, -0.09801101684570312, -0.0944061279296875, -0.09080123901367188, -0.08719635009765625, -0.08359146118164062, -0.079986572265625, -0.07638168334960938, -0.07277679443359375, -0.06917190551757812, -0.0655670166015625, -0.061962127685546875, -0.05835723876953125, -0.054752349853515625, -0.0511474609375, -0.047542572021484375, -0.04393768310546875, -0.040332794189453125, -0.0367279052734375, -0.033123016357421875, -0.02951812744140625, -0.025913238525390625, -0.022308349609375, -0.018703460693359375, -0.01509857177734375, -0.011493682861328125, -0.0078887939453125, -0.004283905029296875, -0.00067901611328125, 0.002925872802734375, 0.00653076171875, 0.010135650634765625, 0.01374053955078125, 0.017345428466796875, 0.0209503173828125, 0.024555206298828125, 0.02816009521484375, 0.031764984130859375, 0.035369873046875, 0.038974761962890625, 0.04257965087890625, 0.046184539794921875, 0.0497894287109375, 0.053394317626953125, 0.05699920654296875, 0.060604095458984375, 0.064208984375, 0.06781387329101562, 0.07141876220703125, 0.07502365112304688, 0.0786285400390625, 0.08223342895507812, 0.08583831787109375, 0.08944320678710938, 0.093048095703125, 0.09665298461914062, 0.10025787353515625, 0.10386276245117188, 0.1074676513671875, 0.11107254028320312, 0.11467742919921875, 0.11828231811523438, 0.12188720703125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 5.0, 4.0, 6.0, 5.0, 7.0, 8.0, 11.0, 22.0, 23.0, 22.0, 31.0, 48.0, 57.0, 68.0, 98.0, 106.0, 87.0, 79.0, 69.0, 49.0, 61.0, 27.0, 23.0, 15.0, 18.0, 13.0, 17.0, 6.0, 3.0, 5.0, 4.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.09228515625, -0.08977413177490234, -0.08726310729980469, -0.08475208282470703, -0.08224105834960938, -0.07973003387451172, -0.07721900939941406, -0.0747079849243164, -0.07219696044921875, -0.0696859359741211, -0.06717491149902344, -0.06466388702392578, -0.062152862548828125, -0.05964183807373047, -0.05713081359863281, -0.054619789123535156, -0.0521087646484375, -0.049597740173339844, -0.04708671569824219, -0.04457569122314453, -0.042064666748046875, -0.03955364227294922, -0.03704261779785156, -0.034531593322753906, -0.03202056884765625, -0.029509544372558594, -0.026998519897460938, -0.02448749542236328, -0.021976470947265625, -0.01946544647216797, -0.016954421997070312, -0.014443397521972656, -0.011932373046875, -0.009421348571777344, -0.0069103240966796875, -0.004399299621582031, -0.001888275146484375, 0.0006227493286132812, 0.0031337738037109375, 0.005644798278808594, 0.00815582275390625, 0.010666847229003906, 0.013177871704101562, 0.01568889617919922, 0.018199920654296875, 0.02071094512939453, 0.023221969604492188, 0.025732994079589844, 0.0282440185546875, 0.030755043029785156, 0.03326606750488281, 0.03577709197998047, 0.038288116455078125, 0.04079914093017578, 0.04331016540527344, 0.045821189880371094, 0.04833221435546875, 0.050843238830566406, 0.05335426330566406, 0.05586528778076172, 0.058376312255859375, 0.06088733673095703, 0.06339836120605469, 0.06590938568115234, 0.06842041015625]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 7.0, 9.0, 20.0, 35.0, 83.0, 199.0, 359.0, 170.0, 68.0, 21.0, 15.0, 7.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.176950216293335, -2.1257588863372803, -2.0745675563812256, -2.023376226425171, -1.9721850156784058, -1.920993685722351, -1.869802474975586, -1.8186111450195312, -1.7674198150634766, -1.7162284851074219, -1.6650371551513672, -1.613845944404602, -1.5626546144485474, -1.5114632844924927, -1.4602720737457275, -1.4090807437896729, -1.3578894138336182, -1.3066980838775635, -1.2555067539215088, -1.2043155431747437, -1.153124213218689, -1.1019328832626343, -1.0507416725158691, -0.9995503425598145, -0.9483590126037598, -0.8971676826477051, -0.8459764122962952, -0.7947851419448853, -0.7435938119888306, -0.6924024820327759, -0.641211211681366, -0.590019941329956, -0.5388286113739014, -0.48763731122016907, -0.43644601106643677, -0.38525471091270447, -0.33406341075897217, -0.28287211060523987, -0.23168081045150757, -0.18048951029777527, -0.12929821014404297, -0.07810690999031067, -0.02691560983657837, 0.02427569031715393, 0.07546699047088623, 0.12665829062461853, 0.17784959077835083, 0.22904089093208313, 0.28023219108581543, 0.33142349123954773, 0.38261479139328003, 0.43380609154701233, 0.48499739170074463, 0.5361887216567993, 0.5873799920082092, 0.6385712623596191, 0.6897625923156738, 0.7409539222717285, 0.7921451926231384, 0.8433364629745483, 0.894527792930603, 0.9457191228866577, 0.9969103932380676, 1.0481016635894775, 1.0992929935455322]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 3.0, 4.0, 5.0, 7.0, 10.0, 7.0, 13.0, 23.0, 55.0, 88.0, 142.0, 159.0, 170.0, 129.0, 67.0, 40.0, 24.0, 14.0, 7.0, 4.0, 4.0, 5.0, 5.0, 3.0, 2.0, 6.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.485454559326172, -3.3795089721679688, -3.2735631465911865, -3.1676173210144043, -3.061671733856201, -2.955726146697998, -2.849780321121216, -2.7438344955444336, -2.6378889083862305, -2.5319433212280273, -2.425997495651245, -2.320051670074463, -2.2141060829162598, -2.1081604957580566, -2.0022146701812744, -1.8962689638137817, -1.790323257446289, -1.6843775510787964, -1.5784318447113037, -1.472486138343811, -1.3665404319763184, -1.2605947256088257, -1.154649019241333, -1.0487033128738403, -0.9427576065063477, -0.836811900138855, -0.7308661937713623, -0.6249204874038696, -0.518974781036377, -0.4130290746688843, -0.3070833683013916, -0.20113766193389893, -0.09519219398498535, 0.010753512382507324, 0.11669921875, 0.22264492511749268, 0.32859063148498535, 0.434536337852478, 0.5404820442199707, 0.6464277505874634, 0.752373456954956, 0.8583191633224487, 0.9642648696899414, 1.070210576057434, 1.1761562824249268, 1.2821019887924194, 1.388047695159912, 1.4939934015274048, 1.5999391078948975, 1.7058848142623901, 1.8118305206298828, 1.9177762269973755, 2.023721933364868, 2.1296677589416504, 2.2356133460998535, 2.3415589332580566, 2.447504758834839, 2.553450584411621, 2.659396171569824, 2.7653417587280273, 2.8712875843048096, 2.977233409881592, 3.083178997039795, 3.189124584197998, 3.2950704097747803]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 5.0, 11.0, 7.0, 15.0, 20.0, 32.0, 46.0, 78.0, 99.0, 123.0, 215.0, 290.0, 459.0, 729.0, 1203.0, 1826.0, 3190.0, 5875.0, 12420.0, 32878.0, 192161.0, 3790938.0, 94763.0, 28164.0, 12440.0, 6511.0, 3680.0, 2134.0, 1377.0, 895.0, 555.0, 343.0, 230.0, 186.0, 126.0, 76.0, 61.0, 31.0, 27.0, 22.0, 19.0, 12.0, 10.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.23974609375, -0.2325592041015625, -0.225372314453125, -0.2181854248046875, -0.21099853515625, -0.2038116455078125, -0.196624755859375, -0.1894378662109375, -0.1822509765625, -0.1750640869140625, -0.167877197265625, -0.1606903076171875, -0.15350341796875, -0.1463165283203125, -0.139129638671875, -0.1319427490234375, -0.124755859375, -0.1175689697265625, -0.110382080078125, -0.1031951904296875, -0.09600830078125, -0.0888214111328125, -0.081634521484375, -0.0744476318359375, -0.0672607421875, -0.0600738525390625, -0.052886962890625, -0.0457000732421875, -0.03851318359375, -0.0313262939453125, -0.024139404296875, -0.0169525146484375, -0.009765625, -0.0025787353515625, 0.004608154296875, 0.0117950439453125, 0.01898193359375, 0.0261688232421875, 0.033355712890625, 0.0405426025390625, 0.0477294921875, 0.0549163818359375, 0.062103271484375, 0.0692901611328125, 0.07647705078125, 0.0836639404296875, 0.090850830078125, 0.0980377197265625, 0.105224609375, 0.1124114990234375, 0.119598388671875, 0.1267852783203125, 0.13397216796875, 0.1411590576171875, 0.148345947265625, 0.1555328369140625, 0.1627197265625, 0.1699066162109375, 0.177093505859375, 0.1842803955078125, 0.19146728515625, 0.1986541748046875, 0.205841064453125, 0.2130279541015625, 0.22021484375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 5.0, 1.0, 4.0, 2.0, 2.0, 2.0, 7.0, 2.0, 7.0, 6.0, 5.0, 6.0, 13.0, 12.0, 25.0, 49.0, 135.0, 250.0, 199.0, 100.0, 37.0, 24.0, 13.0, 11.0, 9.0, 15.0, 10.0, 8.0, 9.0, 7.0, 6.0, 2.0, 4.0, 5.0, 1.0, 3.0, 6.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.0305938720703125, -0.029616117477416992, -0.028638362884521484, -0.027660608291625977, -0.02668285369873047, -0.02570509910583496, -0.024727344512939453, -0.023749589920043945, -0.022771835327148438, -0.02179408073425293, -0.020816326141357422, -0.019838571548461914, -0.018860816955566406, -0.0178830623626709, -0.01690530776977539, -0.015927553176879883, -0.014949798583984375, -0.013972043991088867, -0.01299428939819336, -0.012016534805297852, -0.011038780212402344, -0.010061025619506836, -0.009083271026611328, -0.00810551643371582, -0.0071277618408203125, -0.006150007247924805, -0.005172252655029297, -0.004194498062133789, -0.0032167434692382812, -0.0022389888763427734, -0.0012612342834472656, -0.0002834796905517578, 0.00069427490234375, 0.0016720294952392578, 0.0026497840881347656, 0.0036275386810302734, 0.004605293273925781, 0.005583047866821289, 0.006560802459716797, 0.007538557052612305, 0.008516311645507812, 0.00949406623840332, 0.010471820831298828, 0.011449575424194336, 0.012427330017089844, 0.013405084609985352, 0.01438283920288086, 0.015360593795776367, 0.016338348388671875, 0.017316102981567383, 0.01829385757446289, 0.0192716121673584, 0.020249366760253906, 0.021227121353149414, 0.022204875946044922, 0.02318263053894043, 0.024160385131835938, 0.025138139724731445, 0.026115894317626953, 0.02709364891052246, 0.02807140350341797, 0.029049158096313477, 0.030026912689208984, 0.031004667282104492, 0.031982421875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 3.0, 6.0, 8.0, 8.0, 9.0, 8.0, 22.0, 22.0, 44.0, 87.0, 116.0, 209.0, 342.0, 810.0, 1753.0, 4985.0, 17375.0, 80310.0, 851710.0, 3061767.0, 136708.0, 26245.0, 7277.0, 2416.0, 976.0, 457.0, 242.0, 135.0, 77.0, 42.0, 29.0, 35.0, 15.0, 11.0, 8.0, 10.0, 0.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.2548828125, -0.24802017211914062, -0.24115753173828125, -0.23429489135742188, -0.2274322509765625, -0.22056961059570312, -0.21370697021484375, -0.20684432983398438, -0.199981689453125, -0.19311904907226562, -0.18625640869140625, -0.17939376831054688, -0.1725311279296875, -0.16566848754882812, -0.15880584716796875, -0.15194320678710938, -0.14508056640625, -0.13821792602539062, -0.13135528564453125, -0.12449264526367188, -0.1176300048828125, -0.11076736450195312, -0.10390472412109375, -0.09704208374023438, -0.090179443359375, -0.08331680297851562, -0.07645416259765625, -0.06959152221679688, -0.0627288818359375, -0.055866241455078125, -0.04900360107421875, -0.042140960693359375, -0.0352783203125, -0.028415679931640625, -0.02155303955078125, -0.014690399169921875, -0.0078277587890625, -0.000965118408203125, 0.00589752197265625, 0.012760162353515625, 0.019622802734375, 0.026485443115234375, 0.03334808349609375, 0.040210723876953125, 0.0470733642578125, 0.053936004638671875, 0.06079864501953125, 0.06766128540039062, 0.07452392578125, 0.08138656616210938, 0.08824920654296875, 0.09511184692382812, 0.1019744873046875, 0.10883712768554688, 0.11569976806640625, 0.12256240844726562, 0.129425048828125, 0.13628768920898438, 0.14315032958984375, 0.15001296997070312, 0.1568756103515625, 0.16373825073242188, 0.17060089111328125, 0.17746353149414062, 0.184326171875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 3.0, 5.0, 8.0, 5.0, 7.0, 15.0, 10.0, 18.0, 30.0, 41.0, 64.0, 102.0, 162.0, 273.0, 516.0, 1638.0, 477.0, 227.0, 153.0, 84.0, 63.0, 47.0, 32.0, 25.0, 18.0, 14.0, 11.0, 8.0, 9.0, 4.0, 2.0, 1.0, 2.0, 3.0, 2.0, 6.0], "bins": [-0.05621337890625, -0.05491924285888672, -0.05362510681152344, -0.052330970764160156, -0.051036834716796875, -0.049742698669433594, -0.04844856262207031, -0.04715442657470703, -0.04586029052734375, -0.04456615447998047, -0.04327201843261719, -0.041977882385253906, -0.040683746337890625, -0.039389610290527344, -0.03809547424316406, -0.03680133819580078, -0.0355072021484375, -0.03421306610107422, -0.03291893005371094, -0.031624794006347656, -0.030330657958984375, -0.029036521911621094, -0.027742385864257812, -0.02644824981689453, -0.02515411376953125, -0.02385997772216797, -0.022565841674804688, -0.021271705627441406, -0.019977569580078125, -0.018683433532714844, -0.017389297485351562, -0.01609516143798828, -0.014801025390625, -0.013506889343261719, -0.012212753295898438, -0.010918617248535156, -0.009624481201171875, -0.008330345153808594, -0.0070362091064453125, -0.005742073059082031, -0.00444793701171875, -0.0031538009643554688, -0.0018596649169921875, -0.0005655288696289062, 0.000728607177734375, 0.0020227432250976562, 0.0033168792724609375, 0.004611015319824219, 0.0059051513671875, 0.007199287414550781, 0.008493423461914062, 0.009787559509277344, 0.011081695556640625, 0.012375831604003906, 0.013669967651367188, 0.014964103698730469, 0.01625823974609375, 0.01755237579345703, 0.018846511840820312, 0.020140647888183594, 0.021434783935546875, 0.022728919982910156, 0.024023056030273438, 0.02531719207763672, 0.026611328125]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 5.0, 11.0, 141.0, 624.0, 200.0, 16.0, 6.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2949503660202026, -1.2683104276657104, -1.2416704893112183, -1.215030550956726, -1.1883904933929443, -1.1617505550384521, -1.13511061668396, -1.1084706783294678, -1.0818307399749756, -1.0551908016204834, -1.0285508632659912, -1.001910924911499, -0.9752709269523621, -0.9486309289932251, -0.9219909906387329, -0.8953510522842407, -0.8687111139297485, -0.8420711755752563, -0.8154311776161194, -0.7887912392616272, -0.762151300907135, -0.735511302947998, -0.7088713645935059, -0.6822314262390137, -0.6555914282798767, -0.6289514899253845, -0.6023114919662476, -0.5756715536117554, -0.5490316152572632, -0.522391676902771, -0.49575167894363403, -0.46911174058914185, -0.44247180223464966, -0.4158318340778351, -0.3891918957233429, -0.3625519275665283, -0.33591198921203613, -0.30927202105522156, -0.282632052898407, -0.2559921145439148, -0.2293521612882614, -0.20271220803260803, -0.17607225477695465, -0.14943230152130127, -0.12279234081506729, -0.09615238010883331, -0.06951242685317993, -0.04287247359752655, -0.01623252034187317, 0.010407434776425362, 0.03704738989472389, 0.06368734687566757, 0.09032730013132095, 0.11696726083755493, 0.1436072140932083, 0.1702471673488617, 0.19688712060451508, 0.22352707386016846, 0.25016704201698303, 0.2768069803714752, 0.3034469485282898, 0.330086886882782, 0.35672685503959656, 0.38336682319641113, 0.4100067615509033]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 6.0, 5.0, 4.0, 7.0, 12.0, 4.0, 7.0, 16.0, 18.0, 17.0, 26.0, 35.0, 39.0, 52.0, 48.0, 48.0, 72.0, 67.0, 48.0, 62.0, 71.0, 56.0, 49.0, 45.0, 39.0, 31.0, 25.0, 20.0, 16.0, 15.0, 7.0, 12.0, 9.0, 6.0, 2.0, 5.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.17127442359924316, -0.166089728474617, -0.16090503334999084, -0.15572033822536469, -0.15053564310073853, -0.14535094797611237, -0.1401662528514862, -0.13498154282569885, -0.1297968626022339, -0.12461216747760773, -0.11942747235298157, -0.11424277722835541, -0.10905808210372925, -0.10387338697910309, -0.09868868440389633, -0.09350398927927017, -0.08831928670406342, -0.08313459157943726, -0.0779498964548111, -0.07276520133018494, -0.06758050620555878, -0.06239580735564232, -0.05721110850572586, -0.0520264133810997, -0.04684171825647354, -0.04165702313184738, -0.03647232800722122, -0.031287629157304764, -0.026102934032678604, -0.020918238908052444, -0.015733541920781136, -0.010548844933509827, -0.005364149808883667, -0.0001794537529349327, 0.005005242303013802, 0.010189938358962536, 0.01537463441491127, 0.02055932953953743, 0.02574402652680874, 0.030928723514080048, 0.03611341863870621, 0.04129811376333237, 0.04648280888795853, 0.051667507737874985, 0.056852202862501144, 0.062036897987127304, 0.06722159683704376, 0.07240629196166992, 0.07759098708629608, 0.08277568221092224, 0.0879603773355484, 0.09314507246017456, 0.09832976758480072, 0.10351446270942688, 0.10869916528463364, 0.1138838604092598, 0.11906855553388596, 0.12425325065851212, 0.12943795323371887, 0.13462264835834503, 0.1398073434829712, 0.14499203860759735, 0.1501767337322235, 0.15536142885684967, 0.16054612398147583]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 7.0, 11.0, 9.0, 14.0, 23.0, 27.0, 37.0, 51.0, 89.0, 134.0, 159.0, 267.0, 437.0, 652.0, 1058.0, 1749.0, 3187.0, 5884.0, 11906.0, 25736.0, 82492.0, 715463.0, 138337.0, 31322.0, 13885.0, 6799.0, 3549.0, 1977.0, 1156.0, 695.0, 506.0, 307.0, 197.0, 126.0, 87.0, 65.0, 44.0, 26.0, 22.0, 14.0, 14.0, 9.0, 13.0, 7.0, 6.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.177734375, -0.1722850799560547, -0.16683578491210938, -0.16138648986816406, -0.15593719482421875, -0.15048789978027344, -0.14503860473632812, -0.1395893096923828, -0.1341400146484375, -0.1286907196044922, -0.12324142456054688, -0.11779212951660156, -0.11234283447265625, -0.10689353942871094, -0.10144424438476562, -0.09599494934082031, -0.090545654296875, -0.08509635925292969, -0.07964706420898438, -0.07419776916503906, -0.06874847412109375, -0.06329917907714844, -0.057849884033203125, -0.05240058898925781, -0.0469512939453125, -0.04150199890136719, -0.036052703857421875, -0.030603408813476562, -0.02515411376953125, -0.019704818725585938, -0.014255523681640625, -0.008806228637695312, -0.00335693359375, 0.0020923614501953125, 0.007541656494140625, 0.012990951538085938, 0.01844024658203125, 0.023889541625976562, 0.029338836669921875, 0.03478813171386719, 0.0402374267578125, 0.04568672180175781, 0.051136016845703125, 0.05658531188964844, 0.06203460693359375, 0.06748390197753906, 0.07293319702148438, 0.07838249206542969, 0.083831787109375, 0.08928108215332031, 0.09473037719726562, 0.10017967224121094, 0.10562896728515625, 0.11107826232910156, 0.11652755737304688, 0.12197685241699219, 0.1274261474609375, 0.1328754425048828, 0.13832473754882812, 0.14377403259277344, 0.14922332763671875, 0.15467262268066406, 0.16012191772460938, 0.1655712127685547, 0.1710205078125]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 6.0, 1.0, 3.0, 5.0, 4.0, 4.0, 4.0, 4.0, 5.0, 5.0, 12.0, 15.0, 28.0, 57.0, 140.0, 225.0, 202.0, 111.0, 47.0, 16.0, 24.0, 17.0, 8.0, 9.0, 8.0, 11.0, 5.0, 5.0, 6.0, 6.0, 6.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.034210205078125, -0.03318166732788086, -0.03215312957763672, -0.031124591827392578, -0.030096054077148438, -0.029067516326904297, -0.028038978576660156, -0.027010440826416016, -0.025981903076171875, -0.024953365325927734, -0.023924827575683594, -0.022896289825439453, -0.021867752075195312, -0.020839214324951172, -0.01981067657470703, -0.01878213882446289, -0.01775360107421875, -0.01672506332397461, -0.01569652557373047, -0.014667987823486328, -0.013639450073242188, -0.012610912322998047, -0.011582374572753906, -0.010553836822509766, -0.009525299072265625, -0.008496761322021484, -0.007468223571777344, -0.006439685821533203, -0.0054111480712890625, -0.004382610321044922, -0.0033540725708007812, -0.0023255348205566406, -0.0012969970703125, -0.0002684593200683594, 0.0007600784301757812, 0.0017886161804199219, 0.0028171539306640625, 0.003845691680908203, 0.004874229431152344, 0.005902767181396484, 0.006931304931640625, 0.007959842681884766, 0.008988380432128906, 0.010016918182373047, 0.011045455932617188, 0.012073993682861328, 0.013102531433105469, 0.01413106918334961, 0.01515960693359375, 0.01618814468383789, 0.01721668243408203, 0.018245220184326172, 0.019273757934570312, 0.020302295684814453, 0.021330833435058594, 0.022359371185302734, 0.023387908935546875, 0.024416446685791016, 0.025444984436035156, 0.026473522186279297, 0.027502059936523438, 0.028530597686767578, 0.02955913543701172, 0.03058767318725586, 0.0316162109375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 9.0, 8.0, 7.0, 16.0, 18.0, 24.0, 52.0, 64.0, 112.0, 165.0, 310.0, 515.0, 1258.0, 3138.0, 10724.0, 52344.0, 403979.0, 489905.0, 65732.0, 13155.0, 3937.0, 1520.0, 673.0, 340.0, 200.0, 124.0, 62.0, 53.0, 34.0, 17.0, 15.0, 18.0, 10.0, 5.0, 3.0, 4.0, 2.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.15625, -0.15121841430664062, -0.14618682861328125, -0.14115524291992188, -0.1361236572265625, -0.13109207153320312, -0.12606048583984375, -0.12102890014648438, -0.115997314453125, -0.11096572875976562, -0.10593414306640625, -0.10090255737304688, -0.0958709716796875, -0.09083938598632812, -0.08580780029296875, -0.08077621459960938, -0.07574462890625, -0.07071304321289062, -0.06568145751953125, -0.060649871826171875, -0.0556182861328125, -0.050586700439453125, -0.04555511474609375, -0.040523529052734375, -0.035491943359375, -0.030460357666015625, -0.02542877197265625, -0.020397186279296875, -0.0153656005859375, -0.010334014892578125, -0.00530242919921875, -0.000270843505859375, 0.0047607421875, 0.009792327880859375, 0.01482391357421875, 0.019855499267578125, 0.0248870849609375, 0.029918670654296875, 0.03495025634765625, 0.039981842041015625, 0.045013427734375, 0.050045013427734375, 0.05507659912109375, 0.060108184814453125, 0.0651397705078125, 0.07017135620117188, 0.07520294189453125, 0.08023452758789062, 0.08526611328125, 0.09029769897460938, 0.09532928466796875, 0.10036087036132812, 0.1053924560546875, 0.11042404174804688, 0.11545562744140625, 0.12048721313476562, 0.125518798828125, 0.13055038452148438, 0.13558197021484375, 0.14061355590820312, 0.1456451416015625, 0.15067672729492188, 0.15570831298828125, 0.16073989868164062, 0.165771484375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 5.0, 7.0, 10.0, 6.0, 14.0, 17.0, 20.0, 20.0, 24.0, 36.0, 39.0, 38.0, 32.0, 48.0, 42.0, 39.0, 43.0, 45.0, 59.0, 44.0, 60.0, 49.0, 47.0, 37.0, 34.0, 36.0, 27.0, 25.0, 17.0, 18.0, 14.0, 12.0, 4.0, 8.0, 10.0, 8.0, 1.0, 3.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.11163330078125, -0.10821056365966797, -0.10478782653808594, -0.1013650894165039, -0.09794235229492188, -0.09451961517333984, -0.09109687805175781, -0.08767414093017578, -0.08425140380859375, -0.08082866668701172, -0.07740592956542969, -0.07398319244384766, -0.07056045532226562, -0.0671377182006836, -0.06371498107910156, -0.06029224395751953, -0.0568695068359375, -0.05344676971435547, -0.05002403259277344, -0.046601295471191406, -0.043178558349609375, -0.039755821228027344, -0.03633308410644531, -0.03291034698486328, -0.02948760986328125, -0.02606487274169922, -0.022642135620117188, -0.019219398498535156, -0.015796661376953125, -0.012373924255371094, -0.008951187133789062, -0.005528450012207031, -0.002105712890625, 0.0013170242309570312, 0.0047397613525390625, 0.008162498474121094, 0.011585235595703125, 0.015007972717285156, 0.018430709838867188, 0.02185344696044922, 0.02527618408203125, 0.02869892120361328, 0.03212165832519531, 0.035544395446777344, 0.038967132568359375, 0.042389869689941406, 0.04581260681152344, 0.04923534393310547, 0.0526580810546875, 0.05608081817626953, 0.05950355529785156, 0.0629262924194336, 0.06634902954101562, 0.06977176666259766, 0.07319450378417969, 0.07661724090576172, 0.08003997802734375, 0.08346271514892578, 0.08688545227050781, 0.09030818939208984, 0.09373092651367188, 0.0971536636352539, 0.10057640075683594, 0.10399913787841797, 0.107421875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 3.0, 4.0, 4.0, 8.0, 7.0, 12.0, 16.0, 27.0, 30.0, 40.0, 60.0, 98.0, 175.0, 258.0, 429.0, 701.0, 1372.0, 2951.0, 7060.0, 21647.0, 89480.0, 467805.0, 362794.0, 65291.0, 16871.0, 5879.0, 2571.0, 1278.0, 675.0, 340.0, 212.0, 146.0, 94.0, 55.0, 44.0, 39.0, 26.0, 9.0, 13.0, 15.0, 10.0, 7.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.10400390625, -0.10063838958740234, -0.09727287292480469, -0.09390735626220703, -0.09054183959960938, -0.08717632293701172, -0.08381080627441406, -0.0804452896118164, -0.07707977294921875, -0.0737142562866211, -0.07034873962402344, -0.06698322296142578, -0.06361770629882812, -0.06025218963623047, -0.05688667297363281, -0.053521156311035156, -0.0501556396484375, -0.046790122985839844, -0.04342460632324219, -0.04005908966064453, -0.036693572998046875, -0.03332805633544922, -0.029962539672851562, -0.026597023010253906, -0.02323150634765625, -0.019865989685058594, -0.016500473022460938, -0.013134956359863281, -0.009769439697265625, -0.006403923034667969, -0.0030384063720703125, 0.00032711029052734375, 0.003692626953125, 0.007058143615722656, 0.010423660278320312, 0.013789176940917969, 0.017154693603515625, 0.02052021026611328, 0.023885726928710938, 0.027251243591308594, 0.03061676025390625, 0.033982276916503906, 0.03734779357910156, 0.04071331024169922, 0.044078826904296875, 0.04744434356689453, 0.05080986022949219, 0.054175376892089844, 0.0575408935546875, 0.060906410217285156, 0.06427192687988281, 0.06763744354248047, 0.07100296020507812, 0.07436847686767578, 0.07773399353027344, 0.0810995101928711, 0.08446502685546875, 0.0878305435180664, 0.09119606018066406, 0.09456157684326172, 0.09792709350585938, 0.10129261016845703, 0.10465812683105469, 0.10802364349365234, 0.11138916015625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 6.0, 4.0, 8.0, 3.0, 7.0, 16.0, 17.0, 22.0, 39.0, 36.0, 44.0, 62.0, 58.0, 97.0, 109.0, 109.0, 83.0, 59.0, 49.0, 45.0, 25.0, 31.0, 17.0, 12.0, 13.0, 8.0, 6.0, 2.0, 4.0, 5.0, 5.0, 3.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.888410568237305e-05, -9.611900895833969e-05, -9.335391223430634e-05, -9.058881551027298e-05, -8.782371878623962e-05, -8.505862206220627e-05, -8.229352533817291e-05, -7.952842861413956e-05, -7.67633318901062e-05, -7.399823516607285e-05, -7.123313844203949e-05, -6.846804171800613e-05, -6.570294499397278e-05, -6.293784826993942e-05, -6.017275154590607e-05, -5.740765482187271e-05, -5.4642558097839355e-05, -5.1877461373806e-05, -4.9112364649772644e-05, -4.634726792573929e-05, -4.358217120170593e-05, -4.081707447767258e-05, -3.805197775363922e-05, -3.5286881029605865e-05, -3.252178430557251e-05, -2.9756687581539154e-05, -2.69915908575058e-05, -2.4226494133472443e-05, -2.1461397409439087e-05, -1.869630068540573e-05, -1.5931203961372375e-05, -1.316610723733902e-05, -1.0401010513305664e-05, -7.635913789272308e-06, -4.870817065238953e-06, -2.105720341205597e-06, 6.593763828277588e-07, 3.4244731068611145e-06, 6.18956983089447e-06, 8.954666554927826e-06, 1.1719763278961182e-05, 1.4484860002994537e-05, 1.7249956727027893e-05, 2.001505345106125e-05, 2.2780150175094604e-05, 2.554524689912796e-05, 2.8310343623161316e-05, 3.107544034719467e-05, 3.384053707122803e-05, 3.660563379526138e-05, 3.937073051929474e-05, 4.2135827243328094e-05, 4.490092396736145e-05, 4.7666020691394806e-05, 5.043111741542816e-05, 5.319621413946152e-05, 5.596131086349487e-05, 5.872640758752823e-05, 6.149150431156158e-05, 6.425660103559494e-05, 6.70216977596283e-05, 6.978679448366165e-05, 7.255189120769501e-05, 7.531698793172836e-05, 7.808208465576172e-05]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 5.0, 1.0, 8.0, 4.0, 14.0, 21.0, 24.0, 40.0, 61.0, 126.0, 248.0, 482.0, 1096.0, 3208.0, 12294.0, 67906.0, 504814.0, 392469.0, 50945.0, 10006.0, 2761.0, 1014.0, 463.0, 227.0, 135.0, 65.0, 33.0, 27.0, 20.0, 20.0, 11.0, 5.0, 4.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1273193359375, -0.12320137023925781, -0.11908340454101562, -0.11496543884277344, -0.11084747314453125, -0.10672950744628906, -0.10261154174804688, -0.09849357604980469, -0.0943756103515625, -0.09025764465332031, -0.08613967895507812, -0.08202171325683594, -0.07790374755859375, -0.07378578186035156, -0.06966781616210938, -0.06554985046386719, -0.061431884765625, -0.05731391906738281, -0.053195953369140625, -0.04907798767089844, -0.04496002197265625, -0.04084205627441406, -0.036724090576171875, -0.03260612487792969, -0.0284881591796875, -0.024370193481445312, -0.020252227783203125, -0.016134262084960938, -0.01201629638671875, -0.007898330688476562, -0.003780364990234375, 0.0003376007080078125, 0.00445556640625, 0.008573532104492188, 0.012691497802734375, 0.016809463500976562, 0.02092742919921875, 0.025045394897460938, 0.029163360595703125, 0.03328132629394531, 0.0373992919921875, 0.04151725769042969, 0.045635223388671875, 0.04975318908691406, 0.05387115478515625, 0.05798912048339844, 0.062107086181640625, 0.06622505187988281, 0.070343017578125, 0.07446098327636719, 0.07857894897460938, 0.08269691467285156, 0.08681488037109375, 0.09093284606933594, 0.09505081176757812, 0.09916877746582031, 0.1032867431640625, 0.10740470886230469, 0.11152267456054688, 0.11564064025878906, 0.11975860595703125, 0.12387657165527344, 0.12799453735351562, 0.1321125030517578, 0.13623046875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 7.0, 11.0, 15.0, 18.0, 23.0, 43.0, 55.0, 73.0, 94.0, 99.0, 105.0, 103.0, 84.0, 83.0, 54.0, 38.0, 30.0, 16.0, 13.0, 15.0, 8.0, 3.0, 5.0, 6.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.09326171875, -0.09038448333740234, -0.08750724792480469, -0.08463001251220703, -0.08175277709960938, -0.07887554168701172, -0.07599830627441406, -0.0731210708618164, -0.07024383544921875, -0.0673666000366211, -0.06448936462402344, -0.06161212921142578, -0.058734893798828125, -0.05585765838623047, -0.05298042297363281, -0.050103187561035156, -0.0472259521484375, -0.044348716735839844, -0.04147148132324219, -0.03859424591064453, -0.035717010498046875, -0.03283977508544922, -0.029962539672851562, -0.027085304260253906, -0.02420806884765625, -0.021330833435058594, -0.018453598022460938, -0.015576362609863281, -0.012699127197265625, -0.009821891784667969, -0.0069446563720703125, -0.004067420959472656, -0.001190185546875, 0.0016870498657226562, 0.0045642852783203125, 0.007441520690917969, 0.010318756103515625, 0.013195991516113281, 0.016073226928710938, 0.018950462341308594, 0.02182769775390625, 0.024704933166503906, 0.027582168579101562, 0.03045940399169922, 0.033336639404296875, 0.03621387481689453, 0.03909111022949219, 0.041968345642089844, 0.0448455810546875, 0.047722816467285156, 0.05060005187988281, 0.05347728729248047, 0.056354522705078125, 0.05923175811767578, 0.06210899353027344, 0.0649862289428711, 0.06786346435546875, 0.0707406997680664, 0.07361793518066406, 0.07649517059326172, 0.07937240600585938, 0.08224964141845703, 0.08512687683105469, 0.08800411224365234, 0.09088134765625]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 8.0, 20.0, 108.0, 412.0, 347.0, 80.0, 17.0, 9.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5367259979248047, -3.4658761024475098, -3.395026206970215, -3.324176549911499, -3.253326654434204, -3.182476758956909, -3.1116268634796143, -3.0407772064208984, -2.9699273109436035, -2.8990774154663086, -2.8282275199890137, -2.757377862930298, -2.686527967453003, -2.615678071975708, -2.544828176498413, -2.4739785194396973, -2.4031286239624023, -2.3322787284851074, -2.2614288330078125, -2.1905791759490967, -2.1197292804718018, -2.048879384994507, -1.978029489517212, -1.9071797132492065, -1.836329698562622, -1.7654798030853271, -1.6946300268173218, -1.6237801313400269, -1.5529303550720215, -1.4820804595947266, -1.4112305641174316, -1.3403807878494263, -1.269531011581421, -1.198681116104126, -1.1278313398361206, -1.0569814443588257, -0.9861316680908203, -0.9152817726135254, -0.8444319367408752, -0.7735821008682251, -0.702732264995575, -0.6318824291229248, -0.5610325932502747, -0.4901827275753021, -0.419332891702652, -0.34848305583000183, -0.2776331901550293, -0.20678335428237915, -0.135933518409729, -0.06508367508649826, 0.005766168236732483, 0.07661601901054382, 0.14746585488319397, 0.21831569075584412, 0.28916555643081665, 0.3600153923034668, 0.43086522817611694, 0.5017150640487671, 0.5725648999214172, 0.6434147357940674, 0.7142646312713623, 0.7851144075393677, 0.8559643030166626, 0.9268141388893127, 0.9976639747619629]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 6.0, 2.0, 0.0, 1.0, 1.0, 6.0, 5.0, 8.0, 5.0, 13.0, 13.0, 23.0, 36.0, 40.0, 56.0, 66.0, 57.0, 79.0, 84.0, 83.0, 86.0, 68.0, 51.0, 55.0, 32.0, 42.0, 29.0, 17.0, 9.0, 7.0, 4.0, 10.0, 2.0, 1.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.0924714803695679, -1.0593444108963013, -1.0262172222137451, -0.9930901527404785, -0.9599630832672119, -0.9268360137939453, -0.8937088847160339, -0.8605817556381226, -0.827454686164856, -0.7943276166915894, -0.761200487613678, -0.7280733585357666, -0.6949462890625, -0.6618192195892334, -0.628692090511322, -0.5955649614334106, -0.562437891960144, -0.5293108224868774, -0.49618369340896606, -0.4630565941333771, -0.4299294948577881, -0.3968023955821991, -0.3636752963066101, -0.3305481970310211, -0.29742109775543213, -0.26429399847984314, -0.23116689920425415, -0.19803979992866516, -0.16491270065307617, -0.13178560137748718, -0.0986585021018982, -0.0655314028263092, -0.032404184341430664, 0.0007229149341583252, 0.033850014209747314, 0.0669771134853363, 0.10010421276092529, 0.13323131203651428, 0.16635841131210327, 0.19948551058769226, 0.23261260986328125, 0.26573970913887024, 0.29886680841445923, 0.3319939076900482, 0.3651210069656372, 0.3982481062412262, 0.4313752055168152, 0.4645023047924042, 0.49762940406799316, 0.5307564735412598, 0.5638836026191711, 0.5970107316970825, 0.6301378011703491, 0.6632648706436157, 0.6963919997215271, 0.7295191287994385, 0.7626461982727051, 0.7957732677459717, 0.8289003968238831, 0.8620275259017944, 0.895154595375061, 0.9282816648483276, 0.961408793926239, 0.9945359230041504, 1.027662992477417]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 5.0, 3.0, 3.0, 5.0, 3.0, 6.0, 7.0, 11.0, 11.0, 12.0, 22.0, 38.0, 31.0, 45.0, 50.0, 72.0, 95.0, 120.0, 179.0, 260.0, 389.0, 538.0, 861.0, 1256.0, 2239.0, 4141.0, 9333.0, 27546.0, 164477.0, 3822519.0, 113353.0, 24616.0, 9377.0, 4681.0, 2622.0, 1555.0, 1042.0, 718.0, 474.0, 401.0, 295.0, 213.0, 163.0, 133.0, 97.0, 68.0, 56.0, 47.0, 24.0, 29.0, 13.0, 9.0, 8.0, 9.0, 4.0, 4.0, 7.0, 1.0, 1.0, 1.0], "bins": [-0.320556640625, -0.3109703063964844, -0.30138397216796875, -0.2917976379394531, -0.2822113037109375, -0.2726249694824219, -0.26303863525390625, -0.2534523010253906, -0.243865966796875, -0.23427963256835938, -0.22469329833984375, -0.21510696411132812, -0.2055206298828125, -0.19593429565429688, -0.18634796142578125, -0.17676162719726562, -0.16717529296875, -0.15758895874023438, -0.14800262451171875, -0.13841629028320312, -0.1288299560546875, -0.11924362182617188, -0.10965728759765625, -0.10007095336914062, -0.090484619140625, -0.08089828491210938, -0.07131195068359375, -0.061725616455078125, -0.0521392822265625, -0.042552947998046875, -0.03296661376953125, -0.023380279541015625, -0.0137939453125, -0.004207611083984375, 0.00537872314453125, 0.014965057373046875, 0.0245513916015625, 0.034137725830078125, 0.04372406005859375, 0.053310394287109375, 0.062896728515625, 0.07248306274414062, 0.08206939697265625, 0.09165573120117188, 0.1012420654296875, 0.11082839965820312, 0.12041473388671875, 0.13000106811523438, 0.13958740234375, 0.14917373657226562, 0.15876007080078125, 0.16834640502929688, 0.1779327392578125, 0.18751907348632812, 0.19710540771484375, 0.20669174194335938, 0.216278076171875, 0.22586441040039062, 0.23545074462890625, 0.24503707885742188, 0.2546234130859375, 0.2642097473144531, 0.27379608154296875, 0.2833824157714844, 0.29296875]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 5.0, 5.0, 7.0, 7.0, 14.0, 6.0, 31.0, 31.0, 61.0, 118.0, 180.0, 190.0, 133.0, 53.0, 35.0, 23.0, 21.0, 13.0, 15.0, 5.0, 8.0, 7.0, 8.0, 2.0, 4.0, 2.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.035552978515625, -0.03455018997192383, -0.033547401428222656, -0.032544612884521484, -0.03154182434082031, -0.03053903579711914, -0.02953624725341797, -0.028533458709716797, -0.027530670166015625, -0.026527881622314453, -0.02552509307861328, -0.02452230453491211, -0.023519515991210938, -0.022516727447509766, -0.021513938903808594, -0.020511150360107422, -0.01950836181640625, -0.018505573272705078, -0.017502784729003906, -0.016499996185302734, -0.015497207641601562, -0.01449441909790039, -0.013491630554199219, -0.012488842010498047, -0.011486053466796875, -0.010483264923095703, -0.009480476379394531, -0.00847768783569336, -0.0074748992919921875, -0.006472110748291016, -0.005469322204589844, -0.004466533660888672, -0.0034637451171875, -0.002460956573486328, -0.0014581680297851562, -0.0004553794860839844, 0.0005474090576171875, 0.0015501976013183594, 0.0025529861450195312, 0.003555774688720703, 0.004558563232421875, 0.005561351776123047, 0.006564140319824219, 0.007566928863525391, 0.008569717407226562, 0.009572505950927734, 0.010575294494628906, 0.011578083038330078, 0.01258087158203125, 0.013583660125732422, 0.014586448669433594, 0.015589237213134766, 0.016592025756835938, 0.01759481430053711, 0.01859760284423828, 0.019600391387939453, 0.020603179931640625, 0.021605968475341797, 0.02260875701904297, 0.02361154556274414, 0.024614334106445312, 0.025617122650146484, 0.026619911193847656, 0.027622699737548828, 0.02862548828125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 7.0, 5.0, 9.0, 8.0, 13.0, 28.0, 29.0, 66.0, 112.0, 233.0, 577.0, 1940.0, 7906.0, 49632.0, 3357609.0, 738592.0, 29744.0, 5466.0, 1452.0, 476.0, 160.0, 76.0, 56.0, 24.0, 17.0, 10.0, 14.0, 9.0, 3.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.430908203125, -0.4173927307128906, -0.40387725830078125, -0.3903617858886719, -0.3768463134765625, -0.3633308410644531, -0.34981536865234375, -0.3362998962402344, -0.322784423828125, -0.3092689514160156, -0.29575347900390625, -0.2822380065917969, -0.2687225341796875, -0.2552070617675781, -0.24169158935546875, -0.22817611694335938, -0.21466064453125, -0.20114517211914062, -0.18762969970703125, -0.17411422729492188, -0.1605987548828125, -0.14708328247070312, -0.13356781005859375, -0.12005233764648438, -0.106536865234375, -0.09302139282226562, -0.07950592041015625, -0.06599044799804688, -0.0524749755859375, -0.038959503173828125, -0.02544403076171875, -0.011928558349609375, 0.0015869140625, 0.015102386474609375, 0.02861785888671875, 0.042133331298828125, 0.0556488037109375, 0.06916427612304688, 0.08267974853515625, 0.09619522094726562, 0.109710693359375, 0.12322616577148438, 0.13674163818359375, 0.15025711059570312, 0.1637725830078125, 0.17728805541992188, 0.19080352783203125, 0.20431900024414062, 0.21783447265625, 0.23134994506835938, 0.24486541748046875, 0.2583808898925781, 0.2718963623046875, 0.2854118347167969, 0.29892730712890625, 0.3124427795410156, 0.325958251953125, 0.3394737243652344, 0.35298919677734375, 0.3665046691894531, 0.3800201416015625, 0.3935356140136719, 0.40705108642578125, 0.4205665588378906, 0.43408203125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 3.0, 4.0, 6.0, 2.0, 12.0, 9.0, 10.0, 13.0, 33.0, 34.0, 85.0, 150.0, 290.0, 791.0, 1674.0, 445.0, 187.0, 122.0, 64.0, 42.0, 38.0, 14.0, 11.0, 10.0, 6.0, 6.0, 2.0, 2.0, 5.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.056732177734375, -0.055023193359375, -0.053314208984375, -0.051605224609375, -0.049896240234375, -0.048187255859375, -0.046478271484375, -0.044769287109375, -0.043060302734375, -0.041351318359375, -0.039642333984375, -0.037933349609375, -0.036224365234375, -0.034515380859375, -0.032806396484375, -0.031097412109375, -0.029388427734375, -0.027679443359375, -0.025970458984375, -0.024261474609375, -0.022552490234375, -0.020843505859375, -0.019134521484375, -0.017425537109375, -0.015716552734375, -0.014007568359375, -0.012298583984375, -0.010589599609375, -0.008880615234375, -0.007171630859375, -0.005462646484375, -0.003753662109375, -0.002044677734375, -0.000335693359375, 0.001373291015625, 0.003082275390625, 0.004791259765625, 0.006500244140625, 0.008209228515625, 0.009918212890625, 0.011627197265625, 0.013336181640625, 0.015045166015625, 0.016754150390625, 0.018463134765625, 0.020172119140625, 0.021881103515625, 0.023590087890625, 0.025299072265625, 0.027008056640625, 0.028717041015625, 0.030426025390625, 0.032135009765625, 0.033843994140625, 0.035552978515625, 0.037261962890625, 0.038970947265625, 0.040679931640625, 0.042388916015625, 0.044097900390625, 0.045806884765625, 0.047515869140625, 0.049224853515625, 0.050933837890625, 0.052642822265625]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 5.0, 8.0, 78.0, 292.0, 428.0, 147.0, 34.0, 9.0, 7.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7982879877090454, -0.7749184966087341, -0.7515490055084229, -0.7281795144081116, -0.7048100233078003, -0.681440532207489, -0.6580710411071777, -0.6347014904022217, -0.6113320589065552, -0.5879625678062439, -0.5645930767059326, -0.5412235856056213, -0.5178540945053101, -0.4944846034049988, -0.4711150825023651, -0.44774559140205383, -0.42437607049942017, -0.4010065793991089, -0.3776370882987976, -0.35426759719848633, -0.33089810609817505, -0.30752861499786377, -0.2841590940952301, -0.2607896029949188, -0.23742011189460754, -0.21405062079429626, -0.19068112969398499, -0.1673116236925125, -0.14394213259220123, -0.12057264149188995, -0.09720313549041748, -0.0738336443901062, -0.05046415328979492, -0.027094658464193344, -0.0037251636385917664, 0.01964433491230011, 0.04301382601261139, 0.06638331711292267, 0.08975282311439514, 0.11312231421470642, 0.1364918053150177, 0.15986129641532898, 0.18323078751564026, 0.20660029351711273, 0.229969784617424, 0.2533392906188965, 0.27670878171920776, 0.30007827281951904, 0.3234477639198303, 0.3468172550201416, 0.3701867461204529, 0.39355623722076416, 0.41692572832107544, 0.4402952194213867, 0.4636647403240204, 0.48703423142433167, 0.5104037523269653, 0.5337732434272766, 0.5571427345275879, 0.5805122256278992, 0.6038817167282104, 0.6272512078285217, 0.650620698928833, 0.6739902496337891, 0.6973596811294556]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 5.0, 2.0, 4.0, 5.0, 4.0, 10.0, 8.0, 6.0, 16.0, 22.0, 34.0, 28.0, 29.0, 49.0, 42.0, 54.0, 47.0, 61.0, 81.0, 64.0, 58.0, 49.0, 53.0, 43.0, 41.0, 38.0, 31.0, 28.0, 18.0, 24.0, 12.0, 9.0, 5.0, 9.0, 6.0, 5.0, 5.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.21475166082382202, -0.20842906832695007, -0.20210649073123932, -0.19578389823436737, -0.18946130573749542, -0.18313872814178467, -0.17681613564491272, -0.17049354314804077, -0.16417095065116882, -0.15784835815429688, -0.15152578055858612, -0.14520318806171417, -0.13888059556484222, -0.13255801796913147, -0.12623542547225952, -0.11991283297538757, -0.11359025537967682, -0.10726767033338547, -0.10094507783651352, -0.09462249279022217, -0.08829990029335022, -0.08197731524705887, -0.07565473020076752, -0.06933213770389557, -0.06300955265760422, -0.05668696388602257, -0.05036437511444092, -0.04404179006814957, -0.03771920129656792, -0.03139661252498627, -0.025074027478694916, -0.018751438707113266, -0.012428849935531616, -0.006106262095272541, 0.00021632574498653412, 0.006538912653923035, 0.012861501425504684, 0.019184090197086334, 0.025506675243377686, 0.031829264014959335, 0.038151852786540985, 0.044474441558122635, 0.050797030329704285, 0.057119615375995636, 0.06344220042228699, 0.06976479291915894, 0.07608737796545029, 0.08240996301174164, 0.08873255550861359, 0.09505514055490494, 0.10137773305177689, 0.10770031809806824, 0.11402291059494019, 0.12034549564123154, 0.1266680806875229, 0.13299067318439484, 0.1393132507801056, 0.14563584327697754, 0.1519584208726883, 0.15828101336956024, 0.1646036058664322, 0.17092618346214294, 0.1772487759590149, 0.18357136845588684, 0.1898939609527588]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 6.0, 4.0, 4.0, 9.0, 9.0, 9.0, 17.0, 18.0, 24.0, 39.0, 46.0, 72.0, 111.0, 151.0, 225.0, 306.0, 451.0, 625.0, 1060.0, 1847.0, 2994.0, 5332.0, 10952.0, 26557.0, 93547.0, 530602.0, 282144.0, 53951.0, 18332.0, 8249.0, 4372.0, 2468.0, 1391.0, 860.0, 573.0, 371.0, 244.0, 193.0, 115.0, 79.0, 59.0, 42.0, 21.0, 20.0, 16.0, 9.0, 9.0, 8.0, 8.0, 3.0, 4.0, 3.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.189208984375, -0.1832599639892578, -0.17731094360351562, -0.17136192321777344, -0.16541290283203125, -0.15946388244628906, -0.15351486206054688, -0.1475658416748047, -0.1416168212890625, -0.1356678009033203, -0.12971878051757812, -0.12376976013183594, -0.11782073974609375, -0.11187171936035156, -0.10592269897460938, -0.09997367858886719, -0.094024658203125, -0.08807563781738281, -0.08212661743164062, -0.07617759704589844, -0.07022857666015625, -0.06427955627441406, -0.058330535888671875, -0.05238151550292969, -0.0464324951171875, -0.04048347473144531, -0.034534454345703125, -0.028585433959960938, -0.02263641357421875, -0.016687393188476562, -0.010738372802734375, -0.0047893524169921875, 0.00115966796875, 0.0071086883544921875, 0.013057708740234375, 0.019006729125976562, 0.02495574951171875, 0.030904769897460938, 0.036853790283203125, 0.04280281066894531, 0.0487518310546875, 0.05470085144042969, 0.060649871826171875, 0.06659889221191406, 0.07254791259765625, 0.07849693298339844, 0.08444595336914062, 0.09039497375488281, 0.096343994140625, 0.10229301452636719, 0.10824203491210938, 0.11419105529785156, 0.12014007568359375, 0.12608909606933594, 0.13203811645507812, 0.1379871368408203, 0.1439361572265625, 0.1498851776123047, 0.15583419799804688, 0.16178321838378906, 0.16773223876953125, 0.17368125915527344, 0.17963027954101562, 0.1855792999267578, 0.1915283203125]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 4.0, 3.0, 4.0, 5.0, 5.0, 6.0, 17.0, 23.0, 37.0, 54.0, 89.0, 114.0, 154.0, 148.0, 110.0, 82.0, 33.0, 23.0, 22.0, 11.0, 9.0, 6.0, 5.0, 11.0, 7.0, 5.0, 7.0, 3.0, 4.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.032257080078125, -0.031311988830566406, -0.030366897583007812, -0.02942180633544922, -0.028476715087890625, -0.02753162384033203, -0.026586532592773438, -0.025641441345214844, -0.02469635009765625, -0.023751258850097656, -0.022806167602539062, -0.02186107635498047, -0.020915985107421875, -0.01997089385986328, -0.019025802612304688, -0.018080711364746094, -0.0171356201171875, -0.016190528869628906, -0.015245437622070312, -0.014300346374511719, -0.013355255126953125, -0.012410163879394531, -0.011465072631835938, -0.010519981384277344, -0.00957489013671875, -0.008629798889160156, -0.0076847076416015625, -0.006739616394042969, -0.005794525146484375, -0.004849433898925781, -0.0039043426513671875, -0.0029592514038085938, -0.00201416015625, -0.0010690689086914062, -0.0001239776611328125, 0.0008211135864257812, 0.001766204833984375, 0.0027112960815429688, 0.0036563873291015625, 0.004601478576660156, 0.00554656982421875, 0.006491661071777344, 0.0074367523193359375, 0.008381843566894531, 0.009326934814453125, 0.010272026062011719, 0.011217117309570312, 0.012162208557128906, 0.0131072998046875, 0.014052391052246094, 0.014997482299804688, 0.01594257354736328, 0.016887664794921875, 0.01783275604248047, 0.018777847290039062, 0.019722938537597656, 0.02066802978515625, 0.021613121032714844, 0.022558212280273438, 0.02350330352783203, 0.024448394775390625, 0.02539348602294922, 0.026338577270507812, 0.027283668518066406, 0.028228759765625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 4.0, 1.0, 5.0, 5.0, 12.0, 16.0, 11.0, 19.0, 24.0, 34.0, 44.0, 57.0, 108.0, 133.0, 202.0, 282.0, 539.0, 871.0, 1788.0, 4441.0, 15222.0, 69168.0, 396143.0, 449173.0, 82881.0, 17853.0, 5047.0, 1907.0, 967.0, 525.0, 357.0, 229.0, 138.0, 86.0, 73.0, 53.0, 30.0, 26.0, 17.0, 15.0, 11.0, 9.0, 6.0, 6.0, 5.0, 3.0, 2.0, 3.0, 3.0, 4.0, 1.0, 2.0, 1.0, 3.0], "bins": [-0.2255859375, -0.21875953674316406, -0.21193313598632812, -0.2051067352294922, -0.19828033447265625, -0.1914539337158203, -0.18462753295898438, -0.17780113220214844, -0.1709747314453125, -0.16414833068847656, -0.15732192993164062, -0.1504955291748047, -0.14366912841796875, -0.1368427276611328, -0.13001632690429688, -0.12318992614746094, -0.116363525390625, -0.10953712463378906, -0.10271072387695312, -0.09588432312011719, -0.08905792236328125, -0.08223152160644531, -0.07540512084960938, -0.06857872009277344, -0.0617523193359375, -0.05492591857910156, -0.048099517822265625, -0.04127311706542969, -0.03444671630859375, -0.027620315551757812, -0.020793914794921875, -0.013967514038085938, -0.00714111328125, -0.0003147125244140625, 0.006511688232421875, 0.013338088989257812, 0.02016448974609375, 0.026990890502929688, 0.033817291259765625, 0.04064369201660156, 0.0474700927734375, 0.05429649353027344, 0.061122894287109375, 0.06794929504394531, 0.07477569580078125, 0.08160209655761719, 0.08842849731445312, 0.09525489807128906, 0.102081298828125, 0.10890769958496094, 0.11573410034179688, 0.12256050109863281, 0.12938690185546875, 0.1362133026123047, 0.14303970336914062, 0.14986610412597656, 0.1566925048828125, 0.16351890563964844, 0.17034530639648438, 0.1771717071533203, 0.18399810791015625, 0.1908245086669922, 0.19765090942382812, 0.20447731018066406, 0.2113037109375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 4.0, 2.0, 11.0, 6.0, 9.0, 10.0, 9.0, 12.0, 14.0, 26.0, 31.0, 27.0, 42.0, 26.0, 32.0, 44.0, 42.0, 41.0, 51.0, 46.0, 48.0, 56.0, 42.0, 38.0, 39.0, 41.0, 30.0, 36.0, 24.0, 24.0, 24.0, 16.0, 21.0, 21.0, 14.0, 4.0, 5.0, 4.0, 8.0, 5.0, 4.0, 3.0, 1.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0], "bins": [-0.10711669921875, -0.10392379760742188, -0.10073089599609375, -0.09753799438476562, -0.0943450927734375, -0.09115219116210938, -0.08795928955078125, -0.08476638793945312, -0.081573486328125, -0.07838058471679688, -0.07518768310546875, -0.07199478149414062, -0.0688018798828125, -0.06560897827148438, -0.06241607666015625, -0.059223175048828125, -0.0560302734375, -0.052837371826171875, -0.04964447021484375, -0.046451568603515625, -0.0432586669921875, -0.040065765380859375, -0.03687286376953125, -0.033679962158203125, -0.030487060546875, -0.027294158935546875, -0.02410125732421875, -0.020908355712890625, -0.0177154541015625, -0.014522552490234375, -0.01132965087890625, -0.008136749267578125, -0.00494384765625, -0.001750946044921875, 0.00144195556640625, 0.004634857177734375, 0.0078277587890625, 0.011020660400390625, 0.01421356201171875, 0.017406463623046875, 0.020599365234375, 0.023792266845703125, 0.02698516845703125, 0.030178070068359375, 0.0333709716796875, 0.036563873291015625, 0.03975677490234375, 0.042949676513671875, 0.046142578125, 0.049335479736328125, 0.05252838134765625, 0.055721282958984375, 0.0589141845703125, 0.062107086181640625, 0.06529998779296875, 0.06849288940429688, 0.071685791015625, 0.07487869262695312, 0.07807159423828125, 0.08126449584960938, 0.0844573974609375, 0.08765029907226562, 0.09084320068359375, 0.09403610229492188, 0.09722900390625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 4.0, 7.0, 22.0, 31.0, 48.0, 86.0, 194.0, 387.0, 791.0, 1989.0, 5207.0, 16401.0, 68536.0, 376114.0, 460088.0, 87900.0, 20506.0, 6221.0, 2192.0, 965.0, 447.0, 198.0, 94.0, 51.0, 33.0, 21.0, 8.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1617431640625, -0.15749549865722656, -0.15324783325195312, -0.1490001678466797, -0.14475250244140625, -0.1405048370361328, -0.13625717163085938, -0.13200950622558594, -0.1277618408203125, -0.12351417541503906, -0.11926651000976562, -0.11501884460449219, -0.11077117919921875, -0.10652351379394531, -0.10227584838867188, -0.09802818298339844, -0.093780517578125, -0.08953285217285156, -0.08528518676757812, -0.08103752136230469, -0.07678985595703125, -0.07254219055175781, -0.06829452514648438, -0.06404685974121094, -0.0597991943359375, -0.05555152893066406, -0.051303863525390625, -0.04705619812011719, -0.04280853271484375, -0.03856086730957031, -0.034313201904296875, -0.030065536499023438, -0.02581787109375, -0.021570205688476562, -0.017322540283203125, -0.013074874877929688, -0.00882720947265625, -0.0045795440673828125, -0.000331878662109375, 0.0039157867431640625, 0.0081634521484375, 0.012411117553710938, 0.016658782958984375, 0.020906448364257812, 0.02515411376953125, 0.029401779174804688, 0.033649444580078125, 0.03789710998535156, 0.042144775390625, 0.04639244079589844, 0.050640106201171875, 0.05488777160644531, 0.05913543701171875, 0.06338310241699219, 0.06763076782226562, 0.07187843322753906, 0.0761260986328125, 0.08037376403808594, 0.08462142944335938, 0.08886909484863281, 0.09311676025390625, 0.09736442565917969, 0.10161209106445312, 0.10585975646972656, 0.110107421875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 7.0, 6.0, 6.0, 14.0, 14.0, 39.0, 41.0, 71.0, 73.0, 112.0, 124.0, 133.0, 106.0, 99.0, 54.0, 39.0, 20.0, 21.0, 15.0, 6.0, 3.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.910894393920898e-05, -8.44104215502739e-05, -7.97118991613388e-05, -7.501337677240372e-05, -7.031485438346863e-05, -6.561633199453354e-05, -6.091780960559845e-05, -5.621928721666336e-05, -5.152076482772827e-05, -4.682224243879318e-05, -4.212372004985809e-05, -3.7425197660923004e-05, -3.2726675271987915e-05, -2.8028152883052826e-05, -2.3329630494117737e-05, -1.8631108105182648e-05, -1.3932585716247559e-05, -9.23406332731247e-06, -4.53554093837738e-06, 1.6298145055770874e-07, 4.861503839492798e-06, 9.560026228427887e-06, 1.4258548617362976e-05, 1.8957071006298065e-05, 2.3655593395233154e-05, 2.8354115784168243e-05, 3.305263817310333e-05, 3.775116056203842e-05, 4.244968295097351e-05, 4.71482053399086e-05, 5.184672772884369e-05, 5.654525011777878e-05, 6.124377250671387e-05, 6.594229489564896e-05, 7.064081728458405e-05, 7.533933967351913e-05, 8.003786206245422e-05, 8.473638445138931e-05, 8.94349068403244e-05, 9.413342922925949e-05, 9.883195161819458e-05, 0.00010353047400712967, 0.00010822899639606476, 0.00011292751878499985, 0.00011762604117393494, 0.00012232456356287003, 0.00012702308595180511, 0.0001317216083407402, 0.0001364201307296753, 0.00014111865311861038, 0.00014581717550754547, 0.00015051569789648056, 0.00015521422028541565, 0.00015991274267435074, 0.00016461126506328583, 0.00016930978745222092, 0.000174008309841156, 0.0001787068322300911, 0.00018340535461902618, 0.00018810387700796127, 0.00019280239939689636, 0.00019750092178583145, 0.00020219944417476654, 0.00020689796656370163, 0.00021159648895263672]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 4.0, 4.0, 3.0, 6.0, 10.0, 13.0, 10.0, 24.0, 26.0, 29.0, 63.0, 74.0, 133.0, 210.0, 372.0, 700.0, 1440.0, 3681.0, 12932.0, 64555.0, 425564.0, 448440.0, 69321.0, 13692.0, 3954.0, 1535.0, 698.0, 368.0, 207.0, 166.0, 92.0, 75.0, 44.0, 30.0, 24.0, 18.0, 6.0, 9.0, 5.0, 5.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.14453125, -0.1401538848876953, -0.13577651977539062, -0.13139915466308594, -0.12702178955078125, -0.12264442443847656, -0.11826705932617188, -0.11388969421386719, -0.1095123291015625, -0.10513496398925781, -0.10075759887695312, -0.09638023376464844, -0.09200286865234375, -0.08762550354003906, -0.08324813842773438, -0.07887077331542969, -0.074493408203125, -0.07011604309082031, -0.06573867797851562, -0.06136131286621094, -0.05698394775390625, -0.05260658264160156, -0.048229217529296875, -0.04385185241699219, -0.0394744873046875, -0.03509712219238281, -0.030719757080078125, -0.026342391967773438, -0.02196502685546875, -0.017587661743164062, -0.013210296630859375, -0.008832931518554688, -0.00445556640625, -7.82012939453125e-05, 0.004299163818359375, 0.008676528930664062, 0.01305389404296875, 0.017431259155273438, 0.021808624267578125, 0.026185989379882812, 0.0305633544921875, 0.03494071960449219, 0.039318084716796875, 0.04369544982910156, 0.04807281494140625, 0.05245018005371094, 0.056827545166015625, 0.06120491027832031, 0.065582275390625, 0.06995964050292969, 0.07433700561523438, 0.07871437072753906, 0.08309173583984375, 0.08746910095214844, 0.09184646606445312, 0.09622383117675781, 0.1006011962890625, 0.10497856140136719, 0.10935592651367188, 0.11373329162597656, 0.11811065673828125, 0.12248802185058594, 0.12686538696289062, 0.1312427520751953, 0.1356201171875]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 3.0, 6.0, 4.0, 9.0, 9.0, 21.0, 17.0, 24.0, 27.0, 38.0, 56.0, 37.0, 54.0, 70.0, 81.0, 84.0, 75.0, 72.0, 46.0, 56.0, 37.0, 33.0, 25.0, 25.0, 24.0, 15.0, 13.0, 11.0, 8.0, 6.0, 5.0, 1.0, 4.0, 2.0, 1.0, 0.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.06024169921875, -0.058437347412109375, -0.05663299560546875, -0.054828643798828125, -0.0530242919921875, -0.051219940185546875, -0.04941558837890625, -0.047611236572265625, -0.045806884765625, -0.044002532958984375, -0.04219818115234375, -0.040393829345703125, -0.0385894775390625, -0.036785125732421875, -0.03498077392578125, -0.033176422119140625, -0.0313720703125, -0.029567718505859375, -0.02776336669921875, -0.025959014892578125, -0.0241546630859375, -0.022350311279296875, -0.02054595947265625, -0.018741607666015625, -0.016937255859375, -0.015132904052734375, -0.01332855224609375, -0.011524200439453125, -0.0097198486328125, -0.007915496826171875, -0.00611114501953125, -0.004306793212890625, -0.00250244140625, -0.000698089599609375, 0.00110626220703125, 0.002910614013671875, 0.0047149658203125, 0.006519317626953125, 0.00832366943359375, 0.010128021240234375, 0.011932373046875, 0.013736724853515625, 0.01554107666015625, 0.017345428466796875, 0.0191497802734375, 0.020954132080078125, 0.02275848388671875, 0.024562835693359375, 0.0263671875, 0.028171539306640625, 0.02997589111328125, 0.031780242919921875, 0.0335845947265625, 0.035388946533203125, 0.03719329833984375, 0.038997650146484375, 0.040802001953125, 0.042606353759765625, 0.04441070556640625, 0.046215057373046875, 0.0480194091796875, 0.049823760986328125, 0.05162811279296875, 0.053432464599609375, 0.05523681640625]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 27.0, 298.0, 552.0, 106.0, 19.0, 4.0, 3.0, 3.0, 2.0, 1.0], "bins": [-8.200643539428711, -8.054935455322266, -7.90922737121582, -7.763519763946533, -7.617811679840088, -7.472103595733643, -7.326395511627197, -7.180687427520752, -7.034979820251465, -6.8892717361450195, -6.743563652038574, -6.597856044769287, -6.452147960662842, -6.3064398765563965, -6.160731792449951, -6.015023708343506, -5.8693156242370605, -5.723607540130615, -5.57789945602417, -5.432191848754883, -5.2864837646484375, -5.140775680541992, -4.995067596435547, -4.849359512329102, -4.703651428222656, -4.557943344116211, -4.412235260009766, -4.2665276527404785, -4.120819568634033, -3.975111484527588, -3.8294034004211426, -3.6836953163146973, -3.537987470626831, -3.3922793865203857, -3.2465715408325195, -3.100863456726074, -2.955155372619629, -2.8094475269317627, -2.6637394428253174, -2.518031597137451, -2.372323513031006, -2.2266154289245605, -2.0809075832366943, -1.935199499130249, -1.7894915342330933, -1.6437835693359375, -1.4980754852294922, -1.3523675203323364, -1.2066595554351807, -1.060951590538025, -0.9152435660362244, -0.7695355415344238, -0.6238275766372681, -0.4781196117401123, -0.33241158723831177, -0.18670356273651123, -0.04099559783935547, 0.10471239686012268, 0.25042039155960083, 0.396128386259079, 0.5418363809585571, 0.6875443458557129, 0.8332523703575134, 0.978960394859314, 1.1246683597564697]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 13.0, 14.0, 11.0, 17.0, 20.0, 27.0, 24.0, 32.0, 25.0, 51.0, 39.0, 39.0, 45.0, 61.0, 56.0, 64.0, 68.0, 68.0, 44.0, 52.0, 36.0, 40.0, 43.0, 28.0, 15.0, 20.0, 17.0, 10.0, 5.0, 4.0, 4.0, 6.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0532615184783936, -1.0233211517333984, -0.9933809041976929, -0.9634405374526978, -0.9335002303123474, -0.9035599231719971, -0.873619556427002, -0.8436792492866516, -0.8137389421463013, -0.7837986350059509, -0.7538583278656006, -0.7239179611206055, -0.6939776539802551, -0.6640373468399048, -0.6340969800949097, -0.6041566729545593, -0.574216365814209, -0.5442760586738586, -0.5143357515335083, -0.4843953847885132, -0.45445507764816284, -0.4245147705078125, -0.39457443356513977, -0.36463409662246704, -0.3346937894821167, -0.30475348234176636, -0.27481314539909363, -0.2448728233575821, -0.21493250131607056, -0.18499217927455902, -0.15505185723304749, -0.12511153519153595, -0.09517121315002441, -0.06523089110851288, -0.03529056906700134, -0.005350247025489807, 0.02459007501602173, 0.054530397057533264, 0.0844707190990448, 0.11441104114055634, 0.14435136318206787, 0.1742916852235794, 0.20423200726509094, 0.23417232930660248, 0.264112651348114, 0.29405295848846436, 0.3239932954311371, 0.3539336323738098, 0.38387393951416016, 0.4138142466545105, 0.4437545835971832, 0.47369492053985596, 0.5036352276802063, 0.5335755348205566, 0.5635159015655518, 0.5934562087059021, 0.6233965158462524, 0.6533368229866028, 0.6832771301269531, 0.7132174968719482, 0.7431578040122986, 0.7730981111526489, 0.803038477897644, 0.8329787850379944, 0.8629190921783447]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 9.0, 6.0, 16.0, 6.0, 15.0, 36.0, 54.0, 113.0, 181.0, 418.0, 936.0, 3151.0, 20553.0, 3764105.0, 387663.0, 12908.0, 2506.0, 865.0, 369.0, 143.0, 90.0, 45.0, 27.0, 18.0, 13.0, 10.0, 8.0, 6.0, 4.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.619140625, -0.599090576171875, -0.57904052734375, -0.558990478515625, -0.5389404296875, -0.518890380859375, -0.49884033203125, -0.478790283203125, -0.458740234375, -0.438690185546875, -0.41864013671875, -0.398590087890625, -0.3785400390625, -0.358489990234375, -0.33843994140625, -0.318389892578125, -0.29833984375, -0.278289794921875, -0.25823974609375, -0.238189697265625, -0.2181396484375, -0.198089599609375, -0.17803955078125, -0.157989501953125, -0.137939453125, -0.117889404296875, -0.09783935546875, -0.077789306640625, -0.0577392578125, -0.037689208984375, -0.01763916015625, 0.002410888671875, 0.0224609375, 0.042510986328125, 0.06256103515625, 0.082611083984375, 0.1026611328125, 0.122711181640625, 0.14276123046875, 0.162811279296875, 0.182861328125, 0.202911376953125, 0.22296142578125, 0.243011474609375, 0.2630615234375, 0.283111572265625, 0.30316162109375, 0.323211669921875, 0.34326171875, 0.363311767578125, 0.38336181640625, 0.403411865234375, 0.4234619140625, 0.443511962890625, 0.46356201171875, 0.483612060546875, 0.503662109375, 0.523712158203125, 0.54376220703125, 0.563812255859375, 0.5838623046875, 0.603912353515625, 0.62396240234375, 0.644012451171875, 0.6640625]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 4.0, 3.0, 5.0, 5.0, 6.0, 4.0, 6.0, 10.0, 19.0, 29.0, 54.0, 63.0, 94.0, 93.0, 108.0, 136.0, 102.0, 71.0, 50.0, 38.0, 35.0, 13.0, 11.0, 11.0, 7.0, 7.0, 8.0, 5.0, 4.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.037872314453125, -0.03679084777832031, -0.035709381103515625, -0.03462791442871094, -0.03354644775390625, -0.03246498107910156, -0.031383514404296875, -0.030302047729492188, -0.0292205810546875, -0.028139114379882812, -0.027057647705078125, -0.025976181030273438, -0.02489471435546875, -0.023813247680664062, -0.022731781005859375, -0.021650314331054688, -0.02056884765625, -0.019487380981445312, -0.018405914306640625, -0.017324447631835938, -0.01624298095703125, -0.015161514282226562, -0.014080047607421875, -0.012998580932617188, -0.0119171142578125, -0.010835647583007812, -0.009754180908203125, -0.008672714233398438, -0.00759124755859375, -0.0065097808837890625, -0.005428314208984375, -0.0043468475341796875, -0.003265380859375, -0.0021839141845703125, -0.001102447509765625, -2.09808349609375e-05, 0.00106048583984375, 0.0021419525146484375, 0.003223419189453125, 0.0043048858642578125, 0.0053863525390625, 0.0064678192138671875, 0.007549285888671875, 0.008630752563476562, 0.00971221923828125, 0.010793685913085938, 0.011875152587890625, 0.012956619262695312, 0.0140380859375, 0.015119552612304688, 0.016201019287109375, 0.017282485961914062, 0.01836395263671875, 0.019445419311523438, 0.020526885986328125, 0.021608352661132812, 0.0226898193359375, 0.023771286010742188, 0.024852752685546875, 0.025934219360351562, 0.02701568603515625, 0.028097152709960938, 0.029178619384765625, 0.030260086059570312, 0.031341552734375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 5.0, 3.0, 2.0, 3.0, 5.0, 3.0, 7.0, 14.0, 22.0, 25.0, 27.0, 54.0, 80.0, 130.0, 205.0, 393.0, 755.0, 1607.0, 3707.0, 10875.0, 39205.0, 240530.0, 3372493.0, 443820.0, 57885.0, 14063.0, 4634.0, 1856.0, 862.0, 424.0, 222.0, 132.0, 83.0, 49.0, 38.0, 16.0, 17.0, 4.0, 11.0, 8.0, 8.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2379150390625, -0.2306232452392578, -0.22333145141601562, -0.21603965759277344, -0.20874786376953125, -0.20145606994628906, -0.19416427612304688, -0.1868724822998047, -0.1795806884765625, -0.1722888946533203, -0.16499710083007812, -0.15770530700683594, -0.15041351318359375, -0.14312171936035156, -0.13582992553710938, -0.1285381317138672, -0.121246337890625, -0.11395454406738281, -0.10666275024414062, -0.09937095642089844, -0.09207916259765625, -0.08478736877441406, -0.07749557495117188, -0.07020378112792969, -0.0629119873046875, -0.05562019348144531, -0.048328399658203125, -0.04103660583496094, -0.03374481201171875, -0.026453018188476562, -0.019161224365234375, -0.011869430541992188, -0.00457763671875, 0.0027141571044921875, 0.010005950927734375, 0.017297744750976562, 0.02458953857421875, 0.03188133239746094, 0.039173126220703125, 0.04646492004394531, 0.0537567138671875, 0.06104850769042969, 0.06834030151367188, 0.07563209533691406, 0.08292388916015625, 0.09021568298339844, 0.09750747680664062, 0.10479927062988281, 0.112091064453125, 0.11938285827636719, 0.12667465209960938, 0.13396644592285156, 0.14125823974609375, 0.14855003356933594, 0.15584182739257812, 0.1631336212158203, 0.1704254150390625, 0.1777172088623047, 0.18500900268554688, 0.19230079650878906, 0.19959259033203125, 0.20688438415527344, 0.21417617797851562, 0.2214679718017578, 0.228759765625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 9.0, 3.0, 5.0, 4.0, 8.0, 6.0, 8.0, 16.0, 23.0, 20.0, 38.0, 39.0, 56.0, 95.0, 148.0, 241.0, 446.0, 1410.0, 668.0, 284.0, 170.0, 109.0, 79.0, 59.0, 30.0, 27.0, 16.0, 19.0, 9.0, 4.0, 9.0, 3.0, 5.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.046295166015625, -0.04488182067871094, -0.043468475341796875, -0.04205513000488281, -0.04064178466796875, -0.03922843933105469, -0.037815093994140625, -0.03640174865722656, -0.0349884033203125, -0.03357505798339844, -0.032161712646484375, -0.030748367309570312, -0.02933502197265625, -0.027921676635742188, -0.026508331298828125, -0.025094985961914062, -0.023681640625, -0.022268295288085938, -0.020854949951171875, -0.019441604614257812, -0.01802825927734375, -0.016614913940429688, -0.015201568603515625, -0.013788223266601562, -0.0123748779296875, -0.010961532592773438, -0.009548187255859375, -0.008134841918945312, -0.00672149658203125, -0.0053081512451171875, -0.003894805908203125, -0.0024814605712890625, -0.001068115234375, 0.0003452301025390625, 0.001758575439453125, 0.0031719207763671875, 0.00458526611328125, 0.0059986114501953125, 0.007411956787109375, 0.008825302124023438, 0.0102386474609375, 0.011651992797851562, 0.013065338134765625, 0.014478683471679688, 0.01589202880859375, 0.017305374145507812, 0.018718719482421875, 0.020132064819335938, 0.02154541015625, 0.022958755493164062, 0.024372100830078125, 0.025785446166992188, 0.02719879150390625, 0.028612136840820312, 0.030025482177734375, 0.03143882751464844, 0.0328521728515625, 0.03426551818847656, 0.035678863525390625, 0.03709220886230469, 0.03850555419921875, 0.03991889953613281, 0.041332244873046875, 0.04274559020996094, 0.044158935546875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 3.0, 30.0, 129.0, 364.0, 360.0, 97.0, 22.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.22499901056289673, -0.19673500955104828, -0.16847100853919983, -0.14020700752735138, -0.11194300651550293, -0.08367900550365448, -0.05541500449180603, -0.02715100347995758, 0.0011129975318908691, 0.02937699854373932, 0.05764099955558777, 0.08590500056743622, 0.11416900157928467, 0.14243300259113312, 0.17069700360298157, 0.19896100461483002, 0.22722500562667847, 0.2554889917373657, 0.28375300765037537, 0.312017023563385, 0.34028100967407227, 0.3685449957847595, 0.39680901169776917, 0.4250730276107788, 0.45333701372146606, 0.4816009998321533, 0.5098650455474854, 0.5381290316581726, 0.5663930177688599, 0.5946570038795471, 0.6229209899902344, 0.6511850357055664, 0.6794490814208984, 0.7077130675315857, 0.735977053642273, 0.764241099357605, 0.7925050854682922, 0.8207690715789795, 0.8490331172943115, 0.8772971034049988, 0.905561089515686, 0.9338250756263733, 0.9620890617370605, 0.9903531074523926, 1.0186171531677246, 1.046881079673767, 1.0751451253890991, 1.1034090518951416, 1.1316730976104736, 1.1599371433258057, 1.1882010698318481, 1.2164651155471802, 1.2447290420532227, 1.2729930877685547, 1.3012571334838867, 1.3295210599899292, 1.3577851057052612, 1.3860491514205933, 1.4143130779266357, 1.4425771236419678, 1.4708411693572998, 1.4991050958633423, 1.5273691415786743, 1.5556330680847168, 1.5838971138000488]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 6.0, 7.0, 6.0, 8.0, 5.0, 3.0, 11.0, 8.0, 12.0, 11.0, 13.0, 18.0, 24.0, 22.0, 31.0, 27.0, 29.0, 22.0, 27.0, 20.0, 37.0, 41.0, 37.0, 44.0, 37.0, 37.0, 46.0, 38.0, 28.0, 27.0, 39.0, 37.0, 35.0, 35.0, 20.0, 29.0, 14.0, 20.0, 7.0, 16.0, 11.0, 13.0, 9.0, 8.0, 10.0, 3.0, 8.0, 1.0, 2.0, 5.0, 3.0, 1.0, 4.0], "bins": [-0.15151524543762207, -0.14729519188404083, -0.1430751383304596, -0.13885506987571716, -0.13463501632213593, -0.1304149627685547, -0.12619490921497345, -0.12197485566139221, -0.11775479465723038, -0.11353474110364914, -0.1093146800994873, -0.10509462654590607, -0.10087457299232483, -0.096654511988163, -0.09243445843458176, -0.08821439743041992, -0.08399434387683868, -0.07977429032325745, -0.07555422931909561, -0.07133417576551437, -0.06711411476135254, -0.0628940612077713, -0.058674007654190063, -0.05445395037531853, -0.05023389309644699, -0.046013835817575455, -0.04179377853870392, -0.03757372498512268, -0.033353667706251144, -0.029133610427379608, -0.02491355501115322, -0.020693499594926834, -0.016473442316055298, -0.012253385968506336, -0.008033329620957375, -0.003813273273408413, 0.0004067830741405487, 0.004626840353012085, 0.008846895769238472, 0.013066951185464859, 0.017287008464336395, 0.02150706574320793, 0.02572712115943432, 0.029947176575660706, 0.03416723385453224, 0.03838729113340378, 0.042607344686985016, 0.04682740196585655, 0.05104745924472809, 0.055267516523599625, 0.05948757380247116, 0.0637076273560524, 0.06792768836021423, 0.07214774191379547, 0.07636779546737671, 0.08058784902095795, 0.08480791002511978, 0.08902796357870102, 0.09324802458286285, 0.09746807813644409, 0.10168813169002533, 0.10590819269418716, 0.1101282462477684, 0.11434830725193024, 0.11856836080551147]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 8.0, 7.0, 7.0, 11.0, 16.0, 31.0, 36.0, 57.0, 91.0, 130.0, 218.0, 367.0, 554.0, 879.0, 1590.0, 3077.0, 6710.0, 17541.0, 57486.0, 226031.0, 486401.0, 175280.0, 45331.0, 14361.0, 5961.0, 2745.0, 1397.0, 859.0, 502.0, 266.0, 206.0, 137.0, 85.0, 45.0, 44.0, 27.0, 19.0, 10.0, 9.0, 10.0, 1.0, 4.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.185302734375, -0.17975616455078125, -0.1742095947265625, -0.16866302490234375, -0.163116455078125, -0.15756988525390625, -0.1520233154296875, -0.14647674560546875, -0.14093017578125, -0.13538360595703125, -0.1298370361328125, -0.12429046630859375, -0.118743896484375, -0.11319732666015625, -0.1076507568359375, -0.10210418701171875, -0.0965576171875, -0.09101104736328125, -0.0854644775390625, -0.07991790771484375, -0.074371337890625, -0.06882476806640625, -0.0632781982421875, -0.05773162841796875, -0.05218505859375, -0.04663848876953125, -0.0410919189453125, -0.03554534912109375, -0.029998779296875, -0.02445220947265625, -0.0189056396484375, -0.01335906982421875, -0.0078125, -0.00226593017578125, 0.0032806396484375, 0.00882720947265625, 0.014373779296875, 0.01992034912109375, 0.0254669189453125, 0.03101348876953125, 0.03656005859375, 0.04210662841796875, 0.0476531982421875, 0.05319976806640625, 0.058746337890625, 0.06429290771484375, 0.0698394775390625, 0.07538604736328125, 0.0809326171875, 0.08647918701171875, 0.0920257568359375, 0.09757232666015625, 0.103118896484375, 0.10866546630859375, 0.1142120361328125, 0.11975860595703125, 0.12530517578125, 0.13085174560546875, 0.1363983154296875, 0.14194488525390625, 0.147491455078125, 0.15303802490234375, 0.1585845947265625, 0.16413116455078125, 0.169677734375]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 4.0, 5.0, 6.0, 5.0, 8.0, 22.0, 28.0, 37.0, 62.0, 70.0, 77.0, 110.0, 125.0, 106.0, 86.0, 73.0, 61.0, 30.0, 24.0, 12.0, 12.0, 8.0, 10.0, 7.0, 4.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.037628173828125, -0.03650665283203125, -0.0353851318359375, -0.03426361083984375, -0.03314208984375, -0.03202056884765625, -0.0308990478515625, -0.02977752685546875, -0.028656005859375, -0.02753448486328125, -0.0264129638671875, -0.02529144287109375, -0.024169921875, -0.02304840087890625, -0.0219268798828125, -0.02080535888671875, -0.019683837890625, -0.01856231689453125, -0.0174407958984375, -0.01631927490234375, -0.01519775390625, -0.01407623291015625, -0.0129547119140625, -0.01183319091796875, -0.010711669921875, -0.00959014892578125, -0.0084686279296875, -0.00734710693359375, -0.0062255859375, -0.00510406494140625, -0.0039825439453125, -0.00286102294921875, -0.001739501953125, -0.00061798095703125, 0.0005035400390625, 0.00162506103515625, 0.00274658203125, 0.00386810302734375, 0.0049896240234375, 0.00611114501953125, 0.007232666015625, 0.00835418701171875, 0.0094757080078125, 0.01059722900390625, 0.01171875, 0.01284027099609375, 0.0139617919921875, 0.01508331298828125, 0.016204833984375, 0.01732635498046875, 0.0184478759765625, 0.01956939697265625, 0.02069091796875, 0.02181243896484375, 0.0229339599609375, 0.02405548095703125, 0.025177001953125, 0.02629852294921875, 0.0274200439453125, 0.02854156494140625, 0.0296630859375, 0.03078460693359375, 0.0319061279296875, 0.03302764892578125, 0.034149169921875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 5.0, 2.0, 9.0, 13.0, 16.0, 18.0, 26.0, 34.0, 44.0, 51.0, 98.0, 107.0, 175.0, 284.0, 446.0, 746.0, 1282.0, 2934.0, 9996.0, 47997.0, 246228.0, 540906.0, 155586.0, 29620.0, 6634.0, 2348.0, 1126.0, 585.0, 397.0, 276.0, 158.0, 101.0, 82.0, 58.0, 40.0, 35.0, 22.0, 22.0, 14.0, 11.0, 6.0, 3.0, 1.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.2142333984375, -0.20740127563476562, -0.20056915283203125, -0.19373703002929688, -0.1869049072265625, -0.18007278442382812, -0.17324066162109375, -0.16640853881835938, -0.159576416015625, -0.15274429321289062, -0.14591217041015625, -0.13908004760742188, -0.1322479248046875, -0.12541580200195312, -0.11858367919921875, -0.11175155639648438, -0.10491943359375, -0.09808731079101562, -0.09125518798828125, -0.08442306518554688, -0.0775909423828125, -0.07075881958007812, -0.06392669677734375, -0.057094573974609375, -0.050262451171875, -0.043430328369140625, -0.03659820556640625, -0.029766082763671875, -0.0229339599609375, -0.016101837158203125, -0.00926971435546875, -0.002437591552734375, 0.00439453125, 0.011226654052734375, 0.01805877685546875, 0.024890899658203125, 0.0317230224609375, 0.038555145263671875, 0.04538726806640625, 0.052219390869140625, 0.059051513671875, 0.06588363647460938, 0.07271575927734375, 0.07954788208007812, 0.0863800048828125, 0.09321212768554688, 0.10004425048828125, 0.10687637329101562, 0.11370849609375, 0.12054061889648438, 0.12737274169921875, 0.13420486450195312, 0.1410369873046875, 0.14786911010742188, 0.15470123291015625, 0.16153335571289062, 0.168365478515625, 0.17519760131835938, 0.18202972412109375, 0.18886184692382812, 0.1956939697265625, 0.20252609252929688, 0.20935821533203125, 0.21619033813476562, 0.2230224609375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 7.0, 7.0, 6.0, 8.0, 3.0, 12.0, 10.0, 7.0, 22.0, 17.0, 16.0, 22.0, 25.0, 16.0, 29.0, 33.0, 31.0, 35.0, 32.0, 42.0, 38.0, 29.0, 39.0, 44.0, 37.0, 30.0, 43.0, 35.0, 42.0, 30.0, 30.0, 27.0, 20.0, 26.0, 23.0, 16.0, 21.0, 15.0, 8.0, 9.0, 16.0, 9.0, 6.0, 12.0, 3.0, 4.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 3.0], "bins": [-0.10137939453125, -0.09840583801269531, -0.09543228149414062, -0.09245872497558594, -0.08948516845703125, -0.08651161193847656, -0.08353805541992188, -0.08056449890136719, -0.0775909423828125, -0.07461738586425781, -0.07164382934570312, -0.06867027282714844, -0.06569671630859375, -0.06272315979003906, -0.059749603271484375, -0.05677604675292969, -0.053802490234375, -0.05082893371582031, -0.047855377197265625, -0.04488182067871094, -0.04190826416015625, -0.03893470764160156, -0.035961151123046875, -0.03298759460449219, -0.0300140380859375, -0.027040481567382812, -0.024066925048828125, -0.021093368530273438, -0.01811981201171875, -0.015146255493164062, -0.012172698974609375, -0.009199142456054688, -0.0062255859375, -0.0032520294189453125, -0.000278472900390625, 0.0026950836181640625, 0.00566864013671875, 0.008642196655273438, 0.011615753173828125, 0.014589309692382812, 0.0175628662109375, 0.020536422729492188, 0.023509979248046875, 0.026483535766601562, 0.02945709228515625, 0.03243064880371094, 0.035404205322265625, 0.03837776184082031, 0.041351318359375, 0.04432487487792969, 0.047298431396484375, 0.05027198791503906, 0.05324554443359375, 0.05621910095214844, 0.059192657470703125, 0.06216621398925781, 0.0651397705078125, 0.06811332702636719, 0.07108688354492188, 0.07406044006347656, 0.07703399658203125, 0.08000755310058594, 0.08298110961914062, 0.08595466613769531, 0.08892822265625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 0.0, 7.0, 3.0, 7.0, 13.0, 10.0, 12.0, 14.0, 37.0, 39.0, 69.0, 78.0, 115.0, 222.0, 338.0, 549.0, 1020.0, 1670.0, 2970.0, 5656.0, 11077.0, 22892.0, 52021.0, 125354.0, 305151.0, 298688.0, 123479.0, 51271.0, 22500.0, 10630.0, 5501.0, 2953.0, 1663.0, 977.0, 591.0, 360.0, 220.0, 128.0, 92.0, 51.0, 37.0, 23.0, 28.0, 16.0, 9.0, 8.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.0733642578125, -0.07114028930664062, -0.06891632080078125, -0.06669235229492188, -0.0644683837890625, -0.062244415283203125, -0.06002044677734375, -0.057796478271484375, -0.055572509765625, -0.053348541259765625, -0.05112457275390625, -0.048900604248046875, -0.0466766357421875, -0.044452667236328125, -0.04222869873046875, -0.040004730224609375, -0.03778076171875, -0.035556793212890625, -0.03333282470703125, -0.031108856201171875, -0.0288848876953125, -0.026660919189453125, -0.02443695068359375, -0.022212982177734375, -0.019989013671875, -0.017765045166015625, -0.01554107666015625, -0.013317108154296875, -0.0110931396484375, -0.008869171142578125, -0.00664520263671875, -0.004421234130859375, -0.002197265625, 2.6702880859375e-05, 0.00225067138671875, 0.004474639892578125, 0.0066986083984375, 0.008922576904296875, 0.01114654541015625, 0.013370513916015625, 0.015594482421875, 0.017818450927734375, 0.02004241943359375, 0.022266387939453125, 0.0244903564453125, 0.026714324951171875, 0.02893829345703125, 0.031162261962890625, 0.03338623046875, 0.035610198974609375, 0.03783416748046875, 0.040058135986328125, 0.0422821044921875, 0.044506072998046875, 0.04673004150390625, 0.048954010009765625, 0.051177978515625, 0.053401947021484375, 0.05562591552734375, 0.057849884033203125, 0.0600738525390625, 0.062297821044921875, 0.06452178955078125, 0.06674575805664062, 0.0689697265625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 7.0, 4.0, 5.0, 6.0, 16.0, 25.0, 39.0, 40.0, 75.0, 93.0, 142.0, 121.0, 122.0, 86.0, 72.0, 39.0, 33.0, 20.0, 15.0, 9.0, 9.0, 10.0, 6.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0001405477523803711, -0.00013645924627780914, -0.0001323707401752472, -0.00012828223407268524, -0.0001241937279701233, -0.00012010522186756134, -0.00011601671576499939, -0.00011192820966243744, -0.00010783970355987549, -0.00010375119745731354, -9.966269135475159e-05, -9.557418525218964e-05, -9.148567914962769e-05, -8.739717304706573e-05, -8.330866694450378e-05, -7.922016084194183e-05, -7.513165473937988e-05, -7.104314863681793e-05, -6.695464253425598e-05, -6.286613643169403e-05, -5.877763032913208e-05, -5.468912422657013e-05, -5.060061812400818e-05, -4.651211202144623e-05, -4.242360591888428e-05, -3.833509981632233e-05, -3.4246593713760376e-05, -3.0158087611198425e-05, -2.6069581508636475e-05, -2.1981075406074524e-05, -1.7892569303512573e-05, -1.3804063200950623e-05, -9.715557098388672e-06, -5.627050995826721e-06, -1.5385448932647705e-06, 2.54996120929718e-06, 6.638467311859131e-06, 1.0726973414421082e-05, 1.4815479516983032e-05, 1.8903985619544983e-05, 2.2992491722106934e-05, 2.7080997824668884e-05, 3.1169503927230835e-05, 3.5258010029792786e-05, 3.9346516132354736e-05, 4.343502223491669e-05, 4.752352833747864e-05, 5.161203444004059e-05, 5.570054054260254e-05, 5.978904664516449e-05, 6.387755274772644e-05, 6.796605885028839e-05, 7.205456495285034e-05, 7.614307105541229e-05, 8.023157715797424e-05, 8.43200832605362e-05, 8.840858936309814e-05, 9.24970954656601e-05, 9.658560156822205e-05, 0.000100674107670784, 0.00010476261377334595, 0.0001088511198759079, 0.00011293962597846985, 0.0001170281320810318, 0.00012111663818359375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 9.0, 6.0, 11.0, 14.0, 14.0, 27.0, 27.0, 52.0, 64.0, 90.0, 131.0, 210.0, 409.0, 756.0, 1747.0, 5332.0, 24662.0, 161029.0, 666289.0, 155394.0, 23429.0, 5418.0, 1704.0, 720.0, 373.0, 203.0, 144.0, 80.0, 66.0, 39.0, 27.0, 21.0, 15.0, 12.0, 11.0, 5.0, 4.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.16552734375, -0.16072845458984375, -0.1559295654296875, -0.15113067626953125, -0.146331787109375, -0.14153289794921875, -0.1367340087890625, -0.13193511962890625, -0.12713623046875, -0.12233734130859375, -0.1175384521484375, -0.11273956298828125, -0.107940673828125, -0.10314178466796875, -0.0983428955078125, -0.09354400634765625, -0.0887451171875, -0.08394622802734375, -0.0791473388671875, -0.07434844970703125, -0.069549560546875, -0.06475067138671875, -0.0599517822265625, -0.05515289306640625, -0.05035400390625, -0.04555511474609375, -0.0407562255859375, -0.03595733642578125, -0.031158447265625, -0.02635955810546875, -0.0215606689453125, -0.01676177978515625, -0.011962890625, -0.00716400146484375, -0.0023651123046875, 0.00243377685546875, 0.007232666015625, 0.01203155517578125, 0.0168304443359375, 0.02162933349609375, 0.02642822265625, 0.03122711181640625, 0.0360260009765625, 0.04082489013671875, 0.045623779296875, 0.05042266845703125, 0.0552215576171875, 0.06002044677734375, 0.0648193359375, 0.06961822509765625, 0.0744171142578125, 0.07921600341796875, 0.084014892578125, 0.08881378173828125, 0.0936126708984375, 0.09841156005859375, 0.10321044921875, 0.10800933837890625, 0.1128082275390625, 0.11760711669921875, 0.122406005859375, 0.12720489501953125, 0.1320037841796875, 0.13680267333984375, 0.1416015625]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 1.0, 4.0, 3.0, 3.0, 4.0, 7.0, 3.0, 6.0, 10.0, 11.0, 11.0, 8.0, 17.0, 13.0, 28.0, 26.0, 27.0, 28.0, 36.0, 53.0, 52.0, 51.0, 54.0, 60.0, 60.0, 57.0, 48.0, 53.0, 38.0, 42.0, 46.0, 20.0, 25.0, 18.0, 17.0, 11.0, 13.0, 4.0, 6.0, 8.0, 3.0, 7.0, 5.0, 1.0, 4.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0577392578125, -0.056032657623291016, -0.05432605743408203, -0.05261945724487305, -0.05091285705566406, -0.04920625686645508, -0.047499656677246094, -0.04579305648803711, -0.044086456298828125, -0.04237985610961914, -0.040673255920410156, -0.03896665573120117, -0.03726005554199219, -0.0355534553527832, -0.03384685516357422, -0.032140254974365234, -0.03043365478515625, -0.028727054595947266, -0.02702045440673828, -0.025313854217529297, -0.023607254028320312, -0.021900653839111328, -0.020194053649902344, -0.01848745346069336, -0.016780853271484375, -0.01507425308227539, -0.013367652893066406, -0.011661052703857422, -0.009954452514648438, -0.008247852325439453, -0.006541252136230469, -0.004834651947021484, -0.0031280517578125, -0.0014214515686035156, 0.00028514862060546875, 0.001991748809814453, 0.0036983489990234375, 0.005404949188232422, 0.007111549377441406, 0.00881814956665039, 0.010524749755859375, 0.01223134994506836, 0.013937950134277344, 0.015644550323486328, 0.017351150512695312, 0.019057750701904297, 0.02076435089111328, 0.022470951080322266, 0.02417755126953125, 0.025884151458740234, 0.02759075164794922, 0.029297351837158203, 0.031003952026367188, 0.03271055221557617, 0.034417152404785156, 0.03612375259399414, 0.037830352783203125, 0.03953695297241211, 0.041243553161621094, 0.04295015335083008, 0.04465675354003906, 0.04636335372924805, 0.04806995391845703, 0.049776554107666016, 0.051483154296875]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 2.0, 11.0, 4.0, 22.0, 29.0, 45.0, 67.0, 94.0, 114.0, 113.0, 124.0, 110.0, 85.0, 73.0, 45.0, 33.0, 10.0, 4.0, 6.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8793714642524719, -0.8468703627586365, -0.814369261264801, -0.7818682193756104, -0.7493671178817749, -0.7168660163879395, -0.684364914894104, -0.6518638134002686, -0.6193627119064331, -0.5868616104125977, -0.5543605089187622, -0.5218594074249268, -0.4893583655357361, -0.45685726404190063, -0.4243561625480652, -0.39185506105422974, -0.35935401916503906, -0.3268529176712036, -0.29435184597969055, -0.2618507444858551, -0.22934965789318085, -0.1968485713005066, -0.16434746980667114, -0.1318463832139969, -0.09934529662132263, -0.06684421002864838, -0.034343115985393524, -0.0018420219421386719, 0.030659064650535583, 0.06316015124320984, 0.09566125273704529, 0.12816233932971954, 0.16066348552703857, 0.19316457211971283, 0.22566565871238708, 0.25816676020622253, 0.2906678318977356, 0.32316893339157104, 0.3556700348854065, 0.38817113637924194, 0.420672208070755, 0.45317330956459045, 0.4856743812561035, 0.518175482749939, 0.5506765842437744, 0.5831776857376099, 0.6156787872314453, 0.648179829120636, 0.6806809306144714, 0.7131820321083069, 0.7456831336021423, 0.778184175491333, 0.8106852769851685, 0.8431863784790039, 0.8756874799728394, 0.9081885814666748, 0.9406896829605103, 0.9731907844543457, 1.0056918859481812, 1.0381929874420166, 1.070694088935852, 1.1031951904296875, 1.1356961727142334, 1.1681972742080688, 1.2006983757019043]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 6.0, 10.0, 6.0, 7.0, 11.0, 10.0, 11.0, 12.0, 18.0, 27.0, 21.0, 35.0, 32.0, 38.0, 40.0, 30.0, 37.0, 45.0, 47.0, 32.0, 38.0, 39.0, 43.0, 37.0, 43.0, 42.0, 35.0, 29.0, 30.0, 34.0, 19.0, 20.0, 18.0, 24.0, 14.0, 10.0, 9.0, 8.0, 8.0, 10.0, 7.0, 3.0, 1.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.718808114528656, -0.6959636807441711, -0.6731192469596863, -0.6502747535705566, -0.6274303197860718, -0.6045858860015869, -0.581741452217102, -0.5588970184326172, -0.5360525846481323, -0.5132081508636475, -0.4903636872768402, -0.46751925349235535, -0.4446747899055481, -0.42183035612106323, -0.39898592233657837, -0.3761414885520935, -0.35329699516296387, -0.330452561378479, -0.30760809779167175, -0.2847636640071869, -0.26191920042037964, -0.23907476663589478, -0.2162303328514099, -0.19338588416576385, -0.1705414354801178, -0.14769698679447174, -0.12485254555940628, -0.10200810432434082, -0.07916365563869476, -0.056319206953048706, -0.03347477316856384, -0.010630324482917786, 0.012214183807373047, 0.035058628767728806, 0.057903073728084564, 0.08074751496315002, 0.10359196364879608, 0.12643641233444214, 0.149280846118927, 0.17212529480457306, 0.19496974349021912, 0.21781419217586517, 0.24065864086151123, 0.2635030746459961, 0.28634750843048096, 0.3091919720172882, 0.33203640580177307, 0.3548808693885803, 0.3777253031730652, 0.40056973695755005, 0.4234142005443573, 0.44625863432884216, 0.4691030979156494, 0.4919475317001343, 0.5147919654846191, 0.537636399269104, 0.5604808330535889, 0.5833252668380737, 0.6061697006225586, 0.6290141344070435, 0.6518586277961731, 0.674703061580658, 0.6975474953651428, 0.7203919291496277, 0.7432364225387573]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 7.0, 5.0, 9.0, 10.0, 14.0, 17.0, 20.0, 38.0, 52.0, 74.0, 122.0, 217.0, 378.0, 802.0, 1699.0, 4520.0, 15582.0, 93727.0, 3703711.0, 327284.0, 32702.0, 8066.0, 2792.0, 1147.0, 507.0, 273.0, 192.0, 102.0, 61.0, 49.0, 28.0, 23.0, 13.0, 14.0, 14.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.296142578125, -0.28807830810546875, -0.2800140380859375, -0.27194976806640625, -0.263885498046875, -0.25582122802734375, -0.2477569580078125, -0.23969268798828125, -0.23162841796875, -0.22356414794921875, -0.2154998779296875, -0.20743560791015625, -0.199371337890625, -0.19130706787109375, -0.1832427978515625, -0.17517852783203125, -0.1671142578125, -0.15904998779296875, -0.1509857177734375, -0.14292144775390625, -0.134857177734375, -0.12679290771484375, -0.1187286376953125, -0.11066436767578125, -0.10260009765625, -0.09453582763671875, -0.0864715576171875, -0.07840728759765625, -0.070343017578125, -0.06227874755859375, -0.0542144775390625, -0.04615020751953125, -0.0380859375, -0.03002166748046875, -0.0219573974609375, -0.01389312744140625, -0.005828857421875, 0.00223541259765625, 0.0102996826171875, 0.01836395263671875, 0.02642822265625, 0.03449249267578125, 0.0425567626953125, 0.05062103271484375, 0.058685302734375, 0.06674957275390625, 0.0748138427734375, 0.08287811279296875, 0.0909423828125, 0.09900665283203125, 0.1070709228515625, 0.11513519287109375, 0.123199462890625, 0.13126373291015625, 0.1393280029296875, 0.14739227294921875, 0.15545654296875, 0.16352081298828125, 0.1715850830078125, 0.17964935302734375, 0.187713623046875, 0.19577789306640625, 0.2038421630859375, 0.21190643310546875, 0.219970703125]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 9.0, 18.0, 15.0, 25.0, 28.0, 40.0, 68.0, 77.0, 93.0, 104.0, 109.0, 84.0, 82.0, 69.0, 54.0, 32.0, 30.0, 14.0, 16.0, 9.0, 7.0, 5.0, 5.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0457763671875, -0.04447507858276367, -0.043173789978027344, -0.041872501373291016, -0.04057121276855469, -0.03926992416381836, -0.03796863555908203, -0.0366673469543457, -0.035366058349609375, -0.03406476974487305, -0.03276348114013672, -0.03146219253540039, -0.030160903930664062, -0.028859615325927734, -0.027558326721191406, -0.026257038116455078, -0.02495574951171875, -0.023654460906982422, -0.022353172302246094, -0.021051883697509766, -0.019750595092773438, -0.01844930648803711, -0.01714801788330078, -0.015846729278564453, -0.014545440673828125, -0.013244152069091797, -0.011942863464355469, -0.01064157485961914, -0.009340286254882812, -0.008038997650146484, -0.006737709045410156, -0.005436420440673828, -0.0041351318359375, -0.002833843231201172, -0.0015325546264648438, -0.00023126602172851562, 0.0010700225830078125, 0.0023713111877441406, 0.0036725997924804688, 0.004973888397216797, 0.006275177001953125, 0.007576465606689453, 0.008877754211425781, 0.01017904281616211, 0.011480331420898438, 0.012781620025634766, 0.014082908630371094, 0.015384197235107422, 0.01668548583984375, 0.017986774444580078, 0.019288063049316406, 0.020589351654052734, 0.021890640258789062, 0.02319192886352539, 0.02449321746826172, 0.025794506072998047, 0.027095794677734375, 0.028397083282470703, 0.02969837188720703, 0.03099966049194336, 0.03230094909667969, 0.033602237701416016, 0.034903526306152344, 0.03620481491088867, 0.037506103515625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 7.0, 7.0, 16.0, 9.0, 26.0, 44.0, 76.0, 155.0, 217.0, 425.0, 930.0, 2924.0, 15152.0, 263752.0, 3827282.0, 71845.0, 7895.0, 2003.0, 759.0, 356.0, 158.0, 110.0, 52.0, 36.0, 15.0, 10.0, 8.0, 4.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.431884765625, -0.41965484619140625, -0.4074249267578125, -0.39519500732421875, -0.382965087890625, -0.37073516845703125, -0.3585052490234375, -0.34627532958984375, -0.33404541015625, -0.32181549072265625, -0.3095855712890625, -0.29735565185546875, -0.285125732421875, -0.27289581298828125, -0.2606658935546875, -0.24843597412109375, -0.2362060546875, -0.22397613525390625, -0.2117462158203125, -0.19951629638671875, -0.187286376953125, -0.17505645751953125, -0.1628265380859375, -0.15059661865234375, -0.13836669921875, -0.12613677978515625, -0.1139068603515625, -0.10167694091796875, -0.089447021484375, -0.07721710205078125, -0.0649871826171875, -0.05275726318359375, -0.04052734375, -0.02829742431640625, -0.0160675048828125, -0.00383758544921875, 0.008392333984375, 0.02062225341796875, 0.0328521728515625, 0.04508209228515625, 0.05731201171875, 0.06954193115234375, 0.0817718505859375, 0.09400177001953125, 0.106231689453125, 0.11846160888671875, 0.1306915283203125, 0.14292144775390625, 0.1551513671875, 0.16738128662109375, 0.1796112060546875, 0.19184112548828125, 0.204071044921875, 0.21630096435546875, 0.2285308837890625, 0.24076080322265625, 0.25299072265625, 0.26522064208984375, 0.2774505615234375, 0.28968048095703125, 0.301910400390625, 0.31414031982421875, 0.3263702392578125, 0.33860015869140625, 0.350830078125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 5.0, 5.0, 20.0, 23.0, 39.0, 63.0, 161.0, 395.0, 2133.0, 763.0, 243.0, 92.0, 48.0, 32.0, 13.0, 12.0, 10.0, 7.0, 7.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10516357421875, -0.10230064392089844, -0.09943771362304688, -0.09657478332519531, -0.09371185302734375, -0.09084892272949219, -0.08798599243164062, -0.08512306213378906, -0.0822601318359375, -0.07939720153808594, -0.07653427124023438, -0.07367134094238281, -0.07080841064453125, -0.06794548034667969, -0.06508255004882812, -0.06221961975097656, -0.059356689453125, -0.05649375915527344, -0.053630828857421875, -0.05076789855957031, -0.04790496826171875, -0.04504203796386719, -0.042179107666015625, -0.03931617736816406, -0.0364532470703125, -0.03359031677246094, -0.030727386474609375, -0.027864456176757812, -0.02500152587890625, -0.022138595581054688, -0.019275665283203125, -0.016412734985351562, -0.0135498046875, -0.010686874389648438, -0.007823944091796875, -0.0049610137939453125, -0.00209808349609375, 0.0007648468017578125, 0.003627777099609375, 0.0064907073974609375, 0.0093536376953125, 0.012216567993164062, 0.015079498291015625, 0.017942428588867188, 0.02080535888671875, 0.023668289184570312, 0.026531219482421875, 0.029394149780273438, 0.032257080078125, 0.03512001037597656, 0.037982940673828125, 0.04084587097167969, 0.04370880126953125, 0.04657173156738281, 0.049434661865234375, 0.05229759216308594, 0.0551605224609375, 0.05802345275878906, 0.060886383056640625, 0.06374931335449219, 0.06661224365234375, 0.06947517395019531, 0.07233810424804688, 0.07520103454589844, 0.07806396484375]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 10.0, 11.0, 37.0, 92.0, 169.0, 229.0, 221.0, 121.0, 61.0, 38.0, 15.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3411327600479126, -0.3228967785835266, -0.30466076731681824, -0.28642478585243225, -0.26818880438804626, -0.24995280802249908, -0.2317168116569519, -0.21348083019256592, -0.19524483382701874, -0.17700883746147156, -0.15877285599708557, -0.1405368596315384, -0.12230087071657181, -0.10406488180160522, -0.08582888543605804, -0.06759290397167206, -0.04935690760612488, -0.031120916828513145, -0.012884926050901413, 0.005351066589355469, 0.023587055504322052, 0.041823044419288635, 0.060059040784835815, 0.0782950222492218, 0.09653101861476898, 0.11476700752973557, 0.13300299644470215, 0.15123899281024933, 0.1694749891757965, 0.1877109706401825, 0.20594696700572968, 0.22418294847011566, 0.24241894483566284, 0.26065492630004883, 0.2788909375667572, 0.2971269190311432, 0.3153629004955292, 0.33359891176223755, 0.35183489322662354, 0.3700708746910095, 0.3883068561553955, 0.4065428376197815, 0.42477884888648987, 0.44301483035087585, 0.46125081181526184, 0.4794868230819702, 0.4977228045463562, 0.5159587860107422, 0.534194827079773, 0.5524308085441589, 0.5706667900085449, 0.5889028310775757, 0.6071388125419617, 0.6253747940063477, 0.6436107754707336, 0.6618467569351196, 0.6800827383995056, 0.6983187198638916, 0.7165547013282776, 0.7347906827926636, 0.7530267238616943, 0.7712627053260803, 0.7894986867904663, 0.8077346682548523, 0.8259706497192383]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 4.0, 4.0, 2.0, 4.0, 3.0, 6.0, 11.0, 16.0, 9.0, 15.0, 24.0, 33.0, 25.0, 44.0, 40.0, 50.0, 41.0, 51.0, 56.0, 44.0, 52.0, 52.0, 44.0, 63.0, 40.0, 44.0, 30.0, 41.0, 35.0, 25.0, 14.0, 9.0, 15.0, 12.0, 9.0, 6.0, 8.0, 8.0, 4.0, 5.0, 4.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.2592989206314087, -0.25250810384750366, -0.24571727216243744, -0.2389264553785324, -0.23213563859462738, -0.22534480690956116, -0.21855399012565613, -0.2117631733417511, -0.20497235655784607, -0.19818153977394104, -0.19139070808887482, -0.1845998913049698, -0.17780907452106476, -0.17101824283599854, -0.1642274260520935, -0.15743660926818848, -0.15064577758312225, -0.14385496079921722, -0.137064129114151, -0.13027331233024597, -0.12348249554634094, -0.11669167131185532, -0.10990084707736969, -0.10311003029346466, -0.09631920605897903, -0.08952838182449341, -0.08273756504058838, -0.07594674080610275, -0.06915591657161713, -0.0623650997877121, -0.05557427555322647, -0.04878345504403114, -0.041992634534835815, -0.03520181402564049, -0.02841099165380001, -0.021620169281959534, -0.014829348772764206, -0.008038528263568878, -0.001247704029083252, 0.005543116480112076, 0.012333936989307404, 0.01912475749850273, 0.02591557987034321, 0.032706402242183685, 0.03949722275137901, 0.04628804326057434, 0.05307886749505997, 0.059869688004255295, 0.06666050851345062, 0.07345133274793625, 0.08024214953184128, 0.0870329737663269, 0.09382379055023193, 0.10061461478471756, 0.10740543901920319, 0.11419625580310822, 0.12098708003759384, 0.12777790427207947, 0.1345687210559845, 0.14135953783988953, 0.14815036952495575, 0.15494118630886078, 0.161732017993927, 0.16852283477783203, 0.17531365156173706]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 8.0, 11.0, 22.0, 23.0, 20.0, 46.0, 66.0, 92.0, 145.0, 206.0, 332.0, 528.0, 885.0, 1593.0, 3105.0, 6296.0, 13997.0, 34419.0, 85967.0, 218216.0, 362537.0, 190423.0, 75520.0, 29742.0, 12626.0, 5467.0, 2586.0, 1496.0, 799.0, 513.0, 269.0, 206.0, 138.0, 82.0, 58.0, 43.0, 17.0, 21.0, 10.0, 9.0, 5.0, 5.0, 4.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11328125, -0.10967636108398438, -0.10607147216796875, -0.10246658325195312, -0.0988616943359375, -0.09525680541992188, -0.09165191650390625, -0.08804702758789062, -0.084442138671875, -0.08083724975585938, -0.07723236083984375, -0.07362747192382812, -0.0700225830078125, -0.06641769409179688, -0.06281280517578125, -0.059207916259765625, -0.05560302734375, -0.051998138427734375, -0.04839324951171875, -0.044788360595703125, -0.0411834716796875, -0.037578582763671875, -0.03397369384765625, -0.030368804931640625, -0.026763916015625, -0.023159027099609375, -0.01955413818359375, -0.015949249267578125, -0.0123443603515625, -0.008739471435546875, -0.00513458251953125, -0.001529693603515625, 0.0020751953125, 0.005680084228515625, 0.00928497314453125, 0.012889862060546875, 0.0164947509765625, 0.020099639892578125, 0.02370452880859375, 0.027309417724609375, 0.030914306640625, 0.034519195556640625, 0.03812408447265625, 0.041728973388671875, 0.0453338623046875, 0.048938751220703125, 0.05254364013671875, 0.056148529052734375, 0.05975341796875, 0.06335830688476562, 0.06696319580078125, 0.07056808471679688, 0.0741729736328125, 0.07777786254882812, 0.08138275146484375, 0.08498764038085938, 0.088592529296875, 0.09219741821289062, 0.09580230712890625, 0.09940719604492188, 0.1030120849609375, 0.10661697387695312, 0.11022186279296875, 0.11382675170898438, 0.117431640625]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 6.0, 5.0, 9.0, 13.0, 14.0, 26.0, 24.0, 38.0, 57.0, 53.0, 75.0, 76.0, 103.0, 85.0, 74.0, 78.0, 71.0, 48.0, 43.0, 24.0, 21.0, 21.0, 15.0, 11.0, 6.0, 2.0, 3.0, 4.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.043609619140625, -0.0424041748046875, -0.04119873046875, -0.0399932861328125, -0.038787841796875, -0.0375823974609375, -0.036376953125, -0.0351715087890625, -0.033966064453125, -0.0327606201171875, -0.03155517578125, -0.0303497314453125, -0.029144287109375, -0.0279388427734375, -0.0267333984375, -0.0255279541015625, -0.024322509765625, -0.0231170654296875, -0.02191162109375, -0.0207061767578125, -0.019500732421875, -0.0182952880859375, -0.01708984375, -0.0158843994140625, -0.014678955078125, -0.0134735107421875, -0.01226806640625, -0.0110626220703125, -0.009857177734375, -0.0086517333984375, -0.0074462890625, -0.0062408447265625, -0.005035400390625, -0.0038299560546875, -0.00262451171875, -0.0014190673828125, -0.000213623046875, 0.0009918212890625, 0.002197265625, 0.0034027099609375, 0.004608154296875, 0.0058135986328125, 0.00701904296875, 0.0082244873046875, 0.009429931640625, 0.0106353759765625, 0.0118408203125, 0.0130462646484375, 0.014251708984375, 0.0154571533203125, 0.01666259765625, 0.0178680419921875, 0.019073486328125, 0.0202789306640625, 0.021484375, 0.0226898193359375, 0.023895263671875, 0.0251007080078125, 0.02630615234375, 0.0275115966796875, 0.028717041015625, 0.0299224853515625, 0.0311279296875, 0.0323333740234375, 0.033538818359375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 8.0, 9.0, 18.0, 13.0, 25.0, 27.0, 39.0, 69.0, 69.0, 132.0, 150.0, 218.0, 298.0, 499.0, 673.0, 1309.0, 2363.0, 6076.0, 21413.0, 84487.0, 303347.0, 428648.0, 144201.0, 36717.0, 9867.0, 3461.0, 1662.0, 905.0, 565.0, 351.0, 247.0, 165.0, 142.0, 97.0, 87.0, 55.0, 36.0, 26.0, 20.0, 12.0, 9.0, 9.0, 7.0, 7.0, 5.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1451416015625, -0.1404895782470703, -0.13583755493164062, -0.13118553161621094, -0.12653350830078125, -0.12188148498535156, -0.11722946166992188, -0.11257743835449219, -0.1079254150390625, -0.10327339172363281, -0.09862136840820312, -0.09396934509277344, -0.08931732177734375, -0.08466529846191406, -0.08001327514648438, -0.07536125183105469, -0.070709228515625, -0.06605720520019531, -0.061405181884765625, -0.05675315856933594, -0.05210113525390625, -0.04744911193847656, -0.042797088623046875, -0.03814506530761719, -0.0334930419921875, -0.028841018676757812, -0.024188995361328125, -0.019536972045898438, -0.01488494873046875, -0.010232925415039062, -0.005580902099609375, -0.0009288787841796875, 0.00372314453125, 0.008375167846679688, 0.013027191162109375, 0.017679214477539062, 0.02233123779296875, 0.026983261108398438, 0.031635284423828125, 0.03628730773925781, 0.0409393310546875, 0.04559135437011719, 0.050243377685546875, 0.05489540100097656, 0.05954742431640625, 0.06419944763183594, 0.06885147094726562, 0.07350349426269531, 0.078155517578125, 0.08280754089355469, 0.08745956420898438, 0.09211158752441406, 0.09676361083984375, 0.10141563415527344, 0.10606765747070312, 0.11071968078613281, 0.1153717041015625, 0.12002372741699219, 0.12467575073242188, 0.12932777404785156, 0.13397979736328125, 0.13863182067871094, 0.14328384399414062, 0.1479358673095703, 0.152587890625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 1.0, 4.0, 9.0, 14.0, 8.0, 22.0, 20.0, 21.0, 25.0, 34.0, 35.0, 29.0, 49.0, 56.0, 39.0, 63.0, 50.0, 57.0, 53.0, 56.0, 45.0, 56.0, 38.0, 40.0, 40.0, 35.0, 25.0, 28.0, 13.0, 9.0, 13.0, 3.0, 5.0, 1.0, 7.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12359619140625, -0.11875438690185547, -0.11391258239746094, -0.1090707778930664, -0.10422897338867188, -0.09938716888427734, -0.09454536437988281, -0.08970355987548828, -0.08486175537109375, -0.08001995086669922, -0.07517814636230469, -0.07033634185791016, -0.06549453735351562, -0.060652732849121094, -0.05581092834472656, -0.05096912384033203, -0.0461273193359375, -0.04128551483154297, -0.03644371032714844, -0.031601905822753906, -0.026760101318359375, -0.021918296813964844, -0.017076492309570312, -0.012234687805175781, -0.00739288330078125, -0.0025510787963867188, 0.0022907257080078125, 0.007132530212402344, 0.011974334716796875, 0.016816139221191406, 0.021657943725585938, 0.02649974822998047, 0.031341552734375, 0.03618335723876953, 0.04102516174316406, 0.045866966247558594, 0.050708770751953125, 0.055550575256347656, 0.06039237976074219, 0.06523418426513672, 0.07007598876953125, 0.07491779327392578, 0.07975959777832031, 0.08460140228271484, 0.08944320678710938, 0.0942850112915039, 0.09912681579589844, 0.10396862030029297, 0.1088104248046875, 0.11365222930908203, 0.11849403381347656, 0.1233358383178711, 0.12817764282226562, 0.13301944732666016, 0.1378612518310547, 0.14270305633544922, 0.14754486083984375, 0.15238666534423828, 0.1572284698486328, 0.16207027435302734, 0.16691207885742188, 0.1717538833618164, 0.17659568786621094, 0.18143749237060547, 0.186279296875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 6.0, 1.0, 6.0, 4.0, 4.0, 6.0, 15.0, 14.0, 14.0, 23.0, 26.0, 63.0, 80.0, 151.0, 251.0, 364.0, 754.0, 1491.0, 3141.0, 7808.0, 24558.0, 110963.0, 606658.0, 231165.0, 40834.0, 11613.0, 4329.0, 1984.0, 951.0, 501.0, 296.0, 162.0, 115.0, 58.0, 38.0, 22.0, 29.0, 19.0, 8.0, 5.0, 6.0, 7.0, 4.0, 1.0, 6.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.12445068359375, -0.12086296081542969, -0.11727523803710938, -0.11368751525878906, -0.11009979248046875, -0.10651206970214844, -0.10292434692382812, -0.09933662414550781, -0.0957489013671875, -0.09216117858886719, -0.08857345581054688, -0.08498573303222656, -0.08139801025390625, -0.07781028747558594, -0.07422256469726562, -0.07063484191894531, -0.067047119140625, -0.06345939636230469, -0.059871673583984375, -0.05628395080566406, -0.05269622802734375, -0.04910850524902344, -0.045520782470703125, -0.04193305969238281, -0.0383453369140625, -0.03475761413574219, -0.031169891357421875, -0.027582168579101562, -0.02399444580078125, -0.020406723022460938, -0.016819000244140625, -0.013231277465820312, -0.0096435546875, -0.0060558319091796875, -0.002468109130859375, 0.0011196136474609375, 0.00470733642578125, 0.008295059204101562, 0.011882781982421875, 0.015470504760742188, 0.0190582275390625, 0.022645950317382812, 0.026233673095703125, 0.029821395874023438, 0.03340911865234375, 0.03699684143066406, 0.040584564208984375, 0.04417228698730469, 0.047760009765625, 0.05134773254394531, 0.054935455322265625, 0.05852317810058594, 0.06211090087890625, 0.06569862365722656, 0.06928634643554688, 0.07287406921386719, 0.0764617919921875, 0.08004951477050781, 0.08363723754882812, 0.08722496032714844, 0.09081268310546875, 0.09440040588378906, 0.09798812866210938, 0.10157585144042969, 0.10516357421875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 6.0, 11.0, 7.0, 34.0, 41.0, 75.0, 89.0, 108.0, 114.0, 115.0, 120.0, 85.0, 68.0, 47.0, 42.0, 18.0, 14.0, 8.0, 1.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011515617370605469, -0.00011092238128185272, -0.00010668858885765076, -0.00010245479643344879, -9.822100400924683e-05, -9.398721158504486e-05, -8.97534191608429e-05, -8.551962673664093e-05, -8.128583431243896e-05, -7.7052041888237e-05, -7.281824946403503e-05, -6.858445703983307e-05, -6.43506646156311e-05, -6.011687219142914e-05, -5.588307976722717e-05, -5.164928734302521e-05, -4.741549491882324e-05, -4.318170249462128e-05, -3.894791007041931e-05, -3.4714117646217346e-05, -3.048032522201538e-05, -2.6246532797813416e-05, -2.201274037361145e-05, -1.7778947949409485e-05, -1.354515552520752e-05, -9.311363101005554e-06, -5.077570676803589e-06, -8.437782526016235e-07, 3.390014171600342e-06, 7.623806595802307e-06, 1.1857599020004272e-05, 1.6091391444206238e-05, 2.0325183868408203e-05, 2.455897629261017e-05, 2.8792768716812134e-05, 3.30265611410141e-05, 3.7260353565216064e-05, 4.149414598941803e-05, 4.5727938413619995e-05, 4.996173083782196e-05, 5.4195523262023926e-05, 5.842931568622589e-05, 6.266310811042786e-05, 6.689690053462982e-05, 7.113069295883179e-05, 7.536448538303375e-05, 7.959827780723572e-05, 8.383207023143768e-05, 8.806586265563965e-05, 9.229965507984161e-05, 9.653344750404358e-05, 0.00010076723992824554, 0.00010500103235244751, 0.00010923482477664948, 0.00011346861720085144, 0.0001177024096250534, 0.00012193620204925537, 0.00012616999447345734, 0.0001304037868976593, 0.00013463757932186127, 0.00013887137174606323, 0.0001431051641702652, 0.00014733895659446716, 0.00015157274901866913, 0.0001558065414428711]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 7.0, 5.0, 7.0, 16.0, 27.0, 28.0, 29.0, 44.0, 85.0, 155.0, 375.0, 829.0, 2699.0, 12215.0, 146771.0, 824204.0, 51361.0, 6765.0, 1681.0, 618.0, 284.0, 120.0, 66.0, 46.0, 46.0, 25.0, 13.0, 13.0, 10.0, 8.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2039794921875, -0.19746780395507812, -0.19095611572265625, -0.18444442749023438, -0.1779327392578125, -0.17142105102539062, -0.16490936279296875, -0.15839767456054688, -0.151885986328125, -0.14537429809570312, -0.13886260986328125, -0.13235092163085938, -0.1258392333984375, -0.11932754516601562, -0.11281585693359375, -0.10630416870117188, -0.09979248046875, -0.09328079223632812, -0.08676910400390625, -0.08025741577148438, -0.0737457275390625, -0.06723403930664062, -0.06072235107421875, -0.054210662841796875, -0.047698974609375, -0.041187286376953125, -0.03467559814453125, -0.028163909912109375, -0.0216522216796875, -0.015140533447265625, -0.00862884521484375, -0.002117156982421875, 0.00439453125, 0.010906219482421875, 0.01741790771484375, 0.023929595947265625, 0.0304412841796875, 0.036952972412109375, 0.04346466064453125, 0.049976348876953125, 0.056488037109375, 0.06299972534179688, 0.06951141357421875, 0.07602310180664062, 0.0825347900390625, 0.08904647827148438, 0.09555816650390625, 0.10206985473632812, 0.10858154296875, 0.11509323120117188, 0.12160491943359375, 0.12811660766601562, 0.1346282958984375, 0.14113998413085938, 0.14765167236328125, 0.15416336059570312, 0.160675048828125, 0.16718673706054688, 0.17369842529296875, 0.18021011352539062, 0.1867218017578125, 0.19323348999023438, 0.19974517822265625, 0.20625686645507812, 0.2127685546875]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 4.0, 5.0, 12.0, 12.0, 25.0, 34.0, 34.0, 67.0, 90.0, 130.0, 131.0, 135.0, 107.0, 59.0, 44.0, 36.0, 21.0, 7.0, 12.0, 6.0, 8.0, 5.0, 6.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.10321044921875, -0.09993457794189453, -0.09665870666503906, -0.0933828353881836, -0.09010696411132812, -0.08683109283447266, -0.08355522155761719, -0.08027935028076172, -0.07700347900390625, -0.07372760772705078, -0.07045173645019531, -0.06717586517333984, -0.06389999389648438, -0.060624122619628906, -0.05734825134277344, -0.05407238006591797, -0.0507965087890625, -0.04752063751220703, -0.04424476623535156, -0.040968894958496094, -0.037693023681640625, -0.034417152404785156, -0.031141281127929688, -0.02786540985107422, -0.02458953857421875, -0.02131366729736328, -0.018037796020507812, -0.014761924743652344, -0.011486053466796875, -0.008210182189941406, -0.0049343109130859375, -0.0016584396362304688, 0.001617431640625, 0.004893302917480469, 0.008169174194335938, 0.011445045471191406, 0.014720916748046875, 0.017996788024902344, 0.021272659301757812, 0.02454853057861328, 0.02782440185546875, 0.03110027313232422, 0.03437614440917969, 0.037652015686035156, 0.040927886962890625, 0.044203758239746094, 0.04747962951660156, 0.05075550079345703, 0.0540313720703125, 0.05730724334716797, 0.06058311462402344, 0.0638589859008789, 0.06713485717773438, 0.07041072845458984, 0.07368659973144531, 0.07696247100830078, 0.08023834228515625, 0.08351421356201172, 0.08679008483886719, 0.09006595611572266, 0.09334182739257812, 0.0966176986694336, 0.09989356994628906, 0.10316944122314453, 0.1064453125]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 10.0, 18.0, 27.0, 75.0, 127.0, 199.0, 208.0, 160.0, 97.0, 49.0, 23.0, 6.0, 5.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9106699228286743, -1.8620346784591675, -1.8133994340896606, -1.7647641897201538, -1.716128945350647, -1.6674937009811401, -1.6188585758209229, -1.570223331451416, -1.5215880870819092, -1.4729528427124023, -1.4243175983428955, -1.3756823539733887, -1.3270471096038818, -1.278411865234375, -1.2297766208648682, -1.1811413764953613, -1.1325061321258545, -1.0838708877563477, -1.0352356433868408, -0.986600399017334, -0.9379651546478271, -0.8893299102783203, -0.8406947255134583, -0.7920594811439514, -0.7434242367744446, -0.6947889924049377, -0.6461537480354309, -0.5975185632705688, -0.548883318901062, -0.5002480745315552, -0.45161283016204834, -0.4029775857925415, -0.3543424606323242, -0.3057072162628174, -0.25707197189331055, -0.2084367573261261, -0.15980151295661926, -0.11116626858711243, -0.06253105401992798, -0.013895809650421143, 0.03473943471908569, 0.08337467163801193, 0.13200990855693817, 0.1806451380252838, 0.22928038239479065, 0.2779156267642975, 0.32655084133148193, 0.37518608570098877, 0.4238213300704956, 0.47245657444000244, 0.5210918188095093, 0.5697270631790161, 0.618362307548523, 0.6669975519180298, 0.7156327366828918, 0.7642679810523987, 0.8129032254219055, 0.8615384697914124, 0.9101737141609192, 0.9588088989257812, 1.007444143295288, 1.056079387664795, 1.1047146320343018, 1.1533498764038086, 1.2019851207733154]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 5.0, 5.0, 5.0, 7.0, 13.0, 14.0, 17.0, 11.0, 24.0, 19.0, 32.0, 37.0, 29.0, 32.0, 45.0, 39.0, 47.0, 46.0, 52.0, 57.0, 38.0, 43.0, 41.0, 38.0, 46.0, 38.0, 37.0, 27.0, 46.0, 22.0, 15.0, 17.0, 14.0, 8.0, 10.0, 8.0, 7.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.9258089065551758, -0.9006794095039368, -0.8755499720573425, -0.8504204750061035, -0.8252910375595093, -0.8001615405082703, -0.7750320434570312, -0.749902606010437, -0.724773108959198, -0.699643611907959, -0.6745141744613647, -0.6493846774101257, -0.6242551803588867, -0.5991257429122925, -0.5739962458610535, -0.5488667488098145, -0.5237373113632202, -0.4986078441143036, -0.47347837686538696, -0.44834887981414795, -0.4232194125652313, -0.3980899453163147, -0.3729604482650757, -0.34783098101615906, -0.32270151376724243, -0.2975720465183258, -0.2724425792694092, -0.24731308221817017, -0.22218361496925354, -0.19705414772033691, -0.1719246655702591, -0.14679518342018127, -0.12166571617126465, -0.09653624147176743, -0.0714067667722702, -0.04627729207277298, -0.021147817373275757, 0.003981649875640869, 0.02911113202571869, 0.05424061417579651, 0.07937008142471313, 0.10449955612421036, 0.12962903082370758, 0.1547585129737854, 0.17988798022270203, 0.20501744747161865, 0.23014692962169647, 0.2552764117717743, 0.2804058790206909, 0.30553534626960754, 0.33066481351852417, 0.3557943105697632, 0.3809237778186798, 0.40605324506759644, 0.43118274211883545, 0.4563122093677521, 0.4814416766166687, 0.5065711736679077, 0.531700611114502, 0.556830108165741, 0.58195960521698, 0.6070890426635742, 0.6322185397148132, 0.6573480367660522, 0.6824774742126465]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 8.0, 6.0, 7.0, 8.0, 11.0, 26.0, 39.0, 53.0, 97.0, 161.0, 309.0, 587.0, 1577.0, 3993.0, 14117.0, 79294.0, 3603167.0, 438963.0, 38321.0, 8571.0, 2857.0, 1085.0, 452.0, 254.0, 132.0, 70.0, 50.0, 27.0, 15.0, 13.0, 6.0, 5.0, 5.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.255859375, -0.24850845336914062, -0.24115753173828125, -0.23380661010742188, -0.2264556884765625, -0.21910476684570312, -0.21175384521484375, -0.20440292358398438, -0.197052001953125, -0.18970108032226562, -0.18235015869140625, -0.17499923706054688, -0.1676483154296875, -0.16029739379882812, -0.15294647216796875, -0.14559555053710938, -0.13824462890625, -0.13089370727539062, -0.12354278564453125, -0.11619186401367188, -0.1088409423828125, -0.10149002075195312, -0.09413909912109375, -0.08678817749023438, -0.079437255859375, -0.07208633422851562, -0.06473541259765625, -0.057384490966796875, -0.0500335693359375, -0.042682647705078125, -0.03533172607421875, -0.027980804443359375, -0.0206298828125, -0.013278961181640625, -0.00592803955078125, 0.001422882080078125, 0.0087738037109375, 0.016124725341796875, 0.02347564697265625, 0.030826568603515625, 0.038177490234375, 0.045528411865234375, 0.05287933349609375, 0.060230255126953125, 0.0675811767578125, 0.07493209838867188, 0.08228302001953125, 0.08963394165039062, 0.09698486328125, 0.10433578491210938, 0.11168670654296875, 0.11903762817382812, 0.1263885498046875, 0.13373947143554688, 0.14109039306640625, 0.14844131469726562, 0.155792236328125, 0.16314315795898438, 0.17049407958984375, 0.17784500122070312, 0.1851959228515625, 0.19254684448242188, 0.19989776611328125, 0.20724868774414062, 0.214599609375]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 7.0, 8.0, 5.0, 10.0, 18.0, 17.0, 34.0, 35.0, 43.0, 67.0, 71.0, 92.0, 92.0, 78.0, 84.0, 77.0, 69.0, 57.0, 26.0, 28.0, 28.0, 16.0, 14.0, 7.0, 8.0, 7.0, 5.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04473876953125, -0.04346609115600586, -0.04219341278076172, -0.04092073440551758, -0.03964805603027344, -0.0383753776550293, -0.037102699279785156, -0.035830020904541016, -0.034557342529296875, -0.033284664154052734, -0.032011985778808594, -0.030739307403564453, -0.029466629028320312, -0.028193950653076172, -0.02692127227783203, -0.02564859390258789, -0.02437591552734375, -0.02310323715209961, -0.02183055877685547, -0.020557880401611328, -0.019285202026367188, -0.018012523651123047, -0.016739845275878906, -0.015467166900634766, -0.014194488525390625, -0.012921810150146484, -0.011649131774902344, -0.010376453399658203, -0.009103775024414062, -0.007831096649169922, -0.006558418273925781, -0.005285739898681641, -0.0040130615234375, -0.0027403831481933594, -0.0014677047729492188, -0.00019502639770507812, 0.0010776519775390625, 0.002350330352783203, 0.0036230087280273438, 0.004895687103271484, 0.006168365478515625, 0.007441043853759766, 0.008713722229003906, 0.009986400604248047, 0.011259078979492188, 0.012531757354736328, 0.013804435729980469, 0.01507711410522461, 0.01634979248046875, 0.01762247085571289, 0.01889514923095703, 0.020167827606201172, 0.021440505981445312, 0.022713184356689453, 0.023985862731933594, 0.025258541107177734, 0.026531219482421875, 0.027803897857666016, 0.029076576232910156, 0.030349254608154297, 0.03162193298339844, 0.03289461135864258, 0.03416728973388672, 0.03543996810913086, 0.036712646484375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 9.0, 11.0, 23.0, 26.0, 42.0, 43.0, 69.0, 71.0, 106.0, 165.0, 317.0, 1582.0, 26623.0, 4075476.0, 86201.0, 2524.0, 407.0, 169.0, 113.0, 78.0, 63.0, 54.0, 31.0, 31.0, 21.0, 19.0, 6.0, 3.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.66015625, -0.6405258178710938, -0.6208953857421875, -0.6012649536132812, -0.581634521484375, -0.5620040893554688, -0.5423736572265625, -0.5227432250976562, -0.50311279296875, -0.48348236083984375, -0.4638519287109375, -0.44422149658203125, -0.424591064453125, -0.40496063232421875, -0.3853302001953125, -0.36569976806640625, -0.3460693359375, -0.32643890380859375, -0.3068084716796875, -0.28717803955078125, -0.267547607421875, -0.24791717529296875, -0.2282867431640625, -0.20865631103515625, -0.18902587890625, -0.16939544677734375, -0.1497650146484375, -0.13013458251953125, -0.110504150390625, -0.09087371826171875, -0.0712432861328125, -0.05161285400390625, -0.031982421875, -0.01235198974609375, 0.0072784423828125, 0.02690887451171875, 0.046539306640625, 0.06616973876953125, 0.0858001708984375, 0.10543060302734375, 0.12506103515625, 0.14469146728515625, 0.1643218994140625, 0.18395233154296875, 0.203582763671875, 0.22321319580078125, 0.2428436279296875, 0.26247406005859375, 0.2821044921875, 0.30173492431640625, 0.3213653564453125, 0.34099578857421875, 0.360626220703125, 0.38025665283203125, 0.3998870849609375, 0.41951751708984375, 0.43914794921875, 0.45877838134765625, 0.4784088134765625, 0.49803924560546875, 0.517669677734375, 0.5373001098632812, 0.5569305419921875, 0.5765609741210938, 0.59619140625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 6.0, 17.0, 22.0, 51.0, 203.0, 1061.0, 2354.0, 253.0, 69.0, 26.0, 13.0, 7.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16015625, -0.1553192138671875, -0.150482177734375, -0.1456451416015625, -0.14080810546875, -0.1359710693359375, -0.131134033203125, -0.1262969970703125, -0.1214599609375, -0.1166229248046875, -0.111785888671875, -0.1069488525390625, -0.10211181640625, -0.0972747802734375, -0.092437744140625, -0.0876007080078125, -0.082763671875, -0.0779266357421875, -0.073089599609375, -0.0682525634765625, -0.06341552734375, -0.0585784912109375, -0.053741455078125, -0.0489044189453125, -0.0440673828125, -0.0392303466796875, -0.034393310546875, -0.0295562744140625, -0.02471923828125, -0.0198822021484375, -0.015045166015625, -0.0102081298828125, -0.00537109375, -0.0005340576171875, 0.004302978515625, 0.0091400146484375, 0.01397705078125, 0.0188140869140625, 0.023651123046875, 0.0284881591796875, 0.0333251953125, 0.0381622314453125, 0.042999267578125, 0.0478363037109375, 0.05267333984375, 0.0575103759765625, 0.062347412109375, 0.0671844482421875, 0.072021484375, 0.0768585205078125, 0.081695556640625, 0.0865325927734375, 0.09136962890625, 0.0962066650390625, 0.101043701171875, 0.1058807373046875, 0.1107177734375, 0.1155548095703125, 0.120391845703125, 0.1252288818359375, 0.13006591796875, 0.1349029541015625, 0.139739990234375, 0.1445770263671875, 0.1494140625]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 7.0, 5.0, 9.0, 7.0, 15.0, 36.0, 38.0, 51.0, 63.0, 79.0, 93.0, 97.0, 115.0, 84.0, 82.0, 73.0, 51.0, 29.0, 21.0, 16.0, 11.0, 6.0, 6.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.34344029426574707, -0.3346615433692932, -0.32588279247283936, -0.3171040415763855, -0.30832529067993164, -0.2995465099811554, -0.29076775908470154, -0.2819890081882477, -0.2732102572917938, -0.26443150639533997, -0.2556527554988861, -0.24687398970127106, -0.2380952388048172, -0.22931648790836334, -0.2205377221107483, -0.21175897121429443, -0.20298022031784058, -0.19420146942138672, -0.18542271852493286, -0.1766439527273178, -0.16786520183086395, -0.1590864509344101, -0.15030768513679504, -0.1415289342403412, -0.13275018334388733, -0.12397143244743347, -0.11519267410039902, -0.10641391575336456, -0.0976351648569107, -0.08885641396045685, -0.0800776556134224, -0.07129889726638794, -0.06252017617225647, -0.053741421550512314, -0.04496266692876816, -0.036183912307024, -0.027405157685279846, -0.01862640306353569, -0.009847648441791534, -0.0010688938200473785, 0.007709860801696777, 0.016488615423440933, 0.02526737004518509, 0.034046124666929245, 0.0428248792886734, 0.05160363391041756, 0.06038238853216171, 0.06916114687919617, 0.07793989777565002, 0.08671864867210388, 0.09549740701913834, 0.10427616536617279, 0.11305491626262665, 0.1218336671590805, 0.13061243295669556, 0.13939118385314941, 0.14816993474960327, 0.15694868564605713, 0.165727436542511, 0.17450620234012604, 0.1832849532365799, 0.19206370413303375, 0.2008424699306488, 0.20962122082710266, 0.21839997172355652]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 5.0, 6.0, 2.0, 5.0, 6.0, 7.0, 6.0, 9.0, 8.0, 17.0, 13.0, 17.0, 27.0, 18.0, 28.0, 22.0, 27.0, 26.0, 22.0, 26.0, 33.0, 32.0, 34.0, 43.0, 39.0, 41.0, 36.0, 40.0, 34.0, 33.0, 38.0, 29.0, 27.0, 25.0, 32.0, 27.0, 25.0, 22.0, 16.0, 17.0, 9.0, 13.0, 8.0, 14.0, 9.0, 10.0, 6.0, 4.0, 3.0, 4.0, 3.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0], "bins": [-0.17114514112472534, -0.1658613532781601, -0.16057755053043365, -0.1552937626838684, -0.15000995993614197, -0.14472617208957672, -0.13944238424301147, -0.13415858149528503, -0.1288747936487198, -0.12359099835157394, -0.1183072030544281, -0.11302341520786285, -0.10773961991071701, -0.10245582461357117, -0.09717203676700592, -0.09188824146986008, -0.08660444617271423, -0.08132065087556839, -0.07603685557842255, -0.0707530677318573, -0.06546927243471146, -0.06018547713756561, -0.05490168556571007, -0.04961789399385452, -0.04433409869670868, -0.039050303399562836, -0.03376651182770729, -0.028482718393206596, -0.023198924958705902, -0.017915131524205208, -0.012631338089704514, -0.0073475465178489685, -0.002063751220703125, 0.0032200422137975693, 0.008503835648298264, 0.013787629082798958, 0.019071422517299652, 0.024355215951800346, 0.02963900938630104, 0.034922800958156586, 0.04020659625530243, 0.04549039155244827, 0.05077418312430382, 0.05605797469615936, 0.061341769993305206, 0.06662556529045105, 0.0719093531370163, 0.07719314843416214, 0.08247694373130798, 0.08776073902845383, 0.09304453432559967, 0.09832832217216492, 0.10361211746931076, 0.1088959127664566, 0.11417970061302185, 0.1194634959101677, 0.12474729120731354, 0.13003107905387878, 0.13531488180160522, 0.14059866964817047, 0.14588245749473572, 0.15116626024246216, 0.1564500480890274, 0.16173383593559265, 0.1670176386833191]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 9.0, 6.0, 13.0, 11.0, 25.0, 30.0, 53.0, 89.0, 109.0, 187.0, 334.0, 541.0, 987.0, 1828.0, 3894.0, 8759.0, 20331.0, 52134.0, 139513.0, 329290.0, 295668.0, 118040.0, 44327.0, 17857.0, 7245.0, 3410.0, 1659.0, 887.0, 512.0, 300.0, 166.0, 119.0, 77.0, 49.0, 42.0, 19.0, 13.0, 6.0, 10.0, 4.0, 2.0, 4.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1207275390625, -0.11705970764160156, -0.11339187622070312, -0.10972404479980469, -0.10605621337890625, -0.10238838195800781, -0.09872055053710938, -0.09505271911621094, -0.0913848876953125, -0.08771705627441406, -0.08404922485351562, -0.08038139343261719, -0.07671356201171875, -0.07304573059082031, -0.06937789916992188, -0.06571006774902344, -0.062042236328125, -0.05837440490722656, -0.054706573486328125, -0.05103874206542969, -0.04737091064453125, -0.04370307922363281, -0.040035247802734375, -0.03636741638183594, -0.0326995849609375, -0.029031753540039062, -0.025363922119140625, -0.021696090698242188, -0.01802825927734375, -0.014360427856445312, -0.010692596435546875, -0.0070247650146484375, -0.00335693359375, 0.0003108978271484375, 0.003978729248046875, 0.0076465606689453125, 0.01131439208984375, 0.014982223510742188, 0.018650054931640625, 0.022317886352539062, 0.0259857177734375, 0.029653549194335938, 0.033321380615234375, 0.03698921203613281, 0.04065704345703125, 0.04432487487792969, 0.047992706298828125, 0.05166053771972656, 0.055328369140625, 0.05899620056152344, 0.06266403198242188, 0.06633186340332031, 0.06999969482421875, 0.07366752624511719, 0.07733535766601562, 0.08100318908691406, 0.0846710205078125, 0.08833885192871094, 0.09200668334960938, 0.09567451477050781, 0.09934234619140625, 0.10301017761230469, 0.10667800903320312, 0.11034584045410156, 0.114013671875]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 4.0, 7.0, 5.0, 14.0, 12.0, 27.0, 22.0, 35.0, 47.0, 47.0, 66.0, 64.0, 74.0, 82.0, 75.0, 78.0, 76.0, 52.0, 52.0, 41.0, 31.0, 29.0, 23.0, 11.0, 5.0, 9.0, 5.0, 4.0, 4.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.04656982421875, -0.045342445373535156, -0.04411506652832031, -0.04288768768310547, -0.041660308837890625, -0.04043292999267578, -0.03920555114746094, -0.037978172302246094, -0.03675079345703125, -0.035523414611816406, -0.03429603576660156, -0.03306865692138672, -0.031841278076171875, -0.03061389923095703, -0.029386520385742188, -0.028159141540527344, -0.0269317626953125, -0.025704383850097656, -0.024477005004882812, -0.02324962615966797, -0.022022247314453125, -0.02079486846923828, -0.019567489624023438, -0.018340110778808594, -0.01711273193359375, -0.015885353088378906, -0.014657974243164062, -0.013430595397949219, -0.012203216552734375, -0.010975837707519531, -0.009748458862304688, -0.008521080017089844, -0.007293701171875, -0.006066322326660156, -0.0048389434814453125, -0.0036115646362304688, -0.002384185791015625, -0.0011568069458007812, 7.05718994140625e-05, 0.0012979507446289062, 0.00252532958984375, 0.0037527084350585938, 0.0049800872802734375, 0.006207466125488281, 0.007434844970703125, 0.008662223815917969, 0.009889602661132812, 0.011116981506347656, 0.0123443603515625, 0.013571739196777344, 0.014799118041992188, 0.01602649688720703, 0.017253875732421875, 0.01848125457763672, 0.019708633422851562, 0.020936012268066406, 0.02216339111328125, 0.023390769958496094, 0.024618148803710938, 0.02584552764892578, 0.027072906494140625, 0.02830028533935547, 0.029527664184570312, 0.030755043029785156, 0.031982421875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 6.0, 6.0, 10.0, 11.0, 21.0, 36.0, 26.0, 58.0, 65.0, 81.0, 125.0, 159.0, 259.0, 338.0, 589.0, 972.0, 1928.0, 4523.0, 13870.0, 52380.0, 217088.0, 499220.0, 190198.0, 45792.0, 12294.0, 4083.0, 1663.0, 978.0, 556.0, 348.0, 239.0, 168.0, 120.0, 90.0, 47.0, 57.0, 33.0, 27.0, 21.0, 18.0, 17.0, 7.0, 7.0, 2.0, 2.0, 7.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.134765625, -0.1301898956298828, -0.12561416625976562, -0.12103843688964844, -0.11646270751953125, -0.11188697814941406, -0.10731124877929688, -0.10273551940917969, -0.0981597900390625, -0.09358406066894531, -0.08900833129882812, -0.08443260192871094, -0.07985687255859375, -0.07528114318847656, -0.07070541381835938, -0.06612968444824219, -0.061553955078125, -0.05697822570800781, -0.052402496337890625, -0.04782676696777344, -0.04325103759765625, -0.03867530822753906, -0.034099578857421875, -0.029523849487304688, -0.0249481201171875, -0.020372390747070312, -0.015796661376953125, -0.011220932006835938, -0.00664520263671875, -0.0020694732666015625, 0.002506256103515625, 0.0070819854736328125, 0.01165771484375, 0.016233444213867188, 0.020809173583984375, 0.025384902954101562, 0.02996063232421875, 0.03453636169433594, 0.039112091064453125, 0.04368782043457031, 0.0482635498046875, 0.05283927917480469, 0.057415008544921875, 0.06199073791503906, 0.06656646728515625, 0.07114219665527344, 0.07571792602539062, 0.08029365539550781, 0.084869384765625, 0.08944511413574219, 0.09402084350585938, 0.09859657287597656, 0.10317230224609375, 0.10774803161621094, 0.11232376098632812, 0.11689949035644531, 0.1214752197265625, 0.1260509490966797, 0.13062667846679688, 0.13520240783691406, 0.13977813720703125, 0.14435386657714844, 0.14892959594726562, 0.1535053253173828, 0.1580810546875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 0.0, 3.0, 4.0, 9.0, 8.0, 11.0, 11.0, 12.0, 14.0, 13.0, 29.0, 28.0, 29.0, 31.0, 32.0, 38.0, 36.0, 53.0, 40.0, 59.0, 43.0, 51.0, 54.0, 48.0, 37.0, 39.0, 39.0, 35.0, 35.0, 25.0, 25.0, 24.0, 18.0, 14.0, 15.0, 6.0, 13.0, 3.0, 7.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1253662109375, -0.12151718139648438, -0.11766815185546875, -0.11381912231445312, -0.1099700927734375, -0.10612106323242188, -0.10227203369140625, -0.09842300415039062, -0.094573974609375, -0.09072494506835938, -0.08687591552734375, -0.08302688598632812, -0.0791778564453125, -0.07532882690429688, -0.07147979736328125, -0.06763076782226562, -0.06378173828125, -0.059932708740234375, -0.05608367919921875, -0.052234649658203125, -0.0483856201171875, -0.044536590576171875, -0.04068756103515625, -0.036838531494140625, -0.032989501953125, -0.029140472412109375, -0.02529144287109375, -0.021442413330078125, -0.0175933837890625, -0.013744354248046875, -0.00989532470703125, -0.006046295166015625, -0.002197265625, 0.001651763916015625, 0.00550079345703125, 0.009349822998046875, 0.0131988525390625, 0.017047882080078125, 0.02089691162109375, 0.024745941162109375, 0.028594970703125, 0.032444000244140625, 0.03629302978515625, 0.040142059326171875, 0.0439910888671875, 0.047840118408203125, 0.05168914794921875, 0.055538177490234375, 0.05938720703125, 0.06323623657226562, 0.06708526611328125, 0.07093429565429688, 0.0747833251953125, 0.07863235473632812, 0.08248138427734375, 0.08633041381835938, 0.090179443359375, 0.09402847290039062, 0.09787750244140625, 0.10172653198242188, 0.1055755615234375, 0.10942459106445312, 0.11327362060546875, 0.11712265014648438, 0.1209716796875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 5.0, 3.0, 6.0, 6.0, 16.0, 6.0, 27.0, 27.0, 42.0, 60.0, 73.0, 109.0, 169.0, 297.0, 411.0, 673.0, 1139.0, 2110.0, 3923.0, 8364.0, 19753.0, 55256.0, 186416.0, 454682.0, 212678.0, 62063.0, 21623.0, 8991.0, 4207.0, 2154.0, 1201.0, 719.0, 448.0, 294.0, 179.0, 127.0, 101.0, 54.0, 45.0, 36.0, 18.0, 12.0, 10.0, 10.0, 6.0, 3.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05633544921875, -0.054429054260253906, -0.05252265930175781, -0.05061626434326172, -0.048709869384765625, -0.04680347442626953, -0.04489707946777344, -0.042990684509277344, -0.04108428955078125, -0.039177894592285156, -0.03727149963378906, -0.03536510467529297, -0.033458709716796875, -0.03155231475830078, -0.029645919799804688, -0.027739524841308594, -0.0258331298828125, -0.023926734924316406, -0.022020339965820312, -0.02011394500732422, -0.018207550048828125, -0.01630115509033203, -0.014394760131835938, -0.012488365173339844, -0.01058197021484375, -0.008675575256347656, -0.0067691802978515625, -0.004862785339355469, -0.002956390380859375, -0.0010499954223632812, 0.0008563995361328125, 0.0027627944946289062, 0.004669189453125, 0.006575584411621094, 0.008481979370117188, 0.010388374328613281, 0.012294769287109375, 0.014201164245605469, 0.016107559204101562, 0.018013954162597656, 0.01992034912109375, 0.021826744079589844, 0.023733139038085938, 0.02563953399658203, 0.027545928955078125, 0.02945232391357422, 0.03135871887207031, 0.033265113830566406, 0.0351715087890625, 0.037077903747558594, 0.03898429870605469, 0.04089069366455078, 0.042797088623046875, 0.04470348358154297, 0.04660987854003906, 0.048516273498535156, 0.05042266845703125, 0.052329063415527344, 0.05423545837402344, 0.05614185333251953, 0.058048248291015625, 0.05995464324951172, 0.06186103820800781, 0.0637674331665039, 0.065673828125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 0.0, 5.0, 7.0, 13.0, 18.0, 26.0, 38.0, 49.0, 80.0, 114.0, 113.0, 140.0, 102.0, 77.0, 71.0, 38.0, 34.0, 21.0, 22.0, 12.0, 7.0, 7.0, 6.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010770559310913086, -0.00010359007865190506, -9.947456419467926e-05, -9.535904973745346e-05, -9.124353528022766e-05, -8.712802082300186e-05, -8.301250636577606e-05, -7.889699190855026e-05, -7.478147745132446e-05, -7.066596299409866e-05, -6.655044853687286e-05, -6.243493407964706e-05, -5.8319419622421265e-05, -5.4203905165195465e-05, -5.0088390707969666e-05, -4.5972876250743866e-05, -4.1857361793518066e-05, -3.774184733629227e-05, -3.362633287906647e-05, -2.9510818421840668e-05, -2.5395303964614868e-05, -2.127978950738907e-05, -1.716427505016327e-05, -1.304876059293747e-05, -8.93324613571167e-06, -4.81773167848587e-06, -7.022172212600708e-07, 3.4132972359657288e-06, 7.528811693191528e-06, 1.1644326150417328e-05, 1.5759840607643127e-05, 1.9875355064868927e-05, 2.3990869522094727e-05, 2.8106383979320526e-05, 3.2221898436546326e-05, 3.6337412893772125e-05, 4.0452927350997925e-05, 4.4568441808223724e-05, 4.8683956265449524e-05, 5.2799470722675323e-05, 5.691498517990112e-05, 6.103049963712692e-05, 6.514601409435272e-05, 6.926152855157852e-05, 7.337704300880432e-05, 7.749255746603012e-05, 8.160807192325592e-05, 8.572358638048172e-05, 8.983910083770752e-05, 9.395461529493332e-05, 9.807012975215912e-05, 0.00010218564420938492, 0.00010630115866661072, 0.00011041667312383652, 0.00011453218758106232, 0.00011864770203828812, 0.00012276321649551392, 0.00012687873095273972, 0.00013099424540996552, 0.00013510975986719131, 0.00013922527432441711, 0.00014334078878164291, 0.0001474563032388687, 0.0001515718176960945, 0.0001556873321533203]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 6.0, 2.0, 4.0, 4.0, 9.0, 9.0, 13.0, 11.0, 37.0, 48.0, 83.0, 124.0, 229.0, 484.0, 1042.0, 2800.0, 10484.0, 62625.0, 559626.0, 360335.0, 39175.0, 7376.0, 2283.0, 856.0, 382.0, 191.0, 110.0, 66.0, 51.0, 35.0, 18.0, 15.0, 7.0, 9.0, 5.0, 5.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1295166015625, -0.1260976791381836, -0.12267875671386719, -0.11925983428955078, -0.11584091186523438, -0.11242198944091797, -0.10900306701660156, -0.10558414459228516, -0.10216522216796875, -0.09874629974365234, -0.09532737731933594, -0.09190845489501953, -0.08848953247070312, -0.08507061004638672, -0.08165168762207031, -0.0782327651977539, -0.0748138427734375, -0.0713949203491211, -0.06797599792480469, -0.06455707550048828, -0.061138153076171875, -0.05771923065185547, -0.05430030822753906, -0.050881385803222656, -0.04746246337890625, -0.044043540954589844, -0.04062461853027344, -0.03720569610595703, -0.033786773681640625, -0.03036785125732422, -0.026948928833007812, -0.023530006408691406, -0.020111083984375, -0.016692161560058594, -0.013273239135742188, -0.009854316711425781, -0.006435394287109375, -0.0030164718627929688, 0.0004024505615234375, 0.0038213729858398438, 0.00724029541015625, 0.010659217834472656, 0.014078140258789062, 0.01749706268310547, 0.020915985107421875, 0.02433490753173828, 0.027753829956054688, 0.031172752380371094, 0.0345916748046875, 0.038010597229003906, 0.04142951965332031, 0.04484844207763672, 0.048267364501953125, 0.05168628692626953, 0.05510520935058594, 0.058524131774902344, 0.06194305419921875, 0.06536197662353516, 0.06878089904785156, 0.07219982147216797, 0.07561874389648438, 0.07903766632080078, 0.08245658874511719, 0.0858755111694336, 0.08929443359375]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 5.0, 7.0, 8.0, 9.0, 10.0, 16.0, 19.0, 35.0, 47.0, 54.0, 64.0, 96.0, 87.0, 98.0, 100.0, 83.0, 72.0, 48.0, 38.0, 32.0, 17.0, 19.0, 13.0, 9.0, 6.0, 3.0, 5.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0831298828125, -0.08116817474365234, -0.07920646667480469, -0.07724475860595703, -0.07528305053710938, -0.07332134246826172, -0.07135963439941406, -0.0693979263305664, -0.06743621826171875, -0.0654745101928711, -0.06351280212402344, -0.06155109405517578, -0.059589385986328125, -0.05762767791748047, -0.05566596984863281, -0.053704261779785156, -0.0517425537109375, -0.049780845642089844, -0.04781913757324219, -0.04585742950439453, -0.043895721435546875, -0.04193401336669922, -0.03997230529785156, -0.038010597229003906, -0.03604888916015625, -0.034087181091308594, -0.03212547302246094, -0.03016376495361328, -0.028202056884765625, -0.02624034881591797, -0.024278640747070312, -0.022316932678222656, -0.020355224609375, -0.018393516540527344, -0.016431808471679688, -0.014470100402832031, -0.012508392333984375, -0.010546684265136719, -0.008584976196289062, -0.006623268127441406, -0.00466156005859375, -0.0026998519897460938, -0.0007381439208984375, 0.0012235641479492188, 0.003185272216796875, 0.005146980285644531, 0.0071086883544921875, 0.009070396423339844, 0.0110321044921875, 0.012993812561035156, 0.014955520629882812, 0.01691722869873047, 0.018878936767578125, 0.02084064483642578, 0.022802352905273438, 0.024764060974121094, 0.02672576904296875, 0.028687477111816406, 0.030649185180664062, 0.03261089324951172, 0.034572601318359375, 0.03653430938720703, 0.03849601745605469, 0.040457725524902344, 0.04241943359375]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 3.0, 8.0, 13.0, 36.0, 80.0, 197.0, 253.0, 219.0, 117.0, 55.0, 21.0, 5.0, 1.0, 2.0, 1.0, 2.0], "bins": [-3.112252712249756, -3.05542254447937, -2.9985921382904053, -2.9417619705200195, -2.8849315643310547, -2.828101396560669, -2.771271228790283, -2.7144408226013184, -2.6576106548309326, -2.600780487060547, -2.543950080871582, -2.4871199131011963, -2.4302897453308105, -2.3734593391418457, -2.31662917137146, -2.259798765182495, -2.2029685974121094, -2.1461384296417236, -2.089308023452759, -2.032477855682373, -1.9756475687026978, -1.9188172817230225, -1.8619871139526367, -1.8051568269729614, -1.7483265399932861, -1.6914962530136108, -1.6346659660339355, -1.5778357982635498, -1.5210055112838745, -1.4641752243041992, -1.4073450565338135, -1.3505147695541382, -1.293684482574463, -1.2368541955947876, -1.1800239086151123, -1.1231937408447266, -1.0663634538650513, -1.009533166885376, -0.9527029395103455, -0.8958727121353149, -0.8390423655509949, -0.7822121381759644, -0.7253818511962891, -0.6685515642166138, -0.6117213368415833, -0.5548911094665527, -0.49806082248687744, -0.44123056530952454, -0.38440030813217163, -0.3275700509548187, -0.2707397937774658, -0.21390953660011292, -0.15707927942276, -0.1002490222454071, -0.0434187650680542, 0.013411492109298706, 0.07024174928665161, 0.12707200646400452, 0.18390226364135742, 0.24073252081871033, 0.29756277799606323, 0.35439303517341614, 0.41122329235076904, 0.46805354952812195, 0.5248838067054749]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 5.0, 4.0, 5.0, 11.0, 7.0, 5.0, 14.0, 9.0, 19.0, 17.0, 21.0, 32.0, 19.0, 28.0, 27.0, 37.0, 49.0, 43.0, 48.0, 40.0, 30.0, 57.0, 50.0, 39.0, 43.0, 58.0, 39.0, 35.0, 34.0, 20.0, 23.0, 20.0, 19.0, 24.0, 15.0, 15.0, 12.0, 9.0, 9.0, 4.0, 6.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.7116256952285767, -0.6907700896263123, -0.6699144840240479, -0.6490589380264282, -0.6282033324241638, -0.6073477268218994, -0.586492121219635, -0.5656365156173706, -0.544780969619751, -0.5239253640174866, -0.5030697584152222, -0.48221418261528015, -0.46135860681533813, -0.44050300121307373, -0.4196473956108093, -0.3987917900085449, -0.3779361844062805, -0.3570805788040161, -0.3362250030040741, -0.3153693974018097, -0.2945138216018677, -0.27365821599960327, -0.25280261039733887, -0.23194701969623566, -0.21109142899513245, -0.19023583829402924, -0.16938024759292603, -0.14852464199066162, -0.1276690512895584, -0.1068134605884552, -0.0859578549861908, -0.06510226428508759, -0.044246673583984375, -0.023391079157590866, -0.002535484731197357, 0.01832011342048645, 0.03917570412158966, 0.06003129482269287, 0.08088690042495728, 0.10174249112606049, 0.1225980818271637, 0.1434536725282669, 0.16430926322937012, 0.18516486883163452, 0.20602045953273773, 0.22687605023384094, 0.24773165583610535, 0.26858723163604736, 0.28944283723831177, 0.31029844284057617, 0.3311540186405182, 0.3520096242427826, 0.3728652000427246, 0.393720805644989, 0.4145764112472534, 0.4354320168495178, 0.45628759264945984, 0.47714319825172424, 0.49799877405166626, 0.5188543796539307, 0.5397099852561951, 0.5605655908584595, 0.5814211368560791, 0.6022767424583435, 0.6231323480606079]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 2.0, 6.0, 4.0, 8.0, 8.0, 6.0, 12.0, 22.0, 26.0, 51.0, 69.0, 127.0, 207.0, 352.0, 747.0, 1337.0, 2595.0, 5686.0, 14541.0, 47094.0, 239130.0, 3378767.0, 404520.0, 65627.0, 19384.0, 7345.0, 3102.0, 1502.0, 926.0, 449.0, 250.0, 141.0, 89.0, 53.0, 35.0, 22.0, 15.0, 17.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.1741943359375, -0.16956329345703125, -0.1649322509765625, -0.16030120849609375, -0.155670166015625, -0.15103912353515625, -0.1464080810546875, -0.14177703857421875, -0.13714599609375, -0.13251495361328125, -0.1278839111328125, -0.12325286865234375, -0.118621826171875, -0.11399078369140625, -0.1093597412109375, -0.10472869873046875, -0.10009765625, -0.09546661376953125, -0.0908355712890625, -0.08620452880859375, -0.081573486328125, -0.07694244384765625, -0.0723114013671875, -0.06768035888671875, -0.06304931640625, -0.05841827392578125, -0.0537872314453125, -0.04915618896484375, -0.044525146484375, -0.03989410400390625, -0.0352630615234375, -0.03063201904296875, -0.0260009765625, -0.02136993408203125, -0.0167388916015625, -0.01210784912109375, -0.007476806640625, -0.00284576416015625, 0.0017852783203125, 0.00641632080078125, 0.01104736328125, 0.01567840576171875, 0.0203094482421875, 0.02494049072265625, 0.029571533203125, 0.03420257568359375, 0.0388336181640625, 0.04346466064453125, 0.048095703125, 0.05272674560546875, 0.0573577880859375, 0.06198883056640625, 0.066619873046875, 0.07125091552734375, 0.0758819580078125, 0.08051300048828125, 0.08514404296875, 0.08977508544921875, 0.0944061279296875, 0.09903717041015625, 0.103668212890625, 0.10829925537109375, 0.1129302978515625, 0.11756134033203125, 0.1221923828125]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 6.0, 5.0, 20.0, 5.0, 18.0, 31.0, 34.0, 44.0, 55.0, 57.0, 68.0, 80.0, 80.0, 75.0, 80.0, 67.0, 51.0, 51.0, 40.0, 42.0, 26.0, 28.0, 14.0, 12.0, 4.0, 8.0, 4.0, 2.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.046875, -0.04561281204223633, -0.044350624084472656, -0.043088436126708984, -0.04182624816894531, -0.04056406021118164, -0.03930187225341797, -0.0380396842956543, -0.036777496337890625, -0.03551530838012695, -0.03425312042236328, -0.03299093246459961, -0.03172874450683594, -0.030466556549072266, -0.029204368591308594, -0.027942180633544922, -0.02667999267578125, -0.025417804718017578, -0.024155616760253906, -0.022893428802490234, -0.021631240844726562, -0.02036905288696289, -0.01910686492919922, -0.017844676971435547, -0.016582489013671875, -0.015320301055908203, -0.014058113098144531, -0.01279592514038086, -0.011533737182617188, -0.010271549224853516, -0.009009361267089844, -0.007747173309326172, -0.0064849853515625, -0.005222797393798828, -0.003960609436035156, -0.0026984214782714844, -0.0014362335205078125, -0.00017404556274414062, 0.0010881423950195312, 0.002350330352783203, 0.003612518310546875, 0.004874706268310547, 0.006136894226074219, 0.007399082183837891, 0.008661270141601562, 0.009923458099365234, 0.011185646057128906, 0.012447834014892578, 0.01371002197265625, 0.014972209930419922, 0.016234397888183594, 0.017496585845947266, 0.018758773803710938, 0.02002096176147461, 0.02128314971923828, 0.022545337677001953, 0.023807525634765625, 0.025069713592529297, 0.02633190155029297, 0.02759408950805664, 0.028856277465820312, 0.030118465423583984, 0.031380653381347656, 0.03264284133911133, 0.033905029296875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 6.0, 7.0, 11.0, 17.0, 28.0, 36.0, 46.0, 93.0, 128.0, 356.0, 1110.0, 4919.0, 42590.0, 2083802.0, 2011751.0, 42292.0, 4992.0, 1168.0, 428.0, 192.0, 97.0, 68.0, 38.0, 34.0, 28.0, 11.0, 14.0, 7.0, 6.0, 2.0, 2.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.277099609375, -0.2675437927246094, -0.25798797607421875, -0.24843215942382812, -0.2388763427734375, -0.22932052612304688, -0.21976470947265625, -0.21020889282226562, -0.200653076171875, -0.19109725952148438, -0.18154144287109375, -0.17198562622070312, -0.1624298095703125, -0.15287399291992188, -0.14331817626953125, -0.13376235961914062, -0.12420654296875, -0.11465072631835938, -0.10509490966796875, -0.09553909301757812, -0.0859832763671875, -0.07642745971679688, -0.06687164306640625, -0.057315826416015625, -0.047760009765625, -0.038204193115234375, -0.02864837646484375, -0.019092559814453125, -0.0095367431640625, 1.9073486328125e-05, 0.00957489013671875, 0.019130706787109375, 0.0286865234375, 0.038242340087890625, 0.04779815673828125, 0.057353973388671875, 0.0669097900390625, 0.07646560668945312, 0.08602142333984375, 0.09557723999023438, 0.105133056640625, 0.11468887329101562, 0.12424468994140625, 0.13380050659179688, 0.1433563232421875, 0.15291213989257812, 0.16246795654296875, 0.17202377319335938, 0.18157958984375, 0.19113540649414062, 0.20069122314453125, 0.21024703979492188, 0.2198028564453125, 0.22935867309570312, 0.23891448974609375, 0.24847030639648438, 0.258026123046875, 0.2675819396972656, 0.27713775634765625, 0.2866935729980469, 0.2962493896484375, 0.3058052062988281, 0.31536102294921875, 0.3249168395996094, 0.33447265625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 4.0, 10.0, 8.0, 19.0, 36.0, 42.0, 73.0, 142.0, 310.0, 818.0, 1534.0, 544.0, 231.0, 129.0, 80.0, 37.0, 22.0, 17.0, 8.0, 5.0, 0.0, 7.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0654296875, -0.06235504150390625, -0.0592803955078125, -0.05620574951171875, -0.053131103515625, -0.05005645751953125, -0.0469818115234375, -0.04390716552734375, -0.04083251953125, -0.03775787353515625, -0.0346832275390625, -0.03160858154296875, -0.028533935546875, -0.02545928955078125, -0.0223846435546875, -0.01930999755859375, -0.0162353515625, -0.01316070556640625, -0.0100860595703125, -0.00701141357421875, -0.003936767578125, -0.00086212158203125, 0.0022125244140625, 0.00528717041015625, 0.00836181640625, 0.01143646240234375, 0.0145111083984375, 0.01758575439453125, 0.020660400390625, 0.02373504638671875, 0.0268096923828125, 0.02988433837890625, 0.032958984375, 0.03603363037109375, 0.0391082763671875, 0.04218292236328125, 0.045257568359375, 0.04833221435546875, 0.0514068603515625, 0.05448150634765625, 0.05755615234375, 0.06063079833984375, 0.0637054443359375, 0.06678009033203125, 0.069854736328125, 0.07292938232421875, 0.0760040283203125, 0.07907867431640625, 0.0821533203125, 0.08522796630859375, 0.0883026123046875, 0.09137725830078125, 0.094451904296875, 0.09752655029296875, 0.1006011962890625, 0.10367584228515625, 0.10675048828125, 0.10982513427734375, 0.1128997802734375, 0.11597442626953125, 0.119049072265625, 0.12212371826171875, 0.1251983642578125, 0.12827301025390625, 0.13134765625]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 8.0, 10.0, 39.0, 63.0, 138.0, 178.0, 199.0, 152.0, 91.0, 62.0, 31.0, 13.0, 10.0, 6.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.32728344202041626, -0.30531027913093567, -0.2833371162414551, -0.2613639235496521, -0.2393907606601715, -0.21741759777069092, -0.19544441998004913, -0.17347124218940735, -0.15149807929992676, -0.12952491641044617, -0.10755173861980438, -0.0855785682797432, -0.063605397939682, -0.04163222759962082, -0.01965905725955963, 0.0023141205310821533, 0.024287283420562744, 0.04626045376062393, 0.06823362410068512, 0.09020679444074631, 0.1121799647808075, 0.13415312767028809, 0.15612630546092987, 0.17809948325157166, 0.20007264614105225, 0.22204580903053284, 0.24401898682117462, 0.2659921646118164, 0.287965327501297, 0.3099384903907776, 0.33191168308258057, 0.35388484597206116, 0.3758580684661865, 0.3978312313556671, 0.4198043942451477, 0.4417775869369507, 0.4637507498264313, 0.48572391271591187, 0.5076971054077148, 0.529670238494873, 0.551643431186676, 0.573616623878479, 0.5955897569656372, 0.6175629496574402, 0.6395361423492432, 0.6615092754364014, 0.6834824681282043, 0.7054556608200073, 0.7274287939071655, 0.7494019865989685, 0.7713751196861267, 0.7933483123779297, 0.8153214454650879, 0.8372946381568909, 0.8592678308486938, 0.881240963935852, 0.903214156627655, 0.925187349319458, 0.9471604824066162, 0.9691336750984192, 0.9911068677902222, 1.0130800008773804, 1.0350531339645386, 1.0570263862609863, 1.0789995193481445]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 7.0, 8.0, 2.0, 6.0, 6.0, 9.0, 16.0, 14.0, 15.0, 17.0, 22.0, 27.0, 18.0, 25.0, 26.0, 33.0, 30.0, 35.0, 38.0, 41.0, 42.0, 48.0, 47.0, 44.0, 36.0, 41.0, 38.0, 42.0, 26.0, 31.0, 29.0, 21.0, 26.0, 18.0, 24.0, 20.0, 16.0, 12.0, 11.0, 7.0, 6.0, 8.0, 4.0, 5.0, 1.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.24209856986999512, -0.23471969366073608, -0.22734081745147705, -0.21996194124221802, -0.21258306503295898, -0.20520418882369995, -0.19782531261444092, -0.19044643640518188, -0.18306756019592285, -0.17568868398666382, -0.16830980777740479, -0.16093093156814575, -0.15355205535888672, -0.14617317914962769, -0.13879430294036865, -0.13141542673110962, -0.12403655052185059, -0.11665767431259155, -0.10927879810333252, -0.10189992189407349, -0.09452104568481445, -0.08714216947555542, -0.07976329326629639, -0.07238441705703735, -0.06500554084777832, -0.05762666463851929, -0.050247788429260254, -0.04286891222000122, -0.03549003601074219, -0.028111159801483154, -0.02073228359222412, -0.013353407382965088, -0.005974531173706055, 0.0014043450355529785, 0.008783221244812012, 0.016162097454071045, 0.023540973663330078, 0.03091984987258911, 0.038298726081848145, 0.04567760229110718, 0.05305647850036621, 0.060435354709625244, 0.06781423091888428, 0.07519310712814331, 0.08257198333740234, 0.08995085954666138, 0.09732973575592041, 0.10470861196517944, 0.11208748817443848, 0.11946636438369751, 0.12684524059295654, 0.13422411680221558, 0.1416029930114746, 0.14898186922073364, 0.15636074542999268, 0.1637396216392517, 0.17111849784851074, 0.17849737405776978, 0.1858762502670288, 0.19325512647628784, 0.20063400268554688, 0.2080128788948059, 0.21539175510406494, 0.22277063131332397, 0.230149507522583]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 9.0, 13.0, 12.0, 21.0, 27.0, 66.0, 72.0, 105.0, 178.0, 320.0, 539.0, 1030.0, 2084.0, 4542.0, 10220.0, 24735.0, 63744.0, 187852.0, 458092.0, 187035.0, 63875.0, 24845.0, 10232.0, 4461.0, 2110.0, 1014.0, 532.0, 318.0, 172.0, 107.0, 71.0, 47.0, 30.0, 17.0, 13.0, 6.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.138916015625, -0.13436126708984375, -0.1298065185546875, -0.12525177001953125, -0.120697021484375, -0.11614227294921875, -0.1115875244140625, -0.10703277587890625, -0.10247802734375, -0.09792327880859375, -0.0933685302734375, -0.08881378173828125, -0.084259033203125, -0.07970428466796875, -0.0751495361328125, -0.07059478759765625, -0.0660400390625, -0.06148529052734375, -0.0569305419921875, -0.05237579345703125, -0.047821044921875, -0.04326629638671875, -0.0387115478515625, -0.03415679931640625, -0.02960205078125, -0.02504730224609375, -0.0204925537109375, -0.01593780517578125, -0.011383056640625, -0.00682830810546875, -0.0022735595703125, 0.00228118896484375, 0.0068359375, 0.01139068603515625, 0.0159454345703125, 0.02050018310546875, 0.025054931640625, 0.02960968017578125, 0.0341644287109375, 0.03871917724609375, 0.04327392578125, 0.04782867431640625, 0.0523834228515625, 0.05693817138671875, 0.061492919921875, 0.06604766845703125, 0.0706024169921875, 0.07515716552734375, 0.0797119140625, 0.08426666259765625, 0.0888214111328125, 0.09337615966796875, 0.097930908203125, 0.10248565673828125, 0.1070404052734375, 0.11159515380859375, 0.11614990234375, 0.12070465087890625, 0.1252593994140625, 0.12981414794921875, 0.134368896484375, 0.13892364501953125, 0.1434783935546875, 0.14803314208984375, 0.152587890625]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 6.0, 6.0, 11.0, 14.0, 17.0, 20.0, 33.0, 51.0, 54.0, 54.0, 65.0, 70.0, 64.0, 70.0, 74.0, 65.0, 61.0, 65.0, 47.0, 30.0, 37.0, 38.0, 16.0, 9.0, 10.0, 8.0, 7.0, 2.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.042266845703125, -0.041043758392333984, -0.03982067108154297, -0.03859758377075195, -0.03737449645996094, -0.03615140914916992, -0.034928321838378906, -0.03370523452758789, -0.032482147216796875, -0.03125905990600586, -0.030035972595214844, -0.028812885284423828, -0.027589797973632812, -0.026366710662841797, -0.02514362335205078, -0.023920536041259766, -0.02269744873046875, -0.021474361419677734, -0.02025127410888672, -0.019028186798095703, -0.017805099487304688, -0.016582012176513672, -0.015358924865722656, -0.01413583755493164, -0.012912750244140625, -0.01168966293334961, -0.010466575622558594, -0.009243488311767578, -0.008020401000976562, -0.006797313690185547, -0.005574226379394531, -0.004351139068603516, -0.0031280517578125, -0.0019049644470214844, -0.0006818771362304688, 0.0005412101745605469, 0.0017642974853515625, 0.002987384796142578, 0.004210472106933594, 0.005433559417724609, 0.006656646728515625, 0.00787973403930664, 0.009102821350097656, 0.010325908660888672, 0.011548995971679688, 0.012772083282470703, 0.013995170593261719, 0.015218257904052734, 0.01644134521484375, 0.017664432525634766, 0.01888751983642578, 0.020110607147216797, 0.021333694458007812, 0.022556781768798828, 0.023779869079589844, 0.02500295639038086, 0.026226043701171875, 0.02744913101196289, 0.028672218322753906, 0.029895305633544922, 0.031118392944335938, 0.03234148025512695, 0.03356456756591797, 0.034787654876708984, 0.0360107421875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 0.0, 6.0, 1.0, 2.0, 3.0, 7.0, 7.0, 12.0, 7.0, 15.0, 12.0, 27.0, 43.0, 42.0, 71.0, 88.0, 123.0, 150.0, 231.0, 391.0, 606.0, 1113.0, 2129.0, 4798.0, 11976.0, 33691.0, 104004.0, 380730.0, 358053.0, 97417.0, 31796.0, 11407.0, 4560.0, 2157.0, 1124.0, 594.0, 355.0, 256.0, 164.0, 111.0, 78.0, 48.0, 39.0, 31.0, 31.0, 22.0, 6.0, 6.0, 8.0, 6.0, 8.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.13232421875, -0.12818527221679688, -0.12404632568359375, -0.11990737915039062, -0.1157684326171875, -0.11162948608398438, -0.10749053955078125, -0.10335159301757812, -0.099212646484375, -0.09507369995117188, -0.09093475341796875, -0.08679580688476562, -0.0826568603515625, -0.07851791381835938, -0.07437896728515625, -0.07024002075195312, -0.06610107421875, -0.061962127685546875, -0.05782318115234375, -0.053684234619140625, -0.0495452880859375, -0.045406341552734375, -0.04126739501953125, -0.037128448486328125, -0.032989501953125, -0.028850555419921875, -0.02471160888671875, -0.020572662353515625, -0.0164337158203125, -0.012294769287109375, -0.00815582275390625, -0.004016876220703125, 0.0001220703125, 0.004261016845703125, 0.00839996337890625, 0.012538909912109375, 0.0166778564453125, 0.020816802978515625, 0.02495574951171875, 0.029094696044921875, 0.033233642578125, 0.037372589111328125, 0.04151153564453125, 0.045650482177734375, 0.0497894287109375, 0.053928375244140625, 0.05806732177734375, 0.062206268310546875, 0.06634521484375, 0.07048416137695312, 0.07462310791015625, 0.07876205444335938, 0.0829010009765625, 0.08703994750976562, 0.09117889404296875, 0.09531784057617188, 0.099456787109375, 0.10359573364257812, 0.10773468017578125, 0.11187362670898438, 0.1160125732421875, 0.12015151977539062, 0.12429046630859375, 0.12842941284179688, 0.132568359375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 8.0, 5.0, 2.0, 8.0, 12.0, 12.0, 7.0, 11.0, 15.0, 23.0, 19.0, 16.0, 29.0, 27.0, 22.0, 35.0, 38.0, 41.0, 35.0, 37.0, 45.0, 41.0, 33.0, 38.0, 36.0, 54.0, 39.0, 27.0, 32.0, 38.0, 29.0, 25.0, 21.0, 25.0, 26.0, 18.0, 22.0, 10.0, 6.0, 8.0, 11.0, 7.0, 3.0, 4.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1204833984375, -0.1167898178100586, -0.11309623718261719, -0.10940265655517578, -0.10570907592773438, -0.10201549530029297, -0.09832191467285156, -0.09462833404541016, -0.09093475341796875, -0.08724117279052734, -0.08354759216308594, -0.07985401153564453, -0.07616043090820312, -0.07246685028076172, -0.06877326965332031, -0.0650796890258789, -0.0613861083984375, -0.057692527770996094, -0.05399894714355469, -0.05030536651611328, -0.046611785888671875, -0.04291820526123047, -0.03922462463378906, -0.035531044006347656, -0.03183746337890625, -0.028143882751464844, -0.024450302124023438, -0.02075672149658203, -0.017063140869140625, -0.013369560241699219, -0.009675979614257812, -0.005982398986816406, -0.002288818359375, 0.0014047622680664062, 0.0050983428955078125, 0.008791923522949219, 0.012485504150390625, 0.01617908477783203, 0.019872665405273438, 0.023566246032714844, 0.02725982666015625, 0.030953407287597656, 0.03464698791503906, 0.03834056854248047, 0.042034149169921875, 0.04572772979736328, 0.04942131042480469, 0.053114891052246094, 0.0568084716796875, 0.060502052307128906, 0.06419563293457031, 0.06788921356201172, 0.07158279418945312, 0.07527637481689453, 0.07896995544433594, 0.08266353607177734, 0.08635711669921875, 0.09005069732666016, 0.09374427795410156, 0.09743785858154297, 0.10113143920898438, 0.10482501983642578, 0.10851860046386719, 0.1122121810913086, 0.11590576171875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 5.0, 6.0, 7.0, 7.0, 9.0, 9.0, 11.0, 16.0, 17.0, 29.0, 42.0, 69.0, 85.0, 168.0, 300.0, 666.0, 1674.0, 5629.0, 31113.0, 542668.0, 431165.0, 26760.0, 5168.0, 1536.0, 640.0, 275.0, 154.0, 105.0, 51.0, 41.0, 23.0, 17.0, 16.0, 17.0, 12.0, 7.0, 8.0, 8.0, 6.0, 7.0, 2.0, 6.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2080078125, -0.20129013061523438, -0.19457244873046875, -0.18785476684570312, -0.1811370849609375, -0.17441940307617188, -0.16770172119140625, -0.16098403930664062, -0.154266357421875, -0.14754867553710938, -0.14083099365234375, -0.13411331176757812, -0.1273956298828125, -0.12067794799804688, -0.11396026611328125, -0.10724258422851562, -0.10052490234375, -0.09380722045898438, -0.08708953857421875, -0.08037185668945312, -0.0736541748046875, -0.06693649291992188, -0.06021881103515625, -0.053501129150390625, -0.046783447265625, -0.040065765380859375, -0.03334808349609375, -0.026630401611328125, -0.0199127197265625, -0.013195037841796875, -0.00647735595703125, 0.000240325927734375, 0.0069580078125, 0.013675689697265625, 0.02039337158203125, 0.027111053466796875, 0.0338287353515625, 0.040546417236328125, 0.04726409912109375, 0.053981781005859375, 0.060699462890625, 0.06741714477539062, 0.07413482666015625, 0.08085250854492188, 0.0875701904296875, 0.09428787231445312, 0.10100555419921875, 0.10772323608398438, 0.11444091796875, 0.12115859985351562, 0.12787628173828125, 0.13459396362304688, 0.1413116455078125, 0.14802932739257812, 0.15474700927734375, 0.16146469116210938, 0.168182373046875, 0.17490005493164062, 0.18161773681640625, 0.18833541870117188, 0.1950531005859375, 0.20177078247070312, 0.20848846435546875, 0.21520614624023438, 0.221923828125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 6.0, 12.0, 7.0, 14.0, 16.0, 27.0, 35.0, 66.0, 74.0, 98.0, 104.0, 119.0, 87.0, 86.0, 80.0, 65.0, 34.0, 23.0, 13.0, 13.0, 11.0, 5.0, 3.0, 5.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0001437664031982422, -0.0001403680071234703, -0.00013696961104869843, -0.00013357121497392654, -0.00013017281889915466, -0.00012677442282438278, -0.0001233760267496109, -0.00011997763067483902, -0.00011657923460006714, -0.00011318083852529526, -0.00010978244245052338, -0.0001063840463757515, -0.00010298565030097961, -9.958725422620773e-05, -9.618885815143585e-05, -9.279046207666397e-05, -8.939206600189209e-05, -8.599366992712021e-05, -8.259527385234833e-05, -7.919687777757645e-05, -7.579848170280457e-05, -7.240008562803268e-05, -6.90016895532608e-05, -6.560329347848892e-05, -6.220489740371704e-05, -5.880650132894516e-05, -5.540810525417328e-05, -5.20097091794014e-05, -4.8611313104629517e-05, -4.5212917029857635e-05, -4.1814520955085754e-05, -3.841612488031387e-05, -3.501772880554199e-05, -3.161933273077011e-05, -2.822093665599823e-05, -2.482254058122635e-05, -2.1424144506454468e-05, -1.8025748431682587e-05, -1.4627352356910706e-05, -1.1228956282138824e-05, -7.830560207366943e-06, -4.432164132595062e-06, -1.0337680578231812e-06, 2.3646280169487e-06, 5.763024091720581e-06, 9.161420166492462e-06, 1.2559816241264343e-05, 1.5958212316036224e-05, 1.9356608390808105e-05, 2.2755004465579987e-05, 2.6153400540351868e-05, 2.955179661512375e-05, 3.295019268989563e-05, 3.634858876466751e-05, 3.974698483943939e-05, 4.314538091421127e-05, 4.6543776988983154e-05, 4.9942173063755035e-05, 5.3340569138526917e-05, 5.67389652132988e-05, 6.013736128807068e-05, 6.353575736284256e-05, 6.693415343761444e-05, 7.033254951238632e-05, 7.37309455871582e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 4.0, 4.0, 4.0, 11.0, 8.0, 19.0, 29.0, 57.0, 98.0, 202.0, 381.0, 943.0, 3329.0, 20007.0, 451521.0, 544148.0, 22283.0, 3655.0, 991.0, 367.0, 214.0, 105.0, 69.0, 37.0, 26.0, 13.0, 6.0, 9.0, 6.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.27734375, -0.2702369689941406, -0.26313018798828125, -0.2560234069824219, -0.2489166259765625, -0.24180984497070312, -0.23470306396484375, -0.22759628295898438, -0.220489501953125, -0.21338272094726562, -0.20627593994140625, -0.19916915893554688, -0.1920623779296875, -0.18495559692382812, -0.17784881591796875, -0.17074203491210938, -0.16363525390625, -0.15652847290039062, -0.14942169189453125, -0.14231491088867188, -0.1352081298828125, -0.12810134887695312, -0.12099456787109375, -0.11388778686523438, -0.106781005859375, -0.09967422485351562, -0.09256744384765625, -0.08546066284179688, -0.0783538818359375, -0.07124710083007812, -0.06414031982421875, -0.057033538818359375, -0.0499267578125, -0.042819976806640625, -0.03571319580078125, -0.028606414794921875, -0.0214996337890625, -0.014392852783203125, -0.00728607177734375, -0.000179290771484375, 0.006927490234375, 0.014034271240234375, 0.02114105224609375, 0.028247833251953125, 0.0353546142578125, 0.042461395263671875, 0.04956817626953125, 0.056674957275390625, 0.06378173828125, 0.07088851928710938, 0.07799530029296875, 0.08510208129882812, 0.0922088623046875, 0.09931564331054688, 0.10642242431640625, 0.11352920532226562, 0.120635986328125, 0.12774276733398438, 0.13484954833984375, 0.14195632934570312, 0.1490631103515625, 0.15616989135742188, 0.16327667236328125, 0.17038345336914062, 0.177490234375]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 3.0, 2.0, 4.0, 3.0, 4.0, 12.0, 14.0, 22.0, 30.0, 39.0, 58.0, 114.0, 132.0, 143.0, 120.0, 101.0, 54.0, 43.0, 26.0, 20.0, 21.0, 10.0, 5.0, 7.0, 3.0, 2.0, 4.0, 1.0, 3.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.111328125, -0.1080942153930664, -0.10486030578613281, -0.10162639617919922, -0.09839248657226562, -0.09515857696533203, -0.09192466735839844, -0.08869075775146484, -0.08545684814453125, -0.08222293853759766, -0.07898902893066406, -0.07575511932373047, -0.07252120971679688, -0.06928730010986328, -0.06605339050292969, -0.0628194808959961, -0.0595855712890625, -0.056351661682128906, -0.05311775207519531, -0.04988384246826172, -0.046649932861328125, -0.04341602325439453, -0.04018211364746094, -0.036948204040527344, -0.03371429443359375, -0.030480384826660156, -0.027246475219726562, -0.02401256561279297, -0.020778656005859375, -0.01754474639892578, -0.014310836791992188, -0.011076927185058594, -0.007843017578125, -0.004609107971191406, -0.0013751983642578125, 0.0018587112426757812, 0.005092620849609375, 0.008326530456542969, 0.011560440063476562, 0.014794349670410156, 0.01802825927734375, 0.021262168884277344, 0.024496078491210938, 0.02772998809814453, 0.030963897705078125, 0.03419780731201172, 0.03743171691894531, 0.040665626525878906, 0.0438995361328125, 0.047133445739746094, 0.05036735534667969, 0.05360126495361328, 0.056835174560546875, 0.06006908416748047, 0.06330299377441406, 0.06653690338134766, 0.06977081298828125, 0.07300472259521484, 0.07623863220214844, 0.07947254180908203, 0.08270645141601562, 0.08594036102294922, 0.08917427062988281, 0.0924081802368164, 0.09564208984375]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 6.0, 1.0, 8.0, 27.0, 67.0, 116.0, 182.0, 231.0, 199.0, 111.0, 47.0, 13.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8055821657180786, -0.7406996488571167, -0.6758171319961548, -0.6109346747398376, -0.5460521578788757, -0.4811696410179138, -0.4162871539592743, -0.35140466690063477, -0.28652215003967285, -0.22163964807987213, -0.1567571461200714, -0.09187464416027069, -0.02699214220046997, 0.03789037466049194, 0.10277286171913147, 0.167655348777771, 0.2325378656387329, 0.2974203824996948, 0.36230286955833435, 0.4271853566169739, 0.4920678734779358, 0.5569503903388977, 0.6218328475952148, 0.6867153644561768, 0.7515978813171387, 0.8164803981781006, 0.8813629150390625, 0.9462453722953796, 1.0111279487609863, 1.0760104656219482, 1.1408928632736206, 1.2057753801345825, 1.270658016204834, 1.335540533065796, 1.4004230499267578, 1.4653055667877197, 1.5301880836486816, 1.5950706005096436, 1.659952998161316, 1.7248355150222778, 1.7897180318832397, 1.8546005487442017, 1.9194830656051636, 1.9843655824661255, 2.049247980117798, 2.1141304969787598, 2.1790130138397217, 2.2438955307006836, 2.3087780475616455, 2.3736605644226074, 2.4385430812835693, 2.5034255981445312, 2.568308115005493, 2.633190631866455, 2.698073148727417, 2.762955665588379, 2.8278379440307617, 2.8927204608917236, 2.9576029777526855, 3.0224854946136475, 3.0873680114746094, 3.1522505283355713, 3.217133045196533, 3.282015323638916, 3.346898078918457]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 7.0, 2.0, 5.0, 5.0, 8.0, 16.0, 10.0, 13.0, 21.0, 13.0, 30.0, 20.0, 28.0, 29.0, 30.0, 35.0, 44.0, 35.0, 37.0, 40.0, 39.0, 46.0, 45.0, 37.0, 36.0, 41.0, 32.0, 41.0, 28.0, 26.0, 31.0, 33.0, 26.0, 17.0, 17.0, 9.0, 11.0, 12.0, 7.0, 10.0, 10.0, 5.0, 5.0, 9.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.6402153372764587, -0.6184554100036621, -0.5966954231262207, -0.5749354958534241, -0.5531755685806274, -0.531415581703186, -0.5096556544303894, -0.4878957271575928, -0.46613577008247375, -0.44437581300735474, -0.4226158857345581, -0.4008559286594391, -0.37909597158432007, -0.35733604431152344, -0.3355760872364044, -0.3138161301612854, -0.29205620288848877, -0.27029624581336975, -0.24853631854057312, -0.2267763614654541, -0.20501641929149628, -0.18325647711753845, -0.16149652004241943, -0.1397365778684616, -0.11797663569450378, -0.09621669352054596, -0.07445674389600754, -0.052696794271469116, -0.03093685209751129, -0.009176909923553467, 0.012583047151565552, 0.034342989325523376, 0.0561029314994812, 0.07786287367343903, 0.09962282329797745, 0.12138277292251587, 0.1431427150964737, 0.16490265727043152, 0.18666261434555054, 0.20842255651950836, 0.2301824986934662, 0.2519424557685852, 0.27370238304138184, 0.29546234011650085, 0.3172222971916199, 0.3389822244644165, 0.3607421815395355, 0.38250213861465454, 0.40426206588745117, 0.4260220229625702, 0.4477819502353668, 0.46954190731048584, 0.49130183458328247, 0.5130617618560791, 0.5348217487335205, 0.5565816760063171, 0.5783416032791138, 0.6001015305519104, 0.6218615174293518, 0.6436214447021484, 0.6653813719749451, 0.6871412992477417, 0.7089012861251831, 0.7306612133979797, 0.7524212002754211]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 6.0, 2.0, 10.0, 19.0, 12.0, 21.0, 39.0, 53.0, 69.0, 111.0, 206.0, 324.0, 524.0, 966.0, 1621.0, 3155.0, 6933.0, 16965.0, 48291.0, 214491.0, 3338205.0, 445559.0, 75160.0, 23413.0, 9199.0, 4163.0, 2066.0, 1086.0, 630.0, 382.0, 204.0, 139.0, 105.0, 57.0, 29.0, 23.0, 15.0, 15.0, 5.0, 3.0, 6.0, 0.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1337890625, -0.1295642852783203, -0.12533950805664062, -0.12111473083496094, -0.11688995361328125, -0.11266517639160156, -0.10844039916992188, -0.10421562194824219, -0.0999908447265625, -0.09576606750488281, -0.09154129028320312, -0.08731651306152344, -0.08309173583984375, -0.07886695861816406, -0.07464218139648438, -0.07041740417480469, -0.066192626953125, -0.06196784973144531, -0.057743072509765625, -0.05351829528808594, -0.04929351806640625, -0.04506874084472656, -0.040843963623046875, -0.03661918640136719, -0.0323944091796875, -0.028169631958007812, -0.023944854736328125, -0.019720077514648438, -0.01549530029296875, -0.011270523071289062, -0.007045745849609375, -0.0028209686279296875, 0.00140380859375, 0.0056285858154296875, 0.009853363037109375, 0.014078140258789062, 0.01830291748046875, 0.022527694702148438, 0.026752471923828125, 0.030977249145507812, 0.0352020263671875, 0.03942680358886719, 0.043651580810546875, 0.04787635803222656, 0.05210113525390625, 0.05632591247558594, 0.060550689697265625, 0.06477546691894531, 0.069000244140625, 0.07322502136230469, 0.07744979858398438, 0.08167457580566406, 0.08589935302734375, 0.09012413024902344, 0.09434890747070312, 0.09857368469238281, 0.1027984619140625, 0.10702323913574219, 0.11124801635742188, 0.11547279357910156, 0.11969757080078125, 0.12392234802246094, 0.12814712524414062, 0.1323719024658203, 0.1365966796875]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 7.0, 7.0, 7.0, 10.0, 6.0, 17.0, 29.0, 24.0, 33.0, 41.0, 67.0, 58.0, 62.0, 66.0, 68.0, 77.0, 60.0, 65.0, 59.0, 46.0, 35.0, 37.0, 36.0, 16.0, 20.0, 14.0, 9.0, 8.0, 10.0, 4.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.042999267578125, -0.04183626174926758, -0.040673255920410156, -0.039510250091552734, -0.03834724426269531, -0.03718423843383789, -0.03602123260498047, -0.03485822677612305, -0.033695220947265625, -0.0325322151184082, -0.03136920928955078, -0.03020620346069336, -0.029043197631835938, -0.027880191802978516, -0.026717185974121094, -0.025554180145263672, -0.02439117431640625, -0.023228168487548828, -0.022065162658691406, -0.020902156829833984, -0.019739151000976562, -0.01857614517211914, -0.01741313934326172, -0.016250133514404297, -0.015087127685546875, -0.013924121856689453, -0.012761116027832031, -0.01159811019897461, -0.010435104370117188, -0.009272098541259766, -0.008109092712402344, -0.006946086883544922, -0.0057830810546875, -0.004620075225830078, -0.0034570693969726562, -0.0022940635681152344, -0.0011310577392578125, 3.1948089599609375e-05, 0.0011949539184570312, 0.002357959747314453, 0.003520965576171875, 0.004683971405029297, 0.005846977233886719, 0.007009983062744141, 0.008172988891601562, 0.009335994720458984, 0.010499000549316406, 0.011662006378173828, 0.01282501220703125, 0.013988018035888672, 0.015151023864746094, 0.016314029693603516, 0.017477035522460938, 0.01864004135131836, 0.01980304718017578, 0.020966053009033203, 0.022129058837890625, 0.023292064666748047, 0.02445507049560547, 0.02561807632446289, 0.026781082153320312, 0.027944087982177734, 0.029107093811035156, 0.030270099639892578, 0.03143310546875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 10.0, 20.0, 18.0, 24.0, 70.0, 98.0, 182.0, 340.0, 758.0, 2502.0, 12598.0, 134676.0, 3839737.0, 183336.0, 15424.0, 2850.0, 859.0, 344.0, 176.0, 100.0, 61.0, 42.0, 21.0, 16.0, 6.0, 10.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.34228515625, -0.3302955627441406, -0.31830596923828125, -0.3063163757324219, -0.2943267822265625, -0.2823371887207031, -0.27034759521484375, -0.2583580017089844, -0.246368408203125, -0.23437881469726562, -0.22238922119140625, -0.21039962768554688, -0.1984100341796875, -0.18642044067382812, -0.17443084716796875, -0.16244125366210938, -0.15045166015625, -0.13846206665039062, -0.12647247314453125, -0.11448287963867188, -0.1024932861328125, -0.09050369262695312, -0.07851409912109375, -0.06652450561523438, -0.054534912109375, -0.042545318603515625, -0.03055572509765625, -0.018566131591796875, -0.0065765380859375, 0.005413055419921875, 0.01740264892578125, 0.029392242431640625, 0.0413818359375, 0.053371429443359375, 0.06536102294921875, 0.07735061645507812, 0.0893402099609375, 0.10132980346679688, 0.11331939697265625, 0.12530899047851562, 0.137298583984375, 0.14928817749023438, 0.16127777099609375, 0.17326736450195312, 0.1852569580078125, 0.19724655151367188, 0.20923614501953125, 0.22122573852539062, 0.23321533203125, 0.24520492553710938, 0.25719451904296875, 0.2691841125488281, 0.2811737060546875, 0.2931632995605469, 0.30515289306640625, 0.3171424865722656, 0.329132080078125, 0.3411216735839844, 0.35311126708984375, 0.3651008605957031, 0.3770904541015625, 0.3890800476074219, 0.40106964111328125, 0.4130592346191406, 0.425048828125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 9.0, 12.0, 26.0, 45.0, 90.0, 176.0, 479.0, 2147.0, 673.0, 206.0, 93.0, 46.0, 41.0, 18.0, 11.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1339111328125, -0.12967681884765625, -0.1254425048828125, -0.12120819091796875, -0.116973876953125, -0.11273956298828125, -0.1085052490234375, -0.10427093505859375, -0.10003662109375, -0.09580230712890625, -0.0915679931640625, -0.08733367919921875, -0.083099365234375, -0.07886505126953125, -0.0746307373046875, -0.07039642333984375, -0.066162109375, -0.06192779541015625, -0.0576934814453125, -0.05345916748046875, -0.049224853515625, -0.04499053955078125, -0.0407562255859375, -0.03652191162109375, -0.03228759765625, -0.02805328369140625, -0.0238189697265625, -0.01958465576171875, -0.015350341796875, -0.01111602783203125, -0.0068817138671875, -0.00264739990234375, 0.0015869140625, 0.00582122802734375, 0.0100555419921875, 0.01428985595703125, 0.018524169921875, 0.02275848388671875, 0.0269927978515625, 0.03122711181640625, 0.03546142578125, 0.03969573974609375, 0.0439300537109375, 0.04816436767578125, 0.052398681640625, 0.05663299560546875, 0.0608673095703125, 0.06510162353515625, 0.0693359375, 0.07357025146484375, 0.0778045654296875, 0.08203887939453125, 0.086273193359375, 0.09050750732421875, 0.0947418212890625, 0.09897613525390625, 0.10321044921875, 0.10744476318359375, 0.1116790771484375, 0.11591339111328125, 0.120147705078125, 0.12438201904296875, 0.1286163330078125, 0.13285064697265625, 0.1370849609375]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 7.0, 12.0, 15.0, 38.0, 111.0, 182.0, 193.0, 174.0, 131.0, 95.0, 32.0, 15.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.087468147277832, -1.0614737272262573, -1.0354794263839722, -1.0094850063323975, -0.9834907054901123, -0.9574962854385376, -0.9315019249916077, -0.9055075645446777, -0.8795132040977478, -0.8535188436508179, -0.8275244832038879, -0.801530122756958, -0.7755357027053833, -0.7495414018630981, -0.7235469818115234, -0.6975526213645935, -0.6715582609176636, -0.6455639004707336, -0.6195695400238037, -0.5935751795768738, -0.5675808191299438, -0.5415863990783691, -0.5155920386314392, -0.4895976781845093, -0.46360331773757935, -0.4376089572906494, -0.4116145968437195, -0.38562020659446716, -0.35962584614753723, -0.3336314857006073, -0.307637095451355, -0.28164273500442505, -0.25564831495285034, -0.2296539545059204, -0.20365957915782928, -0.17766520380973816, -0.15167084336280823, -0.1256764829158783, -0.09968210756778717, -0.07368773221969604, -0.04769337177276611, -0.021699003875255585, 0.004295364022254944, 0.030289731919765472, 0.056284099817276, 0.08227846026420593, 0.10827283561229706, 0.13426721096038818, 0.16026157140731812, 0.18625593185424805, 0.21225030720233917, 0.2382446825504303, 0.26423904299736023, 0.29023340344429016, 0.3162277936935425, 0.3422221541404724, 0.36821651458740234, 0.3942108750343323, 0.4202052354812622, 0.4461996257305145, 0.47219398617744446, 0.4981883466243744, 0.5241827368736267, 0.5501770973205566, 0.5761714577674866]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 4.0, 7.0, 2.0, 6.0, 7.0, 3.0, 9.0, 17.0, 12.0, 15.0, 19.0, 20.0, 18.0, 25.0, 23.0, 34.0, 35.0, 33.0, 40.0, 41.0, 51.0, 39.0, 43.0, 45.0, 43.0, 47.0, 46.0, 41.0, 36.0, 29.0, 35.0, 27.0, 24.0, 26.0, 24.0, 10.0, 13.0, 10.0, 10.0, 6.0, 12.0, 6.0, 5.0, 4.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.27648842334747314, -0.2680753469467163, -0.2596622407436371, -0.25124916434288025, -0.24283607304096222, -0.2344229817390442, -0.22600989043712616, -0.21759679913520813, -0.2091837227344513, -0.20077063143253326, -0.19235754013061523, -0.1839444637298584, -0.17553137242794037, -0.16711828112602234, -0.1587051898241043, -0.15029209852218628, -0.14187900722026825, -0.13346591591835022, -0.1250528246164322, -0.11663974076509476, -0.10822665691375732, -0.0998135656118393, -0.09140047430992126, -0.08298738300800323, -0.0745742991566658, -0.06616120785474777, -0.05774812400341034, -0.04933503270149231, -0.04092194512486458, -0.03250885754823685, -0.024095766246318817, -0.015682678669691086, -0.0072695910930633545, 0.0011434974148869514, 0.009556585922837257, 0.017969675362110138, 0.02638276293873787, 0.0347958505153656, 0.04320894181728363, 0.05162202939391136, 0.06003511697053909, 0.06844820827245712, 0.07686129212379456, 0.08527438342571259, 0.09368747472763062, 0.10210055857896805, 0.11051364988088608, 0.11892673373222351, 0.12733982503414154, 0.13575291633605957, 0.1441660076379776, 0.15257909893989563, 0.16099217534065247, 0.1694052666425705, 0.17781835794448853, 0.18623144924640656, 0.19464454054832458, 0.20305763185024261, 0.21147072315216064, 0.21988379955291748, 0.2282968908548355, 0.23670998215675354, 0.24512307345867157, 0.2535361647605896, 0.26194924116134644]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 0.0, 5.0, 5.0, 8.0, 18.0, 21.0, 20.0, 31.0, 57.0, 74.0, 138.0, 239.0, 371.0, 638.0, 1190.0, 2225.0, 4603.0, 9302.0, 19341.0, 40595.0, 86654.0, 198468.0, 345980.0, 183042.0, 81202.0, 38546.0, 17866.0, 8744.0, 4361.0, 2150.0, 1106.0, 595.0, 369.0, 218.0, 130.0, 75.0, 57.0, 40.0, 25.0, 17.0, 16.0, 10.0, 6.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1236572265625, -0.11972618103027344, -0.11579513549804688, -0.11186408996582031, -0.10793304443359375, -0.10400199890136719, -0.10007095336914062, -0.09613990783691406, -0.0922088623046875, -0.08827781677246094, -0.08434677124023438, -0.08041572570800781, -0.07648468017578125, -0.07255363464355469, -0.06862258911132812, -0.06469154357910156, -0.060760498046875, -0.05682945251464844, -0.052898406982421875, -0.04896736145019531, -0.04503631591796875, -0.04110527038574219, -0.037174224853515625, -0.03324317932128906, -0.0293121337890625, -0.025381088256835938, -0.021450042724609375, -0.017518997192382812, -0.01358795166015625, -0.009656906127929688, -0.005725860595703125, -0.0017948150634765625, 0.00213623046875, 0.0060672760009765625, 0.009998321533203125, 0.013929367065429688, 0.01786041259765625, 0.021791458129882812, 0.025722503662109375, 0.029653549194335938, 0.0335845947265625, 0.03751564025878906, 0.041446685791015625, 0.04537773132324219, 0.04930877685546875, 0.05323982238769531, 0.057170867919921875, 0.06110191345214844, 0.065032958984375, 0.06896400451660156, 0.07289505004882812, 0.07682609558105469, 0.08075714111328125, 0.08468818664550781, 0.08861923217773438, 0.09255027770996094, 0.0964813232421875, 0.10041236877441406, 0.10434341430664062, 0.10827445983886719, 0.11220550537109375, 0.11613655090332031, 0.12006759643554688, 0.12399864196777344, 0.1279296875]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 8.0, 12.0, 9.0, 14.0, 18.0, 23.0, 28.0, 35.0, 57.0, 56.0, 46.0, 71.0, 75.0, 63.0, 65.0, 62.0, 71.0, 54.0, 51.0, 42.0, 31.0, 24.0, 19.0, 21.0, 11.0, 8.0, 11.0, 7.0, 7.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.049407958984375, -0.04809999465942383, -0.046792030334472656, -0.045484066009521484, -0.04417610168457031, -0.04286813735961914, -0.04156017303466797, -0.0402522087097168, -0.038944244384765625, -0.03763628005981445, -0.03632831573486328, -0.03502035140991211, -0.03371238708496094, -0.032404422760009766, -0.031096458435058594, -0.029788494110107422, -0.02848052978515625, -0.027172565460205078, -0.025864601135253906, -0.024556636810302734, -0.023248672485351562, -0.02194070816040039, -0.02063274383544922, -0.019324779510498047, -0.018016815185546875, -0.016708850860595703, -0.015400886535644531, -0.01409292221069336, -0.012784957885742188, -0.011476993560791016, -0.010169029235839844, -0.008861064910888672, -0.0075531005859375, -0.006245136260986328, -0.004937171936035156, -0.0036292076110839844, -0.0023212432861328125, -0.0010132789611816406, 0.00029468536376953125, 0.0016026496887207031, 0.002910614013671875, 0.004218578338623047, 0.005526542663574219, 0.006834506988525391, 0.008142471313476562, 0.009450435638427734, 0.010758399963378906, 0.012066364288330078, 0.01337432861328125, 0.014682292938232422, 0.015990257263183594, 0.017298221588134766, 0.018606185913085938, 0.01991415023803711, 0.02122211456298828, 0.022530078887939453, 0.023838043212890625, 0.025146007537841797, 0.02645397186279297, 0.02776193618774414, 0.029069900512695312, 0.030377864837646484, 0.031685829162597656, 0.03299379348754883, 0.0343017578125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 7.0, 7.0, 5.0, 19.0, 13.0, 17.0, 33.0, 50.0, 82.0, 109.0, 158.0, 250.0, 334.0, 575.0, 941.0, 1956.0, 5060.0, 16475.0, 72638.0, 435067.0, 419621.0, 69772.0, 16071.0, 4773.0, 1933.0, 987.0, 527.0, 329.0, 228.0, 161.0, 104.0, 72.0, 52.0, 38.0, 31.0, 20.0, 7.0, 8.0, 12.0, 5.0, 6.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.190673828125, -0.1836090087890625, -0.176544189453125, -0.1694793701171875, -0.16241455078125, -0.1553497314453125, -0.148284912109375, -0.1412200927734375, -0.1341552734375, -0.1270904541015625, -0.120025634765625, -0.1129608154296875, -0.10589599609375, -0.0988311767578125, -0.091766357421875, -0.0847015380859375, -0.07763671875, -0.0705718994140625, -0.063507080078125, -0.0564422607421875, -0.04937744140625, -0.0423126220703125, -0.035247802734375, -0.0281829833984375, -0.0211181640625, -0.0140533447265625, -0.006988525390625, 7.62939453125e-05, 0.00714111328125, 0.0142059326171875, 0.021270751953125, 0.0283355712890625, 0.035400390625, 0.0424652099609375, 0.049530029296875, 0.0565948486328125, 0.06365966796875, 0.0707244873046875, 0.077789306640625, 0.0848541259765625, 0.0919189453125, 0.0989837646484375, 0.106048583984375, 0.1131134033203125, 0.12017822265625, 0.1272430419921875, 0.134307861328125, 0.1413726806640625, 0.1484375, 0.1555023193359375, 0.162567138671875, 0.1696319580078125, 0.17669677734375, 0.1837615966796875, 0.190826416015625, 0.1978912353515625, 0.2049560546875, 0.2120208740234375, 0.219085693359375, 0.2261505126953125, 0.23321533203125, 0.2402801513671875, 0.247344970703125, 0.2544097900390625, 0.261474609375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 4.0, 1.0, 7.0, 6.0, 13.0, 8.0, 10.0, 23.0, 19.0, 27.0, 37.0, 47.0, 34.0, 48.0, 33.0, 46.0, 60.0, 48.0, 60.0, 54.0, 53.0, 44.0, 48.0, 42.0, 35.0, 37.0, 34.0, 27.0, 17.0, 20.0, 22.0, 11.0, 9.0, 4.0, 4.0, 7.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17236328125, -0.16698646545410156, -0.16160964965820312, -0.1562328338623047, -0.15085601806640625, -0.1454792022705078, -0.14010238647460938, -0.13472557067871094, -0.1293487548828125, -0.12397193908691406, -0.11859512329101562, -0.11321830749511719, -0.10784149169921875, -0.10246467590332031, -0.09708786010742188, -0.09171104431152344, -0.086334228515625, -0.08095741271972656, -0.07558059692382812, -0.07020378112792969, -0.06482696533203125, -0.05945014953613281, -0.054073333740234375, -0.04869651794433594, -0.0433197021484375, -0.03794288635253906, -0.032566070556640625, -0.027189254760742188, -0.02181243896484375, -0.016435623168945312, -0.011058807373046875, -0.0056819915771484375, -0.00030517578125, 0.0050716400146484375, 0.010448455810546875, 0.015825271606445312, 0.02120208740234375, 0.026578903198242188, 0.031955718994140625, 0.03733253479003906, 0.0427093505859375, 0.04808616638183594, 0.053462982177734375, 0.05883979797363281, 0.06421661376953125, 0.06959342956542969, 0.07497024536132812, 0.08034706115722656, 0.085723876953125, 0.09110069274902344, 0.09647750854492188, 0.10185432434082031, 0.10723114013671875, 0.11260795593261719, 0.11798477172851562, 0.12336158752441406, 0.1287384033203125, 0.13411521911621094, 0.13949203491210938, 0.1448688507080078, 0.15024566650390625, 0.1556224822998047, 0.16099929809570312, 0.16637611389160156, 0.1717529296875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 5.0, 6.0, 8.0, 11.0, 24.0, 22.0, 26.0, 30.0, 50.0, 79.0, 92.0, 176.0, 232.0, 386.0, 711.0, 1326.0, 2755.0, 7295.0, 33275.0, 372390.0, 570177.0, 44252.0, 8760.0, 3063.0, 1392.0, 773.0, 416.0, 250.0, 163.0, 110.0, 88.0, 63.0, 33.0, 31.0, 22.0, 11.0, 14.0, 12.0, 8.0, 6.0, 5.0, 3.0, 1.0, 1.0, 4.0, 0.0, 5.0], "bins": [-0.255126953125, -0.2482452392578125, -0.241363525390625, -0.2344818115234375, -0.22760009765625, -0.2207183837890625, -0.213836669921875, -0.2069549560546875, -0.2000732421875, -0.1931915283203125, -0.186309814453125, -0.1794281005859375, -0.17254638671875, -0.1656646728515625, -0.158782958984375, -0.1519012451171875, -0.14501953125, -0.1381378173828125, -0.131256103515625, -0.1243743896484375, -0.11749267578125, -0.1106109619140625, -0.103729248046875, -0.0968475341796875, -0.0899658203125, -0.0830841064453125, -0.076202392578125, -0.0693206787109375, -0.06243896484375, -0.0555572509765625, -0.048675537109375, -0.0417938232421875, -0.034912109375, -0.0280303955078125, -0.021148681640625, -0.0142669677734375, -0.00738525390625, -0.0005035400390625, 0.006378173828125, 0.0132598876953125, 0.0201416015625, 0.0270233154296875, 0.033905029296875, 0.0407867431640625, 0.04766845703125, 0.0545501708984375, 0.061431884765625, 0.0683135986328125, 0.0751953125, 0.0820770263671875, 0.088958740234375, 0.0958404541015625, 0.10272216796875, 0.1096038818359375, 0.116485595703125, 0.1233673095703125, 0.1302490234375, 0.1371307373046875, 0.144012451171875, 0.1508941650390625, 0.15777587890625, 0.1646575927734375, 0.171539306640625, 0.1784210205078125, 0.185302734375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 6.0, 8.0, 5.0, 12.0, 16.0, 15.0, 27.0, 36.0, 54.0, 61.0, 76.0, 90.0, 78.0, 85.0, 82.0, 87.0, 56.0, 55.0, 34.0, 29.0, 22.0, 17.0, 16.0, 11.0, 5.0, 7.0, 7.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010609626770019531, -0.00010310392826795578, -0.00010011158883571625, -9.711924940347672e-05, -9.412690997123718e-05, -9.113457053899765e-05, -8.814223110675812e-05, -8.514989167451859e-05, -8.215755224227905e-05, -7.916521281003952e-05, -7.617287337779999e-05, -7.318053394556046e-05, -7.018819451332092e-05, -6.719585508108139e-05, -6.420351564884186e-05, -6.121117621660233e-05, -5.821883678436279e-05, -5.522649735212326e-05, -5.223415791988373e-05, -4.9241818487644196e-05, -4.624947905540466e-05, -4.325713962316513e-05, -4.02648001909256e-05, -3.7272460758686066e-05, -3.428012132644653e-05, -3.1287781894207e-05, -2.8295442461967468e-05, -2.5303103029727936e-05, -2.2310763597488403e-05, -1.931842416524887e-05, -1.632608473300934e-05, -1.3333745300769806e-05, -1.0341405868530273e-05, -7.349066436290741e-06, -4.3567270040512085e-06, -1.364387571811676e-06, 1.6279518604278564e-06, 4.620291292667389e-06, 7.612630724906921e-06, 1.0604970157146454e-05, 1.3597309589385986e-05, 1.658964902162552e-05, 1.958198845386505e-05, 2.2574327886104584e-05, 2.5566667318344116e-05, 2.855900675058365e-05, 3.155134618282318e-05, 3.4543685615062714e-05, 3.7536025047302246e-05, 4.052836447954178e-05, 4.352070391178131e-05, 4.6513043344020844e-05, 4.9505382776260376e-05, 5.249772220849991e-05, 5.549006164073944e-05, 5.8482401072978973e-05, 6.14747405052185e-05, 6.446707993745804e-05, 6.745941936969757e-05, 7.04517588019371e-05, 7.344409823417664e-05, 7.643643766641617e-05, 7.94287770986557e-05, 8.242111653089523e-05, 8.541345596313477e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 3.0, 2.0, 3.0, 5.0, 6.0, 7.0, 7.0, 4.0, 12.0, 27.0, 24.0, 50.0, 74.0, 99.0, 183.0, 397.0, 711.0, 1585.0, 3829.0, 15446.0, 152458.0, 789589.0, 68657.0, 9905.0, 2857.0, 1268.0, 611.0, 296.0, 185.0, 99.0, 51.0, 31.0, 19.0, 10.0, 14.0, 3.0, 8.0, 8.0, 3.0, 10.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.22265625, -0.21555519104003906, -0.20845413208007812, -0.2013530731201172, -0.19425201416015625, -0.1871509552001953, -0.18004989624023438, -0.17294883728027344, -0.1658477783203125, -0.15874671936035156, -0.15164566040039062, -0.1445446014404297, -0.13744354248046875, -0.1303424835205078, -0.12324142456054688, -0.11614036560058594, -0.109039306640625, -0.10193824768066406, -0.09483718872070312, -0.08773612976074219, -0.08063507080078125, -0.07353401184082031, -0.06643295288085938, -0.05933189392089844, -0.0522308349609375, -0.04512977600097656, -0.038028717041015625, -0.030927658081054688, -0.02382659912109375, -0.016725540161132812, -0.009624481201171875, -0.0025234222412109375, 0.00457763671875, 0.011678695678710938, 0.018779754638671875, 0.025880813598632812, 0.03298187255859375, 0.04008293151855469, 0.047183990478515625, 0.05428504943847656, 0.0613861083984375, 0.06848716735839844, 0.07558822631835938, 0.08268928527832031, 0.08979034423828125, 0.09689140319824219, 0.10399246215820312, 0.11109352111816406, 0.118194580078125, 0.12529563903808594, 0.13239669799804688, 0.1394977569580078, 0.14659881591796875, 0.1536998748779297, 0.16080093383789062, 0.16790199279785156, 0.1750030517578125, 0.18210411071777344, 0.18920516967773438, 0.1963062286376953, 0.20340728759765625, 0.2105083465576172, 0.21760940551757812, 0.22471046447753906, 0.2318115234375]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 2.0, 5.0, 8.0, 7.0, 6.0, 10.0, 24.0, 17.0, 36.0, 51.0, 55.0, 86.0, 133.0, 134.0, 120.0, 81.0, 71.0, 36.0, 36.0, 28.0, 16.0, 8.0, 7.0, 7.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.1353759765625, -0.13167572021484375, -0.1279754638671875, -0.12427520751953125, -0.120574951171875, -0.11687469482421875, -0.1131744384765625, -0.10947418212890625, -0.10577392578125, -0.10207366943359375, -0.0983734130859375, -0.09467315673828125, -0.090972900390625, -0.08727264404296875, -0.0835723876953125, -0.07987213134765625, -0.076171875, -0.07247161865234375, -0.0687713623046875, -0.06507110595703125, -0.061370849609375, -0.05767059326171875, -0.0539703369140625, -0.05027008056640625, -0.04656982421875, -0.04286956787109375, -0.0391693115234375, -0.03546905517578125, -0.031768798828125, -0.02806854248046875, -0.0243682861328125, -0.02066802978515625, -0.0169677734375, -0.01326751708984375, -0.0095672607421875, -0.00586700439453125, -0.002166748046875, 0.00153350830078125, 0.0052337646484375, 0.00893402099609375, 0.01263427734375, 0.01633453369140625, 0.0200347900390625, 0.02373504638671875, 0.027435302734375, 0.03113555908203125, 0.0348358154296875, 0.03853607177734375, 0.042236328125, 0.04593658447265625, 0.0496368408203125, 0.05333709716796875, 0.057037353515625, 0.06073760986328125, 0.0644378662109375, 0.06813812255859375, 0.07183837890625, 0.07553863525390625, 0.0792388916015625, 0.08293914794921875, 0.086639404296875, 0.09033966064453125, 0.0940399169921875, 0.09774017333984375, 0.1014404296875]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 13.0, 37.0, 92.0, 156.0, 235.0, 179.0, 152.0, 84.0, 21.0, 15.0, 8.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.650705099105835, -2.5721492767333984, -2.493593692779541, -2.4150378704071045, -2.336482048034668, -2.2579262256622314, -2.179370403289795, -2.1008148193359375, -2.022258996963501, -1.9437031745910645, -1.8651474714279175, -1.7865917682647705, -1.708035945892334, -1.6294801235198975, -1.5509244203567505, -1.4723687171936035, -1.393812894821167, -1.3152570724487305, -1.2367013692855835, -1.1581456661224365, -1.07958984375, -1.0010340213775635, -0.9224783182144165, -0.8439225554466248, -0.765366792678833, -0.6868110299110413, -0.6082552671432495, -0.5296995043754578, -0.451143741607666, -0.37258797883987427, -0.2940322160720825, -0.21547645330429077, -0.13692092895507812, -0.05836516618728638, 0.02019059658050537, 0.09874635934829712, 0.17730212211608887, 0.2558578848838806, 0.33441364765167236, 0.4129694104194641, 0.49152517318725586, 0.5700809359550476, 0.6486366987228394, 0.7271924614906311, 0.8057482242584229, 0.8843039870262146, 0.9628597497940063, 1.0414154529571533, 1.1199712753295898, 1.1985270977020264, 1.2770828008651733, 1.3556385040283203, 1.4341943264007568, 1.5127501487731934, 1.5913058519363403, 1.6698615550994873, 1.7484173774719238, 1.8269731998443604, 1.9055289030075073, 1.9840846061706543, 2.062640428543091, 2.1411962509155273, 2.2197518348693848, 2.2983076572418213, 2.376863479614258]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 6.0, 5.0, 8.0, 7.0, 2.0, 6.0, 10.0, 11.0, 22.0, 16.0, 28.0, 21.0, 26.0, 34.0, 29.0, 41.0, 47.0, 35.0, 40.0, 47.0, 49.0, 41.0, 40.0, 51.0, 49.0, 50.0, 33.0, 45.0, 29.0, 36.0, 29.0, 22.0, 13.0, 13.0, 17.0, 11.0, 7.0, 7.0, 6.0, 4.0, 1.0, 7.0, 4.0, 1.0, 2.0, 0.0, 4.0, 0.0, 1.0, 1.0], "bins": [-1.0180760622024536, -0.9890245795249939, -0.959973156452179, -0.9309216737747192, -0.9018701910972595, -0.8728187680244446, -0.8437672853469849, -0.8147158622741699, -0.7856643795967102, -0.7566128969192505, -0.7275614738464355, -0.6985099911689758, -0.6694585084915161, -0.6404070854187012, -0.6113556027412415, -0.5823041200637817, -0.5532526969909668, -0.5242012143135071, -0.49514976143836975, -0.4660983085632324, -0.4370468556880951, -0.40799540281295776, -0.37894392013549805, -0.3498924672603607, -0.3208409547805786, -0.2917895019054413, -0.26273801922798157, -0.23368656635284424, -0.2046351134777069, -0.1755836457014084, -0.14653217792510986, -0.11748072504997253, -0.0884292721748352, -0.05937781184911728, -0.030326347798109055, -0.00127488374710083, 0.027776576578617096, 0.05682803690433502, 0.08587950468063354, 0.11493095755577087, 0.1439824253320694, 0.17303389310836792, 0.20208534598350525, 0.23113681375980377, 0.2601882815361023, 0.2892397344112396, 0.31829118728637695, 0.34734266996383667, 0.376394122838974, 0.40544557571411133, 0.43449705839157104, 0.4635485112667084, 0.4925999641418457, 0.5216514468193054, 0.5507029294967651, 0.5797543525695801, 0.6088058352470398, 0.6378573179244995, 0.6669087409973145, 0.6959602236747742, 0.7250117063522339, 0.7540631294250488, 0.7831146121025085, 0.8121660947799683, 0.8412175178527832]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 5.0, 13.0, 19.0, 27.0, 41.0, 88.0, 143.0, 202.0, 351.0, 688.0, 1379.0, 3029.0, 6920.0, 17618.0, 53196.0, 238167.0, 3291157.0, 462896.0, 78160.0, 23842.0, 8990.0, 3849.0, 1757.0, 808.0, 398.0, 226.0, 125.0, 75.0, 43.0, 25.0, 16.0, 15.0, 2.0, 8.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.1866455078125, -0.18155288696289062, -0.17646026611328125, -0.17136764526367188, -0.1662750244140625, -0.16118240356445312, -0.15608978271484375, -0.15099716186523438, -0.145904541015625, -0.14081192016601562, -0.13571929931640625, -0.13062667846679688, -0.1255340576171875, -0.12044143676757812, -0.11534881591796875, -0.11025619506835938, -0.10516357421875, -0.10007095336914062, -0.09497833251953125, -0.08988571166992188, -0.0847930908203125, -0.07970046997070312, -0.07460784912109375, -0.06951522827148438, -0.064422607421875, -0.059329986572265625, -0.05423736572265625, -0.049144744873046875, -0.0440521240234375, -0.038959503173828125, -0.03386688232421875, -0.028774261474609375, -0.023681640625, -0.018589019775390625, -0.01349639892578125, -0.008403778076171875, -0.0033111572265625, 0.001781463623046875, 0.00687408447265625, 0.011966705322265625, 0.017059326171875, 0.022151947021484375, 0.02724456787109375, 0.032337188720703125, 0.0374298095703125, 0.042522430419921875, 0.04761505126953125, 0.052707672119140625, 0.05780029296875, 0.06289291381835938, 0.06798553466796875, 0.07307815551757812, 0.0781707763671875, 0.08326339721679688, 0.08835601806640625, 0.09344863891601562, 0.098541259765625, 0.10363388061523438, 0.10872650146484375, 0.11381912231445312, 0.1189117431640625, 0.12400436401367188, 0.12909698486328125, 0.13418960571289062, 0.1392822265625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 8.0, 8.0, 4.0, 10.0, 10.0, 15.0, 17.0, 31.0, 27.0, 39.0, 37.0, 62.0, 47.0, 49.0, 56.0, 66.0, 61.0, 66.0, 43.0, 55.0, 54.0, 41.0, 55.0, 26.0, 38.0, 17.0, 12.0, 9.0, 11.0, 8.0, 10.0, 8.0, 2.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.051544189453125, -0.05026388168334961, -0.04898357391357422, -0.04770326614379883, -0.04642295837402344, -0.04514265060424805, -0.043862342834472656, -0.042582035064697266, -0.041301727294921875, -0.040021419525146484, -0.038741111755371094, -0.0374608039855957, -0.03618049621582031, -0.03490018844604492, -0.03361988067626953, -0.03233957290649414, -0.03105926513671875, -0.02977895736694336, -0.02849864959716797, -0.027218341827392578, -0.025938034057617188, -0.024657726287841797, -0.023377418518066406, -0.022097110748291016, -0.020816802978515625, -0.019536495208740234, -0.018256187438964844, -0.016975879669189453, -0.015695571899414062, -0.014415264129638672, -0.013134956359863281, -0.01185464859008789, -0.0105743408203125, -0.00929403305053711, -0.008013725280761719, -0.006733417510986328, -0.0054531097412109375, -0.004172801971435547, -0.0028924942016601562, -0.0016121864318847656, -0.000331878662109375, 0.0009484291076660156, 0.0022287368774414062, 0.003509044647216797, 0.0047893524169921875, 0.006069660186767578, 0.007349967956542969, 0.00863027572631836, 0.00991058349609375, 0.01119089126586914, 0.012471199035644531, 0.013751506805419922, 0.015031814575195312, 0.016312122344970703, 0.017592430114746094, 0.018872737884521484, 0.020153045654296875, 0.021433353424072266, 0.022713661193847656, 0.023993968963623047, 0.025274276733398438, 0.026554584503173828, 0.02783489227294922, 0.02911520004272461, 0.0303955078125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 6.0, 6.0, 14.0, 15.0, 41.0, 72.0, 104.0, 199.0, 400.0, 912.0, 2294.0, 6373.0, 22200.0, 110823.0, 2087009.0, 1825137.0, 106565.0, 21823.0, 6213.0, 2277.0, 919.0, 406.0, 216.0, 98.0, 56.0, 42.0, 24.0, 13.0, 10.0, 5.0, 6.0, 3.0, 1.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1795654296875, -0.1717548370361328, -0.16394424438476562, -0.15613365173339844, -0.14832305908203125, -0.14051246643066406, -0.13270187377929688, -0.12489128112792969, -0.1170806884765625, -0.10927009582519531, -0.10145950317382812, -0.09364891052246094, -0.08583831787109375, -0.07802772521972656, -0.07021713256835938, -0.06240653991699219, -0.054595947265625, -0.04678535461425781, -0.038974761962890625, -0.031164169311523438, -0.02335357666015625, -0.015542984008789062, -0.007732391357421875, 7.82012939453125e-05, 0.0078887939453125, 0.015699386596679688, 0.023509979248046875, 0.03132057189941406, 0.03913116455078125, 0.04694175720214844, 0.054752349853515625, 0.06256294250488281, 0.07037353515625, 0.07818412780761719, 0.08599472045898438, 0.09380531311035156, 0.10161590576171875, 0.10942649841308594, 0.11723709106445312, 0.1250476837158203, 0.1328582763671875, 0.1406688690185547, 0.14847946166992188, 0.15629005432128906, 0.16410064697265625, 0.17191123962402344, 0.17972183227539062, 0.1875324249267578, 0.195343017578125, 0.2031536102294922, 0.21096420288085938, 0.21877479553222656, 0.22658538818359375, 0.23439598083496094, 0.24220657348632812, 0.2500171661376953, 0.2578277587890625, 0.2656383514404297, 0.2734489440917969, 0.28125953674316406, 0.28907012939453125, 0.29688072204589844, 0.3046913146972656, 0.3125019073486328, 0.3203125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 4.0, 4.0, 3.0, 7.0, 14.0, 5.0, 11.0, 28.0, 33.0, 41.0, 81.0, 118.0, 176.0, 329.0, 797.0, 1306.0, 484.0, 226.0, 132.0, 88.0, 59.0, 46.0, 27.0, 19.0, 6.0, 11.0, 8.0, 2.0, 4.0, 7.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.1082763671875, -0.10511589050292969, -0.10195541381835938, -0.09879493713378906, -0.09563446044921875, -0.09247398376464844, -0.08931350708007812, -0.08615303039550781, -0.0829925537109375, -0.07983207702636719, -0.07667160034179688, -0.07351112365722656, -0.07035064697265625, -0.06719017028808594, -0.06402969360351562, -0.06086921691894531, -0.057708740234375, -0.05454826354980469, -0.051387786865234375, -0.04822731018066406, -0.04506683349609375, -0.04190635681152344, -0.038745880126953125, -0.03558540344238281, -0.0324249267578125, -0.029264450073242188, -0.026103973388671875, -0.022943496704101562, -0.01978302001953125, -0.016622543334960938, -0.013462066650390625, -0.010301589965820312, -0.00714111328125, -0.0039806365966796875, -0.000820159912109375, 0.0023403167724609375, 0.00550079345703125, 0.008661270141601562, 0.011821746826171875, 0.014982223510742188, 0.0181427001953125, 0.021303176879882812, 0.024463653564453125, 0.027624130249023438, 0.03078460693359375, 0.03394508361816406, 0.037105560302734375, 0.04026603698730469, 0.043426513671875, 0.04658699035644531, 0.049747467041015625, 0.05290794372558594, 0.05606842041015625, 0.05922889709472656, 0.062389373779296875, 0.06554985046386719, 0.0687103271484375, 0.07187080383300781, 0.07503128051757812, 0.07819175720214844, 0.08135223388671875, 0.08451271057128906, 0.08767318725585938, 0.09083366394042969, 0.093994140625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 0.0, 2.0, 2.0, 7.0, 6.0, 9.0, 9.0, 16.0, 36.0, 34.0, 44.0, 51.0, 85.0, 73.0, 95.0, 84.0, 90.0, 87.0, 73.0, 58.0, 36.0, 34.0, 21.0, 17.0, 6.0, 10.0, 9.0, 8.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.5481261014938354, -0.5349147915840149, -0.5217034816741943, -0.5084922313690186, -0.4952808916568756, -0.48206961154937744, -0.4688583016395569, -0.45564699172973633, -0.44243568181991577, -0.4292243719100952, -0.41601309180259705, -0.4028017818927765, -0.38959047198295593, -0.37637919187545776, -0.3631678819656372, -0.34995657205581665, -0.3367452919483185, -0.3235339820384979, -0.31032270193099976, -0.2971113920211792, -0.28390008211135864, -0.2706887722015381, -0.2574774920940399, -0.24426618218421936, -0.23105488717556, -0.21784359216690063, -0.20463228225708008, -0.19142098724842072, -0.17820969223976135, -0.1649983823299408, -0.15178708732128143, -0.13857579231262207, -0.1253644824028015, -0.11215317994356155, -0.0989418774843216, -0.08573058247566223, -0.07251928001642227, -0.05930797755718231, -0.04609668254852295, -0.03288538008928299, -0.01967407763004303, -0.006462777033448219, 0.006748523563146591, 0.019959822297096252, 0.03317112475633621, 0.04638242721557617, 0.059593722224235535, 0.0728050246834755, 0.08601632714271545, 0.09922762960195541, 0.11243893206119537, 0.12565022706985474, 0.1388615369796753, 0.15207283198833466, 0.16528412699699402, 0.17849543690681458, 0.19170673191547394, 0.2049180269241333, 0.21812933683395386, 0.23134063184261322, 0.24455192685127258, 0.25776323676109314, 0.2709745168685913, 0.28418582677841187, 0.2973971366882324]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 4.0, 3.0, 5.0, 8.0, 9.0, 5.0, 9.0, 8.0, 15.0, 14.0, 18.0, 21.0, 20.0, 29.0, 26.0, 29.0, 30.0, 27.0, 35.0, 39.0, 43.0, 39.0, 38.0, 44.0, 53.0, 38.0, 48.0, 40.0, 41.0, 37.0, 35.0, 31.0, 30.0, 20.0, 24.0, 20.0, 12.0, 11.0, 5.0, 9.0, 8.0, 7.0, 5.0, 7.0, 5.0, 4.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.30163830518722534, -0.2916310131549835, -0.2816237509250641, -0.27161645889282227, -0.26160919666290283, -0.251601904630661, -0.24159462749958038, -0.23158735036849976, -0.22158005833625793, -0.2115727812051773, -0.20156550407409668, -0.19155821204185486, -0.18155093491077423, -0.1715436577796936, -0.16153638064861298, -0.15152910351753235, -0.14152182638645172, -0.1315145492553711, -0.12150726467370987, -0.11149998754262924, -0.10149270296096802, -0.09148542582988739, -0.08147814869880676, -0.07147086411714554, -0.06146358698606491, -0.051456306129693985, -0.04144902527332306, -0.03144174814224243, -0.021434467285871506, -0.01142718642950058, -0.0014199092984199524, 0.008587375283241272, 0.0185946524143219, 0.028601933270692825, 0.03860921412706375, 0.04861649125814438, 0.058623772114515305, 0.06863105297088623, 0.07863833010196686, 0.08864561468362808, 0.09865289181470871, 0.10866016894578934, 0.11866745352745056, 0.1286747306585312, 0.13868200778961182, 0.14868929982185364, 0.15869656205177307, 0.1687038540840149, 0.17871113121509552, 0.18871840834617615, 0.19872568547725677, 0.2087329626083374, 0.21874025464057922, 0.22874753177165985, 0.23875480890274048, 0.2487621009349823, 0.25876936316490173, 0.26877665519714355, 0.278783917427063, 0.2887912094593048, 0.29879847168922424, 0.30880576372146606, 0.3188130259513855, 0.3288203179836273, 0.33882761001586914]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 4.0, 5.0, 8.0, 8.0, 17.0, 19.0, 20.0, 47.0, 63.0, 97.0, 167.0, 231.0, 381.0, 582.0, 957.0, 1660.0, 2938.0, 5442.0, 10077.0, 19069.0, 36501.0, 71443.0, 263273.0, 441162.0, 97006.0, 45560.0, 24110.0, 12322.0, 6738.0, 3639.0, 2019.0, 1145.0, 701.0, 382.0, 255.0, 156.0, 102.0, 83.0, 55.0, 46.0, 21.0, 13.0, 16.0, 5.0, 6.0, 4.0, 1.0, 4.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0], "bins": [-0.13720703125, -0.13294219970703125, -0.1286773681640625, -0.12441253662109375, -0.120147705078125, -0.11588287353515625, -0.1116180419921875, -0.10735321044921875, -0.10308837890625, -0.09882354736328125, -0.0945587158203125, -0.09029388427734375, -0.086029052734375, -0.08176422119140625, -0.0774993896484375, -0.07323455810546875, -0.0689697265625, -0.06470489501953125, -0.0604400634765625, -0.05617523193359375, -0.051910400390625, -0.04764556884765625, -0.0433807373046875, -0.03911590576171875, -0.03485107421875, -0.03058624267578125, -0.0263214111328125, -0.02205657958984375, -0.017791748046875, -0.01352691650390625, -0.0092620849609375, -0.00499725341796875, -0.000732421875, 0.00353240966796875, 0.0077972412109375, 0.01206207275390625, 0.016326904296875, 0.02059173583984375, 0.0248565673828125, 0.02912139892578125, 0.03338623046875, 0.03765106201171875, 0.0419158935546875, 0.04618072509765625, 0.050445556640625, 0.05471038818359375, 0.0589752197265625, 0.06324005126953125, 0.0675048828125, 0.07176971435546875, 0.0760345458984375, 0.08029937744140625, 0.084564208984375, 0.08882904052734375, 0.0930938720703125, 0.09735870361328125, 0.10162353515625, 0.10588836669921875, 0.1101531982421875, 0.11441802978515625, 0.118682861328125, 0.12294769287109375, 0.1272125244140625, 0.13147735595703125, 0.1357421875]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 7.0, 9.0, 6.0, 8.0, 10.0, 16.0, 12.0, 20.0, 27.0, 38.0, 47.0, 51.0, 44.0, 50.0, 58.0, 48.0, 53.0, 65.0, 54.0, 55.0, 37.0, 50.0, 41.0, 43.0, 33.0, 25.0, 22.0, 18.0, 9.0, 8.0, 5.0, 10.0, 11.0, 5.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.043670654296875, -0.042452335357666016, -0.04123401641845703, -0.04001569747924805, -0.03879737854003906, -0.03757905960083008, -0.036360740661621094, -0.03514242172241211, -0.033924102783203125, -0.03270578384399414, -0.031487464904785156, -0.030269145965576172, -0.029050827026367188, -0.027832508087158203, -0.02661418914794922, -0.025395870208740234, -0.02417755126953125, -0.022959232330322266, -0.02174091339111328, -0.020522594451904297, -0.019304275512695312, -0.018085956573486328, -0.016867637634277344, -0.01564931869506836, -0.014430999755859375, -0.01321268081665039, -0.011994361877441406, -0.010776042938232422, -0.009557723999023438, -0.008339405059814453, -0.007121086120605469, -0.005902767181396484, -0.0046844482421875, -0.0034661293029785156, -0.0022478103637695312, -0.0010294914245605469, 0.0001888275146484375, 0.0014071464538574219, 0.0026254653930664062, 0.0038437843322753906, 0.005062103271484375, 0.006280422210693359, 0.007498741149902344, 0.008717060089111328, 0.009935379028320312, 0.011153697967529297, 0.012372016906738281, 0.013590335845947266, 0.01480865478515625, 0.016026973724365234, 0.01724529266357422, 0.018463611602783203, 0.019681930541992188, 0.020900249481201172, 0.022118568420410156, 0.02333688735961914, 0.024555206298828125, 0.02577352523803711, 0.026991844177246094, 0.028210163116455078, 0.029428482055664062, 0.030646800994873047, 0.03186511993408203, 0.033083438873291016, 0.0343017578125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 0.0, 5.0, 2.0, 8.0, 11.0, 23.0, 11.0, 21.0, 43.0, 43.0, 63.0, 78.0, 92.0, 134.0, 215.0, 296.0, 387.0, 721.0, 1314.0, 3015.0, 8874.0, 32460.0, 130690.0, 707645.0, 118520.0, 29604.0, 8010.0, 2852.0, 1304.0, 675.0, 446.0, 282.0, 183.0, 141.0, 123.0, 65.0, 45.0, 33.0, 28.0, 32.0, 15.0, 8.0, 11.0, 7.0, 5.0, 11.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.2335205078125, -0.22674560546875, -0.219970703125, -0.21319580078125, -0.2064208984375, -0.19964599609375, -0.19287109375, -0.18609619140625, -0.1793212890625, -0.17254638671875, -0.165771484375, -0.15899658203125, -0.1522216796875, -0.14544677734375, -0.138671875, -0.13189697265625, -0.1251220703125, -0.11834716796875, -0.111572265625, -0.10479736328125, -0.0980224609375, -0.09124755859375, -0.08447265625, -0.07769775390625, -0.0709228515625, -0.06414794921875, -0.057373046875, -0.05059814453125, -0.0438232421875, -0.03704833984375, -0.0302734375, -0.02349853515625, -0.0167236328125, -0.00994873046875, -0.003173828125, 0.00360107421875, 0.0103759765625, 0.01715087890625, 0.02392578125, 0.03070068359375, 0.0374755859375, 0.04425048828125, 0.051025390625, 0.05780029296875, 0.0645751953125, 0.07135009765625, 0.078125, 0.08489990234375, 0.0916748046875, 0.09844970703125, 0.105224609375, 0.11199951171875, 0.1187744140625, 0.12554931640625, 0.13232421875, 0.13909912109375, 0.1458740234375, 0.15264892578125, 0.159423828125, 0.16619873046875, 0.1729736328125, 0.17974853515625, 0.1865234375, 0.19329833984375, 0.2000732421875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 5.0, 6.0, 3.0, 6.0, 7.0, 10.0, 9.0, 12.0, 14.0, 16.0, 19.0, 22.0, 16.0, 29.0, 26.0, 38.0, 39.0, 44.0, 43.0, 45.0, 38.0, 47.0, 43.0, 47.0, 49.0, 40.0, 43.0, 39.0, 25.0, 35.0, 22.0, 34.0, 20.0, 12.0, 20.0, 14.0, 16.0, 17.0, 6.0, 11.0, 8.0, 3.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1383056640625, -0.1337127685546875, -0.129119873046875, -0.1245269775390625, -0.11993408203125, -0.1153411865234375, -0.110748291015625, -0.1061553955078125, -0.1015625, -0.0969696044921875, -0.092376708984375, -0.0877838134765625, -0.08319091796875, -0.0785980224609375, -0.074005126953125, -0.0694122314453125, -0.0648193359375, -0.0602264404296875, -0.055633544921875, -0.0510406494140625, -0.04644775390625, -0.0418548583984375, -0.037261962890625, -0.0326690673828125, -0.028076171875, -0.0234832763671875, -0.018890380859375, -0.0142974853515625, -0.00970458984375, -0.0051116943359375, -0.000518798828125, 0.0040740966796875, 0.0086669921875, 0.0132598876953125, 0.017852783203125, 0.0224456787109375, 0.02703857421875, 0.0316314697265625, 0.036224365234375, 0.0408172607421875, 0.04541015625, 0.0500030517578125, 0.054595947265625, 0.0591888427734375, 0.06378173828125, 0.0683746337890625, 0.072967529296875, 0.0775604248046875, 0.0821533203125, 0.0867462158203125, 0.091339111328125, 0.0959320068359375, 0.10052490234375, 0.1051177978515625, 0.109710693359375, 0.1143035888671875, 0.118896484375, 0.1234893798828125, 0.128082275390625, 0.1326751708984375, 0.13726806640625, 0.1418609619140625, 0.146453857421875, 0.1510467529296875, 0.1556396484375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 7.0, 19.0, 23.0, 35.0, 68.0, 107.0, 170.0, 379.0, 821.0, 2426.0, 8693.0, 36307.0, 331351.0, 608313.0, 44649.0, 10447.0, 2853.0, 978.0, 407.0, 221.0, 113.0, 76.0, 33.0, 24.0, 11.0, 11.0, 4.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.19873046875, -0.1921215057373047, -0.18551254272460938, -0.17890357971191406, -0.17229461669921875, -0.16568565368652344, -0.15907669067382812, -0.1524677276611328, -0.1458587646484375, -0.1392498016357422, -0.13264083862304688, -0.12603187561035156, -0.11942291259765625, -0.11281394958496094, -0.10620498657226562, -0.09959602355957031, -0.092987060546875, -0.08637809753417969, -0.07976913452148438, -0.07316017150878906, -0.06655120849609375, -0.05994224548339844, -0.053333282470703125, -0.04672431945800781, -0.0401153564453125, -0.03350639343261719, -0.026897430419921875, -0.020288467407226562, -0.01367950439453125, -0.0070705413818359375, -0.000461578369140625, 0.0061473846435546875, 0.01275634765625, 0.019365310668945312, 0.025974273681640625, 0.03258323669433594, 0.03919219970703125, 0.04580116271972656, 0.052410125732421875, 0.05901908874511719, 0.0656280517578125, 0.07223701477050781, 0.07884597778320312, 0.08545494079589844, 0.09206390380859375, 0.09867286682128906, 0.10528182983398438, 0.11189079284667969, 0.118499755859375, 0.1251087188720703, 0.13171768188476562, 0.13832664489746094, 0.14493560791015625, 0.15154457092285156, 0.15815353393554688, 0.1647624969482422, 0.1713714599609375, 0.1779804229736328, 0.18458938598632812, 0.19119834899902344, 0.19780731201171875, 0.20441627502441406, 0.21102523803710938, 0.2176342010498047, 0.2242431640625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 5.0, 8.0, 13.0, 13.0, 22.0, 42.0, 67.0, 128.0, 159.0, 164.0, 158.0, 98.0, 48.0, 30.0, 16.0, 9.0, 12.0, 6.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00022530555725097656, -0.00021995045244693756, -0.00021459534764289856, -0.00020924024283885956, -0.00020388513803482056, -0.00019853003323078156, -0.00019317492842674255, -0.00018781982362270355, -0.00018246471881866455, -0.00017710961401462555, -0.00017175450921058655, -0.00016639940440654755, -0.00016104429960250854, -0.00015568919479846954, -0.00015033408999443054, -0.00014497898519039154, -0.00013962388038635254, -0.00013426877558231354, -0.00012891367077827454, -0.00012355856597423553, -0.00011820346117019653, -0.00011284835636615753, -0.00010749325156211853, -0.00010213814675807953, -9.678304195404053e-05, -9.142793715000153e-05, -8.607283234596252e-05, -8.071772754192352e-05, -7.536262273788452e-05, -7.000751793384552e-05, -6.465241312980652e-05, -5.929730832576752e-05, -5.3942203521728516e-05, -4.8587098717689514e-05, -4.323199391365051e-05, -3.787688910961151e-05, -3.252178430557251e-05, -2.7166679501533508e-05, -2.1811574697494507e-05, -1.6456469893455505e-05, -1.1101365089416504e-05, -5.7462602853775024e-06, -3.91155481338501e-07, 4.9639493227005005e-06, 1.0319054126739502e-05, 1.5674158930778503e-05, 2.1029263734817505e-05, 2.6384368538856506e-05, 3.173947334289551e-05, 3.709457814693451e-05, 4.244968295097351e-05, 4.780478775501251e-05, 5.3159892559051514e-05, 5.8514997363090515e-05, 6.387010216712952e-05, 6.922520697116852e-05, 7.458031177520752e-05, 7.993541657924652e-05, 8.529052138328552e-05, 9.064562618732452e-05, 9.600073099136353e-05, 0.00010135583579540253, 0.00010671094059944153, 0.00011206604540348053, 0.00011742115020751953]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 7.0, 9.0, 10.0, 9.0, 21.0, 27.0, 56.0, 80.0, 125.0, 192.0, 362.0, 797.0, 1862.0, 6788.0, 30783.0, 281300.0, 670446.0, 42277.0, 9081.0, 2407.0, 862.0, 449.0, 244.0, 132.0, 73.0, 59.0, 43.0, 21.0, 11.0, 6.0, 5.0, 4.0, 4.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1820068359375, -0.17552947998046875, -0.1690521240234375, -0.16257476806640625, -0.156097412109375, -0.14962005615234375, -0.1431427001953125, -0.13666534423828125, -0.13018798828125, -0.12371063232421875, -0.1172332763671875, -0.11075592041015625, -0.104278564453125, -0.09780120849609375, -0.0913238525390625, -0.08484649658203125, -0.078369140625, -0.07189178466796875, -0.0654144287109375, -0.05893707275390625, -0.052459716796875, -0.04598236083984375, -0.0395050048828125, -0.03302764892578125, -0.02655029296875, -0.02007293701171875, -0.0135955810546875, -0.00711822509765625, -0.000640869140625, 0.00583648681640625, 0.0123138427734375, 0.01879119873046875, 0.0252685546875, 0.03174591064453125, 0.0382232666015625, 0.04470062255859375, 0.051177978515625, 0.05765533447265625, 0.0641326904296875, 0.07061004638671875, 0.07708740234375, 0.08356475830078125, 0.0900421142578125, 0.09651947021484375, 0.102996826171875, 0.10947418212890625, 0.1159515380859375, 0.12242889404296875, 0.12890625, 0.13538360595703125, 0.1418609619140625, 0.14833831787109375, 0.154815673828125, 0.16129302978515625, 0.1677703857421875, 0.17424774169921875, 0.18072509765625, 0.18720245361328125, 0.1936798095703125, 0.20015716552734375, 0.206634521484375, 0.21311187744140625, 0.2195892333984375, 0.22606658935546875, 0.2325439453125]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 4.0, 3.0, 1.0, 3.0, 4.0, 3.0, 5.0, 8.0, 9.0, 12.0, 12.0, 17.0, 10.0, 20.0, 27.0, 22.0, 57.0, 92.0, 195.0, 182.0, 114.0, 38.0, 40.0, 26.0, 18.0, 18.0, 17.0, 11.0, 10.0, 5.0, 6.0, 6.0, 0.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09490966796875, -0.09185028076171875, -0.0887908935546875, -0.08573150634765625, -0.082672119140625, -0.07961273193359375, -0.0765533447265625, -0.07349395751953125, -0.0704345703125, -0.06737518310546875, -0.0643157958984375, -0.06125640869140625, -0.058197021484375, -0.05513763427734375, -0.0520782470703125, -0.04901885986328125, -0.04595947265625, -0.04290008544921875, -0.0398406982421875, -0.03678131103515625, -0.033721923828125, -0.03066253662109375, -0.0276031494140625, -0.02454376220703125, -0.021484375, -0.01842498779296875, -0.0153656005859375, -0.01230621337890625, -0.009246826171875, -0.00618743896484375, -0.0031280517578125, -6.866455078125e-05, 0.00299072265625, 0.00605010986328125, 0.0091094970703125, 0.01216888427734375, 0.015228271484375, 0.01828765869140625, 0.0213470458984375, 0.02440643310546875, 0.0274658203125, 0.03052520751953125, 0.0335845947265625, 0.03664398193359375, 0.039703369140625, 0.04276275634765625, 0.0458221435546875, 0.04888153076171875, 0.05194091796875, 0.05500030517578125, 0.0580596923828125, 0.06111907958984375, 0.064178466796875, 0.06723785400390625, 0.0702972412109375, 0.07335662841796875, 0.076416015625, 0.07947540283203125, 0.0825347900390625, 0.08559417724609375, 0.088653564453125, 0.09171295166015625, 0.0947723388671875, 0.09783172607421875, 0.10089111328125]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 3.0, 3.0, 6.0, 17.0, 35.0, 45.0, 84.0, 139.0, 163.0, 140.0, 117.0, 98.0, 76.0, 37.0, 19.0, 9.0, 3.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.417062520980835, -1.3601893186569214, -1.3033161163330078, -1.2464427947998047, -1.1895695924758911, -1.1326963901519775, -1.075823187828064, -1.0189499855041504, -0.9620767831802368, -0.9052035808563232, -0.8483303189277649, -0.7914571166038513, -0.7345839142799377, -0.6777106523513794, -0.6208374500274658, -0.5639642477035522, -0.5070909857749939, -0.45021775364875793, -0.39334455132484436, -0.3364713191986084, -0.2795981168746948, -0.22272488474845886, -0.1658516526222229, -0.10897845029830933, -0.052105218172073364, 0.004768002778291702, 0.06164122372865677, 0.11851444840431213, 0.1753876656293869, 0.23226088285446167, 0.28913411498069763, 0.3460073173046112, 0.40288054943084717, 0.45975378155708313, 0.5166270136833191, 0.5735002160072327, 0.6303734183311462, 0.6872466802597046, 0.7441198825836182, 0.8009930849075317, 0.8578662872314453, 0.9147394895553589, 0.9716127514839172, 1.0284860134124756, 1.0853592157363892, 1.1422324180603027, 1.1991056203842163, 1.2559788227081299, 1.312852144241333, 1.3697253465652466, 1.4265985488891602, 1.4834718704223633, 1.5403450727462769, 1.5972182750701904, 1.654091477394104, 1.7109646797180176, 1.7678378820419312, 1.8247110843658447, 1.8815842866897583, 1.9384574890136719, 1.995330810546875, 2.052203893661499, 2.109077215194702, 2.165950298309326, 2.2228236198425293]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 6.0, 3.0, 4.0, 7.0, 7.0, 11.0, 10.0, 11.0, 27.0, 23.0, 27.0, 30.0, 25.0, 45.0, 31.0, 35.0, 36.0, 44.0, 40.0, 38.0, 37.0, 53.0, 51.0, 52.0, 39.0, 47.0, 41.0, 32.0, 28.0, 18.0, 29.0, 25.0, 21.0, 11.0, 12.0, 10.0, 7.0, 11.0, 7.0, 5.0, 7.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.8936876654624939, -0.8686922192573547, -0.8436967730522156, -0.8187013268470764, -0.7937058806419373, -0.7687104344367981, -0.7437149286270142, -0.718719482421875, -0.6937240362167358, -0.6687285900115967, -0.6437331438064575, -0.6187376976013184, -0.5937422513961792, -0.56874680519104, -0.5437513589859009, -0.5187559127807617, -0.49376046657562256, -0.4687650203704834, -0.44376957416534424, -0.4187741279602051, -0.3937786817550659, -0.36878323554992676, -0.3437877595424652, -0.31879231333732605, -0.2937968671321869, -0.26880142092704773, -0.24380597472190857, -0.21881051361560822, -0.19381506741046906, -0.1688196212053299, -0.14382416009902954, -0.11882871389389038, -0.09383320808410645, -0.06883776187896729, -0.04384230822324753, -0.01884685456752777, 0.006148591637611389, 0.03114403784275055, 0.0561394989490509, 0.08113494515419006, 0.10613039135932922, 0.13112583756446838, 0.15612128376960754, 0.1811167448759079, 0.20611219108104706, 0.23110763728618622, 0.2561030983924866, 0.28109854459762573, 0.3060939908027649, 0.33108943700790405, 0.3560848832130432, 0.3810803294181824, 0.40607577562332153, 0.4310712218284607, 0.45606669783592224, 0.4810621440410614, 0.506057620048523, 0.5310530662536621, 0.5560485124588013, 0.5810439586639404, 0.6060394048690796, 0.6310348510742188, 0.6560302972793579, 0.6810257434844971, 0.7060211896896362]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 6.0, 6.0, 2.0, 5.0, 9.0, 11.0, 7.0, 17.0, 27.0, 27.0, 32.0, 64.0, 127.0, 184.0, 257.0, 480.0, 783.0, 1508.0, 3165.0, 7007.0, 18147.0, 57604.0, 289214.0, 3419962.0, 303468.0, 59293.0, 18680.0, 7262.0, 3273.0, 1562.0, 837.0, 444.0, 307.0, 179.0, 107.0, 75.0, 39.0, 29.0, 8.0, 15.0, 12.0, 8.0, 17.0, 6.0, 4.0, 3.0, 5.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1827392578125, -0.17711830139160156, -0.17149734497070312, -0.1658763885498047, -0.16025543212890625, -0.1546344757080078, -0.14901351928710938, -0.14339256286621094, -0.1377716064453125, -0.13215065002441406, -0.12652969360351562, -0.12090873718261719, -0.11528778076171875, -0.10966682434082031, -0.10404586791992188, -0.09842491149902344, -0.092803955078125, -0.08718299865722656, -0.08156204223632812, -0.07594108581542969, -0.07032012939453125, -0.06469917297363281, -0.059078216552734375, -0.05345726013183594, -0.0478363037109375, -0.04221534729003906, -0.036594390869140625, -0.030973434448242188, -0.02535247802734375, -0.019731521606445312, -0.014110565185546875, -0.008489608764648438, -0.00286865234375, 0.0027523040771484375, 0.008373260498046875, 0.013994216918945312, 0.01961517333984375, 0.025236129760742188, 0.030857086181640625, 0.03647804260253906, 0.0420989990234375, 0.04771995544433594, 0.053340911865234375, 0.05896186828613281, 0.06458282470703125, 0.07020378112792969, 0.07582473754882812, 0.08144569396972656, 0.087066650390625, 0.09268760681152344, 0.09830856323242188, 0.10392951965332031, 0.10955047607421875, 0.11517143249511719, 0.12079238891601562, 0.12641334533691406, 0.1320343017578125, 0.13765525817871094, 0.14327621459960938, 0.1488971710205078, 0.15451812744140625, 0.1601390838623047, 0.16576004028320312, 0.17138099670410156, 0.177001953125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 4.0, 11.0, 5.0, 10.0, 6.0, 12.0, 20.0, 23.0, 25.0, 33.0, 35.0, 38.0, 40.0, 44.0, 40.0, 47.0, 53.0, 69.0, 61.0, 58.0, 49.0, 39.0, 49.0, 39.0, 26.0, 31.0, 25.0, 20.0, 26.0, 14.0, 10.0, 13.0, 8.0, 8.0, 5.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.041839599609375, -0.04063224792480469, -0.039424896240234375, -0.03821754455566406, -0.03701019287109375, -0.03580284118652344, -0.034595489501953125, -0.03338813781738281, -0.0321807861328125, -0.030973434448242188, -0.029766082763671875, -0.028558731079101562, -0.02735137939453125, -0.026144027709960938, -0.024936676025390625, -0.023729324340820312, -0.02252197265625, -0.021314620971679688, -0.020107269287109375, -0.018899917602539062, -0.01769256591796875, -0.016485214233398438, -0.015277862548828125, -0.014070510864257812, -0.0128631591796875, -0.011655807495117188, -0.010448455810546875, -0.009241104125976562, -0.00803375244140625, -0.0068264007568359375, -0.005619049072265625, -0.0044116973876953125, -0.003204345703125, -0.0019969940185546875, -0.000789642333984375, 0.0004177093505859375, 0.00162506103515625, 0.0028324127197265625, 0.004039764404296875, 0.0052471160888671875, 0.0064544677734375, 0.0076618194580078125, 0.008869171142578125, 0.010076522827148438, 0.01128387451171875, 0.012491226196289062, 0.013698577880859375, 0.014905929565429688, 0.01611328125, 0.017320632934570312, 0.018527984619140625, 0.019735336303710938, 0.02094268798828125, 0.022150039672851562, 0.023357391357421875, 0.024564743041992188, 0.0257720947265625, 0.026979446411132812, 0.028186798095703125, 0.029394149780273438, 0.03060150146484375, 0.03180885314941406, 0.033016204833984375, 0.03422355651855469, 0.035430908203125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 6.0, 8.0, 7.0, 11.0, 7.0, 17.0, 8.0, 16.0, 32.0, 51.0, 57.0, 85.0, 158.0, 326.0, 817.0, 2711.0, 10255.0, 57201.0, 1220156.0, 2812440.0, 72805.0, 12235.0, 3073.0, 939.0, 380.0, 154.0, 94.0, 54.0, 44.0, 33.0, 27.0, 17.0, 15.0, 11.0, 9.0, 7.0, 5.0, 2.0, 3.0, 4.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.314697265625, -0.3038673400878906, -0.29303741455078125, -0.2822074890136719, -0.2713775634765625, -0.2605476379394531, -0.24971771240234375, -0.23888778686523438, -0.228057861328125, -0.21722793579101562, -0.20639801025390625, -0.19556808471679688, -0.1847381591796875, -0.17390823364257812, -0.16307830810546875, -0.15224838256835938, -0.14141845703125, -0.13058853149414062, -0.11975860595703125, -0.10892868041992188, -0.0980987548828125, -0.08726882934570312, -0.07643890380859375, -0.06560897827148438, -0.054779052734375, -0.043949127197265625, -0.03311920166015625, -0.022289276123046875, -0.0114593505859375, -0.000629425048828125, 0.01020050048828125, 0.021030426025390625, 0.0318603515625, 0.042690277099609375, 0.05352020263671875, 0.06435012817382812, 0.0751800537109375, 0.08600997924804688, 0.09683990478515625, 0.10766983032226562, 0.118499755859375, 0.12932968139648438, 0.14015960693359375, 0.15098953247070312, 0.1618194580078125, 0.17264938354492188, 0.18347930908203125, 0.19430923461914062, 0.20513916015625, 0.21596908569335938, 0.22679901123046875, 0.23762893676757812, 0.2484588623046875, 0.2592887878417969, 0.27011871337890625, 0.2809486389160156, 0.291778564453125, 0.3026084899902344, 0.31343841552734375, 0.3242683410644531, 0.3350982666015625, 0.3459281921386719, 0.35675811767578125, 0.3675880432128906, 0.37841796875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 7.0, 11.0, 16.0, 16.0, 34.0, 50.0, 102.0, 183.0, 393.0, 1771.0, 921.0, 268.0, 123.0, 71.0, 50.0, 24.0, 11.0, 8.0, 8.0, 5.0, 3.0, 3.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08837890625, -0.08413124084472656, -0.07988357543945312, -0.07563591003417969, -0.07138824462890625, -0.06714057922363281, -0.06289291381835938, -0.05864524841308594, -0.0543975830078125, -0.05014991760253906, -0.045902252197265625, -0.04165458679199219, -0.03740692138671875, -0.03315925598144531, -0.028911590576171875, -0.024663925170898438, -0.020416259765625, -0.016168594360351562, -0.011920928955078125, -0.0076732635498046875, -0.00342559814453125, 0.0008220672607421875, 0.005069732666015625, 0.009317398071289062, 0.0135650634765625, 0.017812728881835938, 0.022060394287109375, 0.026308059692382812, 0.03055572509765625, 0.03480339050292969, 0.039051055908203125, 0.04329872131347656, 0.04754638671875, 0.05179405212402344, 0.056041717529296875, 0.06028938293457031, 0.06453704833984375, 0.06878471374511719, 0.07303237915039062, 0.07728004455566406, 0.0815277099609375, 0.08577537536621094, 0.09002304077148438, 0.09427070617675781, 0.09851837158203125, 0.10276603698730469, 0.10701370239257812, 0.11126136779785156, 0.115509033203125, 0.11975669860839844, 0.12400436401367188, 0.1282520294189453, 0.13249969482421875, 0.1367473602294922, 0.14099502563476562, 0.14524269104003906, 0.1494903564453125, 0.15373802185058594, 0.15798568725585938, 0.1622333526611328, 0.16648101806640625, 0.1707286834716797, 0.17497634887695312, 0.17922401428222656, 0.1834716796875]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 5.0, 6.0, 18.0, 33.0, 77.0, 141.0, 203.0, 221.0, 151.0, 95.0, 36.0, 17.0, 4.0, 6.0, 3.0, 2.0], "bins": [-1.8768258094787598, -1.8426988124847412, -1.808571696281433, -1.7744446992874146, -1.740317702293396, -1.706190586090088, -1.6720635890960693, -1.6379365921020508, -1.6038095951080322, -1.5696825981140137, -1.5355554819107056, -1.501428484916687, -1.4673014879226685, -1.4331743717193604, -1.3990473747253418, -1.3649203777313232, -1.3307932615280151, -1.2966662645339966, -1.2625391483306885, -1.22841215133667, -1.1942851543426514, -1.1601581573486328, -1.1260310411453247, -1.0919040441513062, -1.057776927947998, -1.0236499309539795, -0.9895228743553162, -0.9553958177566528, -0.9212688207626343, -0.887141764163971, -0.8530147075653076, -0.8188877105712891, -0.7847608327865601, -0.7506337761878967, -0.7165067791938782, -0.6823797225952148, -0.6482527256011963, -0.614125669002533, -0.5799986124038696, -0.5458716154098511, -0.5117445588111877, -0.4776175320148468, -0.44349050521850586, -0.40936344861984253, -0.3752364218235016, -0.34110939502716064, -0.3069823384284973, -0.27285531163215637, -0.23872828483581543, -0.2046012580394745, -0.17047421634197235, -0.13634717464447021, -0.10222014784812927, -0.06809312105178833, -0.033966079354286194, 0.00016096234321594238, 0.034287989139556885, 0.06841502338647842, 0.10254205763339996, 0.1366690993309021, 0.17079612612724304, 0.20492315292358398, 0.23905019462108612, 0.27317723631858826, 0.3073042631149292]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0, 5.0, 12.0, 9.0, 7.0, 22.0, 11.0, 19.0, 24.0, 25.0, 26.0, 35.0, 42.0, 46.0, 46.0, 27.0, 51.0, 43.0, 49.0, 44.0, 45.0, 36.0, 42.0, 42.0, 43.0, 30.0, 35.0, 25.0, 22.0, 22.0, 17.0, 16.0, 19.0, 8.0, 11.0, 5.0, 12.0, 5.0, 5.0, 9.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.3190132975578308, -0.30939653515815735, -0.2997797727584839, -0.29016298055648804, -0.2805462181568146, -0.2709294557571411, -0.26131266355514526, -0.2516959011554718, -0.24207913875579834, -0.23246237635612488, -0.22284559905529022, -0.21322882175445557, -0.2036120593547821, -0.19399529695510864, -0.184378519654274, -0.17476174235343933, -0.16514497995376587, -0.1555282175540924, -0.14591144025325775, -0.1362946629524231, -0.12667790055274963, -0.11706113070249557, -0.10744436085224152, -0.09782759100198746, -0.0882108211517334, -0.07859405130147934, -0.06897728145122528, -0.05936051160097122, -0.04974374175071716, -0.040126971900463104, -0.030510202050209045, -0.020893432199954987, -0.011276662349700928, -0.001659892499446869, 0.00795687735080719, 0.01757364720106125, 0.027190417051315308, 0.036807186901569366, 0.046423956751823425, 0.056040726602077484, 0.06565749645233154, 0.0752742663025856, 0.08489103615283966, 0.09450780600309372, 0.10412457585334778, 0.11374134570360184, 0.1233581155538559, 0.13297489285469055, 0.142591655254364, 0.15220841765403748, 0.16182519495487213, 0.1714419722557068, 0.18105873465538025, 0.1906754970550537, 0.20029227435588837, 0.20990905165672302, 0.21952581405639648, 0.22914257645606995, 0.2387593537569046, 0.24837613105773926, 0.2579928934574127, 0.2676096558570862, 0.27722644805908203, 0.2868432104587555, 0.29645997285842896]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 6.0, 3.0, 6.0, 13.0, 14.0, 31.0, 50.0, 76.0, 145.0, 254.0, 530.0, 1158.0, 2788.0, 6994.0, 17001.0, 40310.0, 150754.0, 627994.0, 134541.0, 38434.0, 15974.0, 6581.0, 2691.0, 1107.0, 521.0, 256.0, 134.0, 70.0, 43.0, 28.0, 21.0, 12.0, 9.0, 9.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1988525390625, -0.19368362426757812, -0.18851470947265625, -0.18334579467773438, -0.1781768798828125, -0.17300796508789062, -0.16783905029296875, -0.16267013549804688, -0.157501220703125, -0.15233230590820312, -0.14716339111328125, -0.14199447631835938, -0.1368255615234375, -0.13165664672851562, -0.12648773193359375, -0.12131881713867188, -0.11614990234375, -0.11098098754882812, -0.10581207275390625, -0.10064315795898438, -0.0954742431640625, -0.09030532836914062, -0.08513641357421875, -0.07996749877929688, -0.074798583984375, -0.06962966918945312, -0.06446075439453125, -0.059291839599609375, -0.0541229248046875, -0.048954010009765625, -0.04378509521484375, -0.038616180419921875, -0.033447265625, -0.028278350830078125, -0.02310943603515625, -0.017940521240234375, -0.0127716064453125, -0.007602691650390625, -0.00243377685546875, 0.002735137939453125, 0.007904052734375, 0.013072967529296875, 0.01824188232421875, 0.023410797119140625, 0.0285797119140625, 0.033748626708984375, 0.03891754150390625, 0.044086456298828125, 0.04925537109375, 0.054424285888671875, 0.05959320068359375, 0.06476211547851562, 0.0699310302734375, 0.07509994506835938, 0.08026885986328125, 0.08543777465820312, 0.090606689453125, 0.09577560424804688, 0.10094451904296875, 0.10611343383789062, 0.1112823486328125, 0.11645126342773438, 0.12162017822265625, 0.12678909301757812, 0.1319580078125]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 5.0, 9.0, 5.0, 15.0, 11.0, 17.0, 25.0, 23.0, 23.0, 49.0, 44.0, 47.0, 52.0, 54.0, 59.0, 76.0, 67.0, 63.0, 49.0, 53.0, 49.0, 35.0, 42.0, 34.0, 22.0, 26.0, 11.0, 12.0, 8.0, 5.0, 7.0, 5.0, 7.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0599365234375, -0.05839204788208008, -0.056847572326660156, -0.055303096771240234, -0.05375862121582031, -0.05221414566040039, -0.05066967010498047, -0.04912519454956055, -0.047580718994140625, -0.0460362434387207, -0.04449176788330078, -0.04294729232788086, -0.04140281677246094, -0.039858341217041016, -0.038313865661621094, -0.03676939010620117, -0.03522491455078125, -0.03368043899536133, -0.032135963439941406, -0.030591487884521484, -0.029047012329101562, -0.02750253677368164, -0.02595806121826172, -0.024413585662841797, -0.022869110107421875, -0.021324634552001953, -0.01978015899658203, -0.01823568344116211, -0.016691207885742188, -0.015146732330322266, -0.013602256774902344, -0.012057781219482422, -0.0105133056640625, -0.008968830108642578, -0.007424354553222656, -0.005879878997802734, -0.0043354034423828125, -0.0027909278869628906, -0.0012464523315429688, 0.0002980232238769531, 0.001842498779296875, 0.003386974334716797, 0.004931449890136719, 0.006475925445556641, 0.008020401000976562, 0.009564876556396484, 0.011109352111816406, 0.012653827667236328, 0.01419830322265625, 0.015742778778076172, 0.017287254333496094, 0.018831729888916016, 0.020376205444335938, 0.02192068099975586, 0.02346515655517578, 0.025009632110595703, 0.026554107666015625, 0.028098583221435547, 0.02964305877685547, 0.03118753433227539, 0.03273200988769531, 0.034276485443115234, 0.035820960998535156, 0.03736543655395508, 0.038909912109375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 4.0, 2.0, 4.0, 4.0, 4.0, 11.0, 9.0, 11.0, 11.0, 18.0, 26.0, 21.0, 46.0, 52.0, 79.0, 103.0, 141.0, 263.0, 355.0, 614.0, 1228.0, 2820.0, 6974.0, 16758.0, 39499.0, 148568.0, 687945.0, 87352.0, 31854.0, 13451.0, 5458.0, 2322.0, 1046.0, 524.0, 300.0, 205.0, 115.0, 99.0, 70.0, 53.0, 31.0, 23.0, 18.0, 12.0, 16.0, 17.0, 11.0, 6.0, 2.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.18212890625, -0.17650222778320312, -0.17087554931640625, -0.16524887084960938, -0.1596221923828125, -0.15399551391601562, -0.14836883544921875, -0.14274215698242188, -0.137115478515625, -0.13148880004882812, -0.12586212158203125, -0.12023544311523438, -0.1146087646484375, -0.10898208618164062, -0.10335540771484375, -0.09772872924804688, -0.09210205078125, -0.08647537231445312, -0.08084869384765625, -0.07522201538085938, -0.0695953369140625, -0.06396865844726562, -0.05834197998046875, -0.052715301513671875, -0.047088623046875, -0.041461944580078125, -0.03583526611328125, -0.030208587646484375, -0.0245819091796875, -0.018955230712890625, -0.01332855224609375, -0.007701873779296875, -0.0020751953125, 0.003551483154296875, 0.00917816162109375, 0.014804840087890625, 0.0204315185546875, 0.026058197021484375, 0.03168487548828125, 0.037311553955078125, 0.042938232421875, 0.048564910888671875, 0.05419158935546875, 0.059818267822265625, 0.0654449462890625, 0.07107162475585938, 0.07669830322265625, 0.08232498168945312, 0.08795166015625, 0.09357833862304688, 0.09920501708984375, 0.10483169555664062, 0.1104583740234375, 0.11608505249023438, 0.12171173095703125, 0.12733840942382812, 0.132965087890625, 0.13859176635742188, 0.14421844482421875, 0.14984512329101562, 0.1554718017578125, 0.16109848022460938, 0.16672515869140625, 0.17235183715820312, 0.177978515625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 0.0, 3.0, 6.0, 8.0, 9.0, 7.0, 17.0, 9.0, 15.0, 21.0, 18.0, 31.0, 35.0, 37.0, 35.0, 39.0, 37.0, 50.0, 52.0, 52.0, 58.0, 59.0, 49.0, 53.0, 47.0, 53.0, 36.0, 33.0, 20.0, 27.0, 16.0, 13.0, 10.0, 16.0, 10.0, 4.0, 7.0, 4.0, 1.0, 3.0, 0.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1966552734375, -0.19029808044433594, -0.18394088745117188, -0.1775836944580078, -0.17122650146484375, -0.1648693084716797, -0.15851211547851562, -0.15215492248535156, -0.1457977294921875, -0.13944053649902344, -0.13308334350585938, -0.1267261505126953, -0.12036895751953125, -0.11401176452636719, -0.10765457153320312, -0.10129737854003906, -0.094940185546875, -0.08858299255371094, -0.08222579956054688, -0.07586860656738281, -0.06951141357421875, -0.06315422058105469, -0.056797027587890625, -0.05043983459472656, -0.0440826416015625, -0.03772544860839844, -0.031368255615234375, -0.025011062622070312, -0.01865386962890625, -0.012296676635742188, -0.005939483642578125, 0.0004177093505859375, 0.00677490234375, 0.013132095336914062, 0.019489288330078125, 0.025846481323242188, 0.03220367431640625, 0.03856086730957031, 0.044918060302734375, 0.05127525329589844, 0.0576324462890625, 0.06398963928222656, 0.07034683227539062, 0.07670402526855469, 0.08306121826171875, 0.08941841125488281, 0.09577560424804688, 0.10213279724121094, 0.108489990234375, 0.11484718322753906, 0.12120437622070312, 0.1275615692138672, 0.13391876220703125, 0.1402759552001953, 0.14663314819335938, 0.15299034118652344, 0.1593475341796875, 0.16570472717285156, 0.17206192016601562, 0.1784191131591797, 0.18477630615234375, 0.1911334991455078, 0.19749069213867188, 0.20384788513183594, 0.210205078125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 9.0, 12.0, 19.0, 51.0, 104.0, 268.0, 1290.0, 11688.0, 843208.0, 184160.0, 6462.0, 902.0, 198.0, 83.0, 46.0, 25.0, 13.0, 7.0, 5.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.345947265625, -0.3325843811035156, -0.31922149658203125, -0.3058586120605469, -0.2924957275390625, -0.2791328430175781, -0.26576995849609375, -0.2524070739746094, -0.239044189453125, -0.22568130493164062, -0.21231842041015625, -0.19895553588867188, -0.1855926513671875, -0.17222976684570312, -0.15886688232421875, -0.14550399780273438, -0.13214111328125, -0.11877822875976562, -0.10541534423828125, -0.09205245971679688, -0.0786895751953125, -0.06532669067382812, -0.05196380615234375, -0.038600921630859375, -0.025238037109375, -0.011875152587890625, 0.00148773193359375, 0.014850616455078125, 0.0282135009765625, 0.041576385498046875, 0.05493927001953125, 0.06830215454101562, 0.0816650390625, 0.09502792358398438, 0.10839080810546875, 0.12175369262695312, 0.1351165771484375, 0.14847946166992188, 0.16184234619140625, 0.17520523071289062, 0.188568115234375, 0.20193099975585938, 0.21529388427734375, 0.22865676879882812, 0.2420196533203125, 0.2553825378417969, 0.26874542236328125, 0.2821083068847656, 0.29547119140625, 0.3088340759277344, 0.32219696044921875, 0.3355598449707031, 0.3489227294921875, 0.3622856140136719, 0.37564849853515625, 0.3890113830566406, 0.402374267578125, 0.4157371520996094, 0.42910003662109375, 0.4424629211425781, 0.4558258056640625, 0.4691886901855469, 0.48255157470703125, 0.4959144592285156, 0.50927734375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 6.0, 1.0, 5.0, 8.0, 3.0, 11.0, 9.0, 15.0, 14.0, 19.0, 32.0, 26.0, 35.0, 44.0, 69.0, 71.0, 79.0, 76.0, 83.0, 60.0, 68.0, 61.0, 41.0, 25.0, 24.0, 26.0, 20.0, 10.0, 10.0, 12.0, 10.0, 8.0, 6.0, 2.0, 0.0, 4.0, 2.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-7.49826431274414e-05, -7.278937846422195e-05, -7.05961138010025e-05, -6.840284913778305e-05, -6.62095844745636e-05, -6.401631981134415e-05, -6.18230551481247e-05, -5.962979048490524e-05, -5.743652582168579e-05, -5.524326115846634e-05, -5.304999649524689e-05, -5.0856731832027435e-05, -4.8663467168807983e-05, -4.647020250558853e-05, -4.427693784236908e-05, -4.208367317914963e-05, -3.9890408515930176e-05, -3.7697143852710724e-05, -3.550387918949127e-05, -3.331061452627182e-05, -3.111734986305237e-05, -2.8924085199832916e-05, -2.6730820536613464e-05, -2.4537555873394012e-05, -2.234429121017456e-05, -2.015102654695511e-05, -1.7957761883735657e-05, -1.5764497220516205e-05, -1.3571232557296753e-05, -1.1377967894077301e-05, -9.184703230857849e-06, -6.991438567638397e-06, -4.798173904418945e-06, -2.6049092411994934e-06, -4.116445779800415e-07, 1.7816200852394104e-06, 3.974884748458862e-06, 6.168149411678314e-06, 8.361414074897766e-06, 1.0554678738117218e-05, 1.274794340133667e-05, 1.4941208064556122e-05, 1.7134472727775574e-05, 1.9327737390995026e-05, 2.1521002054214478e-05, 2.371426671743393e-05, 2.590753138065338e-05, 2.8100796043872833e-05, 3.0294060707092285e-05, 3.248732537031174e-05, 3.468059003353119e-05, 3.687385469675064e-05, 3.906711935997009e-05, 4.1260384023189545e-05, 4.3453648686408997e-05, 4.564691334962845e-05, 4.78401780128479e-05, 5.003344267606735e-05, 5.2226707339286804e-05, 5.4419972002506256e-05, 5.661323666572571e-05, 5.880650132894516e-05, 6.099976599216461e-05, 6.319303065538406e-05, 6.538629531860352e-05]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 1.0, 1.0, 5.0, 6.0, 2.0, 7.0, 10.0, 12.0, 11.0, 15.0, 20.0, 27.0, 54.0, 65.0, 103.0, 184.0, 322.0, 607.0, 1189.0, 2530.0, 6259.0, 17686.0, 63423.0, 676103.0, 223072.0, 37231.0, 11410.0, 4249.0, 1900.0, 871.0, 462.0, 289.0, 132.0, 99.0, 46.0, 44.0, 32.0, 10.0, 17.0, 17.0, 12.0, 9.0, 5.0, 7.0, 0.0, 3.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.139892578125, -0.13535118103027344, -0.13080978393554688, -0.1262683868408203, -0.12172698974609375, -0.11718559265136719, -0.11264419555664062, -0.10810279846191406, -0.1035614013671875, -0.09902000427246094, -0.09447860717773438, -0.08993721008300781, -0.08539581298828125, -0.08085441589355469, -0.07631301879882812, -0.07177162170410156, -0.067230224609375, -0.06268882751464844, -0.058147430419921875, -0.05360603332519531, -0.04906463623046875, -0.04452323913574219, -0.039981842041015625, -0.03544044494628906, -0.0308990478515625, -0.026357650756835938, -0.021816253662109375, -0.017274856567382812, -0.01273345947265625, -0.008192062377929688, -0.003650665283203125, 0.0008907318115234375, 0.00543212890625, 0.009973526000976562, 0.014514923095703125, 0.019056320190429688, 0.02359771728515625, 0.028139114379882812, 0.032680511474609375, 0.03722190856933594, 0.0417633056640625, 0.04630470275878906, 0.050846099853515625, 0.05538749694824219, 0.05992889404296875, 0.06447029113769531, 0.06901168823242188, 0.07355308532714844, 0.078094482421875, 0.08263587951660156, 0.08717727661132812, 0.09171867370605469, 0.09626007080078125, 0.10080146789550781, 0.10534286499023438, 0.10988426208496094, 0.1144256591796875, 0.11896705627441406, 0.12350845336914062, 0.1280498504638672, 0.13259124755859375, 0.1371326446533203, 0.14167404174804688, 0.14621543884277344, 0.1507568359375]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 4.0, 3.0, 8.0, 8.0, 6.0, 9.0, 5.0, 17.0, 21.0, 20.0, 39.0, 64.0, 134.0, 194.0, 177.0, 82.0, 49.0, 38.0, 31.0, 18.0, 11.0, 15.0, 6.0, 6.0, 8.0, 4.0, 4.0, 5.0, 6.0, 2.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.1480712890625, -0.1440439224243164, -0.1400165557861328, -0.13598918914794922, -0.13196182250976562, -0.12793445587158203, -0.12390708923339844, -0.11987972259521484, -0.11585235595703125, -0.11182498931884766, -0.10779762268066406, -0.10377025604248047, -0.09974288940429688, -0.09571552276611328, -0.09168815612792969, -0.0876607894897461, -0.0836334228515625, -0.0796060562133789, -0.07557868957519531, -0.07155132293701172, -0.06752395629882812, -0.06349658966064453, -0.05946922302246094, -0.055441856384277344, -0.05141448974609375, -0.047387123107910156, -0.04335975646972656, -0.03933238983154297, -0.035305023193359375, -0.03127765655517578, -0.027250289916992188, -0.023222923278808594, -0.019195556640625, -0.015168190002441406, -0.011140823364257812, -0.007113456726074219, -0.003086090087890625, 0.0009412765502929688, 0.0049686431884765625, 0.008996009826660156, 0.01302337646484375, 0.017050743103027344, 0.021078109741210938, 0.02510547637939453, 0.029132843017578125, 0.03316020965576172, 0.03718757629394531, 0.041214942932128906, 0.0452423095703125, 0.049269676208496094, 0.05329704284667969, 0.05732440948486328, 0.061351776123046875, 0.06537914276123047, 0.06940650939941406, 0.07343387603759766, 0.07746124267578125, 0.08148860931396484, 0.08551597595214844, 0.08954334259033203, 0.09357070922851562, 0.09759807586669922, 0.10162544250488281, 0.1056528091430664, 0.10968017578125]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 6.0, 16.0, 34.0, 49.0, 74.0, 124.0, 156.0, 173.0, 118.0, 105.0, 66.0, 42.0, 17.0, 7.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.253738522529602, -1.1973276138305664, -1.1409168243408203, -1.0845060348510742, -1.0280951261520386, -0.9716842770576477, -0.9152734279632568, -0.858862578868866, -0.8024517297744751, -0.7460408806800842, -0.6896300315856934, -0.6332191824913025, -0.5768083333969116, -0.5203974843025208, -0.4639866352081299, -0.407575786113739, -0.35116493701934814, -0.2947540879249573, -0.2383432388305664, -0.18193238973617554, -0.12552154064178467, -0.0691106915473938, -0.01269984245300293, 0.04371100664138794, 0.10012185573577881, 0.15653270483016968, 0.21294355392456055, 0.2693544030189514, 0.3257652521133423, 0.38217610120773315, 0.438586950302124, 0.4949977993965149, 0.5514085292816162, 0.6078193783760071, 0.664230227470398, 0.7206410765647888, 0.7770519256591797, 0.8334627747535706, 0.8898736238479614, 0.9462844729423523, 1.0026953220367432, 1.0591061115264893, 1.115517020225525, 1.1719279289245605, 1.2283387184143066, 1.2847495079040527, 1.3411604166030884, 1.397571325302124, 1.4539821147918701, 1.5103929042816162, 1.5668038129806519, 1.6232147216796875, 1.6796255111694336, 1.7360363006591797, 1.7924472093582153, 1.848858118057251, 1.905268907546997, 1.9616796970367432, 2.0180907249450684, 2.0745015144348145, 2.1309123039245605, 2.1873230934143066, 2.2437338829040527, 2.300144910812378, 2.356555700302124]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 2.0, 4.0, 1.0, 3.0, 3.0, 6.0, 10.0, 8.0, 10.0, 17.0, 17.0, 15.0, 10.0, 27.0, 23.0, 23.0, 27.0, 18.0, 31.0, 28.0, 36.0, 29.0, 35.0, 34.0, 44.0, 45.0, 44.0, 33.0, 42.0, 40.0, 30.0, 36.0, 25.0, 22.0, 27.0, 33.0, 27.0, 26.0, 23.0, 21.0, 15.0, 11.0, 8.0, 7.0, 9.0, 8.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0], "bins": [-0.861240029335022, -0.8364761471748352, -0.8117122054100037, -0.7869483232498169, -0.7621843814849854, -0.7374204993247986, -0.7126566171646118, -0.6878926753997803, -0.6631287932395935, -0.6383649110794067, -0.6136009693145752, -0.5888370871543884, -0.5640731453895569, -0.5393092632293701, -0.5145453214645386, -0.4897814393043518, -0.46501752734184265, -0.4402536153793335, -0.41548970341682434, -0.3907257914543152, -0.3659619092941284, -0.34119799733161926, -0.3164340853691101, -0.29167020320892334, -0.2669062614440918, -0.24214234948158264, -0.21737845242023468, -0.19261454045772552, -0.16785064339637756, -0.1430867314338684, -0.11832281947135925, -0.09355892241001129, -0.06879502534866333, -0.04403112083673477, -0.019267212599515915, 0.005496695637702942, 0.0302606001496315, 0.05502450466156006, 0.07978841662406921, 0.10455231368541718, 0.12931622564792633, 0.15408013761043549, 0.17884403467178345, 0.2036079466342926, 0.22837185859680176, 0.2531357407569885, 0.27789968252182007, 0.30266356468200684, 0.327427476644516, 0.35219138860702515, 0.3769553005695343, 0.40171921253204346, 0.4264830946922302, 0.4512470066547394, 0.47601091861724854, 0.5007748007774353, 0.5255387425422668, 0.5503026247024536, 0.5750665664672852, 0.5998304486274719, 0.6245943903923035, 0.6493582725524902, 0.6741222143173218, 0.6988860964775085, 0.7236499786376953]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 0.0, 2.0, 5.0, 5.0, 7.0, 12.0, 14.0, 15.0, 23.0, 38.0, 55.0, 58.0, 83.0, 124.0, 166.0, 253.0, 372.0, 571.0, 887.0, 1378.0, 2283.0, 3768.0, 6685.0, 12171.0, 24038.0, 52566.0, 145241.0, 818752.0, 2779892.0, 212834.0, 68466.0, 29349.0, 14679.0, 7935.0, 4464.0, 2545.0, 1565.0, 1001.0, 616.0, 443.0, 276.0, 183.0, 137.0, 90.0, 59.0, 51.0, 36.0, 24.0, 24.0, 14.0, 10.0, 4.0, 9.0, 6.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.1453857421875, -0.14086341857910156, -0.13634109497070312, -0.1318187713623047, -0.12729644775390625, -0.12277412414550781, -0.11825180053710938, -0.11372947692871094, -0.1092071533203125, -0.10468482971191406, -0.10016250610351562, -0.09564018249511719, -0.09111785888671875, -0.08659553527832031, -0.08207321166992188, -0.07755088806152344, -0.073028564453125, -0.06850624084472656, -0.06398391723632812, -0.05946159362792969, -0.05493927001953125, -0.05041694641113281, -0.045894622802734375, -0.04137229919433594, -0.0368499755859375, -0.03232765197753906, -0.027805328369140625, -0.023283004760742188, -0.01876068115234375, -0.014238357543945312, -0.009716033935546875, -0.0051937103271484375, -0.00067138671875, 0.0038509368896484375, 0.008373260498046875, 0.012895584106445312, 0.01741790771484375, 0.021940231323242188, 0.026462554931640625, 0.030984878540039062, 0.0355072021484375, 0.04002952575683594, 0.044551849365234375, 0.04907417297363281, 0.05359649658203125, 0.05811882019042969, 0.06264114379882812, 0.06716346740722656, 0.071685791015625, 0.07620811462402344, 0.08073043823242188, 0.08525276184082031, 0.08977508544921875, 0.09429740905761719, 0.09881973266601562, 0.10334205627441406, 0.1078643798828125, 0.11238670349121094, 0.11690902709960938, 0.12143135070800781, 0.12595367431640625, 0.1304759979248047, 0.13499832153320312, 0.13952064514160156, 0.14404296875]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 5.0, 8.0, 7.0, 13.0, 4.0, 18.0, 9.0, 24.0, 22.0, 27.0, 31.0, 40.0, 51.0, 56.0, 59.0, 63.0, 65.0, 50.0, 62.0, 52.0, 53.0, 55.0, 36.0, 29.0, 32.0, 30.0, 32.0, 14.0, 14.0, 16.0, 9.0, 7.0, 7.0, 4.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.055755615234375, -0.054257869720458984, -0.05276012420654297, -0.05126237869262695, -0.04976463317871094, -0.04826688766479492, -0.046769142150878906, -0.04527139663696289, -0.043773651123046875, -0.04227590560913086, -0.040778160095214844, -0.03928041458129883, -0.03778266906738281, -0.0362849235534668, -0.03478717803955078, -0.033289432525634766, -0.03179168701171875, -0.030293941497802734, -0.02879619598388672, -0.027298450469970703, -0.025800704956054688, -0.024302959442138672, -0.022805213928222656, -0.02130746841430664, -0.019809722900390625, -0.01831197738647461, -0.016814231872558594, -0.015316486358642578, -0.013818740844726562, -0.012320995330810547, -0.010823249816894531, -0.009325504302978516, -0.0078277587890625, -0.006330013275146484, -0.004832267761230469, -0.003334522247314453, -0.0018367767333984375, -0.0003390312194824219, 0.0011587142944335938, 0.0026564598083496094, 0.004154205322265625, 0.005651950836181641, 0.007149696350097656, 0.008647441864013672, 0.010145187377929688, 0.011642932891845703, 0.013140678405761719, 0.014638423919677734, 0.01613616943359375, 0.017633914947509766, 0.01913166046142578, 0.020629405975341797, 0.022127151489257812, 0.023624897003173828, 0.025122642517089844, 0.02662038803100586, 0.028118133544921875, 0.02961587905883789, 0.031113624572753906, 0.03261137008666992, 0.03410911560058594, 0.03560686111450195, 0.03710460662841797, 0.038602352142333984, 0.04010009765625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 0.0, 5.0, 6.0, 10.0, 12.0, 15.0, 24.0, 31.0, 40.0, 66.0, 90.0, 142.0, 184.0, 307.0, 570.0, 1054.0, 2992.0, 12098.0, 92815.0, 3706367.0, 343068.0, 25731.0, 5185.0, 1585.0, 723.0, 407.0, 241.0, 154.0, 111.0, 80.0, 39.0, 33.0, 29.0, 20.0, 16.0, 12.0, 7.0, 3.0, 8.0, 1.0, 2.0, 2.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58740234375, -0.5704803466796875, -0.553558349609375, -0.5366363525390625, -0.51971435546875, -0.5027923583984375, -0.485870361328125, -0.4689483642578125, -0.4520263671875, -0.4351043701171875, -0.418182373046875, -0.4012603759765625, -0.38433837890625, -0.3674163818359375, -0.350494384765625, -0.3335723876953125, -0.316650390625, -0.2997283935546875, -0.282806396484375, -0.2658843994140625, -0.24896240234375, -0.2320404052734375, -0.215118408203125, -0.1981964111328125, -0.1812744140625, -0.1643524169921875, -0.147430419921875, -0.1305084228515625, -0.11358642578125, -0.0966644287109375, -0.079742431640625, -0.0628204345703125, -0.0458984375, -0.0289764404296875, -0.012054443359375, 0.0048675537109375, 0.02178955078125, 0.0387115478515625, 0.055633544921875, 0.0725555419921875, 0.0894775390625, 0.1063995361328125, 0.123321533203125, 0.1402435302734375, 0.15716552734375, 0.1740875244140625, 0.191009521484375, 0.2079315185546875, 0.224853515625, 0.2417755126953125, 0.258697509765625, 0.2756195068359375, 0.29254150390625, 0.3094635009765625, 0.326385498046875, 0.3433074951171875, 0.3602294921875, 0.3771514892578125, 0.394073486328125, 0.4109954833984375, 0.42791748046875, 0.4448394775390625, 0.461761474609375, 0.4786834716796875, 0.49560546875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 7.0, 23.0, 29.0, 28.0, 88.0, 180.0, 486.0, 2338.0, 555.0, 168.0, 90.0, 34.0, 15.0, 15.0, 4.0, 3.0, 7.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.263671875, -0.2568206787109375, -0.249969482421875, -0.2431182861328125, -0.23626708984375, -0.2294158935546875, -0.222564697265625, -0.2157135009765625, -0.2088623046875, -0.2020111083984375, -0.195159912109375, -0.1883087158203125, -0.18145751953125, -0.1746063232421875, -0.167755126953125, -0.1609039306640625, -0.154052734375, -0.1472015380859375, -0.140350341796875, -0.1334991455078125, -0.12664794921875, -0.1197967529296875, -0.112945556640625, -0.1060943603515625, -0.0992431640625, -0.0923919677734375, -0.085540771484375, -0.0786895751953125, -0.07183837890625, -0.0649871826171875, -0.058135986328125, -0.0512847900390625, -0.04443359375, -0.0375823974609375, -0.030731201171875, -0.0238800048828125, -0.01702880859375, -0.0101776123046875, -0.003326416015625, 0.0035247802734375, 0.0103759765625, 0.0172271728515625, 0.024078369140625, 0.0309295654296875, 0.03778076171875, 0.0446319580078125, 0.051483154296875, 0.0583343505859375, 0.065185546875, 0.0720367431640625, 0.078887939453125, 0.0857391357421875, 0.09259033203125, 0.0994415283203125, 0.106292724609375, 0.1131439208984375, 0.1199951171875, 0.1268463134765625, 0.133697509765625, 0.1405487060546875, 0.14739990234375, 0.1542510986328125, 0.161102294921875, 0.1679534912109375, 0.1748046875]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 7.0, 14.0, 35.0, 61.0, 115.0, 180.0, 204.0, 180.0, 93.0, 52.0, 38.0, 10.0, 11.0, 3.0, 6.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5477823615074158, -0.503001868724823, -0.45822134613990784, -0.41344085335731506, -0.3686603307723999, -0.32387983798980713, -0.27909934520721436, -0.2343188226222992, -0.18953832983970642, -0.14475782215595245, -0.09997732192277908, -0.05519682168960571, -0.010416314005851746, 0.03436419367790222, 0.079144686460495, 0.12392520904541016, 0.16870570182800293, 0.2134862095117569, 0.25826671719551086, 0.30304720997810364, 0.3478277325630188, 0.3926082253456116, 0.43738871812820435, 0.4821692407131195, 0.5269497632980347, 0.5717302560806274, 0.6165107488632202, 0.661291241645813, 0.7060717940330505, 0.7508522868156433, 0.7956327795982361, 0.8404133319854736, 0.8851937055587769, 0.9299741983413696, 0.9747546911239624, 1.0195351839065552, 1.064315676689148, 1.1090962886810303, 1.153876781463623, 1.1986572742462158, 1.2434377670288086, 1.2882182598114014, 1.3329987525939941, 1.377779245376587, 1.4225597381591797, 1.4673402309417725, 1.5121207237243652, 1.5569013357162476, 1.6016817092895508, 1.6464622020721436, 1.6912426948547363, 1.736023187637329, 1.7808036804199219, 1.8255841732025146, 1.8703646659851074, 1.9151452779769897, 1.9599257707595825, 2.004706382751465, 2.0494868755340576, 2.0942673683166504, 2.139047861099243, 2.183828353881836, 2.2286088466644287, 2.2733893394470215, 2.3181698322296143]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 4.0, 4.0, 5.0, 8.0, 13.0, 12.0, 7.0, 9.0, 17.0, 15.0, 12.0, 20.0, 24.0, 15.0, 31.0, 25.0, 29.0, 33.0, 23.0, 27.0, 37.0, 28.0, 48.0, 39.0, 25.0, 35.0, 34.0, 40.0, 35.0, 36.0, 34.0, 24.0, 34.0, 26.0, 22.0, 19.0, 24.0, 27.0, 13.0, 12.0, 9.0, 15.0, 13.0, 3.0, 9.0, 6.0, 9.0, 9.0, 4.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.3982389569282532, -0.3861745297908783, -0.3741101324558258, -0.3620457053184509, -0.34998130798339844, -0.33791688084602356, -0.3258524537086487, -0.3137880563735962, -0.3017236292362213, -0.28965920209884644, -0.27759480476379395, -0.26553037762641907, -0.2534659802913666, -0.2414015531539917, -0.22933714091777802, -0.21727272868156433, -0.20520831644535065, -0.19314390420913696, -0.18107949197292328, -0.1690150797367096, -0.15695065259933472, -0.14488624036312103, -0.13282182812690735, -0.12075740844011307, -0.10869299620389938, -0.0966285839676857, -0.08456416428089142, -0.07249975204467773, -0.06043533608317375, -0.04837092012166977, -0.036306507885456085, -0.024242088198661804, -0.01217767596244812, -0.00011326093226671219, 0.011951154097914696, 0.02401556819677353, 0.03607998415827751, 0.048144400119781494, 0.06020881235599518, 0.07227323204278946, 0.08433764427900314, 0.09640205651521683, 0.10846647620201111, 0.12053088843822479, 0.13259530067443848, 0.14465972781181335, 0.15672412514686584, 0.16878855228424072, 0.1808529645204544, 0.1929173767566681, 0.20498178899288177, 0.21704620122909546, 0.22911062836647034, 0.24117504060268402, 0.2532394528388977, 0.2653038799762726, 0.2773682773113251, 0.28943270444869995, 0.30149710178375244, 0.3135615289211273, 0.3256259262561798, 0.3376903533935547, 0.3497547507286072, 0.36181917786598206, 0.37388360500335693]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 11.0, 15.0, 23.0, 36.0, 84.0, 111.0, 164.0, 354.0, 713.0, 1492.0, 3270.0, 7662.0, 18672.0, 47654.0, 119890.0, 351489.0, 315788.0, 108062.0, 43101.0, 17270.0, 6935.0, 2949.0, 1335.0, 664.0, 324.0, 214.0, 120.0, 60.0, 34.0, 20.0, 14.0, 10.0, 7.0, 4.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2236328125, -0.21723365783691406, -0.21083450317382812, -0.2044353485107422, -0.19803619384765625, -0.1916370391845703, -0.18523788452148438, -0.17883872985839844, -0.1724395751953125, -0.16604042053222656, -0.15964126586914062, -0.1532421112060547, -0.14684295654296875, -0.1404438018798828, -0.13404464721679688, -0.12764549255371094, -0.121246337890625, -0.11484718322753906, -0.10844802856445312, -0.10204887390136719, -0.09564971923828125, -0.08925056457519531, -0.08285140991210938, -0.07645225524902344, -0.0700531005859375, -0.06365394592285156, -0.057254791259765625, -0.05085563659667969, -0.04445648193359375, -0.03805732727050781, -0.031658172607421875, -0.025259017944335938, -0.01885986328125, -0.012460708618164062, -0.006061553955078125, 0.0003376007080078125, 0.00673675537109375, 0.013135910034179688, 0.019535064697265625, 0.025934219360351562, 0.0323333740234375, 0.03873252868652344, 0.045131683349609375, 0.05153083801269531, 0.05792999267578125, 0.06432914733886719, 0.07072830200195312, 0.07712745666503906, 0.083526611328125, 0.08992576599121094, 0.09632492065429688, 0.10272407531738281, 0.10912322998046875, 0.11552238464355469, 0.12192153930664062, 0.12832069396972656, 0.1347198486328125, 0.14111900329589844, 0.14751815795898438, 0.1539173126220703, 0.16031646728515625, 0.1667156219482422, 0.17311477661132812, 0.17951393127441406, 0.1859130859375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 2.0, 11.0, 8.0, 10.0, 13.0, 13.0, 15.0, 19.0, 23.0, 26.0, 27.0, 36.0, 41.0, 50.0, 44.0, 57.0, 50.0, 47.0, 51.0, 56.0, 49.0, 49.0, 41.0, 44.0, 37.0, 34.0, 30.0, 24.0, 16.0, 21.0, 18.0, 10.0, 10.0, 5.0, 8.0, 5.0, 3.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.06494140625, -0.0631871223449707, -0.061432838439941406, -0.05967855453491211, -0.05792427062988281, -0.056169986724853516, -0.05441570281982422, -0.05266141891479492, -0.050907135009765625, -0.04915285110473633, -0.04739856719970703, -0.045644283294677734, -0.04388999938964844, -0.04213571548461914, -0.040381431579589844, -0.03862714767456055, -0.03687286376953125, -0.03511857986450195, -0.033364295959472656, -0.03161001205444336, -0.029855728149414062, -0.028101444244384766, -0.02634716033935547, -0.024592876434326172, -0.022838592529296875, -0.021084308624267578, -0.01933002471923828, -0.017575740814208984, -0.015821456909179688, -0.01406717300415039, -0.012312889099121094, -0.010558605194091797, -0.0088043212890625, -0.007050037384033203, -0.005295753479003906, -0.0035414695739746094, -0.0017871856689453125, -3.2901763916015625e-05, 0.0017213821411132812, 0.003475666046142578, 0.005229949951171875, 0.006984233856201172, 0.008738517761230469, 0.010492801666259766, 0.012247085571289062, 0.01400136947631836, 0.015755653381347656, 0.017509937286376953, 0.01926422119140625, 0.021018505096435547, 0.022772789001464844, 0.02452707290649414, 0.026281356811523438, 0.028035640716552734, 0.02978992462158203, 0.03154420852661133, 0.033298492431640625, 0.03505277633666992, 0.03680706024169922, 0.038561344146728516, 0.04031562805175781, 0.04206991195678711, 0.043824195861816406, 0.0455784797668457, 0.047332763671875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 5.0, 6.0, 15.0, 23.0, 30.0, 48.0, 66.0, 103.0, 167.0, 252.0, 408.0, 629.0, 1100.0, 2349.0, 7403.0, 36067.0, 220489.0, 651240.0, 102249.0, 17490.0, 4492.0, 1760.0, 837.0, 472.0, 278.0, 179.0, 136.0, 79.0, 46.0, 43.0, 26.0, 17.0, 16.0, 10.0, 9.0, 7.0, 5.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.459716796875, -0.4470481872558594, -0.43437957763671875, -0.4217109680175781, -0.4090423583984375, -0.3963737487792969, -0.38370513916015625, -0.3710365295410156, -0.358367919921875, -0.3456993103027344, -0.33303070068359375, -0.3203620910644531, -0.3076934814453125, -0.2950248718261719, -0.28235626220703125, -0.2696876525878906, -0.25701904296875, -0.24435043334960938, -0.23168182373046875, -0.21901321411132812, -0.2063446044921875, -0.19367599487304688, -0.18100738525390625, -0.16833877563476562, -0.155670166015625, -0.14300155639648438, -0.13033294677734375, -0.11766433715820312, -0.1049957275390625, -0.09232711791992188, -0.07965850830078125, -0.06698989868164062, -0.0543212890625, -0.041652679443359375, -0.02898406982421875, -0.016315460205078125, -0.0036468505859375, 0.009021759033203125, 0.02169036865234375, 0.034358978271484375, 0.047027587890625, 0.059696197509765625, 0.07236480712890625, 0.08503341674804688, 0.0977020263671875, 0.11037063598632812, 0.12303924560546875, 0.13570785522460938, 0.14837646484375, 0.16104507446289062, 0.17371368408203125, 0.18638229370117188, 0.1990509033203125, 0.21171951293945312, 0.22438812255859375, 0.23705673217773438, 0.249725341796875, 0.2623939514160156, 0.27506256103515625, 0.2877311706542969, 0.3003997802734375, 0.3130683898925781, 0.32573699951171875, 0.3384056091308594, 0.35107421875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 1.0, 5.0, 6.0, 3.0, 3.0, 10.0, 7.0, 6.0, 9.0, 18.0, 22.0, 17.0, 19.0, 34.0, 21.0, 35.0, 47.0, 46.0, 42.0, 47.0, 52.0, 49.0, 56.0, 53.0, 54.0, 38.0, 48.0, 35.0, 36.0, 35.0, 27.0, 33.0, 23.0, 9.0, 4.0, 13.0, 8.0, 6.0, 7.0, 4.0, 5.0, 4.0, 2.0, 2.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.295654296875, -0.285919189453125, -0.27618408203125, -0.266448974609375, -0.2567138671875, -0.246978759765625, -0.23724365234375, -0.227508544921875, -0.2177734375, -0.208038330078125, -0.19830322265625, -0.188568115234375, -0.1788330078125, -0.169097900390625, -0.15936279296875, -0.149627685546875, -0.139892578125, -0.130157470703125, -0.12042236328125, -0.110687255859375, -0.1009521484375, -0.091217041015625, -0.08148193359375, -0.071746826171875, -0.06201171875, -0.052276611328125, -0.04254150390625, -0.032806396484375, -0.0230712890625, -0.013336181640625, -0.00360107421875, 0.006134033203125, 0.015869140625, 0.025604248046875, 0.03533935546875, 0.045074462890625, 0.0548095703125, 0.064544677734375, 0.07427978515625, 0.084014892578125, 0.09375, 0.103485107421875, 0.11322021484375, 0.122955322265625, 0.1326904296875, 0.142425537109375, 0.15216064453125, 0.161895751953125, 0.171630859375, 0.181365966796875, 0.19110107421875, 0.200836181640625, 0.2105712890625, 0.220306396484375, 0.23004150390625, 0.239776611328125, 0.24951171875, 0.259246826171875, 0.26898193359375, 0.278717041015625, 0.2884521484375, 0.298187255859375, 0.30792236328125, 0.317657470703125, 0.327392578125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 7.0, 12.0, 12.0, 19.0, 27.0, 37.0, 79.0, 132.0, 197.0, 468.0, 1021.0, 2806.0, 11092.0, 80313.0, 710797.0, 209617.0, 24452.0, 4700.0, 1508.0, 575.0, 268.0, 147.0, 104.0, 51.0, 42.0, 21.0, 16.0, 6.0, 10.0, 7.0, 4.0, 3.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.261962890625, -0.2531471252441406, -0.24433135986328125, -0.23551559448242188, -0.2266998291015625, -0.21788406372070312, -0.20906829833984375, -0.20025253295898438, -0.191436767578125, -0.18262100219726562, -0.17380523681640625, -0.16498947143554688, -0.1561737060546875, -0.14735794067382812, -0.13854217529296875, -0.12972640991210938, -0.12091064453125, -0.11209487915039062, -0.10327911376953125, -0.09446334838867188, -0.0856475830078125, -0.07683181762695312, -0.06801605224609375, -0.059200286865234375, -0.050384521484375, -0.041568756103515625, -0.03275299072265625, -0.023937225341796875, -0.0151214599609375, -0.006305694580078125, 0.00251007080078125, 0.011325836181640625, 0.0201416015625, 0.028957366943359375, 0.03777313232421875, 0.046588897705078125, 0.0554046630859375, 0.06422042846679688, 0.07303619384765625, 0.08185195922851562, 0.090667724609375, 0.09948348999023438, 0.10829925537109375, 0.11711502075195312, 0.1259307861328125, 0.13474655151367188, 0.14356231689453125, 0.15237808227539062, 0.16119384765625, 0.17000961303710938, 0.17882537841796875, 0.18764114379882812, 0.1964569091796875, 0.20527267456054688, 0.21408843994140625, 0.22290420532226562, 0.231719970703125, 0.24053573608398438, 0.24935150146484375, 0.2581672668457031, 0.2669830322265625, 0.2757987976074219, 0.28461456298828125, 0.2934303283691406, 0.30224609375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 5.0, 7.0, 4.0, 11.0, 16.0, 17.0, 23.0, 30.0, 44.0, 52.0, 71.0, 82.0, 81.0, 105.0, 112.0, 80.0, 67.0, 43.0, 43.0, 35.0, 27.0, 11.0, 8.0, 9.0, 7.0, 8.0, 6.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.422136306762695e-05, -8.10353085398674e-05, -7.784925401210785e-05, -7.46631994843483e-05, -7.147714495658875e-05, -6.829109042882919e-05, -6.510503590106964e-05, -6.191898137331009e-05, -5.873292684555054e-05, -5.5546872317790985e-05, -5.236081779003143e-05, -4.917476326227188e-05, -4.598870873451233e-05, -4.280265420675278e-05, -3.9616599678993225e-05, -3.643054515123367e-05, -3.324449062347412e-05, -3.005843609571457e-05, -2.6872381567955017e-05, -2.3686327040195465e-05, -2.0500272512435913e-05, -1.731421798467636e-05, -1.4128163456916809e-05, -1.0942108929157257e-05, -7.756054401397705e-06, -4.569999873638153e-06, -1.383945345878601e-06, 1.802109181880951e-06, 4.988163709640503e-06, 8.174218237400055e-06, 1.1360272765159607e-05, 1.4546327292919159e-05, 1.773238182067871e-05, 2.0918436348438263e-05, 2.4104490876197815e-05, 2.7290545403957367e-05, 3.047659993171692e-05, 3.366265445947647e-05, 3.684870898723602e-05, 4.0034763514995575e-05, 4.322081804275513e-05, 4.640687257051468e-05, 4.959292709827423e-05, 5.277898162603378e-05, 5.5965036153793335e-05, 5.915109068155289e-05, 6.233714520931244e-05, 6.552319973707199e-05, 6.870925426483154e-05, 7.18953087925911e-05, 7.508136332035065e-05, 7.82674178481102e-05, 8.145347237586975e-05, 8.46395269036293e-05, 8.782558143138885e-05, 9.101163595914841e-05, 9.419769048690796e-05, 9.738374501466751e-05, 0.00010056979954242706, 0.00010375585407018661, 0.00010694190859794617, 0.00011012796312570572, 0.00011331401765346527, 0.00011650007218122482, 0.00011968612670898438]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 5.0, 6.0, 7.0, 8.0, 15.0, 20.0, 11.0, 24.0, 45.0, 58.0, 93.0, 113.0, 191.0, 334.0, 556.0, 1053.0, 2402.0, 6750.0, 30656.0, 204639.0, 658756.0, 115011.0, 18860.0, 4924.0, 1870.0, 893.0, 464.0, 281.0, 154.0, 114.0, 68.0, 55.0, 31.0, 24.0, 21.0, 15.0, 10.0, 10.0, 6.0, 5.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2342529296875, -0.2274341583251953, -0.22061538696289062, -0.21379661560058594, -0.20697784423828125, -0.20015907287597656, -0.19334030151367188, -0.1865215301513672, -0.1797027587890625, -0.1728839874267578, -0.16606521606445312, -0.15924644470214844, -0.15242767333984375, -0.14560890197753906, -0.13879013061523438, -0.1319713592529297, -0.125152587890625, -0.11833381652832031, -0.11151504516601562, -0.10469627380371094, -0.09787750244140625, -0.09105873107910156, -0.08423995971679688, -0.07742118835449219, -0.0706024169921875, -0.06378364562988281, -0.056964874267578125, -0.05014610290527344, -0.04332733154296875, -0.03650856018066406, -0.029689788818359375, -0.022871017456054688, -0.01605224609375, -0.009233474731445312, -0.002414703369140625, 0.0044040679931640625, 0.01122283935546875, 0.018041610717773438, 0.024860382080078125, 0.03167915344238281, 0.0384979248046875, 0.04531669616699219, 0.052135467529296875, 0.05895423889160156, 0.06577301025390625, 0.07259178161621094, 0.07941055297851562, 0.08622932434082031, 0.093048095703125, 0.09986686706542969, 0.10668563842773438, 0.11350440979003906, 0.12032318115234375, 0.12714195251464844, 0.13396072387695312, 0.1407794952392578, 0.1475982666015625, 0.1544170379638672, 0.16123580932617188, 0.16805458068847656, 0.17487335205078125, 0.18169212341308594, 0.18851089477539062, 0.1953296661376953, 0.2021484375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 0.0, 6.0, 7.0, 5.0, 4.0, 8.0, 15.0, 28.0, 23.0, 31.0, 51.0, 49.0, 53.0, 73.0, 75.0, 106.0, 93.0, 82.0, 55.0, 42.0, 45.0, 33.0, 19.0, 28.0, 18.0, 9.0, 10.0, 7.0, 5.0, 2.0, 5.0, 5.0, 2.0, 2.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1407470703125, -0.1361408233642578, -0.13153457641601562, -0.12692832946777344, -0.12232208251953125, -0.11771583557128906, -0.11310958862304688, -0.10850334167480469, -0.1038970947265625, -0.09929084777832031, -0.09468460083007812, -0.09007835388183594, -0.08547210693359375, -0.08086585998535156, -0.07625961303710938, -0.07165336608886719, -0.067047119140625, -0.06244087219238281, -0.057834625244140625, -0.05322837829589844, -0.04862213134765625, -0.04401588439941406, -0.039409637451171875, -0.03480339050292969, -0.0301971435546875, -0.025590896606445312, -0.020984649658203125, -0.016378402709960938, -0.01177215576171875, -0.0071659088134765625, -0.002559661865234375, 0.0020465850830078125, 0.00665283203125, 0.011259078979492188, 0.015865325927734375, 0.020471572875976562, 0.02507781982421875, 0.029684066772460938, 0.034290313720703125, 0.03889656066894531, 0.0435028076171875, 0.04810905456542969, 0.052715301513671875, 0.05732154846191406, 0.06192779541015625, 0.06653404235839844, 0.07114028930664062, 0.07574653625488281, 0.080352783203125, 0.08495903015136719, 0.08956527709960938, 0.09417152404785156, 0.09877777099609375, 0.10338401794433594, 0.10799026489257812, 0.11259651184082031, 0.1172027587890625, 0.12180900573730469, 0.12641525268554688, 0.13102149963378906, 0.13562774658203125, 0.14023399353027344, 0.14484024047851562, 0.1494464874267578, 0.154052734375]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 5.0, 3.0, 6.0, 10.0, 9.0, 24.0, 26.0, 50.0, 87.0, 99.0, 117.0, 113.0, 125.0, 82.0, 80.0, 62.0, 33.0, 26.0, 21.0, 11.0, 8.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.087712287902832, -2.019488573074341, -1.95126473903656, -1.8830409049987793, -1.814817190170288, -1.7465933561325073, -1.6783695220947266, -1.6101458072662354, -1.5419219732284546, -1.4736981391906738, -1.4054744243621826, -1.3372505903244019, -1.269026756286621, -1.2008030414581299, -1.1325792074203491, -1.0643553733825684, -0.9961316585540771, -0.9279078841209412, -0.8596841096878052, -0.7914602756500244, -0.7232365012168884, -0.6550127267837524, -0.5867888927459717, -0.5185651183128357, -0.4503413438796997, -0.3821175694465637, -0.31389376521110535, -0.24566997587680817, -0.177446186542511, -0.109222412109375, -0.040998607873916626, 0.027225196361541748, 0.09544897079467773, 0.16367276012897491, 0.2318965494632721, 0.30012035369873047, 0.36834412813186646, 0.43656790256500244, 0.5047917366027832, 0.5730155110359192, 0.6412392854690552, 0.7094630599021912, 0.7776868343353271, 0.8459106683731079, 0.9141344428062439, 0.9823582172393799, 1.0505820512771606, 1.1188058853149414, 1.1870296001434326, 1.2552534341812134, 1.3234771490097046, 1.3917009830474854, 1.4599246978759766, 1.5281485319137573, 1.596372365951538, 1.6645960807800293, 1.73281991481781, 1.8010437488555908, 1.869267463684082, 1.9374912977218628, 2.0057151317596436, 2.0739388465881348, 2.142162561416626, 2.2103865146636963, 2.2786102294921875]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 4.0, 6.0, 4.0, 7.0, 9.0, 12.0, 21.0, 13.0, 21.0, 14.0, 25.0, 30.0, 22.0, 36.0, 43.0, 37.0, 42.0, 44.0, 43.0, 45.0, 53.0, 48.0, 38.0, 42.0, 35.0, 39.0, 49.0, 40.0, 29.0, 20.0, 21.0, 25.0, 21.0, 20.0, 10.0, 9.0, 5.0, 7.0, 6.0, 2.0, 2.0, 3.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5358490943908691, -1.4835495948791504, -1.4312502145767212, -1.3789507150650024, -1.3266513347625732, -1.2743518352508545, -1.2220523357391357, -1.169752836227417, -1.1174534559249878, -1.065153956413269, -1.0128545761108398, -0.9605550765991211, -0.9082556366920471, -0.8559561967849731, -0.8036566972732544, -0.7513572573661804, -0.6990578174591064, -0.6467583775520325, -0.5944589376449585, -0.5421594381332397, -0.48985999822616577, -0.4375605583190918, -0.38526108860969543, -0.3329616189002991, -0.2806621789932251, -0.22836272418498993, -0.17606326937675476, -0.12376381456851959, -0.07146435976028442, -0.01916491985321045, 0.03313454985618591, 0.08543401956558228, 0.1377335786819458, 0.19003303349018097, 0.24233248829841614, 0.2946319580078125, 0.3469313979148865, 0.39923083782196045, 0.4515303075313568, 0.5038297772407532, 0.5561292171478271, 0.6084286570549011, 0.6607280969619751, 0.7130275964736938, 0.7653270363807678, 0.8176264762878418, 0.8699259757995605, 0.9222254157066345, 0.9745248556137085, 1.0268243551254272, 1.0791237354278564, 1.1314232349395752, 1.183722734451294, 1.2360221147537231, 1.288321614265442, 1.340620994567871, 1.3929204940795898, 1.4452199935913086, 1.4975193738937378, 1.5498188734054565, 1.6021182537078857, 1.6544177532196045, 1.7067172527313232, 1.759016752243042, 1.8113161325454712]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 3.0, 18.0, 11.0, 13.0, 27.0, 46.0, 47.0, 109.0, 148.0, 255.0, 385.0, 654.0, 1183.0, 2262.0, 4695.0, 10097.0, 25642.0, 82727.0, 536415.0, 3245396.0, 204886.0, 48396.0, 16681.0, 6965.0, 3290.0, 1652.0, 916.0, 509.0, 303.0, 191.0, 119.0, 90.0, 42.0, 43.0, 22.0, 17.0, 11.0, 9.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.291748046875, -0.28412818908691406, -0.2765083312988281, -0.2688884735107422, -0.26126861572265625, -0.2536487579345703, -0.24602890014648438, -0.23840904235839844, -0.2307891845703125, -0.22316932678222656, -0.21554946899414062, -0.2079296112060547, -0.20030975341796875, -0.1926898956298828, -0.18507003784179688, -0.17745018005371094, -0.169830322265625, -0.16221046447753906, -0.15459060668945312, -0.1469707489013672, -0.13935089111328125, -0.1317310333251953, -0.12411117553710938, -0.11649131774902344, -0.1088714599609375, -0.10125160217285156, -0.09363174438476562, -0.08601188659667969, -0.07839202880859375, -0.07077217102050781, -0.06315231323242188, -0.05553245544433594, -0.04791259765625, -0.04029273986816406, -0.032672882080078125, -0.025053024291992188, -0.01743316650390625, -0.009813308715820312, -0.002193450927734375, 0.0054264068603515625, 0.0130462646484375, 0.020666122436523438, 0.028285980224609375, 0.03590583801269531, 0.04352569580078125, 0.05114555358886719, 0.058765411376953125, 0.06638526916503906, 0.074005126953125, 0.08162498474121094, 0.08924484252929688, 0.09686470031738281, 0.10448455810546875, 0.11210441589355469, 0.11972427368164062, 0.12734413146972656, 0.1349639892578125, 0.14258384704589844, 0.15020370483398438, 0.1578235626220703, 0.16544342041015625, 0.1730632781982422, 0.18068313598632812, 0.18830299377441406, 0.1959228515625]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 5.0, 7.0, 13.0, 8.0, 12.0, 14.0, 25.0, 24.0, 25.0, 26.0, 32.0, 45.0, 33.0, 50.0, 54.0, 50.0, 64.0, 50.0, 51.0, 49.0, 54.0, 45.0, 53.0, 43.0, 40.0, 20.0, 25.0, 13.0, 16.0, 16.0, 12.0, 8.0, 6.0, 9.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.07916259765625, -0.07714080810546875, -0.0751190185546875, -0.07309722900390625, -0.071075439453125, -0.06905364990234375, -0.0670318603515625, -0.06501007080078125, -0.06298828125, -0.06096649169921875, -0.0589447021484375, -0.05692291259765625, -0.054901123046875, -0.05287933349609375, -0.0508575439453125, -0.04883575439453125, -0.04681396484375, -0.04479217529296875, -0.0427703857421875, -0.04074859619140625, -0.038726806640625, -0.03670501708984375, -0.0346832275390625, -0.03266143798828125, -0.0306396484375, -0.02861785888671875, -0.0265960693359375, -0.02457427978515625, -0.022552490234375, -0.02053070068359375, -0.0185089111328125, -0.01648712158203125, -0.01446533203125, -0.01244354248046875, -0.0104217529296875, -0.00839996337890625, -0.006378173828125, -0.00435638427734375, -0.0023345947265625, -0.00031280517578125, 0.001708984375, 0.00373077392578125, 0.0057525634765625, 0.00777435302734375, 0.009796142578125, 0.01181793212890625, 0.0138397216796875, 0.01586151123046875, 0.01788330078125, 0.01990509033203125, 0.0219268798828125, 0.02394866943359375, 0.025970458984375, 0.02799224853515625, 0.0300140380859375, 0.03203582763671875, 0.0340576171875, 0.03607940673828125, 0.0381011962890625, 0.04012298583984375, 0.042144775390625, 0.04416656494140625, 0.0461883544921875, 0.04821014404296875, 0.05023193359375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 6.0, 2.0, 4.0, 5.0, 8.0, 11.0, 10.0, 15.0, 24.0, 21.0, 38.0, 34.0, 62.0, 107.0, 130.0, 194.0, 315.0, 525.0, 930.0, 1752.0, 4671.0, 17355.0, 95395.0, 3069894.0, 921976.0, 60967.0, 12466.0, 3719.0, 1515.0, 811.0, 454.0, 268.0, 180.0, 124.0, 77.0, 57.0, 42.0, 32.0, 26.0, 17.0, 14.0, 8.0, 8.0, 2.0, 5.0, 5.0, 3.0, 5.0, 3.0, 0.0, 0.0, 5.0], "bins": [-0.58837890625, -0.5719833374023438, -0.5555877685546875, -0.5391921997070312, -0.522796630859375, -0.5064010620117188, -0.4900054931640625, -0.47360992431640625, -0.45721435546875, -0.44081878662109375, -0.4244232177734375, -0.40802764892578125, -0.391632080078125, -0.37523651123046875, -0.3588409423828125, -0.34244537353515625, -0.3260498046875, -0.30965423583984375, -0.2932586669921875, -0.27686309814453125, -0.260467529296875, -0.24407196044921875, -0.2276763916015625, -0.21128082275390625, -0.19488525390625, -0.17848968505859375, -0.1620941162109375, -0.14569854736328125, -0.129302978515625, -0.11290740966796875, -0.0965118408203125, -0.08011627197265625, -0.063720703125, -0.04732513427734375, -0.0309295654296875, -0.01453399658203125, 0.001861572265625, 0.01825714111328125, 0.0346527099609375, 0.05104827880859375, 0.06744384765625, 0.08383941650390625, 0.1002349853515625, 0.11663055419921875, 0.133026123046875, 0.14942169189453125, 0.1658172607421875, 0.18221282958984375, 0.1986083984375, 0.21500396728515625, 0.2313995361328125, 0.24779510498046875, 0.264190673828125, 0.28058624267578125, 0.2969818115234375, 0.31337738037109375, 0.32977294921875, 0.34616851806640625, 0.3625640869140625, 0.37895965576171875, 0.395355224609375, 0.41175079345703125, 0.4281463623046875, 0.44454193115234375, 0.4609375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 8.0, 11.0, 15.0, 38.0, 69.0, 100.0, 246.0, 727.0, 2020.0, 463.0, 175.0, 83.0, 35.0, 40.0, 11.0, 11.0, 5.0, 3.0, 6.0, 3.0, 3.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.36181640625, -0.3523693084716797, -0.3429222106933594, -0.33347511291503906, -0.32402801513671875, -0.31458091735839844, -0.3051338195800781, -0.2956867218017578, -0.2862396240234375, -0.2767925262451172, -0.2673454284667969, -0.25789833068847656, -0.24845123291015625, -0.23900413513183594, -0.22955703735351562, -0.2201099395751953, -0.210662841796875, -0.2012157440185547, -0.19176864624023438, -0.18232154846191406, -0.17287445068359375, -0.16342735290527344, -0.15398025512695312, -0.1445331573486328, -0.1350860595703125, -0.1256389617919922, -0.11619186401367188, -0.10674476623535156, -0.09729766845703125, -0.08785057067871094, -0.07840347290039062, -0.06895637512207031, -0.05950927734375, -0.05006217956542969, -0.040615081787109375, -0.031167984008789062, -0.02172088623046875, -0.012273788452148438, -0.002826690673828125, 0.0066204071044921875, 0.0160675048828125, 0.025514602661132812, 0.034961700439453125, 0.04440879821777344, 0.05385589599609375, 0.06330299377441406, 0.07275009155273438, 0.08219718933105469, 0.091644287109375, 0.10109138488769531, 0.11053848266601562, 0.11998558044433594, 0.12943267822265625, 0.13887977600097656, 0.14832687377929688, 0.1577739715576172, 0.1672210693359375, 0.1766681671142578, 0.18611526489257812, 0.19556236267089844, 0.20500946044921875, 0.21445655822753906, 0.22390365600585938, 0.2333507537841797, 0.2427978515625]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 8.0, 13.0, 49.0, 111.0, 183.0, 232.0, 205.0, 123.0, 43.0, 26.0, 7.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6873784065246582, -1.61225163936615, -1.5371248722076416, -1.4619981050491333, -1.386871337890625, -1.3117444515228271, -1.2366176843643188, -1.1614909172058105, -1.0863641500473022, -1.011237382888794, -0.9361106157302856, -0.8609837889671326, -0.7858570218086243, -0.710730254650116, -0.6356034278869629, -0.5604766607284546, -0.4853498935699463, -0.410223126411438, -0.3350963294506073, -0.2599695324897766, -0.1848427653312683, -0.10971599817276001, -0.03458920121192932, 0.04053759574890137, 0.11566436290740967, 0.19079114496707916, 0.26591792702674866, 0.34104472398757935, 0.41617149114608765, 0.49129825830459595, 0.566425085067749, 0.6415518522262573, 0.7166788578033447, 0.791805624961853, 0.8669323921203613, 0.9420592188835144, 1.017185926437378, 1.0923128128051758, 1.167439579963684, 1.2425663471221924, 1.3176931142807007, 1.392819881439209, 1.4679466485977173, 1.5430734157562256, 1.6182003021240234, 1.6933269500732422, 1.76845383644104, 1.8435806035995483, 1.9187073707580566, 1.993834137916565, 2.0689609050750732, 2.144087791442871, 2.21921443939209, 2.2943413257598877, 2.3694679737091064, 2.4445948600769043, 2.519721508026123, 2.594848394393921, 2.6699750423431396, 2.7451019287109375, 2.8202285766601562, 2.895355463027954, 2.970482110977173, 3.0456089973449707, 3.1207358837127686]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 5.0, 2.0, 5.0, 7.0, 6.0, 7.0, 7.0, 18.0, 14.0, 11.0, 23.0, 20.0, 34.0, 30.0, 43.0, 38.0, 42.0, 44.0, 43.0, 41.0, 42.0, 31.0, 38.0, 41.0, 39.0, 36.0, 39.0, 38.0, 30.0, 38.0, 29.0, 21.0, 23.0, 30.0, 12.0, 16.0, 8.0, 11.0, 21.0, 7.0, 3.0, 6.0, 4.0, 1.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6243484616279602, -0.6034522652626038, -0.5825560688972473, -0.5616599321365356, -0.5407637357711792, -0.5198675394058228, -0.4989713430404663, -0.47807514667510986, -0.4571789801120758, -0.43628278374671936, -0.4153866171836853, -0.39449042081832886, -0.3735942244529724, -0.35269805788993835, -0.3318018615245819, -0.31090569496154785, -0.2900094985961914, -0.26911330223083496, -0.2482171356678009, -0.22732093930244446, -0.2064247578382492, -0.18552857637405396, -0.1646323800086975, -0.14373619854450226, -0.122840017080307, -0.10194383561611176, -0.08104764670133591, -0.06015145778656006, -0.03925527632236481, -0.018359094858169556, 0.0025371015071868896, 0.02343328297138214, 0.04432946443557739, 0.06522564589977264, 0.08612183481454849, 0.10701802372932434, 0.1279142051935196, 0.14881038665771484, 0.1697065830230713, 0.19060276448726654, 0.2114989459514618, 0.23239512741565704, 0.2532913088798523, 0.27418750524520874, 0.2950837016105652, 0.31597986817359924, 0.3368760645389557, 0.35777223110198975, 0.3786684274673462, 0.39956462383270264, 0.4204607903957367, 0.44135698676109314, 0.4622531533241272, 0.48314934968948364, 0.5040455460548401, 0.5249417424201965, 0.5458378791809082, 0.5667340755462646, 0.5876302719116211, 0.6085264682769775, 0.6294226050376892, 0.6503188014030457, 0.6712149977684021, 0.6921111941337585, 0.713007390499115]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 3.0, 2.0, 6.0, 9.0, 8.0, 14.0, 17.0, 23.0, 35.0, 73.0, 109.0, 182.0, 309.0, 476.0, 807.0, 1458.0, 2688.0, 4929.0, 9512.0, 19397.0, 40804.0, 89126.0, 183316.0, 278240.0, 212188.0, 107134.0, 49725.0, 23534.0, 11475.0, 5822.0, 3096.0, 1722.0, 958.0, 548.0, 303.0, 181.0, 119.0, 77.0, 44.0, 31.0, 22.0, 12.0, 8.0, 8.0, 6.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.1981201171875, -0.1923980712890625, -0.186676025390625, -0.1809539794921875, -0.17523193359375, -0.1695098876953125, -0.163787841796875, -0.1580657958984375, -0.15234375, -0.1466217041015625, -0.140899658203125, -0.1351776123046875, -0.12945556640625, -0.1237335205078125, -0.118011474609375, -0.1122894287109375, -0.1065673828125, -0.1008453369140625, -0.095123291015625, -0.0894012451171875, -0.08367919921875, -0.0779571533203125, -0.072235107421875, -0.0665130615234375, -0.060791015625, -0.0550689697265625, -0.049346923828125, -0.0436248779296875, -0.03790283203125, -0.0321807861328125, -0.026458740234375, -0.0207366943359375, -0.0150146484375, -0.0092926025390625, -0.003570556640625, 0.0021514892578125, 0.00787353515625, 0.0135955810546875, 0.019317626953125, 0.0250396728515625, 0.03076171875, 0.0364837646484375, 0.042205810546875, 0.0479278564453125, 0.05364990234375, 0.0593719482421875, 0.065093994140625, 0.0708160400390625, 0.0765380859375, 0.0822601318359375, 0.087982177734375, 0.0937042236328125, 0.09942626953125, 0.1051483154296875, 0.110870361328125, 0.1165924072265625, 0.122314453125, 0.1280364990234375, 0.133758544921875, 0.1394805908203125, 0.14520263671875, 0.1509246826171875, 0.156646728515625, 0.1623687744140625, 0.1680908203125]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 7.0, 9.0, 7.0, 11.0, 12.0, 12.0, 17.0, 18.0, 18.0, 33.0, 37.0, 22.0, 34.0, 20.0, 38.0, 46.0, 54.0, 54.0, 48.0, 39.0, 43.0, 48.0, 50.0, 48.0, 31.0, 38.0, 32.0, 26.0, 21.0, 27.0, 15.0, 18.0, 8.0, 13.0, 16.0, 8.0, 3.0, 8.0, 4.0, 9.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0711669921875, -0.06913518905639648, -0.06710338592529297, -0.06507158279418945, -0.06303977966308594, -0.06100797653198242, -0.058976173400878906, -0.05694437026977539, -0.054912567138671875, -0.05288076400756836, -0.050848960876464844, -0.04881715774536133, -0.04678535461425781, -0.0447535514831543, -0.04272174835205078, -0.040689945220947266, -0.03865814208984375, -0.036626338958740234, -0.03459453582763672, -0.0325627326965332, -0.030530929565429688, -0.028499126434326172, -0.026467323303222656, -0.02443552017211914, -0.022403717041015625, -0.02037191390991211, -0.018340110778808594, -0.016308307647705078, -0.014276504516601562, -0.012244701385498047, -0.010212898254394531, -0.008181095123291016, -0.0061492919921875, -0.004117488861083984, -0.0020856857299804688, -5.3882598876953125e-05, 0.0019779205322265625, 0.004009723663330078, 0.006041526794433594, 0.00807332992553711, 0.010105133056640625, 0.01213693618774414, 0.014168739318847656, 0.016200542449951172, 0.018232345581054688, 0.020264148712158203, 0.02229595184326172, 0.024327754974365234, 0.02635955810546875, 0.028391361236572266, 0.03042316436767578, 0.0324549674987793, 0.03448677062988281, 0.03651857376098633, 0.038550376892089844, 0.04058218002319336, 0.042613983154296875, 0.04464578628540039, 0.046677589416503906, 0.04870939254760742, 0.05074119567871094, 0.05277299880981445, 0.05480480194091797, 0.056836605072021484, 0.058868408203125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 7.0, 8.0, 13.0, 18.0, 30.0, 34.0, 42.0, 68.0, 124.0, 140.0, 239.0, 341.0, 586.0, 1157.0, 2321.0, 5538.0, 18534.0, 110861.0, 607832.0, 250230.0, 35282.0, 8438.0, 3211.0, 1479.0, 768.0, 443.0, 286.0, 146.0, 131.0, 72.0, 60.0, 35.0, 26.0, 16.0, 14.0, 5.0, 8.0, 3.0, 1.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.497802734375, -0.4825782775878906, -0.46735382080078125, -0.4521293640136719, -0.4369049072265625, -0.4216804504394531, -0.40645599365234375, -0.3912315368652344, -0.376007080078125, -0.3607826232910156, -0.34555816650390625, -0.3303337097167969, -0.3151092529296875, -0.2998847961425781, -0.28466033935546875, -0.2694358825683594, -0.25421142578125, -0.23898696899414062, -0.22376251220703125, -0.20853805541992188, -0.1933135986328125, -0.17808914184570312, -0.16286468505859375, -0.14764022827148438, -0.132415771484375, -0.11719131469726562, -0.10196685791015625, -0.08674240112304688, -0.0715179443359375, -0.056293487548828125, -0.04106903076171875, -0.025844573974609375, -0.0106201171875, 0.004604339599609375, 0.01982879638671875, 0.035053253173828125, 0.0502777099609375, 0.06550216674804688, 0.08072662353515625, 0.09595108032226562, 0.111175537109375, 0.12639999389648438, 0.14162445068359375, 0.15684890747070312, 0.1720733642578125, 0.18729782104492188, 0.20252227783203125, 0.21774673461914062, 0.23297119140625, 0.24819564819335938, 0.26342010498046875, 0.2786445617675781, 0.2938690185546875, 0.3090934753417969, 0.32431793212890625, 0.3395423889160156, 0.354766845703125, 0.3699913024902344, 0.38521575927734375, 0.4004402160644531, 0.4156646728515625, 0.4308891296386719, 0.44611358642578125, 0.4613380432128906, 0.4765625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 3.0, 3.0, 5.0, 3.0, 6.0, 10.0, 13.0, 8.0, 18.0, 20.0, 18.0, 20.0, 19.0, 43.0, 31.0, 40.0, 34.0, 40.0, 39.0, 42.0, 45.0, 41.0, 44.0, 57.0, 42.0, 46.0, 54.0, 36.0, 41.0, 25.0, 27.0, 23.0, 9.0, 16.0, 15.0, 12.0, 14.0, 10.0, 9.0, 6.0, 5.0, 4.0, 2.0, 7.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3857421875, -0.3733062744140625, -0.360870361328125, -0.3484344482421875, -0.33599853515625, -0.3235626220703125, -0.311126708984375, -0.2986907958984375, -0.2862548828125, -0.2738189697265625, -0.261383056640625, -0.2489471435546875, -0.23651123046875, -0.2240753173828125, -0.211639404296875, -0.1992034912109375, -0.186767578125, -0.1743316650390625, -0.161895751953125, -0.1494598388671875, -0.13702392578125, -0.1245880126953125, -0.112152099609375, -0.0997161865234375, -0.0872802734375, -0.0748443603515625, -0.062408447265625, -0.0499725341796875, -0.03753662109375, -0.0251007080078125, -0.012664794921875, -0.0002288818359375, 0.01220703125, 0.0246429443359375, 0.037078857421875, 0.0495147705078125, 0.06195068359375, 0.0743865966796875, 0.086822509765625, 0.0992584228515625, 0.1116943359375, 0.1241302490234375, 0.136566162109375, 0.1490020751953125, 0.16143798828125, 0.1738739013671875, 0.186309814453125, 0.1987457275390625, 0.211181640625, 0.2236175537109375, 0.236053466796875, 0.2484893798828125, 0.26092529296875, 0.2733612060546875, 0.285797119140625, 0.2982330322265625, 0.3106689453125, 0.3231048583984375, 0.335540771484375, 0.3479766845703125, 0.36041259765625, 0.3728485107421875, 0.385284423828125, 0.3977203369140625, 0.41015625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 6.0, 3.0, 4.0, 9.0, 10.0, 17.0, 17.0, 36.0, 38.0, 69.0, 157.0, 414.0, 1179.0, 6748.0, 136107.0, 857404.0, 41434.0, 3526.0, 816.0, 264.0, 134.0, 52.0, 37.0, 26.0, 19.0, 13.0, 7.0, 5.0, 6.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.70703125, -0.6880950927734375, -0.669158935546875, -0.6502227783203125, -0.63128662109375, -0.6123504638671875, -0.593414306640625, -0.5744781494140625, -0.5555419921875, -0.5366058349609375, -0.517669677734375, -0.4987335205078125, -0.47979736328125, -0.4608612060546875, -0.441925048828125, -0.4229888916015625, -0.404052734375, -0.3851165771484375, -0.366180419921875, -0.3472442626953125, -0.32830810546875, -0.3093719482421875, -0.290435791015625, -0.2714996337890625, -0.2525634765625, -0.2336273193359375, -0.214691162109375, -0.1957550048828125, -0.17681884765625, -0.1578826904296875, -0.138946533203125, -0.1200103759765625, -0.10107421875, -0.0821380615234375, -0.063201904296875, -0.0442657470703125, -0.02532958984375, -0.0063934326171875, 0.012542724609375, 0.0314788818359375, 0.0504150390625, 0.0693511962890625, 0.088287353515625, 0.1072235107421875, 0.12615966796875, 0.1450958251953125, 0.164031982421875, 0.1829681396484375, 0.201904296875, 0.2208404541015625, 0.239776611328125, 0.2587127685546875, 0.27764892578125, 0.2965850830078125, 0.315521240234375, 0.3344573974609375, 0.3533935546875, 0.3723297119140625, 0.391265869140625, 0.4102020263671875, 0.42913818359375, 0.4480743408203125, 0.467010498046875, 0.4859466552734375, 0.5048828125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 1.0, 6.0, 6.0, 6.0, 15.0, 3.0, 11.0, 11.0, 12.0, 10.0, 34.0, 24.0, 25.0, 54.0, 47.0, 51.0, 64.0, 55.0, 57.0, 68.0, 67.0, 60.0, 46.0, 49.0, 45.0, 32.0, 34.0, 24.0, 19.0, 18.0, 10.0, 7.0, 8.0, 11.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.435415267944336e-05, -9.167753159999847e-05, -8.900091052055359e-05, -8.63242894411087e-05, -8.364766836166382e-05, -8.097104728221893e-05, -7.829442620277405e-05, -7.561780512332916e-05, -7.294118404388428e-05, -7.026456296443939e-05, -6.758794188499451e-05, -6.491132080554962e-05, -6.223469972610474e-05, -5.955807864665985e-05, -5.6881457567214966e-05, -5.420483648777008e-05, -5.1528215408325195e-05, -4.885159432888031e-05, -4.6174973249435425e-05, -4.349835216999054e-05, -4.0821731090545654e-05, -3.814511001110077e-05, -3.5468488931655884e-05, -3.2791867852211e-05, -3.0115246772766113e-05, -2.7438625693321228e-05, -2.4762004613876343e-05, -2.2085383534431458e-05, -1.9408762454986572e-05, -1.6732141375541687e-05, -1.4055520296096802e-05, -1.1378899216651917e-05, -8.702278137207031e-06, -6.025657057762146e-06, -3.3490359783172607e-06, -6.724148988723755e-07, 2.0042061805725098e-06, 4.680827260017395e-06, 7.35744833946228e-06, 1.0034069418907166e-05, 1.271069049835205e-05, 1.5387311577796936e-05, 1.806393265724182e-05, 2.0740553736686707e-05, 2.3417174816131592e-05, 2.6093795895576477e-05, 2.8770416975021362e-05, 3.144703805446625e-05, 3.412365913391113e-05, 3.680028021335602e-05, 3.94769012928009e-05, 4.215352237224579e-05, 4.4830143451690674e-05, 4.750676453113556e-05, 5.0183385610580444e-05, 5.286000669002533e-05, 5.5536627769470215e-05, 5.82132488489151e-05, 6.0889869928359985e-05, 6.356649100780487e-05, 6.624311208724976e-05, 6.891973316669464e-05, 7.159635424613953e-05, 7.427297532558441e-05, 7.69495964050293e-05]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 4.0, 3.0, 2.0, 7.0, 12.0, 21.0, 15.0, 17.0, 31.0, 50.0, 82.0, 157.0, 236.0, 448.0, 1057.0, 2765.0, 9630.0, 53305.0, 471112.0, 445701.0, 50115.0, 9012.0, 2689.0, 1050.0, 457.0, 231.0, 117.0, 80.0, 51.0, 38.0, 19.0, 10.0, 9.0, 6.0, 9.0, 3.0, 4.0, 5.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.359619140625, -0.34903717041015625, -0.3384552001953125, -0.32787322998046875, -0.317291259765625, -0.30670928955078125, -0.2961273193359375, -0.28554534912109375, -0.27496337890625, -0.26438140869140625, -0.2537994384765625, -0.24321746826171875, -0.232635498046875, -0.22205352783203125, -0.2114715576171875, -0.20088958740234375, -0.1903076171875, -0.17972564697265625, -0.1691436767578125, -0.15856170654296875, -0.147979736328125, -0.13739776611328125, -0.1268157958984375, -0.11623382568359375, -0.10565185546875, -0.09506988525390625, -0.0844879150390625, -0.07390594482421875, -0.063323974609375, -0.05274200439453125, -0.0421600341796875, -0.03157806396484375, -0.02099609375, -0.01041412353515625, 0.0001678466796875, 0.01074981689453125, 0.021331787109375, 0.03191375732421875, 0.0424957275390625, 0.05307769775390625, 0.06365966796875, 0.07424163818359375, 0.0848236083984375, 0.09540557861328125, 0.105987548828125, 0.11656951904296875, 0.1271514892578125, 0.13773345947265625, 0.1483154296875, 0.15889739990234375, 0.1694793701171875, 0.18006134033203125, 0.190643310546875, 0.20122528076171875, 0.2118072509765625, 0.22238922119140625, 0.23297119140625, 0.24355316162109375, 0.2541351318359375, 0.26471710205078125, 0.275299072265625, 0.28588104248046875, 0.2964630126953125, 0.30704498291015625, 0.317626953125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 3.0, 6.0, 4.0, 17.0, 12.0, 11.0, 18.0, 23.0, 21.0, 37.0, 40.0, 47.0, 55.0, 67.0, 71.0, 64.0, 67.0, 80.0, 54.0, 64.0, 38.0, 30.0, 30.0, 26.0, 21.0, 15.0, 14.0, 13.0, 9.0, 11.0, 2.0, 4.0, 7.0, 2.0, 0.0, 5.0, 0.0, 6.0, 2.0, 2.0, 1.0, 3.0, 1.0], "bins": [-0.205810546875, -0.2002391815185547, -0.19466781616210938, -0.18909645080566406, -0.18352508544921875, -0.17795372009277344, -0.17238235473632812, -0.1668109893798828, -0.1612396240234375, -0.1556682586669922, -0.15009689331054688, -0.14452552795410156, -0.13895416259765625, -0.13338279724121094, -0.12781143188476562, -0.12224006652832031, -0.116668701171875, -0.11109733581542969, -0.10552597045898438, -0.09995460510253906, -0.09438323974609375, -0.08881187438964844, -0.08324050903320312, -0.07766914367675781, -0.0720977783203125, -0.06652641296386719, -0.060955047607421875, -0.05538368225097656, -0.04981231689453125, -0.04424095153808594, -0.038669586181640625, -0.03309822082519531, -0.02752685546875, -0.021955490112304688, -0.016384124755859375, -0.010812759399414062, -0.00524139404296875, 0.0003299713134765625, 0.005901336669921875, 0.011472702026367188, 0.0170440673828125, 0.022615432739257812, 0.028186798095703125, 0.03375816345214844, 0.03932952880859375, 0.04490089416503906, 0.050472259521484375, 0.05604362487792969, 0.061614990234375, 0.06718635559082031, 0.07275772094726562, 0.07832908630371094, 0.08390045166015625, 0.08947181701660156, 0.09504318237304688, 0.10061454772949219, 0.1061859130859375, 0.11175727844238281, 0.11732864379882812, 0.12290000915527344, 0.12847137451171875, 0.13404273986816406, 0.13961410522460938, 0.1451854705810547, 0.1507568359375]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 26.0, 57.0, 126.0, 191.0, 268.0, 193.0, 92.0, 34.0, 11.0, 7.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3618974685668945, -3.1553597450256348, -2.948822259902954, -2.7422845363616943, -2.5357470512390137, -2.329209327697754, -2.122671604156494, -1.9161341190338135, -1.7095965147018433, -1.503058910369873, -1.2965213060379028, -1.0899837017059326, -0.8834460377693176, -0.6769083738327026, -0.4703707695007324, -0.2638331651687622, -0.05729556083679199, 0.14924205839633942, 0.3557796776294708, 0.5623173117637634, 0.7688549160957336, 0.9753925800323486, 1.1819301843643188, 1.388467788696289, 1.5950053930282593, 1.8015429973602295, 2.0080807209014893, 2.21461820602417, 2.4211559295654297, 2.6276936531066895, 2.83423113822937, 3.040768623352051, 3.2473063468933105, 3.4538440704345703, 3.660381555557251, 3.8669192790985107, 4.073456764221191, 4.279994487762451, 4.486532211303711, 4.6930694580078125, 4.899607181549072, 5.106144905090332, 5.312682628631592, 5.519219875335693, 5.725757598876953, 5.932295322418213, 6.138833045959473, 6.345370292663574, 6.551908493041992, 6.758446216583252, 6.964983940124512, 7.171521186828613, 7.378058910369873, 7.584596633911133, 7.791134357452393, 7.997672080993652, 8.204209327697754, 8.410746574401855, 8.617284774780273, 8.823822021484375, 9.030360221862793, 9.236897468566895, 9.443434715270996, 9.649972915649414, 9.856510162353516]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 7.0, 0.0, 16.0, 13.0, 19.0, 16.0, 16.0, 36.0, 17.0, 16.0, 35.0, 26.0, 47.0, 39.0, 44.0, 39.0, 43.0, 44.0, 60.0, 53.0, 39.0, 42.0, 47.0, 42.0, 38.0, 31.0, 25.0, 22.0, 30.0, 24.0, 17.0, 14.0, 8.0, 12.0, 7.0, 5.0, 4.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.162202835083008, -2.088597059249878, -2.014991283416748, -1.9413857460021973, -1.8677799701690674, -1.7941741943359375, -1.7205685377120972, -1.6469628810882568, -1.573357105255127, -1.499751329421997, -1.4261456727981567, -1.3525400161743164, -1.2789342403411865, -1.2053284645080566, -1.1317228078842163, -1.058117151260376, -0.9845113754272461, -0.910905659198761, -0.8372999429702759, -0.7636942267417908, -0.6900885105133057, -0.6164827942848206, -0.5428770780563354, -0.46927136182785034, -0.39566564559936523, -0.3220599293708801, -0.24845421314239502, -0.1748484969139099, -0.1012427806854248, -0.027637064456939697, 0.04596865177154541, 0.11957436800003052, 0.19317984580993652, 0.26678556203842163, 0.34039127826690674, 0.41399699449539185, 0.48760271072387695, 0.5612084269523621, 0.6348141431808472, 0.7084198594093323, 0.7820255756378174, 0.8556312918663025, 0.9292370080947876, 1.002842664718628, 1.0764484405517578, 1.1500542163848877, 1.223659873008728, 1.2972655296325684, 1.3708713054656982, 1.4444770812988281, 1.5180827379226685, 1.5916883945465088, 1.6652941703796387, 1.7388999462127686, 1.8125056028366089, 1.8861112594604492, 1.959717035293579, 2.033322811126709, 2.1069283485412598, 2.1805341243743896, 2.2541399002075195, 2.3277456760406494, 2.4013514518737793, 2.47495698928833, 2.54856276512146]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 8.0, 11.0, 8.0, 16.0, 24.0, 23.0, 33.0, 41.0, 82.0, 123.0, 185.0, 347.0, 678.0, 1743.0, 5552.0, 36827.0, 4084135.0, 54004.0, 6688.0, 1918.0, 807.0, 412.0, 205.0, 132.0, 92.0, 47.0, 42.0, 25.0, 24.0, 26.0, 6.0, 3.0, 5.0, 6.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0], "bins": [-1.0244140625, -0.9991607666015625, -0.973907470703125, -0.9486541748046875, -0.92340087890625, -0.8981475830078125, -0.872894287109375, -0.8476409912109375, -0.8223876953125, -0.7971343994140625, -0.771881103515625, -0.7466278076171875, -0.72137451171875, -0.6961212158203125, -0.670867919921875, -0.6456146240234375, -0.620361328125, -0.5951080322265625, -0.569854736328125, -0.5446014404296875, -0.51934814453125, -0.4940948486328125, -0.468841552734375, -0.4435882568359375, -0.4183349609375, -0.3930816650390625, -0.367828369140625, -0.3425750732421875, -0.31732177734375, -0.2920684814453125, -0.266815185546875, -0.2415618896484375, -0.21630859375, -0.1910552978515625, -0.165802001953125, -0.1405487060546875, -0.11529541015625, -0.0900421142578125, -0.064788818359375, -0.0395355224609375, -0.0142822265625, 0.0109710693359375, 0.036224365234375, 0.0614776611328125, 0.08673095703125, 0.1119842529296875, 0.137237548828125, 0.1624908447265625, 0.187744140625, 0.2129974365234375, 0.238250732421875, 0.2635040283203125, 0.28875732421875, 0.3140106201171875, 0.339263916015625, 0.3645172119140625, 0.3897705078125, 0.4150238037109375, 0.440277099609375, 0.4655303955078125, 0.49078369140625, 0.5160369873046875, 0.541290283203125, 0.5665435791015625, 0.591796875]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 5.0, 9.0, 9.0, 6.0, 15.0, 18.0, 18.0, 19.0, 27.0, 32.0, 36.0, 40.0, 51.0, 51.0, 58.0, 66.0, 61.0, 52.0, 74.0, 58.0, 57.0, 40.0, 46.0, 26.0, 32.0, 23.0, 17.0, 15.0, 14.0, 10.0, 7.0, 7.0, 1.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.109619140625, -0.10661125183105469, -0.10360336303710938, -0.10059547424316406, -0.09758758544921875, -0.09457969665527344, -0.09157180786132812, -0.08856391906738281, -0.0855560302734375, -0.08254814147949219, -0.07954025268554688, -0.07653236389160156, -0.07352447509765625, -0.07051658630371094, -0.06750869750976562, -0.06450080871582031, -0.061492919921875, -0.05848503112792969, -0.055477142333984375, -0.05246925354003906, -0.04946136474609375, -0.04645347595214844, -0.043445587158203125, -0.04043769836425781, -0.0374298095703125, -0.03442192077636719, -0.031414031982421875, -0.028406143188476562, -0.02539825439453125, -0.022390365600585938, -0.019382476806640625, -0.016374588012695312, -0.01336669921875, -0.010358810424804688, -0.007350921630859375, -0.0043430328369140625, -0.00133514404296875, 0.0016727447509765625, 0.004680633544921875, 0.0076885223388671875, 0.0106964111328125, 0.013704299926757812, 0.016712188720703125, 0.019720077514648438, 0.02272796630859375, 0.025735855102539062, 0.028743743896484375, 0.03175163269042969, 0.034759521484375, 0.03776741027832031, 0.040775299072265625, 0.04378318786621094, 0.04679107666015625, 0.04979896545410156, 0.052806854248046875, 0.05581474304199219, 0.0588226318359375, 0.06183052062988281, 0.06483840942382812, 0.06784629821777344, 0.07085418701171875, 0.07386207580566406, 0.07686996459960938, 0.07987785339355469, 0.0828857421875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 3.0, 7.0, 4.0, 10.0, 6.0, 25.0, 19.0, 23.0, 39.0, 48.0, 96.0, 154.0, 258.0, 534.0, 1151.0, 2647.0, 9558.0, 97358.0, 4049571.0, 24102.0, 4984.0, 1877.0, 788.0, 393.0, 245.0, 126.0, 90.0, 55.0, 23.0, 27.0, 15.0, 13.0, 9.0, 8.0, 5.0, 7.0, 3.0, 0.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.04296875, -1.0047149658203125, -0.966461181640625, -0.9282073974609375, -0.88995361328125, -0.8516998291015625, -0.813446044921875, -0.7751922607421875, -0.7369384765625, -0.6986846923828125, -0.660430908203125, -0.6221771240234375, -0.58392333984375, -0.5456695556640625, -0.507415771484375, -0.4691619873046875, -0.430908203125, -0.3926544189453125, -0.354400634765625, -0.3161468505859375, -0.27789306640625, -0.2396392822265625, -0.201385498046875, -0.1631317138671875, -0.1248779296875, -0.0866241455078125, -0.048370361328125, -0.0101165771484375, 0.02813720703125, 0.0663909912109375, 0.104644775390625, 0.1428985595703125, 0.18115234375, 0.2194061279296875, 0.257659912109375, 0.2959136962890625, 0.33416748046875, 0.3724212646484375, 0.410675048828125, 0.4489288330078125, 0.4871826171875, 0.5254364013671875, 0.563690185546875, 0.6019439697265625, 0.64019775390625, 0.6784515380859375, 0.716705322265625, 0.7549591064453125, 0.793212890625, 0.8314666748046875, 0.869720458984375, 0.9079742431640625, 0.94622802734375, 0.9844818115234375, 1.022735595703125, 1.0609893798828125, 1.0992431640625, 1.1374969482421875, 1.175750732421875, 1.2140045166015625, 1.25225830078125, 1.2905120849609375, 1.328765869140625, 1.3670196533203125, 1.4052734375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 1.0, 2.0, 8.0, 6.0, 11.0, 17.0, 28.0, 75.0, 294.0, 3355.0, 163.0, 51.0, 26.0, 3.0, 14.0, 7.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1351318359375, -0.1290760040283203, -0.12302017211914062, -0.11696434020996094, -0.11090850830078125, -0.10485267639160156, -0.09879684448242188, -0.09274101257324219, -0.0866851806640625, -0.08062934875488281, -0.07457351684570312, -0.06851768493652344, -0.06246185302734375, -0.05640602111816406, -0.050350189208984375, -0.04429435729980469, -0.038238525390625, -0.03218269348144531, -0.026126861572265625, -0.020071029663085938, -0.01401519775390625, -0.007959365844726562, -0.001903533935546875, 0.0041522979736328125, 0.0102081298828125, 0.016263961791992188, 0.022319793701171875, 0.028375625610351562, 0.03443145751953125, 0.04048728942871094, 0.046543121337890625, 0.05259895324707031, 0.05865478515625, 0.06471061706542969, 0.07076644897460938, 0.07682228088378906, 0.08287811279296875, 0.08893394470214844, 0.09498977661132812, 0.10104560852050781, 0.1071014404296875, 0.11315727233886719, 0.11921310424804688, 0.12526893615722656, 0.13132476806640625, 0.13738059997558594, 0.14343643188476562, 0.1494922637939453, 0.155548095703125, 0.1616039276123047, 0.16765975952148438, 0.17371559143066406, 0.17977142333984375, 0.18582725524902344, 0.19188308715820312, 0.1979389190673828, 0.2039947509765625, 0.2100505828857422, 0.21610641479492188, 0.22216224670410156, 0.22821807861328125, 0.23427391052246094, 0.24032974243164062, 0.2463855743408203, 0.25244140625]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 10.0, 10.0, 17.0, 16.0, 22.0, 39.0, 64.0, 60.0, 95.0, 119.0, 116.0, 106.0, 95.0, 70.0, 52.0, 39.0, 37.0, 13.0, 9.0, 4.0, 7.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4850998520851135, -0.4657883942127228, -0.4464769661426544, -0.42716550827026367, -0.4078540802001953, -0.38854262232780457, -0.3692311644554138, -0.34991973638534546, -0.3306082785129547, -0.31129682064056396, -0.2919853925704956, -0.27267393469810486, -0.2533624768257141, -0.23405104875564575, -0.214739590883255, -0.19542814791202545, -0.1761167049407959, -0.15680526196956635, -0.1374938189983368, -0.11818236112594604, -0.09887091815471649, -0.07955947518348694, -0.06024802476167679, -0.04093657433986664, -0.021625131368637085, -0.0023136846721172333, 0.01699776202440262, 0.03630920872092247, 0.05562065541744232, 0.07493209838867188, 0.09424354881048203, 0.11355499923229218, 0.1328665018081665, 0.15217794477939606, 0.1714893877506256, 0.19080084562301636, 0.2101122885942459, 0.22942373156547546, 0.2487351894378662, 0.26804661750793457, 0.2873580753803253, 0.30666953325271606, 0.3259809613227844, 0.34529241919517517, 0.3646038770675659, 0.3839153051376343, 0.403226763010025, 0.42253822088241577, 0.44184964895248413, 0.4611611068248749, 0.48047253489494324, 0.499783992767334, 0.5190954208374023, 0.5384068489074707, 0.5577183365821838, 0.5770297646522522, 0.5963412523269653, 0.6156526803970337, 0.6349641680717468, 0.6542755961418152, 0.6735870242118835, 0.6928985118865967, 0.712209939956665, 0.7315213680267334, 0.7508327960968018]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 9.0, 5.0, 10.0, 13.0, 4.0, 10.0, 17.0, 21.0, 20.0, 34.0, 30.0, 20.0, 25.0, 34.0, 30.0, 37.0, 42.0, 34.0, 38.0, 46.0, 45.0, 40.0, 40.0, 28.0, 41.0, 37.0, 35.0, 26.0, 37.0, 18.0, 32.0, 22.0, 20.0, 22.0, 17.0, 11.0, 9.0, 9.0, 6.0, 7.0, 4.0, 4.0, 3.0, 5.0, 2.0, 4.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.2593414783477783, -0.2508465051651001, -0.24235151708126068, -0.23385652899742126, -0.22536155581474304, -0.21686656773090363, -0.2083715796470642, -0.199876606464386, -0.19138161838054657, -0.18288663029670715, -0.17439165711402893, -0.16589666903018951, -0.1574016809463501, -0.14890670776367188, -0.14041171967983246, -0.13191673159599304, -0.12342175841331482, -0.114926777780056, -0.10643179714679718, -0.09793680906295776, -0.08944182842969894, -0.08094684779644012, -0.07245185971260071, -0.06395687907934189, -0.05546189844608307, -0.04696691781282425, -0.03847193345427513, -0.029976950958371162, -0.021481968462467194, -0.012986987829208374, -0.004492003470659256, 0.004002980887889862, 0.012497961521148682, 0.02099294401705265, 0.02948792651295662, 0.03798291087150574, 0.04647789150476456, 0.054972872138023376, 0.06346786022186279, 0.07196284085512161, 0.08045782148838043, 0.08895280212163925, 0.09744778275489807, 0.10594277083873749, 0.11443775147199631, 0.12293273210525513, 0.13142772018909454, 0.13992270827293396, 0.14841768145561218, 0.1569126695394516, 0.16540764272212982, 0.17390263080596924, 0.18239760398864746, 0.19089259207248688, 0.1993875801563263, 0.20788255333900452, 0.21637754142284393, 0.22487252950668335, 0.23336750268936157, 0.241862490773201, 0.2503574788570404, 0.25885245203971863, 0.26734742522239685, 0.27584242820739746, 0.2843374013900757]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 6.0, 2.0, 8.0, 7.0, 18.0, 29.0, 34.0, 78.0, 115.0, 211.0, 443.0, 811.0, 1516.0, 2996.0, 6245.0, 13868.0, 32511.0, 79858.0, 190361.0, 317449.0, 229091.0, 100626.0, 40363.0, 16948.0, 7539.0, 3535.0, 1820.0, 928.0, 485.0, 272.0, 168.0, 99.0, 51.0, 27.0, 19.0, 9.0, 5.0, 4.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26806640625, -0.25984954833984375, -0.2516326904296875, -0.24341583251953125, -0.235198974609375, -0.22698211669921875, -0.2187652587890625, -0.21054840087890625, -0.20233154296875, -0.19411468505859375, -0.1858978271484375, -0.17768096923828125, -0.169464111328125, -0.16124725341796875, -0.1530303955078125, -0.14481353759765625, -0.1365966796875, -0.12837982177734375, -0.1201629638671875, -0.11194610595703125, -0.103729248046875, -0.09551239013671875, -0.0872955322265625, -0.07907867431640625, -0.07086181640625, -0.06264495849609375, -0.0544281005859375, -0.04621124267578125, -0.037994384765625, -0.02977752685546875, -0.0215606689453125, -0.01334381103515625, -0.005126953125, 0.00308990478515625, 0.0113067626953125, 0.01952362060546875, 0.027740478515625, 0.03595733642578125, 0.0441741943359375, 0.05239105224609375, 0.06060791015625, 0.06882476806640625, 0.0770416259765625, 0.08525848388671875, 0.093475341796875, 0.10169219970703125, 0.1099090576171875, 0.11812591552734375, 0.1263427734375, 0.13455963134765625, 0.1427764892578125, 0.15099334716796875, 0.159210205078125, 0.16742706298828125, 0.1756439208984375, 0.18386077880859375, 0.19207763671875, 0.20029449462890625, 0.2085113525390625, 0.21672821044921875, 0.224945068359375, 0.23316192626953125, 0.2413787841796875, 0.24959564208984375, 0.2578125]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 6.0, 2.0, 6.0, 10.0, 11.0, 13.0, 8.0, 10.0, 10.0, 23.0, 22.0, 29.0, 29.0, 35.0, 43.0, 41.0, 47.0, 31.0, 50.0, 52.0, 48.0, 51.0, 50.0, 58.0, 42.0, 46.0, 27.0, 31.0, 26.0, 31.0, 19.0, 19.0, 14.0, 18.0, 14.0, 10.0, 6.0, 5.0, 3.0, 1.0, 2.0, 4.0, 3.0, 0.0, 4.0, 1.0, 1.0, 1.0], "bins": [-0.10137939453125, -0.09858417510986328, -0.09578895568847656, -0.09299373626708984, -0.09019851684570312, -0.0874032974243164, -0.08460807800292969, -0.08181285858154297, -0.07901763916015625, -0.07622241973876953, -0.07342720031738281, -0.0706319808959961, -0.06783676147460938, -0.06504154205322266, -0.06224632263183594, -0.05945110321044922, -0.0566558837890625, -0.05386066436767578, -0.05106544494628906, -0.048270225524902344, -0.045475006103515625, -0.042679786682128906, -0.03988456726074219, -0.03708934783935547, -0.03429412841796875, -0.03149890899658203, -0.028703689575195312, -0.025908470153808594, -0.023113250732421875, -0.020318031311035156, -0.017522811889648438, -0.014727592468261719, -0.011932373046875, -0.009137153625488281, -0.0063419342041015625, -0.0035467147827148438, -0.000751495361328125, 0.0020437240600585938, 0.0048389434814453125, 0.007634162902832031, 0.01042938232421875, 0.013224601745605469, 0.016019821166992188, 0.018815040588378906, 0.021610260009765625, 0.024405479431152344, 0.027200698852539062, 0.02999591827392578, 0.0327911376953125, 0.03558635711669922, 0.03838157653808594, 0.041176795959472656, 0.043972015380859375, 0.046767234802246094, 0.04956245422363281, 0.05235767364501953, 0.05515289306640625, 0.05794811248779297, 0.06074333190917969, 0.0635385513305664, 0.06633377075195312, 0.06912899017333984, 0.07192420959472656, 0.07471942901611328, 0.0775146484375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 4.0, 0.0, 9.0, 6.0, 11.0, 12.0, 20.0, 29.0, 30.0, 51.0, 53.0, 98.0, 111.0, 140.0, 189.0, 308.0, 474.0, 809.0, 1389.0, 2725.0, 6882.0, 22278.0, 93846.0, 454816.0, 362200.0, 72453.0, 17730.0, 5963.0, 2476.0, 1254.0, 689.0, 446.0, 292.0, 197.0, 140.0, 119.0, 89.0, 60.0, 34.0, 32.0, 28.0, 10.0, 16.0, 4.0, 7.0, 6.0, 7.0, 5.0, 3.0, 0.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.421875, -0.4082298278808594, -0.39458465576171875, -0.3809394836425781, -0.3672943115234375, -0.3536491394042969, -0.34000396728515625, -0.3263587951660156, -0.312713623046875, -0.2990684509277344, -0.28542327880859375, -0.2717781066894531, -0.2581329345703125, -0.24448776245117188, -0.23084259033203125, -0.21719741821289062, -0.20355224609375, -0.18990707397460938, -0.17626190185546875, -0.16261672973632812, -0.1489715576171875, -0.13532638549804688, -0.12168121337890625, -0.10803604125976562, -0.094390869140625, -0.08074569702148438, -0.06710052490234375, -0.053455352783203125, -0.0398101806640625, -0.026165008544921875, -0.01251983642578125, 0.001125335693359375, 0.0147705078125, 0.028415679931640625, 0.04206085205078125, 0.055706024169921875, 0.0693511962890625, 0.08299636840820312, 0.09664154052734375, 0.11028671264648438, 0.123931884765625, 0.13757705688476562, 0.15122222900390625, 0.16486740112304688, 0.1785125732421875, 0.19215774536132812, 0.20580291748046875, 0.21944808959960938, 0.23309326171875, 0.24673843383789062, 0.26038360595703125, 0.2740287780761719, 0.2876739501953125, 0.3013191223144531, 0.31496429443359375, 0.3286094665527344, 0.342254638671875, 0.3558998107910156, 0.36954498291015625, 0.3831901550292969, 0.3968353271484375, 0.4104804992675781, 0.42412567138671875, 0.4377708435058594, 0.451416015625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 0.0, 5.0, 13.0, 6.0, 9.0, 8.0, 13.0, 10.0, 16.0, 21.0, 24.0, 24.0, 33.0, 41.0, 42.0, 37.0, 49.0, 50.0, 55.0, 41.0, 40.0, 48.0, 41.0, 47.0, 34.0, 37.0, 29.0, 40.0, 28.0, 25.0, 20.0, 20.0, 18.0, 14.0, 13.0, 20.0, 5.0, 6.0, 8.0, 5.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.445068359375, -0.4308319091796875, -0.416595458984375, -0.4023590087890625, -0.38812255859375, -0.3738861083984375, -0.359649658203125, -0.3454132080078125, -0.3311767578125, -0.3169403076171875, -0.302703857421875, -0.2884674072265625, -0.27423095703125, -0.2599945068359375, -0.245758056640625, -0.2315216064453125, -0.21728515625, -0.2030487060546875, -0.188812255859375, -0.1745758056640625, -0.16033935546875, -0.1461029052734375, -0.131866455078125, -0.1176300048828125, -0.1033935546875, -0.0891571044921875, -0.074920654296875, -0.0606842041015625, -0.04644775390625, -0.0322113037109375, -0.017974853515625, -0.0037384033203125, 0.010498046875, 0.0247344970703125, 0.038970947265625, 0.0532073974609375, 0.06744384765625, 0.0816802978515625, 0.095916748046875, 0.1101531982421875, 0.1243896484375, 0.1386260986328125, 0.152862548828125, 0.1670989990234375, 0.18133544921875, 0.1955718994140625, 0.209808349609375, 0.2240447998046875, 0.23828125, 0.2525177001953125, 0.266754150390625, 0.2809906005859375, 0.29522705078125, 0.3094635009765625, 0.323699951171875, 0.3379364013671875, 0.3521728515625, 0.3664093017578125, 0.380645751953125, 0.3948822021484375, 0.40911865234375, 0.4233551025390625, 0.437591552734375, 0.4518280029296875, 0.466064453125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 5.0, 5.0, 3.0, 8.0, 10.0, 23.0, 22.0, 38.0, 67.0, 66.0, 151.0, 253.0, 414.0, 722.0, 1402.0, 3056.0, 7500.0, 22287.0, 80187.0, 316700.0, 442022.0, 123069.0, 32155.0, 10367.0, 4141.0, 1817.0, 861.0, 512.0, 262.0, 156.0, 105.0, 54.0, 45.0, 29.0, 14.0, 14.0, 6.0, 2.0, 9.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1929931640625, -0.18717193603515625, -0.1813507080078125, -0.17552947998046875, -0.169708251953125, -0.16388702392578125, -0.1580657958984375, -0.15224456787109375, -0.14642333984375, -0.14060211181640625, -0.1347808837890625, -0.12895965576171875, -0.123138427734375, -0.11731719970703125, -0.1114959716796875, -0.10567474365234375, -0.099853515625, -0.09403228759765625, -0.0882110595703125, -0.08238983154296875, -0.076568603515625, -0.07074737548828125, -0.0649261474609375, -0.05910491943359375, -0.05328369140625, -0.04746246337890625, -0.0416412353515625, -0.03582000732421875, -0.029998779296875, -0.02417755126953125, -0.0183563232421875, -0.01253509521484375, -0.0067138671875, -0.00089263916015625, 0.0049285888671875, 0.01074981689453125, 0.016571044921875, 0.02239227294921875, 0.0282135009765625, 0.03403472900390625, 0.03985595703125, 0.04567718505859375, 0.0514984130859375, 0.05731964111328125, 0.063140869140625, 0.06896209716796875, 0.0747833251953125, 0.08060455322265625, 0.08642578125, 0.09224700927734375, 0.0980682373046875, 0.10388946533203125, 0.109710693359375, 0.11553192138671875, 0.1213531494140625, 0.12717437744140625, 0.13299560546875, 0.13881683349609375, 0.1446380615234375, 0.15045928955078125, 0.156280517578125, 0.16210174560546875, 0.1679229736328125, 0.17374420166015625, 0.1795654296875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 4.0, 7.0, 7.0, 14.0, 13.0, 15.0, 19.0, 28.0, 36.0, 39.0, 46.0, 50.0, 50.0, 73.0, 80.0, 69.0, 59.0, 62.0, 47.0, 44.0, 36.0, 46.0, 36.0, 26.0, 13.0, 23.0, 14.0, 7.0, 8.0, 8.0, 3.0, 6.0, 3.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.101629257202148e-05, -8.804164826869965e-05, -8.506700396537781e-05, -8.209235966205597e-05, -7.911771535873413e-05, -7.614307105541229e-05, -7.316842675209045e-05, -7.019378244876862e-05, -6.721913814544678e-05, -6.424449384212494e-05, -6.12698495388031e-05, -5.829520523548126e-05, -5.5320560932159424e-05, -5.2345916628837585e-05, -4.937127232551575e-05, -4.639662802219391e-05, -4.342198371887207e-05, -4.044733941555023e-05, -3.7472695112228394e-05, -3.4498050808906555e-05, -3.152340650558472e-05, -2.854876220226288e-05, -2.557411789894104e-05, -2.25994735956192e-05, -1.9624829292297363e-05, -1.6650184988975525e-05, -1.3675540685653687e-05, -1.0700896382331848e-05, -7.72625207901001e-06, -4.751607775688171e-06, -1.776963472366333e-06, 1.1976808309555054e-06, 4.172325134277344e-06, 7.146969437599182e-06, 1.012161374092102e-05, 1.3096258044242859e-05, 1.6070902347564697e-05, 1.9045546650886536e-05, 2.2020190954208374e-05, 2.4994835257530212e-05, 2.796947956085205e-05, 3.094412386417389e-05, 3.391876816749573e-05, 3.6893412470817566e-05, 3.9868056774139404e-05, 4.284270107746124e-05, 4.581734538078308e-05, 4.879198968410492e-05, 5.176663398742676e-05, 5.4741278290748596e-05, 5.7715922594070435e-05, 6.069056689739227e-05, 6.366521120071411e-05, 6.663985550403595e-05, 6.961449980735779e-05, 7.258914411067963e-05, 7.556378841400146e-05, 7.85384327173233e-05, 8.151307702064514e-05, 8.448772132396698e-05, 8.746236562728882e-05, 9.043700993061066e-05, 9.34116542339325e-05, 9.638629853725433e-05, 9.936094284057617e-05]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 7.0, 11.0, 14.0, 14.0, 14.0, 21.0, 32.0, 57.0, 62.0, 140.0, 224.0, 390.0, 722.0, 1394.0, 3116.0, 9088.0, 39226.0, 257990.0, 585520.0, 119778.0, 20550.0, 5712.0, 2148.0, 1019.0, 536.0, 281.0, 168.0, 111.0, 72.0, 35.0, 30.0, 17.0, 14.0, 6.0, 13.0, 6.0, 5.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.238525390625, -0.23038482666015625, -0.2222442626953125, -0.21410369873046875, -0.205963134765625, -0.19782257080078125, -0.1896820068359375, -0.18154144287109375, -0.17340087890625, -0.16526031494140625, -0.1571197509765625, -0.14897918701171875, -0.140838623046875, -0.13269805908203125, -0.1245574951171875, -0.11641693115234375, -0.1082763671875, -0.10013580322265625, -0.0919952392578125, -0.08385467529296875, -0.075714111328125, -0.06757354736328125, -0.0594329833984375, -0.05129241943359375, -0.04315185546875, -0.03501129150390625, -0.0268707275390625, -0.01873016357421875, -0.010589599609375, -0.00244903564453125, 0.0056915283203125, 0.01383209228515625, 0.02197265625, 0.03011322021484375, 0.0382537841796875, 0.04639434814453125, 0.054534912109375, 0.06267547607421875, 0.0708160400390625, 0.07895660400390625, 0.08709716796875, 0.09523773193359375, 0.1033782958984375, 0.11151885986328125, 0.119659423828125, 0.12779998779296875, 0.1359405517578125, 0.14408111572265625, 0.1522216796875, 0.16036224365234375, 0.1685028076171875, 0.17664337158203125, 0.184783935546875, 0.19292449951171875, 0.2010650634765625, 0.20920562744140625, 0.21734619140625, 0.22548675537109375, 0.2336273193359375, 0.24176788330078125, 0.249908447265625, 0.25804901123046875, 0.2661895751953125, 0.27433013916015625, 0.282470703125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 9.0, 4.0, 7.0, 7.0, 28.0, 23.0, 33.0, 35.0, 62.0, 73.0, 96.0, 97.0, 85.0, 78.0, 83.0, 75.0, 55.0, 42.0, 31.0, 26.0, 9.0, 15.0, 13.0, 5.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2159423828125, -0.20862388610839844, -0.20130538940429688, -0.1939868927001953, -0.18666839599609375, -0.1793498992919922, -0.17203140258789062, -0.16471290588378906, -0.1573944091796875, -0.15007591247558594, -0.14275741577148438, -0.1354389190673828, -0.12812042236328125, -0.12080192565917969, -0.11348342895507812, -0.10616493225097656, -0.098846435546875, -0.09152793884277344, -0.08420944213867188, -0.07689094543457031, -0.06957244873046875, -0.06225395202636719, -0.054935455322265625, -0.04761695861816406, -0.0402984619140625, -0.03297996520996094, -0.025661468505859375, -0.018342971801757812, -0.01102447509765625, -0.0037059783935546875, 0.003612518310546875, 0.010931015014648438, 0.01824951171875, 0.025568008422851562, 0.032886505126953125, 0.04020500183105469, 0.04752349853515625, 0.05484199523925781, 0.062160491943359375, 0.06947898864746094, 0.0767974853515625, 0.08411598205566406, 0.09143447875976562, 0.09875297546386719, 0.10607147216796875, 0.11338996887207031, 0.12070846557617188, 0.12802696228027344, 0.135345458984375, 0.14266395568847656, 0.14998245239257812, 0.1573009490966797, 0.16461944580078125, 0.1719379425048828, 0.17925643920898438, 0.18657493591308594, 0.1938934326171875, 0.20121192932128906, 0.20853042602539062, 0.2158489227294922, 0.22316741943359375, 0.2304859161376953, 0.23780441284179688, 0.24512290954589844, 0.25244140625]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 10.0, 12.0, 24.0, 29.0, 56.0, 78.0, 102.0, 159.0, 111.0, 120.0, 101.0, 80.0, 46.0, 30.0, 17.0, 13.0, 8.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0], "bins": [-5.838349342346191, -5.717735767364502, -5.5971221923828125, -5.476508617401123, -5.355895042419434, -5.235281467437744, -5.114667892456055, -4.994054317474365, -4.873440742492676, -4.752827167510986, -4.632213592529297, -4.511600017547607, -4.390986442565918, -4.2703728675842285, -4.149759292602539, -4.02914571762085, -3.90853214263916, -3.7879185676574707, -3.6673049926757812, -3.546691417694092, -3.4260778427124023, -3.305464267730713, -3.1848506927490234, -3.064237117767334, -2.9436235427856445, -2.823009967803955, -2.7023963928222656, -2.581782817840576, -2.4611692428588867, -2.3405556678771973, -2.219942092895508, -2.0993285179138184, -1.978714942932129, -1.8581013679504395, -1.73748779296875, -1.6168742179870605, -1.496260643005371, -1.3756470680236816, -1.2550334930419922, -1.1344199180603027, -1.0138063430786133, -0.8931927680969238, -0.7725791931152344, -0.6519656181335449, -0.5313520431518555, -0.410738468170166, -0.29012489318847656, -0.1695113182067871, -0.048897743225097656, 0.0717158317565918, 0.19232940673828125, 0.3129429817199707, 0.43355655670166016, 0.5541701316833496, 0.6747837066650391, 0.7953972816467285, 0.916010856628418, 1.0366244316101074, 1.1572380065917969, 1.2778515815734863, 1.3984651565551758, 1.5190787315368652, 1.6396923065185547, 1.7603058815002441, 1.8809194564819336]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 4.0, 4.0, 4.0, 12.0, 8.0, 5.0, 8.0, 12.0, 9.0, 11.0, 14.0, 20.0, 31.0, 37.0, 34.0, 38.0, 48.0, 48.0, 64.0, 49.0, 62.0, 59.0, 64.0, 59.0, 39.0, 41.0, 30.0, 27.0, 26.0, 24.0, 28.0, 22.0, 14.0, 11.0, 5.0, 8.0, 3.0, 5.0, 8.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0], "bins": [-2.7498106956481934, -2.6682560443878174, -2.5867013931274414, -2.5051467418670654, -2.4235920906066895, -2.3420374393463135, -2.2604827880859375, -2.1789278984069824, -2.0973734855651855, -2.0158188343048096, -1.9342641830444336, -1.8527095317840576, -1.7711548805236816, -1.6896002292633057, -1.6080454587936401, -1.5264908075332642, -1.4449360370635986, -1.3633813858032227, -1.2818267345428467, -1.2002720832824707, -1.1187174320220947, -1.0371627807617188, -0.9556080102920532, -0.8740533590316772, -0.7924987077713013, -0.7109440565109253, -0.6293894052505493, -0.5478346943855286, -0.4662800431251526, -0.3847253918647766, -0.30317071080207825, -0.22161602973937988, -0.1400611400604248, -0.058506473898887634, 0.023048192262649536, 0.1046028584241867, 0.18615752458572388, 0.26771217584609985, 0.3492668569087982, 0.4308215379714966, 0.5123761892318726, 0.5939308404922485, 0.6754854917526245, 0.7570402026176453, 0.8385948538780212, 0.9201495051383972, 1.001704216003418, 1.083258867263794, 1.16481351852417, 1.246368169784546, 1.3279228210449219, 1.4094774723052979, 1.4910321235656738, 1.5725867748260498, 1.6541415452957153, 1.7356961965560913, 1.8172508478164673, 1.8988054990768433, 1.9803601503372192, 2.0619149208068848, 2.1434695720672607, 2.2250242233276367, 2.3065788745880127, 2.3881335258483887, 2.4696881771087646]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 3.0, 2.0, 8.0, 11.0, 16.0, 12.0, 27.0, 43.0, 53.0, 59.0, 115.0, 155.0, 244.0, 384.0, 613.0, 928.0, 1736.0, 3110.0, 6795.0, 17713.0, 79660.0, 3908481.0, 134127.0, 23047.0, 8045.0, 3675.0, 2001.0, 1122.0, 709.0, 436.0, 287.0, 202.0, 130.0, 93.0, 76.0, 42.0, 30.0, 28.0, 21.0, 11.0, 8.0, 11.0, 2.0, 9.0, 2.0, 6.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.366455078125, -0.3540802001953125, -0.341705322265625, -0.3293304443359375, -0.31695556640625, -0.3045806884765625, -0.292205810546875, -0.2798309326171875, -0.2674560546875, -0.2550811767578125, -0.242706298828125, -0.2303314208984375, -0.21795654296875, -0.2055816650390625, -0.193206787109375, -0.1808319091796875, -0.16845703125, -0.1560821533203125, -0.143707275390625, -0.1313323974609375, -0.11895751953125, -0.1065826416015625, -0.094207763671875, -0.0818328857421875, -0.0694580078125, -0.0570831298828125, -0.044708251953125, -0.0323333740234375, -0.01995849609375, -0.0075836181640625, 0.004791259765625, 0.0171661376953125, 0.029541015625, 0.0419158935546875, 0.054290771484375, 0.0666656494140625, 0.07904052734375, 0.0914154052734375, 0.103790283203125, 0.1161651611328125, 0.1285400390625, 0.1409149169921875, 0.153289794921875, 0.1656646728515625, 0.17803955078125, 0.1904144287109375, 0.202789306640625, 0.2151641845703125, 0.2275390625, 0.2399139404296875, 0.252288818359375, 0.2646636962890625, 0.27703857421875, 0.2894134521484375, 0.301788330078125, 0.3141632080078125, 0.3265380859375, 0.3389129638671875, 0.351287841796875, 0.3636627197265625, 0.37603759765625, 0.3884124755859375, 0.400787353515625, 0.4131622314453125, 0.425537109375]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 3.0, 0.0, 0.0, 2.0, 5.0, 2.0, 6.0, 7.0, 9.0, 13.0, 13.0, 18.0, 28.0, 22.0, 37.0, 50.0, 42.0, 66.0, 72.0, 62.0, 84.0, 60.0, 63.0, 54.0, 53.0, 38.0, 53.0, 36.0, 23.0, 28.0, 15.0, 9.0, 10.0, 7.0, 3.0, 5.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1165771484375, -0.11277580261230469, -0.10897445678710938, -0.10517311096191406, -0.10137176513671875, -0.09757041931152344, -0.09376907348632812, -0.08996772766113281, -0.0861663818359375, -0.08236503601074219, -0.07856369018554688, -0.07476234436035156, -0.07096099853515625, -0.06715965270996094, -0.06335830688476562, -0.05955696105957031, -0.055755615234375, -0.05195426940917969, -0.048152923583984375, -0.04435157775878906, -0.04055023193359375, -0.03674888610839844, -0.032947540283203125, -0.029146194458007812, -0.0253448486328125, -0.021543502807617188, -0.017742156982421875, -0.013940811157226562, -0.01013946533203125, -0.0063381195068359375, -0.002536773681640625, 0.0012645721435546875, 0.00506591796875, 0.008867263793945312, 0.012668609619140625, 0.016469955444335938, 0.02027130126953125, 0.024072647094726562, 0.027873992919921875, 0.03167533874511719, 0.0354766845703125, 0.03927803039550781, 0.043079376220703125, 0.04688072204589844, 0.05068206787109375, 0.05448341369628906, 0.058284759521484375, 0.06208610534667969, 0.065887451171875, 0.06968879699707031, 0.07349014282226562, 0.07729148864746094, 0.08109283447265625, 0.08489418029785156, 0.08869552612304688, 0.09249687194824219, 0.0962982177734375, 0.10009956359863281, 0.10390090942382812, 0.10770225524902344, 0.11150360107421875, 0.11530494689941406, 0.11910629272460938, 0.12290763854980469, 0.126708984375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 5.0, 3.0, 3.0, 6.0, 9.0, 18.0, 15.0, 15.0, 20.0, 40.0, 56.0, 80.0, 81.0, 125.0, 198.0, 251.0, 434.0, 1020.0, 3584.0, 38146.0, 4117639.0, 27298.0, 3104.0, 838.0, 362.0, 286.0, 186.0, 124.0, 95.0, 72.0, 54.0, 34.0, 25.0, 21.0, 13.0, 13.0, 6.0, 5.0, 6.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2041015625, -1.1527557373046875, -1.101409912109375, -1.0500640869140625, -0.99871826171875, -0.9473724365234375, -0.896026611328125, -0.8446807861328125, -0.7933349609375, -0.7419891357421875, -0.690643310546875, -0.6392974853515625, -0.58795166015625, -0.5366058349609375, -0.485260009765625, -0.4339141845703125, -0.382568359375, -0.3312225341796875, -0.279876708984375, -0.2285308837890625, -0.17718505859375, -0.1258392333984375, -0.074493408203125, -0.0231475830078125, 0.0281982421875, 0.0795440673828125, 0.130889892578125, 0.1822357177734375, 0.23358154296875, 0.2849273681640625, 0.336273193359375, 0.3876190185546875, 0.43896484375, 0.4903106689453125, 0.541656494140625, 0.5930023193359375, 0.64434814453125, 0.6956939697265625, 0.747039794921875, 0.7983856201171875, 0.8497314453125, 0.9010772705078125, 0.952423095703125, 1.0037689208984375, 1.05511474609375, 1.1064605712890625, 1.157806396484375, 1.2091522216796875, 1.260498046875, 1.3118438720703125, 1.363189697265625, 1.4145355224609375, 1.46588134765625, 1.5172271728515625, 1.568572998046875, 1.6199188232421875, 1.6712646484375, 1.7226104736328125, 1.773956298828125, 1.8253021240234375, 1.87664794921875, 1.9279937744140625, 1.979339599609375, 2.0306854248046875, 2.08203125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 6.0, 19.0, 31.0, 80.0, 471.0, 3291.0, 110.0, 32.0, 14.0, 10.0, 8.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.213623046875, -0.20352935791015625, -0.1934356689453125, -0.18334197998046875, -0.173248291015625, -0.16315460205078125, -0.1530609130859375, -0.14296722412109375, -0.13287353515625, -0.12277984619140625, -0.1126861572265625, -0.10259246826171875, -0.092498779296875, -0.08240509033203125, -0.0723114013671875, -0.06221771240234375, -0.0521240234375, -0.04203033447265625, -0.0319366455078125, -0.02184295654296875, -0.011749267578125, -0.00165557861328125, 0.0084381103515625, 0.01853179931640625, 0.02862548828125, 0.03871917724609375, 0.0488128662109375, 0.05890655517578125, 0.069000244140625, 0.07909393310546875, 0.0891876220703125, 0.09928131103515625, 0.109375, 0.11946868896484375, 0.1295623779296875, 0.13965606689453125, 0.149749755859375, 0.15984344482421875, 0.1699371337890625, 0.18003082275390625, 0.19012451171875, 0.20021820068359375, 0.2103118896484375, 0.22040557861328125, 0.230499267578125, 0.24059295654296875, 0.2506866455078125, 0.26078033447265625, 0.2708740234375, 0.28096771240234375, 0.2910614013671875, 0.30115509033203125, 0.311248779296875, 0.32134246826171875, 0.3314361572265625, 0.34152984619140625, 0.35162353515625, 0.36171722412109375, 0.3718109130859375, 0.38190460205078125, 0.391998291015625, 0.40209197998046875, 0.4121856689453125, 0.42227935791015625, 0.432373046875]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 5.0, 6.0, 19.0, 30.0, 40.0, 61.0, 86.0, 139.0, 137.0, 141.0, 118.0, 80.0, 51.0, 26.0, 24.0, 11.0, 8.0, 10.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1902225017547607, -1.1590852737426758, -1.1279481649398804, -1.0968109369277954, -1.065673828125, -1.034536600112915, -1.00339937210083, -0.9722622036933899, -0.9411250352859497, -0.9099878668785095, -0.8788506984710693, -0.8477134704589844, -0.8165763020515442, -0.785439133644104, -0.754301905632019, -0.7231647372245789, -0.6920275688171387, -0.6608904004096985, -0.6297532320022583, -0.5986160039901733, -0.5674788355827332, -0.536341667175293, -0.505204439163208, -0.4740672707557678, -0.44293010234832764, -0.41179293394088745, -0.3806557357311249, -0.3495185375213623, -0.3183813691139221, -0.28724420070648193, -0.25610700249671936, -0.22496981918811798, -0.1938326358795166, -0.16269545257091522, -0.13155826926231384, -0.10042108595371246, -0.06928390264511108, -0.038146719336509705, -0.007009536027908325, 0.024127647280693054, 0.055264830589294434, 0.08640201389789581, 0.11753919720649719, 0.14867638051509857, 0.17981356382369995, 0.21095074713230133, 0.2420879304409027, 0.2732251286506653, 0.30436229705810547, 0.33549946546554565, 0.3666366636753082, 0.3977738618850708, 0.428911030292511, 0.46004819869995117, 0.49118539690971375, 0.5223225951194763, 0.5534597635269165, 0.5845969319343567, 0.6157341003417969, 0.6468713283538818, 0.678008496761322, 0.7091456651687622, 0.7402828931808472, 0.7714200615882874, 0.8025572299957275]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 7.0, 2.0, 7.0, 5.0, 7.0, 4.0, 7.0, 10.0, 12.0, 9.0, 17.0, 15.0, 21.0, 25.0, 25.0, 28.0, 33.0, 44.0, 37.0, 31.0, 49.0, 39.0, 38.0, 49.0, 48.0, 36.0, 35.0, 30.0, 29.0, 49.0, 29.0, 32.0, 36.0, 34.0, 22.0, 20.0, 14.0, 15.0, 10.0, 8.0, 9.0, 12.0, 2.0, 4.0, 5.0, 8.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.4357149004936218, -0.4222544729709625, -0.4087940454483032, -0.3953336179256439, -0.3818731904029846, -0.3684127926826477, -0.3549523651599884, -0.3414919376373291, -0.3280315101146698, -0.3145710825920105, -0.3011106550693512, -0.2876502275466919, -0.274189829826355, -0.2607293725013733, -0.24726897478103638, -0.23380854725837708, -0.22034811973571777, -0.20688769221305847, -0.19342726469039917, -0.17996685206890106, -0.16650642454624176, -0.15304599702358246, -0.13958558440208435, -0.12612515687942505, -0.11266472935676575, -0.09920430183410645, -0.08574388176202774, -0.07228346168994904, -0.058823034167289734, -0.04536260664463043, -0.03190218657255173, -0.018441766500473022, -0.004981338977813721, 0.008479084819555283, 0.021939508616924286, 0.03539993241429329, 0.04886035621166229, 0.062320783734321594, 0.0757812038064003, 0.089241623878479, 0.1027020514011383, 0.11616247892379761, 0.1296229064464569, 0.14308331906795502, 0.15654374659061432, 0.17000417411327362, 0.18346458673477173, 0.19692501425743103, 0.21038544178009033, 0.22384586930274963, 0.23730629682540894, 0.25076672434806824, 0.26422715187072754, 0.27768754959106445, 0.29114797711372375, 0.30460840463638306, 0.31806883215904236, 0.33152925968170166, 0.34498968720436096, 0.35845011472702026, 0.3719105124473572, 0.38537096977233887, 0.3988313674926758, 0.4122917950153351, 0.4257522225379944]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 7.0, 12.0, 18.0, 18.0, 26.0, 45.0, 44.0, 66.0, 122.0, 187.0, 270.0, 453.0, 685.0, 1103.0, 2045.0, 3532.0, 6638.0, 12973.0, 27466.0, 61885.0, 149805.0, 309218.0, 263831.0, 114376.0, 48239.0, 21666.0, 10741.0, 5633.0, 2935.0, 1759.0, 961.0, 629.0, 380.0, 268.0, 165.0, 113.0, 66.0, 56.0, 42.0, 25.0, 21.0, 14.0, 13.0, 1.0, 6.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.266845703125, -0.2594032287597656, -0.25196075439453125, -0.24451828002929688, -0.2370758056640625, -0.22963333129882812, -0.22219085693359375, -0.21474838256835938, -0.207305908203125, -0.19986343383789062, -0.19242095947265625, -0.18497848510742188, -0.1775360107421875, -0.17009353637695312, -0.16265106201171875, -0.15520858764648438, -0.14776611328125, -0.14032363891601562, -0.13288116455078125, -0.12543869018554688, -0.1179962158203125, -0.11055374145507812, -0.10311126708984375, -0.09566879272460938, -0.088226318359375, -0.08078384399414062, -0.07334136962890625, -0.06589889526367188, -0.0584564208984375, -0.051013946533203125, -0.04357147216796875, -0.036128997802734375, -0.0286865234375, -0.021244049072265625, -0.01380157470703125, -0.006359100341796875, 0.0010833740234375, 0.008525848388671875, 0.01596832275390625, 0.023410797119140625, 0.030853271484375, 0.038295745849609375, 0.04573822021484375, 0.053180694580078125, 0.0606231689453125, 0.06806564331054688, 0.07550811767578125, 0.08295059204101562, 0.09039306640625, 0.09783554077148438, 0.10527801513671875, 0.11272048950195312, 0.1201629638671875, 0.12760543823242188, 0.13504791259765625, 0.14249038696289062, 0.149932861328125, 0.15737533569335938, 0.16481781005859375, 0.17226028442382812, 0.1797027587890625, 0.18714523315429688, 0.19458770751953125, 0.20203018188476562, 0.20947265625]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 5.0, 2.0, 1.0, 6.0, 5.0, 8.0, 10.0, 15.0, 12.0, 20.0, 23.0, 24.0, 33.0, 34.0, 40.0, 37.0, 53.0, 51.0, 63.0, 59.0, 65.0, 71.0, 55.0, 39.0, 41.0, 39.0, 46.0, 23.0, 31.0, 20.0, 14.0, 14.0, 12.0, 11.0, 7.0, 6.0, 3.0, 3.0, 7.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.11773681640625, -0.11355876922607422, -0.10938072204589844, -0.10520267486572266, -0.10102462768554688, -0.0968465805053711, -0.09266853332519531, -0.08849048614501953, -0.08431243896484375, -0.08013439178466797, -0.07595634460449219, -0.0717782974243164, -0.06760025024414062, -0.06342220306396484, -0.05924415588378906, -0.05506610870361328, -0.0508880615234375, -0.04671001434326172, -0.04253196716308594, -0.038353919982910156, -0.034175872802734375, -0.029997825622558594, -0.025819778442382812, -0.02164173126220703, -0.01746368408203125, -0.013285636901855469, -0.009107589721679688, -0.004929542541503906, -0.000751495361328125, 0.0034265518188476562, 0.0076045989990234375, 0.011782646179199219, 0.015960693359375, 0.02013874053955078, 0.024316787719726562, 0.028494834899902344, 0.032672882080078125, 0.036850929260253906, 0.04102897644042969, 0.04520702362060547, 0.04938507080078125, 0.05356311798095703, 0.05774116516113281, 0.061919212341308594, 0.06609725952148438, 0.07027530670166016, 0.07445335388183594, 0.07863140106201172, 0.0828094482421875, 0.08698749542236328, 0.09116554260253906, 0.09534358978271484, 0.09952163696289062, 0.1036996841430664, 0.10787773132324219, 0.11205577850341797, 0.11623382568359375, 0.12041187286376953, 0.12458992004394531, 0.1287679672241211, 0.13294601440429688, 0.13712406158447266, 0.14130210876464844, 0.14548015594482422, 0.149658203125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 4.0, 5.0, 3.0, 9.0, 17.0, 26.0, 43.0, 48.0, 67.0, 125.0, 168.0, 260.0, 427.0, 761.0, 1556.0, 3937.0, 17239.0, 145430.0, 754674.0, 103812.0, 13497.0, 3289.0, 1338.0, 672.0, 413.0, 239.0, 161.0, 109.0, 71.0, 57.0, 28.0, 27.0, 15.0, 14.0, 7.0, 5.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.63037109375, -0.6096572875976562, -0.5889434814453125, -0.5682296752929688, -0.547515869140625, -0.5268020629882812, -0.5060882568359375, -0.48537445068359375, -0.46466064453125, -0.44394683837890625, -0.4232330322265625, -0.40251922607421875, -0.381805419921875, -0.36109161376953125, -0.3403778076171875, -0.31966400146484375, -0.2989501953125, -0.27823638916015625, -0.2575225830078125, -0.23680877685546875, -0.216094970703125, -0.19538116455078125, -0.1746673583984375, -0.15395355224609375, -0.13323974609375, -0.11252593994140625, -0.0918121337890625, -0.07109832763671875, -0.050384521484375, -0.02967071533203125, -0.0089569091796875, 0.01175689697265625, 0.032470703125, 0.05318450927734375, 0.0738983154296875, 0.09461212158203125, 0.115325927734375, 0.13603973388671875, 0.1567535400390625, 0.17746734619140625, 0.19818115234375, 0.21889495849609375, 0.2396087646484375, 0.26032257080078125, 0.281036376953125, 0.30175018310546875, 0.3224639892578125, 0.34317779541015625, 0.3638916015625, 0.38460540771484375, 0.4053192138671875, 0.42603302001953125, 0.446746826171875, 0.46746063232421875, 0.4881744384765625, 0.5088882446289062, 0.52960205078125, 0.5503158569335938, 0.5710296630859375, 0.5917434692382812, 0.612457275390625, 0.6331710815429688, 0.6538848876953125, 0.6745986938476562, 0.6953125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 8.0, 15.0, 10.0, 19.0, 25.0, 26.0, 29.0, 34.0, 42.0, 37.0, 53.0, 54.0, 71.0, 64.0, 87.0, 57.0, 44.0, 63.0, 59.0, 42.0, 41.0, 29.0, 20.0, 21.0, 18.0, 11.0, 8.0, 11.0, 6.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.08203125, -1.05621337890625, -1.0303955078125, -1.00457763671875, -0.978759765625, -0.95294189453125, -0.9271240234375, -0.90130615234375, -0.87548828125, -0.84967041015625, -0.8238525390625, -0.79803466796875, -0.772216796875, -0.74639892578125, -0.7205810546875, -0.69476318359375, -0.6689453125, -0.64312744140625, -0.6173095703125, -0.59149169921875, -0.565673828125, -0.53985595703125, -0.5140380859375, -0.48822021484375, -0.46240234375, -0.43658447265625, -0.4107666015625, -0.38494873046875, -0.359130859375, -0.33331298828125, -0.3074951171875, -0.28167724609375, -0.255859375, -0.23004150390625, -0.2042236328125, -0.17840576171875, -0.152587890625, -0.12677001953125, -0.1009521484375, -0.07513427734375, -0.04931640625, -0.02349853515625, 0.0023193359375, 0.02813720703125, 0.053955078125, 0.07977294921875, 0.1055908203125, 0.13140869140625, 0.1572265625, 0.18304443359375, 0.2088623046875, 0.23468017578125, 0.260498046875, 0.28631591796875, 0.3121337890625, 0.33795166015625, 0.36376953125, 0.38958740234375, 0.4154052734375, 0.44122314453125, 0.467041015625, 0.49285888671875, 0.5186767578125, 0.54449462890625, 0.5703125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 11.0, 4.0, 4.0, 10.0, 14.0, 23.0, 29.0, 38.0, 63.0, 110.0, 188.0, 330.0, 648.0, 1255.0, 2803.0, 8290.0, 36501.0, 295260.0, 601107.0, 79780.0, 14312.0, 4191.0, 1686.0, 818.0, 403.0, 250.0, 147.0, 105.0, 59.0, 37.0, 24.0, 19.0, 12.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 4.0], "bins": [-0.317626953125, -0.3093128204345703, -0.3009986877441406, -0.29268455505371094, -0.28437042236328125, -0.27605628967285156, -0.2677421569824219, -0.2594280242919922, -0.2511138916015625, -0.2427997589111328, -0.23448562622070312, -0.22617149353027344, -0.21785736083984375, -0.20954322814941406, -0.20122909545898438, -0.1929149627685547, -0.184600830078125, -0.1762866973876953, -0.16797256469726562, -0.15965843200683594, -0.15134429931640625, -0.14303016662597656, -0.13471603393554688, -0.1264019012451172, -0.1180877685546875, -0.10977363586425781, -0.10145950317382812, -0.09314537048339844, -0.08483123779296875, -0.07651710510253906, -0.06820297241210938, -0.05988883972167969, -0.05157470703125, -0.04326057434082031, -0.034946441650390625, -0.026632308959960938, -0.01831817626953125, -0.010004043579101562, -0.001689910888671875, 0.0066242218017578125, 0.0149383544921875, 0.023252487182617188, 0.031566619873046875, 0.03988075256347656, 0.04819488525390625, 0.05650901794433594, 0.06482315063476562, 0.07313728332519531, 0.081451416015625, 0.08976554870605469, 0.09807968139648438, 0.10639381408691406, 0.11470794677734375, 0.12302207946777344, 0.13133621215820312, 0.1396503448486328, 0.1479644775390625, 0.1562786102294922, 0.16459274291992188, 0.17290687561035156, 0.18122100830078125, 0.18953514099121094, 0.19784927368164062, 0.2061634063720703, 0.2144775390625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 5.0, 3.0, 8.0, 11.0, 18.0, 19.0, 16.0, 29.0, 39.0, 34.0, 68.0, 72.0, 88.0, 107.0, 104.0, 89.0, 58.0, 59.0, 46.0, 28.0, 20.0, 21.0, 16.0, 15.0, 8.0, 4.0, 3.0, 5.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.00010162591934204102, -9.851623326539993e-05, -9.540654718875885e-05, -9.229686111211777e-05, -8.918717503547668e-05, -8.60774889588356e-05, -8.296780288219452e-05, -7.985811680555344e-05, -7.674843072891235e-05, -7.363874465227127e-05, -7.052905857563019e-05, -6.74193724989891e-05, -6.430968642234802e-05, -6.120000034570694e-05, -5.809031426906586e-05, -5.4980628192424774e-05, -5.187094211578369e-05, -4.876125603914261e-05, -4.5651569962501526e-05, -4.254188388586044e-05, -3.943219780921936e-05, -3.632251173257828e-05, -3.3212825655937195e-05, -3.0103139579296112e-05, -2.699345350265503e-05, -2.3883767426013947e-05, -2.0774081349372864e-05, -1.766439527273178e-05, -1.4554709196090698e-05, -1.1445023119449615e-05, -8.335337042808533e-06, -5.22565096616745e-06, -2.115964889526367e-06, 9.937211871147156e-07, 4.103407263755798e-06, 7.213093340396881e-06, 1.0322779417037964e-05, 1.3432465493679047e-05, 1.654215157032013e-05, 1.9651837646961212e-05, 2.2761523723602295e-05, 2.5871209800243378e-05, 2.898089587688446e-05, 3.209058195352554e-05, 3.5200268030166626e-05, 3.830995410680771e-05, 4.141964018344879e-05, 4.4529326260089874e-05, 4.763901233673096e-05, 5.074869841337204e-05, 5.385838449001312e-05, 5.6968070566654205e-05, 6.007775664329529e-05, 6.318744271993637e-05, 6.629712879657745e-05, 6.940681487321854e-05, 7.251650094985962e-05, 7.56261870265007e-05, 7.873587310314178e-05, 8.184555917978287e-05, 8.495524525642395e-05, 8.806493133306503e-05, 9.117461740970612e-05, 9.42843034863472e-05, 9.739398956298828e-05]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 6.0, 1.0, 9.0, 9.0, 14.0, 25.0, 31.0, 94.0, 156.0, 343.0, 825.0, 2297.0, 9335.0, 110862.0, 834830.0, 78406.0, 7925.0, 1990.0, 710.0, 319.0, 170.0, 73.0, 54.0, 22.0, 14.0, 8.0, 9.0, 4.0, 3.0, 6.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.387451171875, -0.374725341796875, -0.36199951171875, -0.349273681640625, -0.3365478515625, -0.323822021484375, -0.31109619140625, -0.298370361328125, -0.28564453125, -0.272918701171875, -0.26019287109375, -0.247467041015625, -0.2347412109375, -0.222015380859375, -0.20928955078125, -0.196563720703125, -0.183837890625, -0.171112060546875, -0.15838623046875, -0.145660400390625, -0.1329345703125, -0.120208740234375, -0.10748291015625, -0.094757080078125, -0.08203125, -0.069305419921875, -0.05657958984375, -0.043853759765625, -0.0311279296875, -0.018402099609375, -0.00567626953125, 0.007049560546875, 0.019775390625, 0.032501220703125, 0.04522705078125, 0.057952880859375, 0.0706787109375, 0.083404541015625, 0.09613037109375, 0.108856201171875, 0.12158203125, 0.134307861328125, 0.14703369140625, 0.159759521484375, 0.1724853515625, 0.185211181640625, 0.19793701171875, 0.210662841796875, 0.223388671875, 0.236114501953125, 0.24884033203125, 0.261566162109375, 0.2742919921875, 0.287017822265625, 0.29974365234375, 0.312469482421875, 0.3251953125, 0.337921142578125, 0.35064697265625, 0.363372802734375, 0.3760986328125, 0.388824462890625, 0.40155029296875, 0.414276123046875, 0.427001953125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 4.0, 3.0, 8.0, 12.0, 17.0, 14.0, 27.0, 29.0, 45.0, 56.0, 69.0, 76.0, 81.0, 86.0, 91.0, 78.0, 72.0, 54.0, 48.0, 35.0, 24.0, 13.0, 20.0, 12.0, 9.0, 7.0, 7.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1956787109375, -0.18885231018066406, -0.18202590942382812, -0.1751995086669922, -0.16837310791015625, -0.1615467071533203, -0.15472030639648438, -0.14789390563964844, -0.1410675048828125, -0.13424110412597656, -0.12741470336914062, -0.12058830261230469, -0.11376190185546875, -0.10693550109863281, -0.10010910034179688, -0.09328269958496094, -0.086456298828125, -0.07962989807128906, -0.07280349731445312, -0.06597709655761719, -0.05915069580078125, -0.05232429504394531, -0.045497894287109375, -0.03867149353027344, -0.0318450927734375, -0.025018692016601562, -0.018192291259765625, -0.011365890502929688, -0.00453948974609375, 0.0022869110107421875, 0.009113311767578125, 0.015939712524414062, 0.02276611328125, 0.029592514038085938, 0.036418914794921875, 0.04324531555175781, 0.05007171630859375, 0.05689811706542969, 0.06372451782226562, 0.07055091857910156, 0.0773773193359375, 0.08420372009277344, 0.09103012084960938, 0.09785652160644531, 0.10468292236328125, 0.11150932312011719, 0.11833572387695312, 0.12516212463378906, 0.131988525390625, 0.13881492614746094, 0.14564132690429688, 0.1524677276611328, 0.15929412841796875, 0.1661205291748047, 0.17294692993164062, 0.17977333068847656, 0.1865997314453125, 0.19342613220214844, 0.20025253295898438, 0.2070789337158203, 0.21390533447265625, 0.2207317352294922, 0.22755813598632812, 0.23438453674316406, 0.2412109375]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 5.0, 8.0, 54.0, 209.0, 340.0, 283.0, 86.0, 18.0, 9.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.757955074310303, -6.4166178703308105, -6.075280666351318, -5.733943462371826, -5.392606258392334, -5.051269054412842, -4.709931373596191, -4.368594169616699, -4.027256965637207, -3.685919761657715, -3.3445825576782227, -3.0032453536987305, -2.6619081497192383, -2.320570945739746, -1.9792335033416748, -1.6378962993621826, -1.2965593338012695, -0.9552221298217773, -0.6138848662376404, -0.2725476026535034, 0.06878960132598877, 0.41012680530548096, 0.7514641284942627, 1.0928013324737549, 1.434138536453247, 1.7754757404327393, 2.1168129444122314, 2.4581503868103027, 2.799487590789795, 3.140824794769287, 3.4821619987487793, 3.8234992027282715, 4.1648359298706055, 4.506173133850098, 4.84751033782959, 5.188847541809082, 5.530184745788574, 5.871521949768066, 6.212859153747559, 6.554196357727051, 6.895533561706543, 7.236870765686035, 7.578207969665527, 7.9195451736450195, 8.260882377624512, 8.602219581604004, 8.943556785583496, 9.284893989562988, 9.626232147216797, 9.967569351196289, 10.308906555175781, 10.650243759155273, 10.991580963134766, 11.332918167114258, 11.67425537109375, 12.015592575073242, 12.356929779052734, 12.698266983032227, 13.039604187011719, 13.380941390991211, 13.722278594970703, 14.063615798950195, 14.404953002929688, 14.74629020690918, 15.087627410888672]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 4.0, 3.0, 2.0, 3.0, 12.0, 9.0, 10.0, 14.0, 14.0, 18.0, 22.0, 23.0, 29.0, 30.0, 40.0, 43.0, 69.0, 55.0, 70.0, 49.0, 55.0, 51.0, 56.0, 45.0, 39.0, 50.0, 39.0, 31.0, 24.0, 25.0, 16.0, 14.0, 13.0, 7.0, 6.0, 6.0, 5.0, 2.0, 2.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.4993457794189453, -3.3902835845947266, -3.281221628189087, -3.172159433364868, -3.0630974769592285, -2.9540352821350098, -2.844973087310791, -2.7359111309051514, -2.6268489360809326, -2.517786741256714, -2.408724784851074, -2.2996625900268555, -2.190600633621216, -2.081538438796997, -1.9724763631820679, -1.8634142875671387, -1.7543522119522095, -1.6452901363372803, -1.536228060722351, -1.4271659851074219, -1.3181037902832031, -1.209041714668274, -1.0999796390533447, -0.9909175038337708, -0.8818554282188416, -0.7727933526039124, -0.6637312173843384, -0.5546691417694092, -0.4456070363521576, -0.336544930934906, -0.2274828553199768, -0.11842072010040283, -0.009358644485473633, 0.09970345348119736, 0.20876555144786835, 0.31782764196395874, 0.4268897473812103, 0.5359518527984619, 0.6450139284133911, 0.7540760636329651, 0.8631381392478943, 0.9722002148628235, 1.0812623500823975, 1.1903244256973267, 1.2993865013122559, 1.4084486961364746, 1.5175106525421143, 1.626572847366333, 1.7356349229812622, 1.8446969985961914, 1.9537590742111206, 2.06282114982605, 2.1718833446502686, 2.280945301055908, 2.390007495880127, 2.4990696907043457, 2.6081316471099854, 2.717193841934204, 2.8262557983398438, 2.9353179931640625, 3.044379949569702, 3.153442144393921, 3.2625041007995605, 3.3715662956237793, 3.480628490447998]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 5.0, 3.0, 11.0, 17.0, 15.0, 30.0, 50.0, 59.0, 113.0, 193.0, 417.0, 942.0, 2783.0, 14006.0, 4075460.0, 90372.0, 6607.0, 1723.0, 694.0, 332.0, 170.0, 88.0, 65.0, 47.0, 25.0, 19.0, 11.0, 13.0, 6.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.21484375, -1.1857833862304688, -1.1567230224609375, -1.1276626586914062, -1.098602294921875, -1.0695419311523438, -1.0404815673828125, -1.0114212036132812, -0.98236083984375, -0.9533004760742188, -0.9242401123046875, -0.8951797485351562, -0.866119384765625, -0.8370590209960938, -0.8079986572265625, -0.7789382934570312, -0.7498779296875, -0.7208175659179688, -0.6917572021484375, -0.6626968383789062, -0.633636474609375, -0.6045761108398438, -0.5755157470703125, -0.5464553833007812, -0.51739501953125, -0.48833465576171875, -0.4592742919921875, -0.43021392822265625, -0.401153564453125, -0.37209320068359375, -0.3430328369140625, -0.31397247314453125, -0.284912109375, -0.25585174560546875, -0.2267913818359375, -0.19773101806640625, -0.168670654296875, -0.13961029052734375, -0.1105499267578125, -0.08148956298828125, -0.05242919921875, -0.02336883544921875, 0.0056915283203125, 0.03475189208984375, 0.063812255859375, 0.09287261962890625, 0.1219329833984375, 0.15099334716796875, 0.1800537109375, 0.20911407470703125, 0.2381744384765625, 0.26723480224609375, 0.296295166015625, 0.32535552978515625, 0.3544158935546875, 0.38347625732421875, 0.41253662109375, 0.44159698486328125, 0.4706573486328125, 0.49971771240234375, 0.528778076171875, 0.5578384399414062, 0.5868988037109375, 0.6159591674804688, 0.64501953125]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 1.0, 2.0, 7.0, 3.0, 8.0, 5.0, 14.0, 7.0, 22.0, 29.0, 26.0, 36.0, 30.0, 58.0, 60.0, 57.0, 60.0, 68.0, 71.0, 58.0, 66.0, 63.0, 55.0, 45.0, 36.0, 20.0, 21.0, 17.0, 17.0, 11.0, 10.0, 12.0, 2.0, 1.0, 0.0, 6.0, 0.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1279296875, -0.123046875, -0.1181640625, -0.11328125, -0.1083984375, -0.103515625, -0.0986328125, -0.09375, -0.0888671875, -0.083984375, -0.0791015625, -0.07421875, -0.0693359375, -0.064453125, -0.0595703125, -0.0546875, -0.0498046875, -0.044921875, -0.0400390625, -0.03515625, -0.0302734375, -0.025390625, -0.0205078125, -0.015625, -0.0107421875, -0.005859375, -0.0009765625, 0.00390625, 0.0087890625, 0.013671875, 0.0185546875, 0.0234375, 0.0283203125, 0.033203125, 0.0380859375, 0.04296875, 0.0478515625, 0.052734375, 0.0576171875, 0.0625, 0.0673828125, 0.072265625, 0.0771484375, 0.08203125, 0.0869140625, 0.091796875, 0.0966796875, 0.1015625, 0.1064453125, 0.111328125, 0.1162109375, 0.12109375, 0.1259765625, 0.130859375, 0.1357421875, 0.140625, 0.1455078125, 0.150390625, 0.1552734375, 0.16015625, 0.1650390625, 0.169921875, 0.1748046875, 0.1796875, 0.1845703125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 12.0, 12.0, 8.0, 14.0, 20.0, 24.0, 44.0, 61.0, 80.0, 120.0, 182.0, 262.0, 380.0, 525.0, 862.0, 1490.0, 2920.0, 7676.0, 34201.0, 4047887.0, 78226.0, 10938.0, 3708.0, 1744.0, 916.0, 600.0, 426.0, 277.0, 182.0, 142.0, 84.0, 71.0, 60.0, 32.0, 24.0, 20.0, 12.0, 12.0, 6.0, 10.0, 4.0, 6.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.80078125, -0.7769851684570312, -0.7531890869140625, -0.7293930053710938, -0.705596923828125, -0.6818008422851562, -0.6580047607421875, -0.6342086791992188, -0.61041259765625, -0.5866165161132812, -0.5628204345703125, -0.5390243530273438, -0.515228271484375, -0.49143218994140625, -0.4676361083984375, -0.44384002685546875, -0.4200439453125, -0.39624786376953125, -0.3724517822265625, -0.34865570068359375, -0.324859619140625, -0.30106353759765625, -0.2772674560546875, -0.25347137451171875, -0.22967529296875, -0.20587921142578125, -0.1820831298828125, -0.15828704833984375, -0.134490966796875, -0.11069488525390625, -0.0868988037109375, -0.06310272216796875, -0.039306640625, -0.01551055908203125, 0.0082855224609375, 0.03208160400390625, 0.055877685546875, 0.07967376708984375, 0.1034698486328125, 0.12726593017578125, 0.15106201171875, 0.17485809326171875, 0.1986541748046875, 0.22245025634765625, 0.246246337890625, 0.27004241943359375, 0.2938385009765625, 0.31763458251953125, 0.3414306640625, 0.36522674560546875, 0.3890228271484375, 0.41281890869140625, 0.436614990234375, 0.46041107177734375, 0.4842071533203125, 0.5080032348632812, 0.53179931640625, 0.5555953979492188, 0.5793914794921875, 0.6031875610351562, 0.626983642578125, 0.6507797241210938, 0.6745758056640625, 0.6983718872070312, 0.72216796875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 1.0, 5.0, 4.0, 4.0, 7.0, 13.0, 21.0, 45.0, 180.0, 3454.0, 214.0, 60.0, 19.0, 16.0, 12.0, 4.0, 8.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1416015625, -0.13605880737304688, -0.13051605224609375, -0.12497329711914062, -0.1194305419921875, -0.11388778686523438, -0.10834503173828125, -0.10280227661132812, -0.097259521484375, -0.09171676635742188, -0.08617401123046875, -0.08063125610351562, -0.0750885009765625, -0.06954574584960938, -0.06400299072265625, -0.058460235595703125, -0.05291748046875, -0.047374725341796875, -0.04183197021484375, -0.036289215087890625, -0.0307464599609375, -0.025203704833984375, -0.01966094970703125, -0.014118194580078125, -0.008575439453125, -0.003032684326171875, 0.00251007080078125, 0.008052825927734375, 0.0135955810546875, 0.019138336181640625, 0.02468109130859375, 0.030223846435546875, 0.0357666015625, 0.041309356689453125, 0.04685211181640625, 0.052394866943359375, 0.0579376220703125, 0.06348037719726562, 0.06902313232421875, 0.07456588745117188, 0.080108642578125, 0.08565139770507812, 0.09119415283203125, 0.09673690795898438, 0.1022796630859375, 0.10782241821289062, 0.11336517333984375, 0.11890792846679688, 0.12445068359375, 0.12999343872070312, 0.13553619384765625, 0.14107894897460938, 0.1466217041015625, 0.15216445922851562, 0.15770721435546875, 0.16324996948242188, 0.168792724609375, 0.17433547973632812, 0.17987823486328125, 0.18542098999023438, 0.1909637451171875, 0.19650650024414062, 0.20204925537109375, 0.20759201049804688, 0.213134765625]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 6.0, 6.0, 8.0, 19.0, 20.0, 44.0, 40.0, 83.0, 99.0, 136.0, 137.0, 117.0, 86.0, 66.0, 54.0, 36.0, 21.0, 9.0, 4.0, 7.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5913881063461304, -0.5717244148254395, -0.5520606637001038, -0.5323969721794128, -0.5127332210540771, -0.49306952953338623, -0.4734058082103729, -0.4537420868873596, -0.4340783953666687, -0.4144146740436554, -0.3947509527206421, -0.37508726119995117, -0.35542353987693787, -0.33575981855392456, -0.31609609723091125, -0.29643237590789795, -0.27676865458488464, -0.25710493326187134, -0.23744122684001923, -0.21777750551700592, -0.1981137990951538, -0.1784500777721405, -0.1587863564491272, -0.13912265002727509, -0.11945892870426178, -0.09979521483182907, -0.08013150095939636, -0.06046777963638306, -0.04080406576395035, -0.02114035189151764, -0.0014766305685043335, 0.01818707585334778, 0.037850797176361084, 0.05751451104879379, 0.0771782249212265, 0.09684194624423981, 0.11650566011667252, 0.13616937398910522, 0.15583309531211853, 0.17549680173397064, 0.19516052305698395, 0.21482424437999725, 0.23448795080184937, 0.25415167212486267, 0.273815393447876, 0.2934790849685669, 0.3131428360939026, 0.3328065276145935, 0.3524702489376068, 0.3721339702606201, 0.3917976915836334, 0.41146141290664673, 0.43112510442733765, 0.45078882575035095, 0.47045254707336426, 0.4901162385940552, 0.5097799897193909, 0.5294436812400818, 0.5491074323654175, 0.5687711238861084, 0.5884348750114441, 0.608098566532135, 0.6277623176574707, 0.6474260091781616, 0.6670897006988525]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 5.0, 2.0, 3.0, 4.0, 11.0, 8.0, 13.0, 13.0, 11.0, 16.0, 17.0, 23.0, 30.0, 30.0, 23.0, 36.0, 26.0, 27.0, 39.0, 34.0, 40.0, 44.0, 48.0, 43.0, 37.0, 46.0, 32.0, 45.0, 31.0, 35.0, 29.0, 31.0, 28.0, 22.0, 14.0, 17.0, 15.0, 16.0, 16.0, 11.0, 5.0, 5.0, 8.0, 5.0, 4.0, 6.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.32902616262435913, -0.3189006745815277, -0.3087752163410187, -0.29864972829818726, -0.2885242700576782, -0.2783987820148468, -0.2682732939720154, -0.25814783573150635, -0.24802234768867493, -0.2378968745470047, -0.22777140140533447, -0.21764591336250305, -0.20752044022083282, -0.1973949670791626, -0.18726947903633118, -0.17714400589466095, -0.16701853275299072, -0.1568930596113205, -0.14676758646965027, -0.13664209842681885, -0.12651662528514862, -0.1163911521434784, -0.10626567155122757, -0.09614019095897675, -0.08601471781730652, -0.07588924467563629, -0.06576376408338547, -0.05563828721642494, -0.045512810349464417, -0.03538733348250389, -0.025261856615543365, -0.015136376023292542, -0.0050109028816223145, 0.005114573985338211, 0.015240050852298737, 0.025365527719259262, 0.03549100458621979, 0.04561648145318031, 0.05574195832014084, 0.06586743891239166, 0.07599291205406189, 0.08611838519573212, 0.09624386578798294, 0.10636934638023376, 0.11649481952190399, 0.12662029266357422, 0.13674578070640564, 0.14687125384807587, 0.1569967269897461, 0.16712220013141632, 0.17724767327308655, 0.18737316131591797, 0.1974986344575882, 0.20762410759925842, 0.21774959564208984, 0.22787506878376007, 0.2380005419254303, 0.24812601506710052, 0.25825148820877075, 0.2683769762516022, 0.2785024642944336, 0.2886279225349426, 0.29875341057777405, 0.30887889862060547, 0.3190043568611145]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 2.0, 4.0, 5.0, 4.0, 3.0, 6.0, 10.0, 14.0, 14.0, 24.0, 34.0, 47.0, 71.0, 95.0, 147.0, 190.0, 289.0, 421.0, 629.0, 940.0, 1474.0, 2392.0, 3953.0, 6442.0, 11051.0, 19549.0, 35633.0, 70523.0, 149028.0, 286302.0, 231427.0, 108700.0, 52945.0, 27939.0, 15294.0, 8818.0, 5188.0, 3291.0, 1935.0, 1280.0, 832.0, 497.0, 319.0, 240.0, 164.0, 135.0, 70.0, 50.0, 38.0, 31.0, 21.0, 13.0, 12.0, 14.0, 3.0, 6.0, 2.0, 2.0, 3.0, 2.0, 4.0], "bins": [-0.1964111328125, -0.19042205810546875, -0.1844329833984375, -0.17844390869140625, -0.172454833984375, -0.16646575927734375, -0.1604766845703125, -0.15448760986328125, -0.14849853515625, -0.14250946044921875, -0.1365203857421875, -0.13053131103515625, -0.124542236328125, -0.11855316162109375, -0.1125640869140625, -0.10657501220703125, -0.1005859375, -0.09459686279296875, -0.0886077880859375, -0.08261871337890625, -0.076629638671875, -0.07064056396484375, -0.0646514892578125, -0.05866241455078125, -0.05267333984375, -0.04668426513671875, -0.0406951904296875, -0.03470611572265625, -0.028717041015625, -0.02272796630859375, -0.0167388916015625, -0.01074981689453125, -0.0047607421875, 0.00122833251953125, 0.0072174072265625, 0.01320648193359375, 0.019195556640625, 0.02518463134765625, 0.0311737060546875, 0.03716278076171875, 0.04315185546875, 0.04914093017578125, 0.0551300048828125, 0.06111907958984375, 0.067108154296875, 0.07309722900390625, 0.0790863037109375, 0.08507537841796875, 0.091064453125, 0.09705352783203125, 0.1030426025390625, 0.10903167724609375, 0.115020751953125, 0.12100982666015625, 0.1269989013671875, 0.13298797607421875, 0.13897705078125, 0.14496612548828125, 0.1509552001953125, 0.15694427490234375, 0.162933349609375, 0.16892242431640625, 0.1749114990234375, 0.18090057373046875, 0.1868896484375]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 7.0, 6.0, 2.0, 14.0, 12.0, 21.0, 12.0, 15.0, 26.0, 26.0, 34.0, 30.0, 38.0, 43.0, 49.0, 39.0, 67.0, 56.0, 55.0, 61.0, 57.0, 49.0, 51.0, 41.0, 19.0, 34.0, 18.0, 15.0, 26.0, 13.0, 17.0, 10.0, 9.0, 8.0, 4.0, 5.0, 4.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.11053466796875, -0.1063089370727539, -0.10208320617675781, -0.09785747528076172, -0.09363174438476562, -0.08940601348876953, -0.08518028259277344, -0.08095455169677734, -0.07672882080078125, -0.07250308990478516, -0.06827735900878906, -0.06405162811279297, -0.059825897216796875, -0.05560016632080078, -0.05137443542480469, -0.047148704528808594, -0.0429229736328125, -0.038697242736816406, -0.03447151184082031, -0.03024578094482422, -0.026020050048828125, -0.02179431915283203, -0.017568588256835938, -0.013342857360839844, -0.00911712646484375, -0.004891395568847656, -0.0006656646728515625, 0.0035600662231445312, 0.007785797119140625, 0.012011528015136719, 0.016237258911132812, 0.020462989807128906, 0.024688720703125, 0.028914451599121094, 0.03314018249511719, 0.03736591339111328, 0.041591644287109375, 0.04581737518310547, 0.05004310607910156, 0.054268836975097656, 0.05849456787109375, 0.06272029876708984, 0.06694602966308594, 0.07117176055908203, 0.07539749145507812, 0.07962322235107422, 0.08384895324707031, 0.0880746841430664, 0.0923004150390625, 0.0965261459350586, 0.10075187683105469, 0.10497760772705078, 0.10920333862304688, 0.11342906951904297, 0.11765480041503906, 0.12188053131103516, 0.12610626220703125, 0.13033199310302734, 0.13455772399902344, 0.13878345489501953, 0.14300918579101562, 0.14723491668701172, 0.1514606475830078, 0.1556863784790039, 0.159912109375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 4.0, 6.0, 3.0, 12.0, 8.0, 16.0, 24.0, 31.0, 47.0, 68.0, 96.0, 119.0, 164.0, 272.0, 391.0, 680.0, 1301.0, 3283.0, 12575.0, 85208.0, 752964.0, 163484.0, 19571.0, 4418.0, 1629.0, 787.0, 433.0, 310.0, 190.0, 136.0, 98.0, 61.0, 57.0, 28.0, 33.0, 17.0, 13.0, 7.0, 7.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.501953125, -0.4844207763671875, -0.466888427734375, -0.4493560791015625, -0.43182373046875, -0.4142913818359375, -0.396759033203125, -0.3792266845703125, -0.3616943359375, -0.3441619873046875, -0.326629638671875, -0.3090972900390625, -0.29156494140625, -0.2740325927734375, -0.256500244140625, -0.2389678955078125, -0.221435546875, -0.2039031982421875, -0.186370849609375, -0.1688385009765625, -0.15130615234375, -0.1337738037109375, -0.116241455078125, -0.0987091064453125, -0.0811767578125, -0.0636444091796875, -0.046112060546875, -0.0285797119140625, -0.01104736328125, 0.0064849853515625, 0.024017333984375, 0.0415496826171875, 0.05908203125, 0.0766143798828125, 0.094146728515625, 0.1116790771484375, 0.12921142578125, 0.1467437744140625, 0.164276123046875, 0.1818084716796875, 0.1993408203125, 0.2168731689453125, 0.234405517578125, 0.2519378662109375, 0.26947021484375, 0.2870025634765625, 0.304534912109375, 0.3220672607421875, 0.339599609375, 0.3571319580078125, 0.374664306640625, 0.3921966552734375, 0.40972900390625, 0.4272613525390625, 0.444793701171875, 0.4623260498046875, 0.4798583984375, 0.4973907470703125, 0.514923095703125, 0.5324554443359375, 0.54998779296875, 0.5675201416015625, 0.585052490234375, 0.6025848388671875, 0.6201171875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 7.0, 7.0, 9.0, 11.0, 11.0, 14.0, 16.0, 20.0, 27.0, 21.0, 32.0, 45.0, 32.0, 43.0, 58.0, 55.0, 44.0, 52.0, 47.0, 47.0, 45.0, 50.0, 45.0, 40.0, 30.0, 35.0, 27.0, 30.0, 22.0, 13.0, 16.0, 14.0, 7.0, 8.0, 7.0, 8.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6376953125, -0.6177597045898438, -0.5978240966796875, -0.5778884887695312, -0.557952880859375, -0.5380172729492188, -0.5180816650390625, -0.49814605712890625, -0.47821044921875, -0.45827484130859375, -0.4383392333984375, -0.41840362548828125, -0.398468017578125, -0.37853240966796875, -0.3585968017578125, -0.33866119384765625, -0.3187255859375, -0.29878997802734375, -0.2788543701171875, -0.25891876220703125, -0.238983154296875, -0.21904754638671875, -0.1991119384765625, -0.17917633056640625, -0.15924072265625, -0.13930511474609375, -0.1193695068359375, -0.09943389892578125, -0.079498291015625, -0.05956268310546875, -0.0396270751953125, -0.01969146728515625, 0.000244140625, 0.02017974853515625, 0.0401153564453125, 0.06005096435546875, 0.079986572265625, 0.09992218017578125, 0.1198577880859375, 0.13979339599609375, 0.15972900390625, 0.17966461181640625, 0.1996002197265625, 0.21953582763671875, 0.239471435546875, 0.25940704345703125, 0.2793426513671875, 0.29927825927734375, 0.3192138671875, 0.33914947509765625, 0.3590850830078125, 0.37902069091796875, 0.398956298828125, 0.41889190673828125, 0.4388275146484375, 0.45876312255859375, 0.47869873046875, 0.49863433837890625, 0.5185699462890625, 0.5385055541992188, 0.558441162109375, 0.5783767700195312, 0.5983123779296875, 0.6182479858398438, 0.63818359375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 6.0, 1.0, 12.0, 7.0, 9.0, 19.0, 26.0, 52.0, 74.0, 109.0, 276.0, 567.0, 1580.0, 6224.0, 52814.0, 814138.0, 156505.0, 12220.0, 2349.0, 809.0, 346.0, 168.0, 96.0, 57.0, 23.0, 19.0, 15.0, 15.0, 7.0, 8.0, 4.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.415771484375, -0.4034271240234375, -0.391082763671875, -0.3787384033203125, -0.36639404296875, -0.3540496826171875, -0.341705322265625, -0.3293609619140625, -0.3170166015625, -0.3046722412109375, -0.292327880859375, -0.2799835205078125, -0.26763916015625, -0.2552947998046875, -0.242950439453125, -0.2306060791015625, -0.21826171875, -0.2059173583984375, -0.193572998046875, -0.1812286376953125, -0.16888427734375, -0.1565399169921875, -0.144195556640625, -0.1318511962890625, -0.1195068359375, -0.1071624755859375, -0.094818115234375, -0.0824737548828125, -0.07012939453125, -0.0577850341796875, -0.045440673828125, -0.0330963134765625, -0.020751953125, -0.0084075927734375, 0.003936767578125, 0.0162811279296875, 0.02862548828125, 0.0409698486328125, 0.053314208984375, 0.0656585693359375, 0.0780029296875, 0.0903472900390625, 0.102691650390625, 0.1150360107421875, 0.12738037109375, 0.1397247314453125, 0.152069091796875, 0.1644134521484375, 0.1767578125, 0.1891021728515625, 0.201446533203125, 0.2137908935546875, 0.22613525390625, 0.2384796142578125, 0.250823974609375, 0.2631683349609375, 0.2755126953125, 0.2878570556640625, 0.300201416015625, 0.3125457763671875, 0.32489013671875, 0.3372344970703125, 0.349578857421875, 0.3619232177734375, 0.374267578125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 5.0, 4.0, 9.0, 7.0, 13.0, 10.0, 13.0, 14.0, 17.0, 30.0, 28.0, 38.0, 59.0, 82.0, 119.0, 106.0, 108.0, 84.0, 54.0, 46.0, 40.0, 24.0, 21.0, 19.0, 10.0, 7.0, 12.0, 10.0, 4.0, 6.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.106231689453125e-05, -7.811468094587326e-05, -7.516704499721527e-05, -7.221940904855728e-05, -6.927177309989929e-05, -6.63241371512413e-05, -6.337650120258331e-05, -6.0428865253925323e-05, -5.7481229305267334e-05, -5.4533593356609344e-05, -5.1585957407951355e-05, -4.8638321459293365e-05, -4.5690685510635376e-05, -4.2743049561977386e-05, -3.97954136133194e-05, -3.684777766466141e-05, -3.390014171600342e-05, -3.095250576734543e-05, -2.800486981868744e-05, -2.505723387002945e-05, -2.210959792137146e-05, -1.916196197271347e-05, -1.621432602405548e-05, -1.3266690075397491e-05, -1.0319054126739502e-05, -7.3714181780815125e-06, -4.423782229423523e-06, -1.4761462807655334e-06, 1.471489667892456e-06, 4.4191256165504456e-06, 7.366761565208435e-06, 1.0314397513866425e-05, 1.3262033462524414e-05, 1.6209669411182404e-05, 1.9157305359840393e-05, 2.2104941308498383e-05, 2.5052577257156372e-05, 2.800021320581436e-05, 3.094784915447235e-05, 3.389548510313034e-05, 3.684312105178833e-05, 3.979075700044632e-05, 4.273839294910431e-05, 4.56860288977623e-05, 4.863366484642029e-05, 5.158130079507828e-05, 5.452893674373627e-05, 5.7476572692394257e-05, 6.0424208641052246e-05, 6.337184458971024e-05, 6.631948053836823e-05, 6.926711648702621e-05, 7.22147524356842e-05, 7.51623883843422e-05, 7.811002433300018e-05, 8.105766028165817e-05, 8.400529623031616e-05, 8.695293217897415e-05, 8.990056812763214e-05, 9.284820407629013e-05, 9.579584002494812e-05, 9.874347597360611e-05, 0.0001016911119222641, 0.00010463874787092209, 0.00010758638381958008]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 4.0, 9.0, 2.0, 8.0, 9.0, 15.0, 22.0, 38.0, 74.0, 126.0, 275.0, 575.0, 1417.0, 4792.0, 31626.0, 650197.0, 335117.0, 18798.0, 3354.0, 1144.0, 436.0, 222.0, 129.0, 55.0, 41.0, 17.0, 19.0, 11.0, 6.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.37646484375, -0.36386871337890625, -0.3512725830078125, -0.33867645263671875, -0.326080322265625, -0.31348419189453125, -0.3008880615234375, -0.28829193115234375, -0.27569580078125, -0.26309967041015625, -0.2505035400390625, -0.23790740966796875, -0.225311279296875, -0.21271514892578125, -0.2001190185546875, -0.18752288818359375, -0.1749267578125, -0.16233062744140625, -0.1497344970703125, -0.13713836669921875, -0.124542236328125, -0.11194610595703125, -0.0993499755859375, -0.08675384521484375, -0.07415771484375, -0.06156158447265625, -0.0489654541015625, -0.03636932373046875, -0.023773193359375, -0.01117706298828125, 0.0014190673828125, 0.01401519775390625, 0.026611328125, 0.03920745849609375, 0.0518035888671875, 0.06439971923828125, 0.076995849609375, 0.08959197998046875, 0.1021881103515625, 0.11478424072265625, 0.12738037109375, 0.13997650146484375, 0.1525726318359375, 0.16516876220703125, 0.177764892578125, 0.19036102294921875, 0.2029571533203125, 0.21555328369140625, 0.2281494140625, 0.24074554443359375, 0.2533416748046875, 0.26593780517578125, 0.278533935546875, 0.29113006591796875, 0.3037261962890625, 0.31632232666015625, 0.32891845703125, 0.34151458740234375, 0.3541107177734375, 0.36670684814453125, 0.379302978515625, 0.39189910888671875, 0.4044952392578125, 0.41709136962890625, 0.4296875]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 6.0, 10.0, 9.0, 11.0, 16.0, 23.0, 39.0, 50.0, 57.0, 85.0, 80.0, 122.0, 134.0, 90.0, 70.0, 58.0, 40.0, 32.0, 17.0, 18.0, 6.0, 9.0, 9.0, 1.0, 3.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2449951171875, -0.23580360412597656, -0.22661209106445312, -0.2174205780029297, -0.20822906494140625, -0.1990375518798828, -0.18984603881835938, -0.18065452575683594, -0.1714630126953125, -0.16227149963378906, -0.15307998657226562, -0.1438884735107422, -0.13469696044921875, -0.1255054473876953, -0.11631393432617188, -0.10712242126464844, -0.097930908203125, -0.08873939514160156, -0.07954788208007812, -0.07035636901855469, -0.06116485595703125, -0.05197334289550781, -0.042781829833984375, -0.03359031677246094, -0.0243988037109375, -0.015207290649414062, -0.006015777587890625, 0.0031757354736328125, 0.01236724853515625, 0.021558761596679688, 0.030750274658203125, 0.03994178771972656, 0.04913330078125, 0.05832481384277344, 0.06751632690429688, 0.07670783996582031, 0.08589935302734375, 0.09509086608886719, 0.10428237915039062, 0.11347389221191406, 0.1226654052734375, 0.13185691833496094, 0.14104843139648438, 0.1502399444580078, 0.15943145751953125, 0.1686229705810547, 0.17781448364257812, 0.18700599670410156, 0.196197509765625, 0.20538902282714844, 0.21458053588867188, 0.2237720489501953, 0.23296356201171875, 0.2421550750732422, 0.2513465881347656, 0.26053810119628906, 0.2697296142578125, 0.27892112731933594, 0.2881126403808594, 0.2973041534423828, 0.30649566650390625, 0.3156871795654297, 0.3248786926269531, 0.33407020568847656, 0.34326171875]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 5.0, 8.0, 28.0, 58.0, 114.0, 206.0, 232.0, 179.0, 93.0, 51.0, 15.0, 11.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.85068416595459, -9.663383483886719, -9.476083755493164, -9.288783073425293, -9.101483345031738, -8.914182662963867, -8.726882934570312, -8.539582252502441, -8.352282524108887, -8.164981842041016, -7.977682113647461, -7.790381908416748, -7.603081703186035, -7.415781021118164, -7.228481292724609, -7.041180610656738, -6.853879928588867, -6.666579723358154, -6.479279518127441, -6.2919793128967285, -6.104679107666016, -5.9173784255981445, -5.73007869720459, -5.542778015136719, -5.355478286743164, -5.168178081512451, -4.980877876281738, -4.793577671051025, -4.6062774658203125, -4.418976783752441, -4.231677055358887, -4.044376373291016, -3.8570761680603027, -3.66977596282959, -3.482475757598877, -3.295175552368164, -3.107875108718872, -2.920574903488159, -2.7332746982574463, -2.5459742546081543, -2.3586740493774414, -2.1713738441467285, -1.984073519706726, -1.7967733144760132, -1.6094729900360107, -1.4221727848052979, -1.234872579574585, -1.0475722551345825, -0.8602721691131592, -0.6729719042778015, -0.48567166924476624, -0.29837143421173096, -0.11107116937637329, 0.07622909545898438, 0.26352930068969727, 0.4508296251296997, 0.6381298303604126, 0.8254300951957703, 1.012730360031128, 1.2000305652618408, 1.3873307704925537, 1.5746310949325562, 1.761931300163269, 1.9492316246032715, 2.1365318298339844]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 6.0, 4.0, 2.0, 6.0, 7.0, 11.0, 15.0, 10.0, 20.0, 15.0, 20.0, 27.0, 22.0, 33.0, 45.0, 54.0, 42.0, 55.0, 35.0, 47.0, 74.0, 60.0, 49.0, 60.0, 39.0, 47.0, 30.0, 29.0, 28.0, 26.0, 13.0, 16.0, 13.0, 13.0, 8.0, 7.0, 2.0, 4.0, 4.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.6820220947265625, -3.584946632385254, -3.4878711700439453, -3.3907957077026367, -3.293720245361328, -3.1966445446014404, -3.099569082260132, -3.0024936199188232, -2.9054181575775146, -2.808342695236206, -2.7112672328948975, -2.614191770553589, -2.517116069793701, -2.4200406074523926, -2.322965145111084, -2.2258896827697754, -2.128814220428467, -2.031738758087158, -1.9346632957458496, -1.8375877141952515, -1.7405122518539429, -1.6434367895126343, -1.5463612079620361, -1.4492857456207275, -1.352210283279419, -1.2551348209381104, -1.1580593585968018, -1.0609837770462036, -0.963908314704895, -0.8668328523635864, -0.7697573304176331, -0.6726818084716797, -0.5756065845489502, -0.4785310924053192, -0.38145560026168823, -0.28438010811805725, -0.18730461597442627, -0.09022912383079529, 0.006846368312835693, 0.10392189025878906, 0.20099735260009766, 0.29807284474372864, 0.3951483368873596, 0.4922238290309906, 0.5892993211746216, 0.6863747835159302, 0.7834503054618835, 0.8805258274078369, 0.9776012897491455, 1.074676752090454, 1.1717522144317627, 1.2688277959823608, 1.3659032583236694, 1.462978720664978, 1.5600543022155762, 1.6571297645568848, 1.7542052268981934, 1.851280689239502, 1.9483561515808105, 2.045431613922119, 2.1425070762634277, 2.2395827770233154, 2.336658239364624, 2.4337337017059326, 2.530809164047241]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 4.0, 7.0, 6.0, 6.0, 3.0, 8.0, 7.0, 9.0, 6.0, 12.0, 17.0, 23.0, 30.0, 29.0, 40.0, 81.0, 96.0, 217.0, 365.0, 799.0, 1722.0, 5176.0, 26822.0, 3905897.0, 232629.0, 14101.0, 3383.0, 1300.0, 613.0, 307.0, 180.0, 126.0, 78.0, 40.0, 30.0, 26.0, 15.0, 9.0, 11.0, 7.0, 13.0, 10.0, 3.0, 8.0, 7.0, 3.0, 3.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.763671875, -0.7411041259765625, -0.718536376953125, -0.6959686279296875, -0.67340087890625, -0.6508331298828125, -0.628265380859375, -0.6056976318359375, -0.5831298828125, -0.5605621337890625, -0.537994384765625, -0.5154266357421875, -0.49285888671875, -0.4702911376953125, -0.447723388671875, -0.4251556396484375, -0.402587890625, -0.3800201416015625, -0.357452392578125, -0.3348846435546875, -0.31231689453125, -0.2897491455078125, -0.267181396484375, -0.2446136474609375, -0.2220458984375, -0.1994781494140625, -0.176910400390625, -0.1543426513671875, -0.13177490234375, -0.1092071533203125, -0.086639404296875, -0.0640716552734375, -0.04150390625, -0.0189361572265625, 0.003631591796875, 0.0261993408203125, 0.04876708984375, 0.0713348388671875, 0.093902587890625, 0.1164703369140625, 0.1390380859375, 0.1616058349609375, 0.184173583984375, 0.2067413330078125, 0.22930908203125, 0.2518768310546875, 0.274444580078125, 0.2970123291015625, 0.319580078125, 0.3421478271484375, 0.364715576171875, 0.3872833251953125, 0.40985107421875, 0.4324188232421875, 0.454986572265625, 0.4775543212890625, 0.5001220703125, 0.5226898193359375, 0.545257568359375, 0.5678253173828125, 0.59039306640625, 0.6129608154296875, 0.635528564453125, 0.6580963134765625, 0.6806640625]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 4.0, 7.0, 7.0, 7.0, 9.0, 16.0, 24.0, 20.0, 24.0, 25.0, 34.0, 56.0, 57.0, 78.0, 81.0, 90.0, 76.0, 77.0, 48.0, 56.0, 44.0, 42.0, 35.0, 22.0, 24.0, 9.0, 11.0, 5.0, 5.0, 8.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12335205078125, -0.11765003204345703, -0.11194801330566406, -0.1062459945678711, -0.10054397583007812, -0.09484195709228516, -0.08913993835449219, -0.08343791961669922, -0.07773590087890625, -0.07203388214111328, -0.06633186340332031, -0.060629844665527344, -0.054927825927734375, -0.049225807189941406, -0.04352378845214844, -0.03782176971435547, -0.0321197509765625, -0.02641773223876953, -0.020715713500976562, -0.015013694763183594, -0.009311676025390625, -0.0036096572875976562, 0.0020923614501953125, 0.007794380187988281, 0.01349639892578125, 0.01919841766357422, 0.024900436401367188, 0.030602455139160156, 0.036304473876953125, 0.042006492614746094, 0.04770851135253906, 0.05341053009033203, 0.059112548828125, 0.06481456756591797, 0.07051658630371094, 0.0762186050415039, 0.08192062377929688, 0.08762264251708984, 0.09332466125488281, 0.09902667999267578, 0.10472869873046875, 0.11043071746826172, 0.11613273620605469, 0.12183475494384766, 0.12753677368164062, 0.1332387924194336, 0.13894081115722656, 0.14464282989501953, 0.1503448486328125, 0.15604686737060547, 0.16174888610839844, 0.1674509048461914, 0.17315292358398438, 0.17885494232177734, 0.1845569610595703, 0.19025897979736328, 0.19596099853515625, 0.20166301727294922, 0.2073650360107422, 0.21306705474853516, 0.21876907348632812, 0.2244710922241211, 0.23017311096191406, 0.23587512969970703, 0.2415771484375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 6.0, 4.0, 1.0, 7.0, 6.0, 10.0, 20.0, 21.0, 41.0, 48.0, 59.0, 95.0, 140.0, 226.0, 314.0, 477.0, 820.0, 1413.0, 2570.0, 4907.0, 11385.0, 31811.0, 203897.0, 3792123.0, 101988.0, 23358.0, 8891.0, 4202.0, 2207.0, 1203.0, 726.0, 470.0, 285.0, 150.0, 111.0, 87.0, 57.0, 37.0, 33.0, 27.0, 19.0, 13.0, 9.0, 4.0, 7.0, 2.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0], "bins": [-0.4775390625, -0.4640350341796875, -0.450531005859375, -0.4370269775390625, -0.42352294921875, -0.4100189208984375, -0.396514892578125, -0.3830108642578125, -0.3695068359375, -0.3560028076171875, -0.342498779296875, -0.3289947509765625, -0.31549072265625, -0.3019866943359375, -0.288482666015625, -0.2749786376953125, -0.261474609375, -0.2479705810546875, -0.234466552734375, -0.2209625244140625, -0.20745849609375, -0.1939544677734375, -0.180450439453125, -0.1669464111328125, -0.1534423828125, -0.1399383544921875, -0.126434326171875, -0.1129302978515625, -0.09942626953125, -0.0859222412109375, -0.072418212890625, -0.0589141845703125, -0.04541015625, -0.0319061279296875, -0.018402099609375, -0.0048980712890625, 0.00860595703125, 0.0221099853515625, 0.035614013671875, 0.0491180419921875, 0.0626220703125, 0.0761260986328125, 0.089630126953125, 0.1031341552734375, 0.11663818359375, 0.1301422119140625, 0.143646240234375, 0.1571502685546875, 0.170654296875, 0.1841583251953125, 0.197662353515625, 0.2111663818359375, 0.22467041015625, 0.2381744384765625, 0.251678466796875, 0.2651824951171875, 0.2786865234375, 0.2921905517578125, 0.305694580078125, 0.3191986083984375, 0.33270263671875, 0.3462066650390625, 0.359710693359375, 0.3732147216796875, 0.38671875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 5.0, 4.0, 7.0, 12.0, 9.0, 15.0, 17.0, 40.0, 78.0, 190.0, 2378.0, 958.0, 160.0, 75.0, 36.0, 22.0, 15.0, 14.0, 9.0, 7.0, 7.0, 4.0, 2.0, 0.0, 2.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.239501953125, -0.23175048828125, -0.2239990234375, -0.21624755859375, -0.20849609375, -0.20074462890625, -0.1929931640625, -0.18524169921875, -0.177490234375, -0.16973876953125, -0.1619873046875, -0.15423583984375, -0.146484375, -0.13873291015625, -0.1309814453125, -0.12322998046875, -0.115478515625, -0.10772705078125, -0.0999755859375, -0.09222412109375, -0.08447265625, -0.07672119140625, -0.0689697265625, -0.06121826171875, -0.053466796875, -0.04571533203125, -0.0379638671875, -0.03021240234375, -0.0224609375, -0.01470947265625, -0.0069580078125, 0.00079345703125, 0.008544921875, 0.01629638671875, 0.0240478515625, 0.03179931640625, 0.03955078125, 0.04730224609375, 0.0550537109375, 0.06280517578125, 0.070556640625, 0.07830810546875, 0.0860595703125, 0.09381103515625, 0.1015625, 0.10931396484375, 0.1170654296875, 0.12481689453125, 0.132568359375, 0.14031982421875, 0.1480712890625, 0.15582275390625, 0.16357421875, 0.17132568359375, 0.1790771484375, 0.18682861328125, 0.194580078125, 0.20233154296875, 0.2100830078125, 0.21783447265625, 0.2255859375, 0.23333740234375, 0.2410888671875, 0.24884033203125, 0.256591796875]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 0.0, 0.0, 2.0, 6.0, 7.0, 17.0, 28.0, 46.0, 92.0, 124.0, 136.0, 156.0, 140.0, 108.0, 60.0, 31.0, 25.0, 15.0, 9.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8327465057373047, -1.7911361455917358, -1.7495256662368774, -1.7079153060913086, -1.6663049459457397, -1.6246944665908813, -1.5830841064453125, -1.541473627090454, -1.4998632669448853, -1.4582529067993164, -1.416642427444458, -1.3750320672988892, -1.3334217071533203, -1.291811227798462, -1.250200867652893, -1.2085905075073242, -1.1669800281524658, -1.125369668006897, -1.0837591886520386, -1.0421488285064697, -1.0005384683609009, -0.9589279890060425, -0.9173176288604736, -0.87570720911026, -0.8340969085693359, -0.7924864888191223, -0.7508761286735535, -0.7092657089233398, -0.6676552891731262, -0.6260448694229126, -0.5844345092773438, -0.5428240895271301, -0.5012137293815613, -0.45960333943367004, -0.4179929196834564, -0.3763825297355652, -0.33477210998535156, -0.2931617200374603, -0.2515513300895691, -0.20994091033935547, -0.16833052039146423, -0.1267201155424118, -0.08510971814393997, -0.04349932074546814, -0.0018889158964157104, 0.03972148895263672, 0.08133187890052795, 0.12294229865074158, 0.1645526885986328, 0.20616309344768524, 0.24777349829673767, 0.2893838882446289, 0.33099430799484253, 0.37260469794273376, 0.414215087890625, 0.4558255076408386, 0.49743589758872986, 0.5390462875366211, 0.5806567072868347, 0.6222671270370483, 0.6638774871826172, 0.7054879069328308, 0.7470983266830444, 0.7887086868286133, 0.8303191065788269]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 1.0, 7.0, 12.0, 8.0, 6.0, 12.0, 14.0, 18.0, 23.0, 24.0, 23.0, 22.0, 30.0, 27.0, 36.0, 40.0, 43.0, 39.0, 42.0, 40.0, 44.0, 56.0, 42.0, 44.0, 39.0, 33.0, 39.0, 33.0, 27.0, 28.0, 15.0, 26.0, 13.0, 16.0, 11.0, 13.0, 11.0, 7.0, 13.0, 4.0, 5.0, 5.0, 5.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.5308579802513123, -0.5140323042869568, -0.4972066879272461, -0.4803810119628906, -0.46355536580085754, -0.44672971963882446, -0.429904043674469, -0.4130783975124359, -0.39625275135040283, -0.37942710518836975, -0.36260145902633667, -0.3457757830619812, -0.3289501368999481, -0.31212449073791504, -0.29529881477355957, -0.2784731686115265, -0.2616475224494934, -0.24482187628746033, -0.22799621522426605, -0.21117055416107178, -0.1943449079990387, -0.17751926183700562, -0.16069360077381134, -0.14386793971061707, -0.12704229354858398, -0.1102166399359703, -0.09339098632335663, -0.07656533271074295, -0.05973967909812927, -0.042914025485515594, -0.026088371872901917, -0.009262718260288239, 0.007562994956970215, 0.024388648569583893, 0.04121430218219757, 0.05803995579481125, 0.07486560940742493, 0.0916912630200386, 0.10851691663265228, 0.12534257769584656, 0.14216822385787964, 0.15899387001991272, 0.175819531083107, 0.19264519214630127, 0.20947083830833435, 0.22629648447036743, 0.2431221455335617, 0.259947806596756, 0.27677345275878906, 0.29359909892082214, 0.3104247450828552, 0.3272504210472107, 0.3440760672092438, 0.36090171337127686, 0.3777273893356323, 0.3945530354976654, 0.4113786816596985, 0.42820432782173157, 0.44502997398376465, 0.4618556499481201, 0.4786812961101532, 0.4955069422721863, 0.5123326182365417, 0.5291582345962524, 0.5459839105606079]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 3.0, 6.0, 9.0, 11.0, 10.0, 26.0, 27.0, 42.0, 54.0, 97.0, 159.0, 253.0, 429.0, 705.0, 1141.0, 1947.0, 3441.0, 6447.0, 12515.0, 25223.0, 53307.0, 114943.0, 270169.0, 306454.0, 131865.0, 60016.0, 28703.0, 14091.0, 7254.0, 3894.0, 2111.0, 1245.0, 744.0, 427.0, 302.0, 178.0, 102.0, 86.0, 45.0, 27.0, 18.0, 13.0, 8.0, 5.0, 4.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2203369140625, -0.2122020721435547, -0.20406723022460938, -0.19593238830566406, -0.18779754638671875, -0.17966270446777344, -0.17152786254882812, -0.1633930206298828, -0.1552581787109375, -0.1471233367919922, -0.13898849487304688, -0.13085365295410156, -0.12271881103515625, -0.11458396911621094, -0.10644912719726562, -0.09831428527832031, -0.090179443359375, -0.08204460144042969, -0.07390975952148438, -0.06577491760253906, -0.05764007568359375, -0.04950523376464844, -0.041370391845703125, -0.03323554992675781, -0.0251007080078125, -0.016965866088867188, -0.008831024169921875, -0.0006961822509765625, 0.00743865966796875, 0.015573501586914062, 0.023708343505859375, 0.03184318542480469, 0.03997802734375, 0.04811286926269531, 0.056247711181640625, 0.06438255310058594, 0.07251739501953125, 0.08065223693847656, 0.08878707885742188, 0.09692192077636719, 0.1050567626953125, 0.11319160461425781, 0.12132644653320312, 0.12946128845214844, 0.13759613037109375, 0.14573097229003906, 0.15386581420898438, 0.1620006561279297, 0.170135498046875, 0.1782703399658203, 0.18640518188476562, 0.19454002380371094, 0.20267486572265625, 0.21080970764160156, 0.21894454956054688, 0.2270793914794922, 0.2352142333984375, 0.2433490753173828, 0.2514839172363281, 0.25961875915527344, 0.26775360107421875, 0.27588844299316406, 0.2840232849121094, 0.2921581268310547, 0.30029296875]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 12.0, 2.0, 8.0, 9.0, 14.0, 14.0, 23.0, 23.0, 36.0, 33.0, 42.0, 50.0, 47.0, 57.0, 67.0, 66.0, 65.0, 60.0, 55.0, 62.0, 41.0, 39.0, 30.0, 40.0, 22.0, 19.0, 18.0, 11.0, 10.0, 5.0, 4.0, 6.0, 2.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.142333984375, -0.13721847534179688, -0.13210296630859375, -0.12698745727539062, -0.1218719482421875, -0.11675643920898438, -0.11164093017578125, -0.10652542114257812, -0.101409912109375, -0.09629440307617188, -0.09117889404296875, -0.08606338500976562, -0.0809478759765625, -0.07583236694335938, -0.07071685791015625, -0.06560134887695312, -0.06048583984375, -0.055370330810546875, -0.05025482177734375, -0.045139312744140625, -0.0400238037109375, -0.034908294677734375, -0.02979278564453125, -0.024677276611328125, -0.019561767578125, -0.014446258544921875, -0.00933074951171875, -0.004215240478515625, 0.0009002685546875, 0.006015777587890625, 0.01113128662109375, 0.016246795654296875, 0.0213623046875, 0.026477813720703125, 0.03159332275390625, 0.036708831787109375, 0.0418243408203125, 0.046939849853515625, 0.05205535888671875, 0.057170867919921875, 0.062286376953125, 0.06740188598632812, 0.07251739501953125, 0.07763290405273438, 0.0827484130859375, 0.08786392211914062, 0.09297943115234375, 0.09809494018554688, 0.10321044921875, 0.10832595825195312, 0.11344146728515625, 0.11855697631835938, 0.1236724853515625, 0.12878799438476562, 0.13390350341796875, 0.13901901245117188, 0.144134521484375, 0.14925003051757812, 0.15436553955078125, 0.15948104858398438, 0.1645965576171875, 0.16971206665039062, 0.17482757568359375, 0.17994308471679688, 0.18505859375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 6.0, 6.0, 8.0, 24.0, 31.0, 39.0, 101.0, 192.0, 331.0, 648.0, 1557.0, 5427.0, 65292.0, 890280.0, 75467.0, 5969.0, 1651.0, 734.0, 364.0, 166.0, 117.0, 53.0, 29.0, 20.0, 10.0, 7.0, 3.0, 4.0, 4.0, 4.0, 5.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.11328125, -1.081939697265625, -1.05059814453125, -1.019256591796875, -0.9879150390625, -0.956573486328125, -0.92523193359375, -0.893890380859375, -0.862548828125, -0.831207275390625, -0.79986572265625, -0.768524169921875, -0.7371826171875, -0.705841064453125, -0.67449951171875, -0.643157958984375, -0.61181640625, -0.580474853515625, -0.54913330078125, -0.517791748046875, -0.4864501953125, -0.455108642578125, -0.42376708984375, -0.392425537109375, -0.361083984375, -0.329742431640625, -0.29840087890625, -0.267059326171875, -0.2357177734375, -0.204376220703125, -0.17303466796875, -0.141693115234375, -0.1103515625, -0.079010009765625, -0.04766845703125, -0.016326904296875, 0.0150146484375, 0.046356201171875, 0.07769775390625, 0.109039306640625, 0.140380859375, 0.171722412109375, 0.20306396484375, 0.234405517578125, 0.2657470703125, 0.297088623046875, 0.32843017578125, 0.359771728515625, 0.39111328125, 0.422454833984375, 0.45379638671875, 0.485137939453125, 0.5164794921875, 0.547821044921875, 0.57916259765625, 0.610504150390625, 0.641845703125, 0.673187255859375, 0.70452880859375, 0.735870361328125, 0.7672119140625, 0.798553466796875, 0.82989501953125, 0.861236572265625, 0.892578125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 1.0, 4.0, 8.0, 7.0, 9.0, 10.0, 14.0, 15.0, 14.0, 17.0, 22.0, 22.0, 29.0, 20.0, 31.0, 30.0, 35.0, 41.0, 24.0, 35.0, 47.0, 34.0, 59.0, 33.0, 58.0, 32.0, 33.0, 39.0, 27.0, 35.0, 27.0, 34.0, 23.0, 20.0, 16.0, 18.0, 15.0, 16.0, 9.0, 7.0, 9.0, 3.0, 4.0, 4.0, 3.0, 3.0, 3.0, 4.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.5068359375, -0.4908447265625, -0.474853515625, -0.4588623046875, -0.44287109375, -0.4268798828125, -0.410888671875, -0.3948974609375, -0.37890625, -0.3629150390625, -0.346923828125, -0.3309326171875, -0.31494140625, -0.2989501953125, -0.282958984375, -0.2669677734375, -0.2509765625, -0.2349853515625, -0.218994140625, -0.2030029296875, -0.18701171875, -0.1710205078125, -0.155029296875, -0.1390380859375, -0.123046875, -0.1070556640625, -0.091064453125, -0.0750732421875, -0.05908203125, -0.0430908203125, -0.027099609375, -0.0111083984375, 0.0048828125, 0.0208740234375, 0.036865234375, 0.0528564453125, 0.06884765625, 0.0848388671875, 0.100830078125, 0.1168212890625, 0.1328125, 0.1488037109375, 0.164794921875, 0.1807861328125, 0.19677734375, 0.2127685546875, 0.228759765625, 0.2447509765625, 0.2607421875, 0.2767333984375, 0.292724609375, 0.3087158203125, 0.32470703125, 0.3406982421875, 0.356689453125, 0.3726806640625, 0.388671875, 0.4046630859375, 0.420654296875, 0.4366455078125, 0.45263671875, 0.4686279296875, 0.484619140625, 0.5006103515625, 0.5166015625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 2.0, 3.0, 4.0, 5.0, 13.0, 11.0, 14.0, 22.0, 32.0, 52.0, 102.0, 186.0, 353.0, 824.0, 2203.0, 7644.0, 49613.0, 748953.0, 214032.0, 17872.0, 4104.0, 1334.0, 547.0, 252.0, 141.0, 79.0, 48.0, 33.0, 27.0, 12.0, 7.0, 8.0, 3.0, 6.0, 5.0, 3.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.33251953125, -0.3213462829589844, -0.31017303466796875, -0.2989997863769531, -0.2878265380859375, -0.2766532897949219, -0.26548004150390625, -0.2543067932128906, -0.243133544921875, -0.23196029663085938, -0.22078704833984375, -0.20961380004882812, -0.1984405517578125, -0.18726730346679688, -0.17609405517578125, -0.16492080688476562, -0.15374755859375, -0.14257431030273438, -0.13140106201171875, -0.12022781372070312, -0.1090545654296875, -0.09788131713867188, -0.08670806884765625, -0.07553482055664062, -0.064361572265625, -0.053188323974609375, -0.04201507568359375, -0.030841827392578125, -0.0196685791015625, -0.008495330810546875, 0.00267791748046875, 0.013851165771484375, 0.0250244140625, 0.036197662353515625, 0.04737091064453125, 0.058544158935546875, 0.0697174072265625, 0.08089065551757812, 0.09206390380859375, 0.10323715209960938, 0.114410400390625, 0.12558364868164062, 0.13675689697265625, 0.14793014526367188, 0.1591033935546875, 0.17027664184570312, 0.18144989013671875, 0.19262313842773438, 0.20379638671875, 0.21496963500976562, 0.22614288330078125, 0.23731613159179688, 0.2484893798828125, 0.2596626281738281, 0.27083587646484375, 0.2820091247558594, 0.293182373046875, 0.3043556213378906, 0.31552886962890625, 0.3267021179199219, 0.3378753662109375, 0.3490486145019531, 0.36022186279296875, 0.3713951110839844, 0.382568359375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 7.0, 10.0, 9.0, 9.0, 9.0, 16.0, 27.0, 28.0, 24.0, 36.0, 35.0, 46.0, 68.0, 92.0, 107.0, 109.0, 77.0, 71.0, 49.0, 44.0, 22.0, 28.0, 18.0, 11.0, 8.0, 11.0, 7.0, 9.0, 9.0, 6.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.971857070922852e-05, -9.685847908258438e-05, -9.399838745594025e-05, -9.113829582929611e-05, -8.827820420265198e-05, -8.541811257600784e-05, -8.255802094936371e-05, -7.969792932271957e-05, -7.683783769607544e-05, -7.39777460694313e-05, -7.111765444278717e-05, -6.825756281614304e-05, -6.53974711894989e-05, -6.253737956285477e-05, -5.967728793621063e-05, -5.68171963095665e-05, -5.395710468292236e-05, -5.109701305627823e-05, -4.8236921429634094e-05, -4.537682980298996e-05, -4.2516738176345825e-05, -3.965664654970169e-05, -3.6796554923057556e-05, -3.393646329641342e-05, -3.107637166976929e-05, -2.8216280043125153e-05, -2.5356188416481018e-05, -2.2496096789836884e-05, -1.963600516319275e-05, -1.6775913536548615e-05, -1.391582190990448e-05, -1.1055730283260345e-05, -8.195638656616211e-06, -5.335547029972076e-06, -2.475455403327942e-06, 3.8463622331619263e-07, 3.244727849960327e-06, 6.104819476604462e-06, 8.964911103248596e-06, 1.182500272989273e-05, 1.4685094356536865e-05, 1.7545185983181e-05, 2.0405277609825134e-05, 2.326536923646927e-05, 2.6125460863113403e-05, 2.8985552489757538e-05, 3.184564411640167e-05, 3.470573574304581e-05, 3.756582736968994e-05, 4.0425918996334076e-05, 4.328601062297821e-05, 4.6146102249622345e-05, 4.900619387626648e-05, 5.1866285502910614e-05, 5.472637712955475e-05, 5.758646875619888e-05, 6.044656038284302e-05, 6.330665200948715e-05, 6.616674363613129e-05, 6.902683526277542e-05, 7.188692688941956e-05, 7.474701851606369e-05, 7.760711014270782e-05, 8.046720176935196e-05, 8.33272933959961e-05]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 5.0, 5.0, 11.0, 8.0, 20.0, 25.0, 46.0, 34.0, 55.0, 78.0, 151.0, 231.0, 385.0, 701.0, 1430.0, 3151.0, 8984.0, 40878.0, 445307.0, 488049.0, 42923.0, 9491.0, 3362.0, 1476.0, 684.0, 391.0, 211.0, 135.0, 103.0, 56.0, 31.0, 37.0, 32.0, 16.0, 18.0, 13.0, 5.0, 6.0, 9.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.314697265625, -0.3057098388671875, -0.296722412109375, -0.2877349853515625, -0.27874755859375, -0.2697601318359375, -0.260772705078125, -0.2517852783203125, -0.2427978515625, -0.2338104248046875, -0.224822998046875, -0.2158355712890625, -0.20684814453125, -0.1978607177734375, -0.188873291015625, -0.1798858642578125, -0.1708984375, -0.1619110107421875, -0.152923583984375, -0.1439361572265625, -0.13494873046875, -0.1259613037109375, -0.116973876953125, -0.1079864501953125, -0.0989990234375, -0.0900115966796875, -0.081024169921875, -0.0720367431640625, -0.06304931640625, -0.0540618896484375, -0.045074462890625, -0.0360870361328125, -0.027099609375, -0.0181121826171875, -0.009124755859375, -0.0001373291015625, 0.00885009765625, 0.0178375244140625, 0.026824951171875, 0.0358123779296875, 0.0447998046875, 0.0537872314453125, 0.062774658203125, 0.0717620849609375, 0.08074951171875, 0.0897369384765625, 0.098724365234375, 0.1077117919921875, 0.11669921875, 0.1256866455078125, 0.134674072265625, 0.1436614990234375, 0.15264892578125, 0.1616363525390625, 0.170623779296875, 0.1796112060546875, 0.1885986328125, 0.1975860595703125, 0.206573486328125, 0.2155609130859375, 0.22454833984375, 0.2335357666015625, 0.242523193359375, 0.2515106201171875, 0.260498046875]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 0.0, 3.0, 1.0, 3.0, 2.0, 8.0, 4.0, 7.0, 13.0, 10.0, 19.0, 32.0, 34.0, 45.0, 72.0, 92.0, 102.0, 120.0, 98.0, 85.0, 57.0, 63.0, 33.0, 36.0, 24.0, 14.0, 6.0, 10.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.269287109375, -0.2609977722167969, -0.25270843505859375, -0.24441909790039062, -0.2361297607421875, -0.22784042358398438, -0.21955108642578125, -0.21126174926757812, -0.202972412109375, -0.19468307495117188, -0.18639373779296875, -0.17810440063476562, -0.1698150634765625, -0.16152572631835938, -0.15323638916015625, -0.14494705200195312, -0.13665771484375, -0.12836837768554688, -0.12007904052734375, -0.11178970336914062, -0.1035003662109375, -0.09521102905273438, -0.08692169189453125, -0.07863235473632812, -0.070343017578125, -0.062053680419921875, -0.05376434326171875, -0.045475006103515625, -0.0371856689453125, -0.028896331787109375, -0.02060699462890625, -0.012317657470703125, -0.0040283203125, 0.004261016845703125, 0.01255035400390625, 0.020839691162109375, 0.0291290283203125, 0.037418365478515625, 0.04570770263671875, 0.053997039794921875, 0.062286376953125, 0.07057571411132812, 0.07886505126953125, 0.08715438842773438, 0.0954437255859375, 0.10373306274414062, 0.11202239990234375, 0.12031173706054688, 0.12860107421875, 0.13689041137695312, 0.14517974853515625, 0.15346908569335938, 0.1617584228515625, 0.17004776000976562, 0.17833709716796875, 0.18662643432617188, 0.194915771484375, 0.20320510864257812, 0.21149444580078125, 0.21978378295898438, 0.2280731201171875, 0.23636245727539062, 0.24465179443359375, 0.2529411315917969, 0.26123046875]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 3.0, 6.0, 15.0, 11.0, 36.0, 58.0, 87.0, 127.0, 141.0, 154.0, 117.0, 88.0, 73.0, 40.0, 14.0, 11.0, 4.0, 2.0, 3.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.223482608795166, -4.087703227996826, -3.9519243240356445, -3.8161449432373047, -3.680365800857544, -3.544586658477783, -3.4088072776794434, -3.2730281352996826, -3.137248992919922, -3.001469850540161, -2.8656907081604004, -2.7299113273620605, -2.5941321849823, -2.458353042602539, -2.322573661804199, -2.1867945194244385, -2.0510153770446777, -1.915236234664917, -1.7794569730758667, -1.6436777114868164, -1.5078985691070557, -1.372119426727295, -1.2363401651382446, -1.1005609035491943, -0.9647817611694336, -0.8290025591850281, -0.6932233572006226, -0.557444155216217, -0.4216649532318115, -0.285885751247406, -0.1501065492630005, -0.01432734727859497, 0.12145233154296875, 0.25723153352737427, 0.3930107355117798, 0.5287899374961853, 0.6645691394805908, 0.8003483414649963, 0.9361275434494019, 1.0719068050384521, 1.207685947418213, 1.3434650897979736, 1.479244351387024, 1.6150236129760742, 1.750802755355835, 1.8865818977355957, 2.0223612785339355, 2.1581404209136963, 2.293919563293457, 2.4296987056732178, 2.5654778480529785, 2.7012572288513184, 2.837036371231079, 2.97281551361084, 3.1085948944091797, 3.2443740367889404, 3.380153179168701, 3.515932321548462, 3.6517114639282227, 3.7874908447265625, 3.9232699871063232, 4.059049129486084, 4.194828510284424, 4.3306074142456055, 4.466386795043945]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 5.0, 3.0, 5.0, 11.0, 10.0, 22.0, 14.0, 19.0, 27.0, 33.0, 33.0, 44.0, 40.0, 53.0, 43.0, 43.0, 40.0, 54.0, 67.0, 47.0, 58.0, 44.0, 47.0, 40.0, 33.0, 33.0, 20.0, 23.0, 23.0, 13.0, 11.0, 8.0, 12.0, 7.0, 7.0, 6.0, 4.0, 5.0, 2.0, 1.0, 0.0, 2.0], "bins": [-3.822504997253418, -3.7261927127838135, -3.629880428314209, -3.5335681438446045, -3.437255859375, -3.3409438133239746, -3.24463152885437, -3.1483192443847656, -3.052006959915161, -2.9556946754455566, -2.859382390975952, -2.7630701065063477, -2.6667580604553223, -2.5704457759857178, -2.4741334915161133, -2.377821207046509, -2.2815089225769043, -2.1851966381073, -2.0888843536376953, -1.9925721883773804, -1.8962599039077759, -1.7999476194381714, -1.7036354541778564, -1.607323169708252, -1.5110108852386475, -1.414698600769043, -1.3183863162994385, -1.2220741510391235, -1.125761866569519, -1.0294495820999146, -0.9331373572349548, -0.8368251323699951, -0.7405128479003906, -0.6442005634307861, -0.5478883385658264, -0.4515760838985443, -0.3552638292312622, -0.2589515745639801, -0.162639319896698, -0.06632709503173828, 0.02998518943786621, 0.12629744410514832, 0.22260969877243042, 0.3189219534397125, 0.41523420810699463, 0.5115464925765991, 0.6078587174415588, 0.7041709423065186, 0.800483226776123, 0.8967955112457275, 0.9931077361106873, 1.089419960975647, 1.1857322454452515, 1.282044529914856, 1.378356695175171, 1.4746689796447754, 1.5709812641143799, 1.6672935485839844, 1.7636058330535889, 1.8599179983139038, 1.9562302827835083, 2.0525424480438232, 2.1488547325134277, 2.2451670169830322, 2.3414793014526367]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 7.0, 12.0, 10.0, 10.0, 14.0, 19.0, 24.0, 52.0, 61.0, 80.0, 116.0, 131.0, 228.0, 360.0, 566.0, 895.0, 1610.0, 3157.0, 6901.0, 17146.0, 53548.0, 294204.0, 2879376.0, 799074.0, 92588.0, 25364.0, 9488.0, 4064.0, 2082.0, 1083.0, 653.0, 412.0, 257.0, 203.0, 127.0, 88.0, 65.0, 50.0, 44.0, 25.0, 22.0, 13.0, 14.0, 14.0, 10.0, 6.0, 2.0, 2.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.25927734375, -0.2505455017089844, -0.24181365966796875, -0.23308181762695312, -0.2243499755859375, -0.21561813354492188, -0.20688629150390625, -0.19815444946289062, -0.189422607421875, -0.18069076538085938, -0.17195892333984375, -0.16322708129882812, -0.1544952392578125, -0.14576339721679688, -0.13703155517578125, -0.12829971313476562, -0.11956787109375, -0.11083602905273438, -0.10210418701171875, -0.09337234497070312, -0.0846405029296875, -0.07590866088867188, -0.06717681884765625, -0.058444976806640625, -0.049713134765625, -0.040981292724609375, -0.03224945068359375, -0.023517608642578125, -0.0147857666015625, -0.006053924560546875, 0.00267791748046875, 0.011409759521484375, 0.0201416015625, 0.028873443603515625, 0.03760528564453125, 0.046337127685546875, 0.0550689697265625, 0.06380081176757812, 0.07253265380859375, 0.08126449584960938, 0.089996337890625, 0.09872817993164062, 0.10746002197265625, 0.11619186401367188, 0.1249237060546875, 0.13365554809570312, 0.14238739013671875, 0.15111923217773438, 0.15985107421875, 0.16858291625976562, 0.17731475830078125, 0.18604660034179688, 0.1947784423828125, 0.20351028442382812, 0.21224212646484375, 0.22097396850585938, 0.229705810546875, 0.23843765258789062, 0.24716949462890625, 0.2559013366699219, 0.2646331787109375, 0.2733650207519531, 0.28209686279296875, 0.2908287048339844, 0.299560546875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 2.0, 6.0, 5.0, 9.0, 11.0, 15.0, 15.0, 14.0, 12.0, 19.0, 19.0, 32.0, 32.0, 43.0, 38.0, 45.0, 46.0, 56.0, 63.0, 52.0, 56.0, 58.0, 53.0, 43.0, 44.0, 37.0, 31.0, 24.0, 22.0, 14.0, 16.0, 14.0, 15.0, 13.0, 6.0, 5.0, 7.0, 1.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.15087890625, -0.14672088623046875, -0.1425628662109375, -0.13840484619140625, -0.134246826171875, -0.13008880615234375, -0.1259307861328125, -0.12177276611328125, -0.11761474609375, -0.11345672607421875, -0.1092987060546875, -0.10514068603515625, -0.100982666015625, -0.09682464599609375, -0.0926666259765625, -0.08850860595703125, -0.0843505859375, -0.08019256591796875, -0.0760345458984375, -0.07187652587890625, -0.067718505859375, -0.06356048583984375, -0.0594024658203125, -0.05524444580078125, -0.05108642578125, -0.04692840576171875, -0.0427703857421875, -0.03861236572265625, -0.034454345703125, -0.03029632568359375, -0.0261383056640625, -0.02198028564453125, -0.017822265625, -0.01366424560546875, -0.0095062255859375, -0.00534820556640625, -0.001190185546875, 0.00296783447265625, 0.0071258544921875, 0.01128387451171875, 0.01544189453125, 0.01959991455078125, 0.0237579345703125, 0.02791595458984375, 0.032073974609375, 0.03623199462890625, 0.0403900146484375, 0.04454803466796875, 0.0487060546875, 0.05286407470703125, 0.0570220947265625, 0.06118011474609375, 0.065338134765625, 0.06949615478515625, 0.0736541748046875, 0.07781219482421875, 0.08197021484375, 0.08612823486328125, 0.0902862548828125, 0.09444427490234375, 0.098602294921875, 0.10276031494140625, 0.1069183349609375, 0.11107635498046875, 0.115234375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 6.0, 2.0, 5.0, 7.0, 4.0, 10.0, 22.0, 31.0, 48.0, 69.0, 141.0, 238.0, 510.0, 1274.0, 3781.0, 12934.0, 58179.0, 685604.0, 3247769.0, 148657.0, 24958.0, 6610.0, 1985.0, 751.0, 310.0, 143.0, 105.0, 52.0, 30.0, 21.0, 10.0, 11.0, 5.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.43701171875, -0.42206573486328125, -0.4071197509765625, -0.39217376708984375, -0.377227783203125, -0.36228179931640625, -0.3473358154296875, -0.33238983154296875, -0.31744384765625, -0.30249786376953125, -0.2875518798828125, -0.27260589599609375, -0.257659912109375, -0.24271392822265625, -0.2277679443359375, -0.21282196044921875, -0.1978759765625, -0.18292999267578125, -0.1679840087890625, -0.15303802490234375, -0.138092041015625, -0.12314605712890625, -0.1082000732421875, -0.09325408935546875, -0.07830810546875, -0.06336212158203125, -0.0484161376953125, -0.03347015380859375, -0.018524169921875, -0.00357818603515625, 0.0113677978515625, 0.02631378173828125, 0.041259765625, 0.05620574951171875, 0.0711517333984375, 0.08609771728515625, 0.101043701171875, 0.11598968505859375, 0.1309356689453125, 0.14588165283203125, 0.16082763671875, 0.17577362060546875, 0.1907196044921875, 0.20566558837890625, 0.220611572265625, 0.23555755615234375, 0.2505035400390625, 0.26544952392578125, 0.2803955078125, 0.29534149169921875, 0.3102874755859375, 0.32523345947265625, 0.340179443359375, 0.35512542724609375, 0.3700714111328125, 0.38501739501953125, 0.39996337890625, 0.41490936279296875, 0.4298553466796875, 0.44480133056640625, 0.459747314453125, 0.47469329833984375, 0.4896392822265625, 0.5045852661132812, 0.51953125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 9.0, 2.0, 5.0, 3.0, 6.0, 8.0, 19.0, 15.0, 33.0, 36.0, 81.0, 103.0, 222.0, 377.0, 851.0, 1104.0, 573.0, 255.0, 139.0, 70.0, 45.0, 44.0, 20.0, 17.0, 12.0, 11.0, 7.0, 4.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.71728515625, -0.7010765075683594, -0.6848678588867188, -0.6686592102050781, -0.6524505615234375, -0.6362419128417969, -0.6200332641601562, -0.6038246154785156, -0.587615966796875, -0.5714073181152344, -0.5551986694335938, -0.5389900207519531, -0.5227813720703125, -0.5065727233886719, -0.49036407470703125, -0.4741554260253906, -0.45794677734375, -0.4417381286621094, -0.42552947998046875, -0.4093208312988281, -0.3931121826171875, -0.3769035339355469, -0.36069488525390625, -0.3444862365722656, -0.328277587890625, -0.3120689392089844, -0.29586029052734375, -0.2796516418457031, -0.2634429931640625, -0.24723434448242188, -0.23102569580078125, -0.21481704711914062, -0.1986083984375, -0.18239974975585938, -0.16619110107421875, -0.14998245239257812, -0.1337738037109375, -0.11756515502929688, -0.10135650634765625, -0.08514785766601562, -0.068939208984375, -0.052730560302734375, -0.03652191162109375, -0.020313262939453125, -0.0041046142578125, 0.012104034423828125, 0.02831268310546875, 0.044521331787109375, 0.06072998046875, 0.07693862915039062, 0.09314727783203125, 0.10935592651367188, 0.1255645751953125, 0.14177322387695312, 0.15798187255859375, 0.17419052124023438, 0.190399169921875, 0.20660781860351562, 0.22281646728515625, 0.23902511596679688, 0.2552337646484375, 0.2714424133300781, 0.28765106201171875, 0.3038597106933594, 0.320068359375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 3.0, 1.0, 5.0, 6.0, 18.0, 36.0, 97.0, 194.0, 294.0, 223.0, 79.0, 27.0, 9.0, 12.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-10.782614707946777, -10.57011890411377, -10.357623100280762, -10.145127296447754, -9.932631492614746, -9.720135688781738, -9.50763988494873, -9.295145034790039, -9.082649230957031, -8.870153427124023, -8.657657623291016, -8.445161819458008, -8.232666015625, -8.020170211791992, -7.807674884796143, -7.595179080963135, -7.382682800292969, -7.170186996459961, -6.957691192626953, -6.745195388793945, -6.5326995849609375, -6.32020378112793, -6.10770845413208, -5.895212650299072, -5.6827168464660645, -5.470221042633057, -5.257725238800049, -5.045229434967041, -4.832734107971191, -4.620238304138184, -4.407742500305176, -4.195246696472168, -3.982750654220581, -3.7702548503875732, -3.5577592849731445, -3.3452634811401367, -3.132767677307129, -2.920271873474121, -2.7077760696411133, -2.4952805042266846, -2.2827847003936768, -2.070288896560669, -1.8577932119369507, -1.6452975273132324, -1.4328017234802246, -1.2203059196472168, -1.0078102350234985, -0.7953145503997803, -0.5828187465667725, -0.3703230023384094, -0.1578272581100464, 0.05466848611831665, 0.2671642303466797, 0.4796600341796875, 0.6921557188034058, 0.904651403427124, 1.1171472072601318, 1.3296430110931396, 1.542138695716858, 1.7546343803405762, 1.967130184173584, 2.179625988006592, 2.3921217918395996, 2.6046173572540283, 2.817113161087036]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 5.0, 4.0, 10.0, 10.0, 18.0, 14.0, 14.0, 19.0, 28.0, 36.0, 46.0, 32.0, 53.0, 53.0, 49.0, 49.0, 65.0, 53.0, 72.0, 57.0, 44.0, 41.0, 31.0, 40.0, 33.0, 22.0, 21.0, 18.0, 13.0, 15.0, 7.0, 10.0, 7.0, 4.0, 5.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.040464401245117, -1.9735764265060425, -1.9066885709762573, -1.8398005962371826, -1.7729127407073975, -1.7060247659683228, -1.639136791229248, -1.572248935699463, -1.5053609609603882, -1.4384729862213135, -1.3715851306915283, -1.3046971559524536, -1.237809181213379, -1.1709213256835938, -1.104033350944519, -1.0371453762054443, -0.9702575206756592, -0.9033696055412292, -0.8364816904067993, -0.7695937156677246, -0.7027058005332947, -0.6358178853988647, -0.56892991065979, -0.5020419955253601, -0.4351540803909302, -0.36826616525650024, -0.3013782203197479, -0.2344902902841568, -0.16760236024856567, -0.10071444511413574, -0.03382650017738342, 0.033061444759368896, 0.09994959831237793, 0.16683752834796906, 0.23372545838356018, 0.3006134033203125, 0.36750131845474243, 0.43438923358917236, 0.5012772083282471, 0.568165123462677, 0.6350530385971069, 0.7019409537315369, 0.7688288688659668, 0.8357168436050415, 0.9026047587394714, 0.9694926738739014, 1.036380648612976, 1.1032686233520508, 1.170156478881836, 1.2370444536209106, 1.3039323091506958, 1.3708202838897705, 1.4377081394195557, 1.5045961141586304, 1.571484088897705, 1.6383719444274902, 1.705259919166565, 1.7721478939056396, 1.8390357494354248, 1.9059237241744995, 1.9728116989135742, 2.0396995544433594, 2.1065874099731445, 2.173475503921509, 2.240363359451294]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 5.0, 6.0, 7.0, 12.0, 7.0, 27.0, 33.0, 48.0, 85.0, 145.0, 198.0, 351.0, 572.0, 947.0, 1613.0, 2887.0, 5011.0, 9437.0, 18309.0, 38485.0, 91433.0, 317086.0, 371813.0, 103210.0, 43108.0, 20466.0, 10278.0, 5571.0, 3112.0, 1689.0, 1003.0, 599.0, 350.0, 247.0, 161.0, 91.0, 47.0, 39.0, 27.0, 10.0, 12.0, 9.0, 10.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25390625, -0.24452590942382812, -0.23514556884765625, -0.22576522827148438, -0.2163848876953125, -0.20700454711914062, -0.19762420654296875, -0.18824386596679688, -0.178863525390625, -0.16948318481445312, -0.16010284423828125, -0.15072250366210938, -0.1413421630859375, -0.13196182250976562, -0.12258148193359375, -0.11320114135742188, -0.10382080078125, -0.09444046020507812, -0.08506011962890625, -0.07567977905273438, -0.0662994384765625, -0.056919097900390625, -0.04753875732421875, -0.038158416748046875, -0.028778076171875, -0.019397735595703125, -0.01001739501953125, -0.000637054443359375, 0.0087432861328125, 0.018123626708984375, 0.02750396728515625, 0.036884307861328125, 0.0462646484375, 0.055644989013671875, 0.06502532958984375, 0.07440567016601562, 0.0837860107421875, 0.09316635131835938, 0.10254669189453125, 0.11192703247070312, 0.121307373046875, 0.13068771362304688, 0.14006805419921875, 0.14944839477539062, 0.1588287353515625, 0.16820907592773438, 0.17758941650390625, 0.18696975708007812, 0.19635009765625, 0.20573043823242188, 0.21511077880859375, 0.22449111938476562, 0.2338714599609375, 0.24325180053710938, 0.25263214111328125, 0.2620124816894531, 0.271392822265625, 0.2807731628417969, 0.29015350341796875, 0.2995338439941406, 0.3089141845703125, 0.3182945251464844, 0.32767486572265625, 0.3370552062988281, 0.346435546875]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 4.0, 3.0, 7.0, 7.0, 9.0, 11.0, 17.0, 10.0, 34.0, 25.0, 40.0, 33.0, 51.0, 65.0, 52.0, 52.0, 68.0, 75.0, 59.0, 59.0, 46.0, 53.0, 50.0, 39.0, 25.0, 24.0, 22.0, 16.0, 5.0, 16.0, 10.0, 2.0, 3.0, 3.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.21044921875, -0.20530033111572266, -0.2001514434814453, -0.19500255584716797, -0.18985366821289062, -0.18470478057861328, -0.17955589294433594, -0.1744070053100586, -0.16925811767578125, -0.1641092300415039, -0.15896034240722656, -0.15381145477294922, -0.14866256713867188, -0.14351367950439453, -0.1383647918701172, -0.13321590423583984, -0.1280670166015625, -0.12291812896728516, -0.11776924133300781, -0.11262035369873047, -0.10747146606445312, -0.10232257843017578, -0.09717369079589844, -0.0920248031616211, -0.08687591552734375, -0.0817270278930664, -0.07657814025878906, -0.07142925262451172, -0.06628036499023438, -0.06113147735595703, -0.05598258972167969, -0.050833702087402344, -0.045684814453125, -0.040535926818847656, -0.03538703918457031, -0.03023815155029297, -0.025089263916015625, -0.01994037628173828, -0.014791488647460938, -0.009642601013183594, -0.00449371337890625, 0.0006551742553710938, 0.0058040618896484375, 0.010952949523925781, 0.016101837158203125, 0.02125072479248047, 0.026399612426757812, 0.031548500061035156, 0.0366973876953125, 0.041846275329589844, 0.04699516296386719, 0.05214405059814453, 0.057292938232421875, 0.06244182586669922, 0.06759071350097656, 0.0727396011352539, 0.07788848876953125, 0.0830373764038086, 0.08818626403808594, 0.09333515167236328, 0.09848403930664062, 0.10363292694091797, 0.10878181457519531, 0.11393070220947266, 0.11907958984375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 8.0, 7.0, 9.0, 9.0, 11.0, 16.0, 27.0, 55.0, 69.0, 137.0, 186.0, 308.0, 535.0, 1029.0, 2325.0, 7467.0, 45949.0, 820393.0, 147969.0, 15040.0, 3760.0, 1442.0, 723.0, 399.0, 249.0, 153.0, 88.0, 59.0, 37.0, 17.0, 26.0, 15.0, 13.0, 8.0, 7.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6220703125, -0.5969085693359375, -0.571746826171875, -0.5465850830078125, -0.52142333984375, -0.4962615966796875, -0.471099853515625, -0.4459381103515625, -0.4207763671875, -0.3956146240234375, -0.370452880859375, -0.3452911376953125, -0.32012939453125, -0.2949676513671875, -0.269805908203125, -0.2446441650390625, -0.219482421875, -0.1943206787109375, -0.169158935546875, -0.1439971923828125, -0.11883544921875, -0.0936737060546875, -0.068511962890625, -0.0433502197265625, -0.0181884765625, 0.0069732666015625, 0.032135009765625, 0.0572967529296875, 0.08245849609375, 0.1076202392578125, 0.132781982421875, 0.1579437255859375, 0.18310546875, 0.2082672119140625, 0.233428955078125, 0.2585906982421875, 0.28375244140625, 0.3089141845703125, 0.334075927734375, 0.3592376708984375, 0.3843994140625, 0.4095611572265625, 0.434722900390625, 0.4598846435546875, 0.48504638671875, 0.5102081298828125, 0.535369873046875, 0.5605316162109375, 0.585693359375, 0.6108551025390625, 0.636016845703125, 0.6611785888671875, 0.68634033203125, 0.7115020751953125, 0.736663818359375, 0.7618255615234375, 0.7869873046875, 0.8121490478515625, 0.837310791015625, 0.8624725341796875, 0.88763427734375, 0.9127960205078125, 0.937957763671875, 0.9631195068359375, 0.98828125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 7.0, 12.0, 8.0, 10.0, 27.0, 14.0, 31.0, 28.0, 35.0, 41.0, 46.0, 50.0, 58.0, 59.0, 56.0, 65.0, 60.0, 55.0, 60.0, 51.0, 29.0, 35.0, 23.0, 24.0, 23.0, 22.0, 17.0, 6.0, 4.0, 10.0, 4.0, 9.0, 5.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64794921875, -0.6257400512695312, -0.6035308837890625, -0.5813217163085938, -0.559112548828125, -0.5369033813476562, -0.5146942138671875, -0.49248504638671875, -0.47027587890625, -0.44806671142578125, -0.4258575439453125, -0.40364837646484375, -0.381439208984375, -0.35923004150390625, -0.3370208740234375, -0.31481170654296875, -0.2926025390625, -0.27039337158203125, -0.2481842041015625, -0.22597503662109375, -0.203765869140625, -0.18155670166015625, -0.1593475341796875, -0.13713836669921875, -0.11492919921875, -0.09272003173828125, -0.0705108642578125, -0.04830169677734375, -0.026092529296875, -0.00388336181640625, 0.0183258056640625, 0.04053497314453125, 0.062744140625, 0.08495330810546875, 0.1071624755859375, 0.12937164306640625, 0.151580810546875, 0.17378997802734375, 0.1959991455078125, 0.21820831298828125, 0.24041748046875, 0.26262664794921875, 0.2848358154296875, 0.30704498291015625, 0.329254150390625, 0.35146331787109375, 0.3736724853515625, 0.39588165283203125, 0.4180908203125, 0.44029998779296875, 0.4625091552734375, 0.48471832275390625, 0.506927490234375, 0.5291366577148438, 0.5513458251953125, 0.5735549926757812, 0.59576416015625, 0.6179733276367188, 0.6401824951171875, 0.6623916625976562, 0.684600830078125, 0.7068099975585938, 0.7290191650390625, 0.7512283325195312, 0.7734375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 3.0, 8.0, 4.0, 9.0, 10.0, 19.0, 26.0, 35.0, 47.0, 56.0, 100.0, 164.0, 312.0, 615.0, 1230.0, 3023.0, 9315.0, 38837.0, 368735.0, 563588.0, 45587.0, 10459.0, 3452.0, 1422.0, 634.0, 308.0, 189.0, 106.0, 75.0, 49.0, 31.0, 24.0, 16.0, 12.0, 7.0, 9.0, 8.0, 6.0, 4.0, 4.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.263671875, -0.25518035888671875, -0.2466888427734375, -0.23819732666015625, -0.229705810546875, -0.22121429443359375, -0.2127227783203125, -0.20423126220703125, -0.19573974609375, -0.18724822998046875, -0.1787567138671875, -0.17026519775390625, -0.161773681640625, -0.15328216552734375, -0.1447906494140625, -0.13629913330078125, -0.1278076171875, -0.11931610107421875, -0.1108245849609375, -0.10233306884765625, -0.093841552734375, -0.08535003662109375, -0.0768585205078125, -0.06836700439453125, -0.05987548828125, -0.05138397216796875, -0.0428924560546875, -0.03440093994140625, -0.025909423828125, -0.01741790771484375, -0.0089263916015625, -0.00043487548828125, 0.008056640625, 0.01654815673828125, 0.0250396728515625, 0.03353118896484375, 0.042022705078125, 0.05051422119140625, 0.0590057373046875, 0.06749725341796875, 0.07598876953125, 0.08448028564453125, 0.0929718017578125, 0.10146331787109375, 0.109954833984375, 0.11844635009765625, 0.1269378662109375, 0.13542938232421875, 0.1439208984375, 0.15241241455078125, 0.1609039306640625, 0.16939544677734375, 0.177886962890625, 0.18637847900390625, 0.1948699951171875, 0.20336151123046875, 0.21185302734375, 0.22034454345703125, 0.2288360595703125, 0.23732757568359375, 0.245819091796875, 0.25431060791015625, 0.2628021240234375, 0.27129364013671875, 0.27978515625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 5.0, 2.0, 4.0, 1.0, 5.0, 10.0, 4.0, 7.0, 15.0, 7.0, 18.0, 15.0, 17.0, 18.0, 24.0, 37.0, 78.0, 90.0, 131.0, 112.0, 105.0, 70.0, 44.0, 44.0, 21.0, 26.0, 13.0, 13.0, 18.0, 14.0, 5.0, 7.0, 5.0, 5.0, 7.0, 3.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.480382919311523e-05, -7.224828004837036e-05, -6.969273090362549e-05, -6.713718175888062e-05, -6.458163261413574e-05, -6.202608346939087e-05, -5.9470534324645996e-05, -5.691498517990112e-05, -5.435943603515625e-05, -5.180388689041138e-05, -4.9248337745666504e-05, -4.669278860092163e-05, -4.413723945617676e-05, -4.1581690311431885e-05, -3.902614116668701e-05, -3.647059202194214e-05, -3.3915042877197266e-05, -3.135949373245239e-05, -2.880394458770752e-05, -2.6248395442962646e-05, -2.3692846298217773e-05, -2.11372971534729e-05, -1.8581748008728027e-05, -1.6026198863983154e-05, -1.3470649719238281e-05, -1.0915100574493408e-05, -8.359551429748535e-06, -5.804002285003662e-06, -3.248453140258789e-06, -6.92903995513916e-07, 1.862645149230957e-06, 4.41819429397583e-06, 6.973743438720703e-06, 9.529292583465576e-06, 1.208484172821045e-05, 1.4640390872955322e-05, 1.7195940017700195e-05, 1.975148916244507e-05, 2.230703830718994e-05, 2.4862587451934814e-05, 2.7418136596679688e-05, 2.997368574142456e-05, 3.2529234886169434e-05, 3.508478403091431e-05, 3.764033317565918e-05, 4.019588232040405e-05, 4.2751431465148926e-05, 4.53069806098938e-05, 4.786252975463867e-05, 5.0418078899383545e-05, 5.297362804412842e-05, 5.552917718887329e-05, 5.8084726333618164e-05, 6.064027547836304e-05, 6.319582462310791e-05, 6.575137376785278e-05, 6.830692291259766e-05, 7.086247205734253e-05, 7.34180212020874e-05, 7.597357034683228e-05, 7.852911949157715e-05, 8.108466863632202e-05, 8.36402177810669e-05, 8.619576692581177e-05, 8.875131607055664e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 4.0, 7.0, 9.0, 9.0, 23.0, 27.0, 32.0, 50.0, 68.0, 98.0, 132.0, 177.0, 309.0, 484.0, 815.0, 1445.0, 2989.0, 7436.0, 24553.0, 149148.0, 729893.0, 99096.0, 19613.0, 6252.0, 2514.0, 1327.0, 736.0, 418.0, 290.0, 182.0, 111.0, 92.0, 59.0, 48.0, 29.0, 24.0, 16.0, 12.0, 7.0, 5.0, 4.0, 3.0, 4.0, 2.0, 1.0, 0.0, 3.0, 3.0], "bins": [-0.28173828125, -0.2740001678466797, -0.2662620544433594, -0.25852394104003906, -0.25078582763671875, -0.24304771423339844, -0.23530960083007812, -0.2275714874267578, -0.2198333740234375, -0.2120952606201172, -0.20435714721679688, -0.19661903381347656, -0.18888092041015625, -0.18114280700683594, -0.17340469360351562, -0.1656665802001953, -0.157928466796875, -0.1501903533935547, -0.14245223999023438, -0.13471412658691406, -0.12697601318359375, -0.11923789978027344, -0.11149978637695312, -0.10376167297363281, -0.0960235595703125, -0.08828544616699219, -0.08054733276367188, -0.07280921936035156, -0.06507110595703125, -0.05733299255371094, -0.049594879150390625, -0.04185676574707031, -0.03411865234375, -0.026380538940429688, -0.018642425537109375, -0.010904312133789062, -0.00316619873046875, 0.0045719146728515625, 0.012310028076171875, 0.020048141479492188, 0.0277862548828125, 0.03552436828613281, 0.043262481689453125, 0.05100059509277344, 0.05873870849609375, 0.06647682189941406, 0.07421493530273438, 0.08195304870605469, 0.089691162109375, 0.09742927551269531, 0.10516738891601562, 0.11290550231933594, 0.12064361572265625, 0.12838172912597656, 0.13611984252929688, 0.1438579559326172, 0.1515960693359375, 0.1593341827392578, 0.16707229614257812, 0.17481040954589844, 0.18254852294921875, 0.19028663635253906, 0.19802474975585938, 0.2057628631591797, 0.2135009765625]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 3.0, 6.0, 3.0, 8.0, 8.0, 11.0, 12.0, 20.0, 31.0, 54.0, 46.0, 63.0, 104.0, 146.0, 129.0, 82.0, 79.0, 47.0, 39.0, 26.0, 20.0, 18.0, 13.0, 12.0, 10.0, 6.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.260986328125, -0.2522735595703125, -0.243560791015625, -0.2348480224609375, -0.22613525390625, -0.2174224853515625, -0.208709716796875, -0.1999969482421875, -0.1912841796875, -0.1825714111328125, -0.173858642578125, -0.1651458740234375, -0.15643310546875, -0.1477203369140625, -0.139007568359375, -0.1302947998046875, -0.12158203125, -0.1128692626953125, -0.104156494140625, -0.0954437255859375, -0.08673095703125, -0.0780181884765625, -0.069305419921875, -0.0605926513671875, -0.0518798828125, -0.0431671142578125, -0.034454345703125, -0.0257415771484375, -0.01702880859375, -0.0083160400390625, 0.000396728515625, 0.0091094970703125, 0.017822265625, 0.0265350341796875, 0.035247802734375, 0.0439605712890625, 0.05267333984375, 0.0613861083984375, 0.070098876953125, 0.0788116455078125, 0.0875244140625, 0.0962371826171875, 0.104949951171875, 0.1136627197265625, 0.12237548828125, 0.1310882568359375, 0.139801025390625, 0.1485137939453125, 0.1572265625, 0.1659393310546875, 0.174652099609375, 0.1833648681640625, 0.19207763671875, 0.2007904052734375, 0.209503173828125, 0.2182159423828125, 0.2269287109375, 0.2356414794921875, 0.244354248046875, 0.2530670166015625, 0.26177978515625, 0.2704925537109375, 0.279205322265625, 0.2879180908203125, 0.296630859375]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 3.0, 8.0, 12.0, 8.0, 28.0, 68.0, 190.0, 276.0, 237.0, 84.0, 50.0, 23.0, 5.0, 3.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.147737503051758, -8.923267364501953, -8.698796272277832, -8.474326133728027, -8.249855041503906, -8.025384902954102, -7.8009138107299805, -7.576443672180176, -7.351973056793213, -7.12750244140625, -6.903031826019287, -6.678561210632324, -6.454090595245361, -6.229619979858398, -6.005149841308594, -5.780679225921631, -5.556208610534668, -5.331737995147705, -5.107267379760742, -4.882796764373779, -4.658326148986816, -4.433856010437012, -4.209384918212891, -3.984914779663086, -3.760443687438965, -3.535973072052002, -3.311502456665039, -3.087031841278076, -2.8625614643096924, -2.6380908489227295, -2.4136202335357666, -2.189149856567383, -1.96467924118042, -1.740208625793457, -1.5157381296157837, -1.2912675142288208, -1.0667970180511475, -0.8423264026641846, -0.6178557872772217, -0.39338529109954834, -0.16891467571258545, 0.05555589497089386, 0.28002646565437317, 0.5044970512390137, 0.7289676070213318, 0.9534381628036499, 1.1779087781906128, 1.4023792743682861, 1.626849889755249, 1.851320505142212, 2.075791120529175, 2.3002614974975586, 2.5247321128845215, 2.7492027282714844, 2.9736733436584473, 3.19814395904541, 3.422614574432373, 3.647085189819336, 3.871555805206299, 4.096026420593262, 4.320497035980225, 4.5449676513671875, 4.769437789916992, 4.993908405303955, 5.218379020690918]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 4.0, 4.0, 7.0, 15.0, 10.0, 15.0, 12.0, 14.0, 17.0, 18.0, 30.0, 29.0, 33.0, 28.0, 37.0, 34.0, 37.0, 38.0, 44.0, 44.0, 54.0, 48.0, 57.0, 41.0, 44.0, 29.0, 35.0, 28.0, 35.0, 20.0, 25.0, 19.0, 20.0, 13.0, 12.0, 7.0, 13.0, 8.0, 5.0, 5.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.122389316558838, -2.054943799972534, -1.9874985218048096, -1.9200531244277954, -1.8526077270507812, -1.7851622104644775, -1.7177168130874634, -1.6502714157104492, -1.582826018333435, -1.515380620956421, -1.4479352235794067, -1.3804898262023926, -1.3130443096160889, -1.2455990314483643, -1.1781535148620605, -1.1107081174850464, -1.0432627201080322, -0.9758173227310181, -0.9083719253540039, -0.840926468372345, -0.7734810709953308, -0.7060356736183167, -0.6385902166366577, -0.5711448192596436, -0.5036994218826294, -0.43625402450561523, -0.3688085973262787, -0.30136317014694214, -0.23391777276992798, -0.16647237539291382, -0.09902694821357727, -0.03158152103424072, 0.03586411476135254, 0.1033095270395279, 0.17075493931770325, 0.2382003515958786, 0.30564576387405396, 0.3730911612510681, 0.44053658843040466, 0.5079820156097412, 0.5754274129867554, 0.6428728103637695, 0.7103182077407837, 0.7777636647224426, 0.8452090620994568, 0.912654459476471, 0.9800999164581299, 1.047545313835144, 1.1149907112121582, 1.1824361085891724, 1.2498815059661865, 1.3173269033432007, 1.3847723007202148, 1.4522178173065186, 1.5196632146835327, 1.5871086120605469, 1.654554009437561, 1.7219994068145752, 1.7894448041915894, 1.8568902015686035, 1.9243357181549072, 1.9917809963226318, 2.0592265129089355, 2.12667179107666, 2.194117307662964]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 7.0, 7.0, 3.0, 10.0, 12.0, 28.0, 25.0, 35.0, 62.0, 76.0, 95.0, 177.0, 519.0, 2892.0, 69151.0, 4079888.0, 38139.0, 2159.0, 445.0, 155.0, 125.0, 78.0, 55.0, 33.0, 30.0, 19.0, 20.0, 9.0, 5.0, 7.0, 5.0, 3.0, 5.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.103515625, -1.0705108642578125, -1.037506103515625, -1.0045013427734375, -0.97149658203125, -0.9384918212890625, -0.905487060546875, -0.8724822998046875, -0.8394775390625, -0.8064727783203125, -0.773468017578125, -0.7404632568359375, -0.70745849609375, -0.6744537353515625, -0.641448974609375, -0.6084442138671875, -0.575439453125, -0.5424346923828125, -0.509429931640625, -0.4764251708984375, -0.44342041015625, -0.4104156494140625, -0.377410888671875, -0.3444061279296875, -0.3114013671875, -0.2783966064453125, -0.245391845703125, -0.2123870849609375, -0.17938232421875, -0.1463775634765625, -0.113372802734375, -0.0803680419921875, -0.04736328125, -0.0143585205078125, 0.018646240234375, 0.0516510009765625, 0.08465576171875, 0.1176605224609375, 0.150665283203125, 0.1836700439453125, 0.2166748046875, 0.2496795654296875, 0.282684326171875, 0.3156890869140625, 0.34869384765625, 0.3816986083984375, 0.414703369140625, 0.4477081298828125, 0.480712890625, 0.5137176513671875, 0.546722412109375, 0.5797271728515625, 0.61273193359375, 0.6457366943359375, 0.678741455078125, 0.7117462158203125, 0.7447509765625, 0.7777557373046875, 0.810760498046875, 0.8437652587890625, 0.87677001953125, 0.9097747802734375, 0.942779541015625, 0.9757843017578125, 1.0087890625]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 8.0, 9.0, 7.0, 8.0, 13.0, 9.0, 17.0, 19.0, 20.0, 27.0, 31.0, 34.0, 33.0, 32.0, 36.0, 54.0, 62.0, 55.0, 55.0, 56.0, 43.0, 52.0, 52.0, 36.0, 42.0, 32.0, 23.0, 29.0, 24.0, 16.0, 15.0, 18.0, 11.0, 5.0, 2.0, 8.0, 2.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1422119140625, -0.1380901336669922, -0.13396835327148438, -0.12984657287597656, -0.12572479248046875, -0.12160301208496094, -0.11748123168945312, -0.11335945129394531, -0.1092376708984375, -0.10511589050292969, -0.10099411010742188, -0.09687232971191406, -0.09275054931640625, -0.08862876892089844, -0.08450698852539062, -0.08038520812988281, -0.076263427734375, -0.07214164733886719, -0.06801986694335938, -0.06389808654785156, -0.05977630615234375, -0.05565452575683594, -0.051532745361328125, -0.04741096496582031, -0.0432891845703125, -0.03916740417480469, -0.035045623779296875, -0.030923843383789062, -0.02680206298828125, -0.022680282592773438, -0.018558502197265625, -0.014436721801757812, -0.01031494140625, -0.0061931610107421875, -0.002071380615234375, 0.0020503997802734375, 0.00617218017578125, 0.010293960571289062, 0.014415740966796875, 0.018537521362304688, 0.0226593017578125, 0.026781082153320312, 0.030902862548828125, 0.03502464294433594, 0.03914642333984375, 0.04326820373535156, 0.047389984130859375, 0.05151176452636719, 0.055633544921875, 0.05975532531738281, 0.06387710571289062, 0.06799888610839844, 0.07212066650390625, 0.07624244689941406, 0.08036422729492188, 0.08448600769042969, 0.0886077880859375, 0.09272956848144531, 0.09685134887695312, 0.10097312927246094, 0.10509490966796875, 0.10921669006347656, 0.11333847045898438, 0.11746025085449219, 0.12158203125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 2.0, 4.0, 9.0, 6.0, 18.0, 43.0, 70.0, 129.0, 318.0, 771.0, 1974.0, 6410.0, 25765.0, 151893.0, 3104354.0, 818125.0, 64437.0, 13795.0, 3902.0, 1296.0, 506.0, 222.0, 95.0, 49.0, 35.0, 24.0, 12.0, 6.0, 5.0, 2.0, 5.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5595703125, -0.5447616577148438, -0.5299530029296875, -0.5151443481445312, -0.500335693359375, -0.48552703857421875, -0.4707183837890625, -0.45590972900390625, -0.44110107421875, -0.42629241943359375, -0.4114837646484375, -0.39667510986328125, -0.381866455078125, -0.36705780029296875, -0.3522491455078125, -0.33744049072265625, -0.3226318359375, -0.30782318115234375, -0.2930145263671875, -0.27820587158203125, -0.263397216796875, -0.24858856201171875, -0.2337799072265625, -0.21897125244140625, -0.20416259765625, -0.18935394287109375, -0.1745452880859375, -0.15973663330078125, -0.144927978515625, -0.13011932373046875, -0.1153106689453125, -0.10050201416015625, -0.085693359375, -0.07088470458984375, -0.0560760498046875, -0.04126739501953125, -0.026458740234375, -0.01165008544921875, 0.0031585693359375, 0.01796722412109375, 0.03277587890625, 0.04758453369140625, 0.0623931884765625, 0.07720184326171875, 0.092010498046875, 0.10681915283203125, 0.1216278076171875, 0.13643646240234375, 0.1512451171875, 0.16605377197265625, 0.1808624267578125, 0.19567108154296875, 0.210479736328125, 0.22528839111328125, 0.2400970458984375, 0.25490570068359375, 0.26971435546875, 0.28452301025390625, 0.2993316650390625, 0.31414031982421875, 0.328948974609375, 0.34375762939453125, 0.3585662841796875, 0.37337493896484375, 0.38818359375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 3.0, 10.0, 8.0, 6.0, 19.0, 18.0, 20.0, 22.0, 30.0, 39.0, 69.0, 89.0, 135.0, 220.0, 394.0, 676.0, 833.0, 536.0, 337.0, 177.0, 129.0, 72.0, 58.0, 38.0, 32.0, 20.0, 24.0, 19.0, 10.0, 6.0, 9.0, 7.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.357666015625, -0.3459205627441406, -0.33417510986328125, -0.3224296569824219, -0.3106842041015625, -0.2989387512207031, -0.28719329833984375, -0.2754478454589844, -0.263702392578125, -0.2519569396972656, -0.24021148681640625, -0.22846603393554688, -0.2167205810546875, -0.20497512817382812, -0.19322967529296875, -0.18148422241210938, -0.16973876953125, -0.15799331665039062, -0.14624786376953125, -0.13450241088867188, -0.1227569580078125, -0.11101150512695312, -0.09926605224609375, -0.08752059936523438, -0.075775146484375, -0.06402969360351562, -0.05228424072265625, -0.040538787841796875, -0.0287933349609375, -0.017047882080078125, -0.00530242919921875, 0.006443023681640625, 0.0181884765625, 0.029933929443359375, 0.04167938232421875, 0.053424835205078125, 0.0651702880859375, 0.07691574096679688, 0.08866119384765625, 0.10040664672851562, 0.112152099609375, 0.12389755249023438, 0.13564300537109375, 0.14738845825195312, 0.1591339111328125, 0.17087936401367188, 0.18262481689453125, 0.19437026977539062, 0.20611572265625, 0.21786117553710938, 0.22960662841796875, 0.24135208129882812, 0.2530975341796875, 0.2648429870605469, 0.27658843994140625, 0.2883338928222656, 0.300079345703125, 0.3118247985839844, 0.32357025146484375, 0.3353157043457031, 0.3470611572265625, 0.3588066101074219, 0.37055206298828125, 0.3822975158691406, 0.39404296875]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 5.0, 1.0, 5.0, 4.0, 12.0, 42.0, 92.0, 244.0, 294.0, 170.0, 87.0, 22.0, 8.0, 5.0, 3.0, 1.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.698622226715088, -3.516643762588501, -3.334665298461914, -3.152686595916748, -2.9707083702087402, -2.788729667663574, -2.6067512035369873, -2.4247727394104004, -2.2427942752838135, -2.0608158111572266, -1.8788373470306396, -1.6968587636947632, -1.5148802995681763, -1.3329018354415894, -1.150923252105713, -0.968944787979126, -0.7869663238525391, -0.6049878597259521, -0.42300933599472046, -0.24103081226348877, -0.059052348136901855, 0.12292611598968506, 0.3049046993255615, 0.48688316345214844, 0.6688616275787354, 0.8508400917053223, 1.0328185558319092, 1.2147971391677856, 1.3967756032943726, 1.5787540674209595, 1.760732650756836, 1.9427111148834229, 2.1246895790100098, 2.3066680431365967, 2.4886465072631836, 2.6706252098083496, 2.8526034355163574, 3.0345821380615234, 3.2165606021881104, 3.3985390663146973, 3.580517530441284, 3.762495994567871, 3.944474458694458, 4.126452922821045, 4.308431625366211, 4.490409851074219, 4.672388553619385, 4.854367256164551, 5.036345481872559, 5.218324184417725, 5.400302410125732, 5.582281112670898, 5.764259338378906, 5.946238040924072, 6.128216743469238, 6.310194969177246, 6.492173194885254, 6.67415189743042, 6.856130123138428, 7.038108825683594, 7.220087051391602, 7.402065753936768, 7.584044456481934, 7.766022682189941, 7.948001384735107]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 7.0, 2.0, 3.0, 7.0, 4.0, 7.0, 9.0, 10.0, 11.0, 14.0, 18.0, 35.0, 29.0, 20.0, 25.0, 38.0, 37.0, 47.0, 37.0, 30.0, 44.0, 48.0, 46.0, 36.0, 40.0, 43.0, 41.0, 29.0, 29.0, 29.0, 22.0, 30.0, 33.0, 24.0, 17.0, 20.0, 17.0, 11.0, 8.0, 3.0, 12.0, 7.0, 7.0, 3.0, 4.0, 4.0, 3.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3740421533584595, -1.3269727230072021, -1.2799032926559448, -1.2328338623046875, -1.1857643127441406, -1.1386948823928833, -1.091625452041626, -1.0445560216903687, -0.9974865913391113, -0.950417160987854, -0.9033476710319519, -0.8562782406806946, -0.8092088103294373, -0.7621393203735352, -0.7150698900222778, -0.6680004596710205, -0.6209309697151184, -0.5738615393638611, -0.526792049407959, -0.47972261905670166, -0.43265318870544434, -0.3855837285518646, -0.3385142683982849, -0.2914448380470276, -0.24437537789344788, -0.19730593264102936, -0.15023648738861084, -0.10316702723503113, -0.05609758198261261, -0.009028136730194092, 0.03804132342338562, 0.08511075377464294, 0.13218021392822266, 0.17924965918064117, 0.2263191044330597, 0.2733885645866394, 0.32045799493789673, 0.36752745509147644, 0.41459691524505615, 0.4616663455963135, 0.5087357759475708, 0.5558052062988281, 0.6028746962547302, 0.6499441266059875, 0.6970135569572449, 0.744083046913147, 0.7911524772644043, 0.8382219076156616, 0.8852913975715637, 0.932360827922821, 0.9794303178787231, 1.0264997482299805, 1.0735691785812378, 1.1206386089324951, 1.167708158493042, 1.2147774696350098, 1.2618470191955566, 1.308916449546814, 1.3559858798980713, 1.4030554294586182, 1.4501248598098755, 1.4971942901611328, 1.5442637205123901, 1.5913331508636475, 1.6384025812149048]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 7.0, 9.0, 10.0, 13.0, 23.0, 34.0, 66.0, 116.0, 196.0, 287.0, 617.0, 1182.0, 2383.0, 5627.0, 14155.0, 39442.0, 168804.0, 607360.0, 148532.0, 36454.0, 13041.0, 5359.0, 2418.0, 1129.0, 557.0, 324.0, 154.0, 103.0, 53.0, 42.0, 26.0, 12.0, 10.0, 3.0, 7.0, 0.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.341552734375, -0.3291168212890625, -0.316680908203125, -0.3042449951171875, -0.29180908203125, -0.2793731689453125, -0.266937255859375, -0.2545013427734375, -0.2420654296875, -0.2296295166015625, -0.217193603515625, -0.2047576904296875, -0.19232177734375, -0.1798858642578125, -0.167449951171875, -0.1550140380859375, -0.142578125, -0.1301422119140625, -0.117706298828125, -0.1052703857421875, -0.09283447265625, -0.0803985595703125, -0.067962646484375, -0.0555267333984375, -0.0430908203125, -0.0306549072265625, -0.018218994140625, -0.0057830810546875, 0.00665283203125, 0.0190887451171875, 0.031524658203125, 0.0439605712890625, 0.056396484375, 0.0688323974609375, 0.081268310546875, 0.0937042236328125, 0.10614013671875, 0.1185760498046875, 0.131011962890625, 0.1434478759765625, 0.1558837890625, 0.1683197021484375, 0.180755615234375, 0.1931915283203125, 0.20562744140625, 0.2180633544921875, 0.230499267578125, 0.2429351806640625, 0.25537109375, 0.2678070068359375, 0.280242919921875, 0.2926788330078125, 0.30511474609375, 0.3175506591796875, 0.329986572265625, 0.3424224853515625, 0.3548583984375, 0.3672943115234375, 0.379730224609375, 0.3921661376953125, 0.40460205078125, 0.4170379638671875, 0.429473876953125, 0.4419097900390625, 0.454345703125]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 8.0, 8.0, 8.0, 12.0, 10.0, 8.0, 12.0, 13.0, 25.0, 21.0, 28.0, 27.0, 35.0, 34.0, 43.0, 47.0, 58.0, 60.0, 52.0, 51.0, 43.0, 58.0, 33.0, 57.0, 31.0, 26.0, 40.0, 26.0, 19.0, 20.0, 16.0, 10.0, 15.0, 12.0, 9.0, 4.0, 7.0, 7.0, 3.0, 6.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1514892578125, -0.14700889587402344, -0.14252853393554688, -0.1380481719970703, -0.13356781005859375, -0.1290874481201172, -0.12460708618164062, -0.12012672424316406, -0.1156463623046875, -0.11116600036621094, -0.10668563842773438, -0.10220527648925781, -0.09772491455078125, -0.09324455261230469, -0.08876419067382812, -0.08428382873535156, -0.079803466796875, -0.07532310485839844, -0.07084274291992188, -0.06636238098144531, -0.06188201904296875, -0.05740165710449219, -0.052921295166015625, -0.04844093322753906, -0.0439605712890625, -0.03948020935058594, -0.034999847412109375, -0.030519485473632812, -0.02603912353515625, -0.021558761596679688, -0.017078399658203125, -0.012598037719726562, -0.00811767578125, -0.0036373138427734375, 0.000843048095703125, 0.0053234100341796875, 0.00980377197265625, 0.014284133911132812, 0.018764495849609375, 0.023244857788085938, 0.0277252197265625, 0.03220558166503906, 0.036685943603515625, 0.04116630554199219, 0.04564666748046875, 0.05012702941894531, 0.054607391357421875, 0.05908775329589844, 0.063568115234375, 0.06804847717285156, 0.07252883911132812, 0.07700920104980469, 0.08148956298828125, 0.08596992492675781, 0.09045028686523438, 0.09493064880371094, 0.0994110107421875, 0.10389137268066406, 0.10837173461914062, 0.11285209655761719, 0.11733245849609375, 0.12181282043457031, 0.12629318237304688, 0.13077354431152344, 0.13525390625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 7.0, 3.0, 7.0, 9.0, 11.0, 8.0, 20.0, 23.0, 34.0, 38.0, 75.0, 102.0, 133.0, 208.0, 355.0, 617.0, 1276.0, 2723.0, 7653.0, 28806.0, 214613.0, 710266.0, 60156.0, 13232.0, 4168.0, 1827.0, 877.0, 492.0, 266.0, 166.0, 104.0, 82.0, 56.0, 40.0, 24.0, 23.0, 10.0, 16.0, 10.0, 10.0, 6.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.501953125, -0.48416900634765625, -0.4663848876953125, -0.44860076904296875, -0.430816650390625, -0.41303253173828125, -0.3952484130859375, -0.37746429443359375, -0.35968017578125, -0.34189605712890625, -0.3241119384765625, -0.30632781982421875, -0.288543701171875, -0.27075958251953125, -0.2529754638671875, -0.23519134521484375, -0.2174072265625, -0.19962310791015625, -0.1818389892578125, -0.16405487060546875, -0.146270751953125, -0.12848663330078125, -0.1107025146484375, -0.09291839599609375, -0.07513427734375, -0.05735015869140625, -0.0395660400390625, -0.02178192138671875, -0.003997802734375, 0.01378631591796875, 0.0315704345703125, 0.04935455322265625, 0.067138671875, 0.08492279052734375, 0.1027069091796875, 0.12049102783203125, 0.138275146484375, 0.15605926513671875, 0.1738433837890625, 0.19162750244140625, 0.20941162109375, 0.22719573974609375, 0.2449798583984375, 0.26276397705078125, 0.280548095703125, 0.29833221435546875, 0.3161163330078125, 0.33390045166015625, 0.3516845703125, 0.36946868896484375, 0.3872528076171875, 0.40503692626953125, 0.422821044921875, 0.44060516357421875, 0.4583892822265625, 0.47617340087890625, 0.49395751953125, 0.5117416381835938, 0.5295257568359375, 0.5473098754882812, 0.565093994140625, 0.5828781127929688, 0.6006622314453125, 0.6184463500976562, 0.63623046875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 3.0, 5.0, 5.0, 10.0, 9.0, 5.0, 10.0, 21.0, 22.0, 22.0, 34.0, 27.0, 38.0, 35.0, 50.0, 51.0, 61.0, 61.0, 56.0, 51.0, 52.0, 40.0, 44.0, 53.0, 46.0, 28.0, 27.0, 22.0, 24.0, 10.0, 24.0, 13.0, 11.0, 6.0, 7.0, 3.0, 6.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.69091796875, -0.66864013671875, -0.6463623046875, -0.62408447265625, -0.601806640625, -0.57952880859375, -0.5572509765625, -0.53497314453125, -0.5126953125, -0.49041748046875, -0.4681396484375, -0.44586181640625, -0.423583984375, -0.40130615234375, -0.3790283203125, -0.35675048828125, -0.33447265625, -0.31219482421875, -0.2899169921875, -0.26763916015625, -0.245361328125, -0.22308349609375, -0.2008056640625, -0.17852783203125, -0.15625, -0.13397216796875, -0.1116943359375, -0.08941650390625, -0.067138671875, -0.04486083984375, -0.0225830078125, -0.00030517578125, 0.02197265625, 0.04425048828125, 0.0665283203125, 0.08880615234375, 0.111083984375, 0.13336181640625, 0.1556396484375, 0.17791748046875, 0.2001953125, 0.22247314453125, 0.2447509765625, 0.26702880859375, 0.289306640625, 0.31158447265625, 0.3338623046875, 0.35614013671875, 0.37841796875, 0.40069580078125, 0.4229736328125, 0.44525146484375, 0.467529296875, 0.48980712890625, 0.5120849609375, 0.53436279296875, 0.556640625, 0.57891845703125, 0.6011962890625, 0.62347412109375, 0.645751953125, 0.66802978515625, 0.6903076171875, 0.71258544921875, 0.73486328125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 5.0, 17.0, 13.0, 19.0, 41.0, 70.0, 162.0, 447.0, 1647.0, 9533.0, 148102.0, 856679.0, 27018.0, 3523.0, 781.0, 238.0, 102.0, 50.0, 37.0, 19.0, 12.0, 3.0, 5.0, 3.0, 7.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.6396484375, -0.6229171752929688, -0.6061859130859375, -0.5894546508789062, -0.572723388671875, -0.5559921264648438, -0.5392608642578125, -0.5225296020507812, -0.50579833984375, -0.48906707763671875, -0.4723358154296875, -0.45560455322265625, -0.438873291015625, -0.42214202880859375, -0.4054107666015625, -0.38867950439453125, -0.3719482421875, -0.35521697998046875, -0.3384857177734375, -0.32175445556640625, -0.305023193359375, -0.28829193115234375, -0.2715606689453125, -0.25482940673828125, -0.23809814453125, -0.22136688232421875, -0.2046356201171875, -0.18790435791015625, -0.171173095703125, -0.15444183349609375, -0.1377105712890625, -0.12097930908203125, -0.104248046875, -0.08751678466796875, -0.0707855224609375, -0.05405426025390625, -0.037322998046875, -0.02059173583984375, -0.0038604736328125, 0.01287078857421875, 0.02960205078125, 0.04633331298828125, 0.0630645751953125, 0.07979583740234375, 0.096527099609375, 0.11325836181640625, 0.1299896240234375, 0.14672088623046875, 0.1634521484375, 0.18018341064453125, 0.1969146728515625, 0.21364593505859375, 0.230377197265625, 0.24710845947265625, 0.2638397216796875, 0.28057098388671875, 0.29730224609375, 0.31403350830078125, 0.3307647705078125, 0.34749603271484375, 0.364227294921875, 0.38095855712890625, 0.3976898193359375, 0.41442108154296875, 0.43115234375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 1.0, 0.0, 2.0, 4.0, 1.0, 4.0, 7.0, 6.0, 8.0, 15.0, 11.0, 23.0, 21.0, 21.0, 40.0, 40.0, 82.0, 110.0, 134.0, 114.0, 108.0, 71.0, 46.0, 34.0, 15.0, 12.0, 15.0, 6.0, 8.0, 10.0, 3.0, 10.0, 11.0, 1.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.237361907958984e-05, -8.000712841749191e-05, -7.764063775539398e-05, -7.527414709329605e-05, -7.290765643119812e-05, -7.054116576910019e-05, -6.817467510700226e-05, -6.580818444490433e-05, -6.34416937828064e-05, -6.107520312070847e-05, -5.8708712458610535e-05, -5.6342221796512604e-05, -5.397573113441467e-05, -5.160924047231674e-05, -4.924274981021881e-05, -4.687625914812088e-05, -4.450976848602295e-05, -4.214327782392502e-05, -3.977678716182709e-05, -3.7410296499729156e-05, -3.5043805837631226e-05, -3.2677315175533295e-05, -3.0310824513435364e-05, -2.7944333851337433e-05, -2.5577843189239502e-05, -2.321135252714157e-05, -2.084486186504364e-05, -1.847837120294571e-05, -1.611188054084778e-05, -1.3745389878749847e-05, -1.1378899216651917e-05, -9.012408554553986e-06, -6.645917892456055e-06, -4.279427230358124e-06, -1.912936568260193e-06, 4.5355409383773804e-07, 2.820044755935669e-06, 5.1865354180336e-06, 7.553026080131531e-06, 9.919516742229462e-06, 1.2286007404327393e-05, 1.4652498066425323e-05, 1.7018988728523254e-05, 1.9385479390621185e-05, 2.1751970052719116e-05, 2.4118460714817047e-05, 2.6484951376914978e-05, 2.885144203901291e-05, 3.121793270111084e-05, 3.358442336320877e-05, 3.59509140253067e-05, 3.831740468740463e-05, 4.0683895349502563e-05, 4.3050386011600494e-05, 4.5416876673698425e-05, 4.7783367335796356e-05, 5.014985799789429e-05, 5.251634865999222e-05, 5.488283932209015e-05, 5.724932998418808e-05, 5.961582064628601e-05, 6.198231130838394e-05, 6.434880197048187e-05, 6.67152926325798e-05, 6.908178329467773e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 5.0, 3.0, 5.0, 12.0, 10.0, 11.0, 14.0, 18.0, 48.0, 55.0, 94.0, 169.0, 257.0, 454.0, 880.0, 1880.0, 5303.0, 25312.0, 594939.0, 388967.0, 21605.0, 4860.0, 1680.0, 840.0, 442.0, 228.0, 145.0, 107.0, 65.0, 44.0, 29.0, 22.0, 8.0, 9.0, 13.0, 9.0, 2.0, 5.0, 3.0, 4.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0], "bins": [-0.4541015625, -0.4411125183105469, -0.42812347412109375, -0.4151344299316406, -0.4021453857421875, -0.3891563415527344, -0.37616729736328125, -0.3631782531738281, -0.350189208984375, -0.3372001647949219, -0.32421112060546875, -0.3112220764160156, -0.2982330322265625, -0.2852439880371094, -0.27225494384765625, -0.2592658996582031, -0.24627685546875, -0.23328781127929688, -0.22029876708984375, -0.20730972290039062, -0.1943206787109375, -0.18133163452148438, -0.16834259033203125, -0.15535354614257812, -0.142364501953125, -0.12937545776367188, -0.11638641357421875, -0.10339736938476562, -0.0904083251953125, -0.07741928100585938, -0.06443023681640625, -0.051441192626953125, -0.0384521484375, -0.025463104248046875, -0.01247406005859375, 0.000514984130859375, 0.0135040283203125, 0.026493072509765625, 0.03948211669921875, 0.052471160888671875, 0.065460205078125, 0.07844924926757812, 0.09143829345703125, 0.10442733764648438, 0.1174163818359375, 0.13040542602539062, 0.14339447021484375, 0.15638351440429688, 0.16937255859375, 0.18236160278320312, 0.19535064697265625, 0.20833969116210938, 0.2213287353515625, 0.23431777954101562, 0.24730682373046875, 0.2602958679199219, 0.273284912109375, 0.2862739562988281, 0.29926300048828125, 0.3122520446777344, 0.3252410888671875, 0.3382301330566406, 0.35121917724609375, 0.3642082214355469, 0.377197265625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 5.0, 6.0, 5.0, 6.0, 7.0, 13.0, 20.0, 23.0, 32.0, 55.0, 77.0, 105.0, 163.0, 131.0, 96.0, 78.0, 50.0, 32.0, 21.0, 15.0, 9.0, 13.0, 9.0, 5.0, 6.0, 4.0, 6.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.33349609375, -0.3236885070800781, -0.31388092041015625, -0.3040733337402344, -0.2942657470703125, -0.2844581604003906, -0.27465057373046875, -0.2648429870605469, -0.255035400390625, -0.24522781372070312, -0.23542022705078125, -0.22561264038085938, -0.2158050537109375, -0.20599746704101562, -0.19618988037109375, -0.18638229370117188, -0.17657470703125, -0.16676712036132812, -0.15695953369140625, -0.14715194702148438, -0.1373443603515625, -0.12753677368164062, -0.11772918701171875, -0.10792160034179688, -0.098114013671875, -0.08830642700195312, -0.07849884033203125, -0.06869125366210938, -0.0588836669921875, -0.049076080322265625, -0.03926849365234375, -0.029460906982421875, -0.0196533203125, -0.009845733642578125, -3.814697265625e-05, 0.009769439697265625, 0.0195770263671875, 0.029384613037109375, 0.03919219970703125, 0.048999786376953125, 0.058807373046875, 0.06861495971679688, 0.07842254638671875, 0.08823013305664062, 0.0980377197265625, 0.10784530639648438, 0.11765289306640625, 0.12746047973632812, 0.13726806640625, 0.14707565307617188, 0.15688323974609375, 0.16669082641601562, 0.1764984130859375, 0.18630599975585938, 0.19611358642578125, 0.20592117309570312, 0.215728759765625, 0.22553634643554688, 0.23534393310546875, 0.24515151977539062, 0.2549591064453125, 0.2647666931152344, 0.27457427978515625, 0.2843818664550781, 0.294189453125]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 2.0, 2.0, 0.0, 7.0, 5.0, 9.0, 20.0, 65.0, 128.0, 235.0, 235.0, 143.0, 73.0, 35.0, 17.0, 7.0, 4.0, 5.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.129510402679443, -6.951709270477295, -6.773908615112305, -6.596107482910156, -6.418306350708008, -6.240505695343018, -6.062704563140869, -5.884903907775879, -5.7071027755737305, -5.529301643371582, -5.351500988006592, -5.173699855804443, -4.995899200439453, -4.818098068237305, -4.640296936035156, -4.462495803833008, -4.284695148468018, -4.106894016265869, -3.929093360900879, -3.7512922286987305, -3.573491334915161, -3.395690441131592, -3.2178893089294434, -3.040088415145874, -2.8622875213623047, -2.6844866275787354, -2.506685733795166, -2.3288846015930176, -2.1510837078094482, -1.973282814025879, -1.79548180103302, -1.6176807880401611, -1.4398798942565918, -1.2620790004730225, -1.0842779874801636, -0.9064770340919495, -0.7286760807037354, -0.5508751273155212, -0.37307417392730713, -0.19527316093444824, -0.017472267150878906, 0.1603286862373352, 0.3381296396255493, 0.5159305930137634, 0.6937315464019775, 0.8715324997901917, 1.0493334531784058, 1.2271344661712646, 1.404935359954834, 1.5827362537384033, 1.7605372667312622, 1.938338279724121, 2.1161391735076904, 2.2939400672912598, 2.471741199493408, 2.6495420932769775, 2.827342987060547, 3.005143880844116, 3.1829447746276855, 3.360745906829834, 3.5385468006134033, 3.7163476943969727, 3.894148826599121, 4.0719499588012695, 4.24975061416626]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 2.0, 3.0, 4.0, 4.0, 9.0, 7.0, 13.0, 15.0, 16.0, 23.0, 18.0, 30.0, 35.0, 29.0, 35.0, 29.0, 47.0, 41.0, 57.0, 60.0, 62.0, 49.0, 39.0, 50.0, 31.0, 41.0, 36.0, 30.0, 30.0, 19.0, 21.0, 18.0, 20.0, 21.0, 12.0, 11.0, 6.0, 4.0, 2.0, 2.0, 6.0, 7.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5878243446350098, -2.5080506801605225, -2.428276777267456, -2.3485031127929688, -2.2687292098999023, -2.188955545425415, -2.1091816425323486, -2.0294079780578613, -1.9496341943740845, -1.8698604106903076, -1.7900866270065308, -1.710312843322754, -1.6305391788482666, -1.5507652759552002, -1.470991611480713, -1.391217827796936, -1.3114440441131592, -1.2316702604293823, -1.1518964767456055, -1.0721226930618286, -0.9923489689826965, -0.9125751852989197, -0.8328014612197876, -0.7530276775360107, -0.6732538938522339, -0.593480110168457, -0.5137063264846802, -0.4339326024055481, -0.35415881872177124, -0.2743850350379944, -0.19461128115653992, -0.11483752727508545, -0.035063743591308594, 0.04471002519130707, 0.12448379397392273, 0.2042575627565384, 0.28403133153915405, 0.3638051152229309, 0.4435788691043854, 0.5233526229858398, 0.6031264066696167, 0.6829001903533936, 0.7626739740371704, 0.8424476981163025, 0.9222214818000793, 1.001995325088501, 1.0817689895629883, 1.1615427732467651, 1.241316556930542, 1.3210903406143188, 1.4008641242980957, 1.4806379079818726, 1.5604116916656494, 1.6401853561401367, 1.7199591398239136, 1.7997329235076904, 1.8795067071914673, 1.9592804908752441, 2.0390541553497314, 2.118828058242798, 2.198601722717285, 2.2783756256103516, 2.358149290084839, 2.437922954559326, 2.5176968574523926]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [6.0, 2.0, 3.0, 3.0, 5.0, 11.0, 15.0, 37.0, 45.0, 112.0, 223.0, 487.0, 1090.0, 3033.0, 8761.0, 30839.0, 158974.0, 1677587.0, 2069384.0, 193787.0, 35499.0, 9387.0, 3057.0, 1095.0, 423.0, 163.0, 92.0, 48.0, 36.0, 16.0, 8.0, 12.0, 4.0, 8.0, 10.0, 5.0, 5.0, 4.0, 2.0, 3.0, 2.0, 3.0, 5.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1754150390625, -0.1656970977783203, -0.15597915649414062, -0.14626121520996094, -0.13654327392578125, -0.12682533264160156, -0.11710739135742188, -0.10738945007324219, -0.0976715087890625, -0.08795356750488281, -0.07823562622070312, -0.06851768493652344, -0.05879974365234375, -0.04908180236816406, -0.039363861083984375, -0.029645919799804688, -0.019927978515625, -0.010210037231445312, -0.000492095947265625, 0.009225845336914062, 0.01894378662109375, 0.028661727905273438, 0.038379669189453125, 0.04809761047363281, 0.0578155517578125, 0.06753349304199219, 0.07725143432617188, 0.08696937561035156, 0.09668731689453125, 0.10640525817871094, 0.11612319946289062, 0.1258411407470703, 0.13555908203125, 0.1452770233154297, 0.15499496459960938, 0.16471290588378906, 0.17443084716796875, 0.18414878845214844, 0.19386672973632812, 0.2035846710205078, 0.2133026123046875, 0.2230205535888672, 0.23273849487304688, 0.24245643615722656, 0.25217437744140625, 0.26189231872558594, 0.2716102600097656, 0.2813282012939453, 0.291046142578125, 0.3007640838623047, 0.3104820251464844, 0.32019996643066406, 0.32991790771484375, 0.33963584899902344, 0.3493537902832031, 0.3590717315673828, 0.3687896728515625, 0.3785076141357422, 0.3882255554199219, 0.39794349670410156, 0.40766143798828125, 0.41737937927246094, 0.4270973205566406, 0.4368152618408203, 0.446533203125]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 3.0, 3.0, 4.0, 6.0, 7.0, 5.0, 10.0, 16.0, 17.0, 32.0, 29.0, 28.0, 28.0, 26.0, 38.0, 32.0, 34.0, 46.0, 57.0, 48.0, 58.0, 59.0, 43.0, 40.0, 37.0, 46.0, 35.0, 31.0, 31.0, 29.0, 27.0, 15.0, 17.0, 18.0, 15.0, 12.0, 8.0, 2.0, 6.0, 4.0, 0.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1317138671875, -0.1275310516357422, -0.12334823608398438, -0.11916542053222656, -0.11498260498046875, -0.11079978942871094, -0.10661697387695312, -0.10243415832519531, -0.0982513427734375, -0.09406852722167969, -0.08988571166992188, -0.08570289611816406, -0.08152008056640625, -0.07733726501464844, -0.07315444946289062, -0.06897163391113281, -0.064788818359375, -0.06060600280761719, -0.056423187255859375, -0.05224037170410156, -0.04805755615234375, -0.04387474060058594, -0.039691925048828125, -0.03550910949707031, -0.0313262939453125, -0.027143478393554688, -0.022960662841796875, -0.018777847290039062, -0.01459503173828125, -0.010412216186523438, -0.006229400634765625, -0.0020465850830078125, 0.00213623046875, 0.0063190460205078125, 0.010501861572265625, 0.014684677124023438, 0.01886749267578125, 0.023050308227539062, 0.027233123779296875, 0.03141593933105469, 0.0355987548828125, 0.03978157043457031, 0.043964385986328125, 0.04814720153808594, 0.05233001708984375, 0.05651283264160156, 0.060695648193359375, 0.06487846374511719, 0.069061279296875, 0.07324409484863281, 0.07742691040039062, 0.08160972595214844, 0.08579254150390625, 0.08997535705566406, 0.09415817260742188, 0.09834098815917969, 0.1025238037109375, 0.10670661926269531, 0.11088943481445312, 0.11507225036621094, 0.11925506591796875, 0.12343788146972656, 0.12762069702148438, 0.1318035125732422, 0.135986328125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 4.0, 4.0, 1.0, 5.0, 9.0, 9.0, 15.0, 19.0, 27.0, 42.0, 61.0, 69.0, 115.0, 215.0, 367.0, 691.0, 1543.0, 4045.0, 10888.0, 35553.0, 146818.0, 1239927.0, 2427193.0, 249546.0, 52540.0, 15167.0, 5136.0, 2012.0, 982.0, 554.0, 256.0, 163.0, 109.0, 61.0, 26.0, 28.0, 26.0, 15.0, 11.0, 8.0, 15.0, 3.0, 4.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.369873046875, -0.3587188720703125, -0.347564697265625, -0.3364105224609375, -0.32525634765625, -0.3141021728515625, -0.302947998046875, -0.2917938232421875, -0.2806396484375, -0.2694854736328125, -0.258331298828125, -0.2471771240234375, -0.23602294921875, -0.2248687744140625, -0.213714599609375, -0.2025604248046875, -0.19140625, -0.1802520751953125, -0.169097900390625, -0.1579437255859375, -0.14678955078125, -0.1356353759765625, -0.124481201171875, -0.1133270263671875, -0.1021728515625, -0.0910186767578125, -0.079864501953125, -0.0687103271484375, -0.05755615234375, -0.0464019775390625, -0.035247802734375, -0.0240936279296875, -0.012939453125, -0.0017852783203125, 0.009368896484375, 0.0205230712890625, 0.03167724609375, 0.0428314208984375, 0.053985595703125, 0.0651397705078125, 0.0762939453125, 0.0874481201171875, 0.098602294921875, 0.1097564697265625, 0.12091064453125, 0.1320648193359375, 0.143218994140625, 0.1543731689453125, 0.16552734375, 0.1766815185546875, 0.187835693359375, 0.1989898681640625, 0.21014404296875, 0.2212982177734375, 0.232452392578125, 0.2436065673828125, 0.2547607421875, 0.2659149169921875, 0.277069091796875, 0.2882232666015625, 0.29937744140625, 0.3105316162109375, 0.321685791015625, 0.3328399658203125, 0.343994140625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 6.0, 2.0, 4.0, 3.0, 0.0, 3.0, 5.0, 4.0, 5.0, 14.0, 14.0, 15.0, 17.0, 27.0, 34.0, 45.0, 56.0, 68.0, 90.0, 149.0, 187.0, 281.0, 451.0, 545.0, 598.0, 385.0, 306.0, 221.0, 137.0, 102.0, 62.0, 44.0, 55.0, 24.0, 36.0, 17.0, 14.0, 20.0, 11.0, 3.0, 11.0, 5.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.36572265625, -0.3539886474609375, -0.342254638671875, -0.3305206298828125, -0.31878662109375, -0.3070526123046875, -0.295318603515625, -0.2835845947265625, -0.2718505859375, -0.2601165771484375, -0.248382568359375, -0.2366485595703125, -0.22491455078125, -0.2131805419921875, -0.201446533203125, -0.1897125244140625, -0.177978515625, -0.1662445068359375, -0.154510498046875, -0.1427764892578125, -0.13104248046875, -0.1193084716796875, -0.107574462890625, -0.0958404541015625, -0.0841064453125, -0.0723724365234375, -0.060638427734375, -0.0489044189453125, -0.03717041015625, -0.0254364013671875, -0.013702392578125, -0.0019683837890625, 0.009765625, 0.0214996337890625, 0.033233642578125, 0.0449676513671875, 0.05670166015625, 0.0684356689453125, 0.080169677734375, 0.0919036865234375, 0.1036376953125, 0.1153717041015625, 0.127105712890625, 0.1388397216796875, 0.15057373046875, 0.1623077392578125, 0.174041748046875, 0.1857757568359375, 0.197509765625, 0.2092437744140625, 0.220977783203125, 0.2327117919921875, 0.24444580078125, 0.2561798095703125, 0.267913818359375, 0.2796478271484375, 0.2913818359375, 0.3031158447265625, 0.314849853515625, 0.3265838623046875, 0.33831787109375, 0.3500518798828125, 0.361785888671875, 0.3735198974609375, 0.38525390625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 3.0, 4.0, 6.0, 8.0, 15.0, 42.0, 95.0, 250.0, 272.0, 184.0, 84.0, 23.0, 13.0, 5.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.496522426605225, -6.259895324707031, -6.02326774597168, -5.786640644073486, -5.550013065338135, -5.313385963439941, -5.07675838470459, -4.8401312828063965, -4.603504180908203, -4.36687707901001, -4.130249500274658, -3.893622398376465, -3.6569948196411133, -3.42036771774292, -3.1837403774261475, -2.947113037109375, -2.7104854583740234, -2.473858118057251, -2.2372307777404785, -2.000603675842285, -1.7639762163162231, -1.5273488759994507, -1.2907216548919678, -1.0540943145751953, -0.8174669742584229, -0.5808396339416504, -0.3442123532295227, -0.10758507251739502, 0.12904226779937744, 0.3656696081161499, 0.6022968292236328, 0.8389241695404053, 1.0755510330200195, 1.312178373336792, 1.5488057136535645, 1.7854329347610474, 2.0220603942871094, 2.2586874961853027, 2.495314836502075, 2.7319421768188477, 2.96856951713562, 3.2051968574523926, 3.441824197769165, 3.6784515380859375, 3.915078639984131, 4.151706218719482, 4.388333320617676, 4.624960899353027, 4.861588001251221, 5.098215103149414, 5.334842681884766, 5.571469783782959, 5.8080973625183105, 6.044724464416504, 6.2813520431518555, 6.517979145050049, 6.754606246948242, 6.9912333488464355, 7.227860927581787, 7.4644880294799805, 7.701115608215332, 7.937742710113525, 8.174369812011719, 8.41099739074707, 8.647624969482422]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 4.0, 7.0, 9.0, 7.0, 9.0, 2.0, 9.0, 11.0, 24.0, 26.0, 33.0, 43.0, 22.0, 39.0, 31.0, 50.0, 48.0, 47.0, 54.0, 51.0, 40.0, 50.0, 57.0, 38.0, 47.0, 30.0, 24.0, 31.0, 18.0, 20.0, 26.0, 20.0, 13.0, 12.0, 16.0, 3.0, 4.0, 7.0, 8.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-2.275489091873169, -2.2092456817626953, -2.1430022716522217, -2.076759099960327, -2.0105156898498535, -1.9442722797393799, -1.8780288696289062, -1.8117854595184326, -1.7455421686172485, -1.679298758506775, -1.6130554676055908, -1.5468120574951172, -1.4805686473846436, -1.4143253564834595, -1.3480819463729858, -1.2818386554718018, -1.2155952453613281, -1.1493518352508545, -1.0831085443496704, -1.0168651342391968, -0.9506217837333679, -0.8843784332275391, -0.8181350231170654, -0.7518916726112366, -0.6856483221054077, -0.6194049715995789, -0.55316162109375, -0.48691821098327637, -0.4206748604774475, -0.35443150997161865, -0.2881881296634674, -0.22194474935531616, -0.1557016372680664, -0.08945827186107635, -0.023214906454086304, 0.04302845895290375, 0.1092718243598938, 0.17551517486572266, 0.2417585551738739, 0.30800193548202515, 0.374245285987854, 0.44048863649368286, 0.5067319869995117, 0.5729753971099854, 0.6392187476158142, 0.7054620981216431, 0.7717055082321167, 0.8379488587379456, 0.9041922092437744, 0.9704355597496033, 1.0366789102554321, 1.1029223203659058, 1.1691656112670898, 1.2354090213775635, 1.301652431488037, 1.3678958415985107, 1.4341391324996948, 1.5003825426101685, 1.5666258335113525, 1.6328692436218262, 1.6991126537322998, 1.7653559446334839, 1.8315993547439575, 1.8978426456451416, 1.9640860557556152]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 0.0, 5.0, 10.0, 11.0, 19.0, 26.0, 47.0, 83.0, 155.0, 325.0, 794.0, 1899.0, 5153.0, 15083.0, 50401.0, 202273.0, 554192.0, 156787.0, 41492.0, 12581.0, 4342.0, 1617.0, 630.0, 287.0, 144.0, 76.0, 51.0, 32.0, 17.0, 8.0, 4.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.58740234375, -0.572113037109375, -0.55682373046875, -0.541534423828125, -0.5262451171875, -0.510955810546875, -0.49566650390625, -0.480377197265625, -0.465087890625, -0.449798583984375, -0.43450927734375, -0.419219970703125, -0.4039306640625, -0.388641357421875, -0.37335205078125, -0.358062744140625, -0.3427734375, -0.327484130859375, -0.31219482421875, -0.296905517578125, -0.2816162109375, -0.266326904296875, -0.25103759765625, -0.235748291015625, -0.220458984375, -0.205169677734375, -0.18988037109375, -0.174591064453125, -0.1593017578125, -0.144012451171875, -0.12872314453125, -0.113433837890625, -0.09814453125, -0.082855224609375, -0.06756591796875, -0.052276611328125, -0.0369873046875, -0.021697998046875, -0.00640869140625, 0.008880615234375, 0.024169921875, 0.039459228515625, 0.05474853515625, 0.070037841796875, 0.0853271484375, 0.100616455078125, 0.11590576171875, 0.131195068359375, 0.146484375, 0.161773681640625, 0.17706298828125, 0.192352294921875, 0.2076416015625, 0.222930908203125, 0.23822021484375, 0.253509521484375, 0.268798828125, 0.284088134765625, 0.29937744140625, 0.314666748046875, 0.3299560546875, 0.345245361328125, 0.36053466796875, 0.375823974609375, 0.39111328125]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 7.0, 17.0, 11.0, 13.0, 15.0, 12.0, 15.0, 23.0, 19.0, 25.0, 31.0, 36.0, 38.0, 40.0, 52.0, 47.0, 42.0, 40.0, 49.0, 35.0, 48.0, 51.0, 42.0, 46.0, 31.0, 36.0, 35.0, 33.0, 27.0, 20.0, 16.0, 9.0, 6.0, 7.0, 11.0, 6.0, 8.0, 3.0, 0.0, 0.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1510009765625, -0.14659690856933594, -0.14219284057617188, -0.1377887725830078, -0.13338470458984375, -0.1289806365966797, -0.12457656860351562, -0.12017250061035156, -0.1157684326171875, -0.11136436462402344, -0.10696029663085938, -0.10255622863769531, -0.09815216064453125, -0.09374809265136719, -0.08934402465820312, -0.08493995666503906, -0.080535888671875, -0.07613182067871094, -0.07172775268554688, -0.06732368469238281, -0.06291961669921875, -0.05851554870605469, -0.054111480712890625, -0.04970741271972656, -0.0453033447265625, -0.04089927673339844, -0.036495208740234375, -0.03209114074707031, -0.02768707275390625, -0.023283004760742188, -0.018878936767578125, -0.014474868774414062, -0.01007080078125, -0.0056667327880859375, -0.001262664794921875, 0.0031414031982421875, 0.00754547119140625, 0.011949539184570312, 0.016353607177734375, 0.020757675170898438, 0.0251617431640625, 0.029565811157226562, 0.033969879150390625, 0.03837394714355469, 0.04277801513671875, 0.04718208312988281, 0.051586151123046875, 0.05599021911621094, 0.060394287109375, 0.06479835510253906, 0.06920242309570312, 0.07360649108886719, 0.07801055908203125, 0.08241462707519531, 0.08681869506835938, 0.09122276306152344, 0.0956268310546875, 0.10003089904785156, 0.10443496704101562, 0.10883903503417969, 0.11324310302734375, 0.11764717102050781, 0.12205123901367188, 0.12645530700683594, 0.130859375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 3.0, 7.0, 7.0, 10.0, 8.0, 16.0, 32.0, 41.0, 60.0, 92.0, 143.0, 241.0, 449.0, 923.0, 2086.0, 6027.0, 34031.0, 797583.0, 185222.0, 14745.0, 3748.0, 1482.0, 706.0, 366.0, 208.0, 119.0, 72.0, 41.0, 30.0, 19.0, 18.0, 9.0, 4.0, 5.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.314453125, -1.2787322998046875, -1.243011474609375, -1.2072906494140625, -1.17156982421875, -1.1358489990234375, -1.100128173828125, -1.0644073486328125, -1.0286865234375, -0.9929656982421875, -0.957244873046875, -0.9215240478515625, -0.88580322265625, -0.8500823974609375, -0.814361572265625, -0.7786407470703125, -0.742919921875, -0.7071990966796875, -0.671478271484375, -0.6357574462890625, -0.60003662109375, -0.5643157958984375, -0.528594970703125, -0.4928741455078125, -0.4571533203125, -0.4214324951171875, -0.385711669921875, -0.3499908447265625, -0.31427001953125, -0.2785491943359375, -0.242828369140625, -0.2071075439453125, -0.17138671875, -0.1356658935546875, -0.099945068359375, -0.0642242431640625, -0.02850341796875, 0.0072174072265625, 0.042938232421875, 0.0786590576171875, 0.1143798828125, 0.1501007080078125, 0.185821533203125, 0.2215423583984375, 0.25726318359375, 0.2929840087890625, 0.328704833984375, 0.3644256591796875, 0.400146484375, 0.4358673095703125, 0.471588134765625, 0.5073089599609375, 0.54302978515625, 0.5787506103515625, 0.614471435546875, 0.6501922607421875, 0.6859130859375, 0.7216339111328125, 0.757354736328125, 0.7930755615234375, 0.82879638671875, 0.8645172119140625, 0.900238037109375, 0.9359588623046875, 0.9716796875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 7.0, 4.0, 1.0, 8.0, 4.0, 11.0, 13.0, 15.0, 17.0, 23.0, 16.0, 19.0, 17.0, 39.0, 50.0, 51.0, 51.0, 44.0, 59.0, 48.0, 56.0, 58.0, 58.0, 54.0, 38.0, 29.0, 37.0, 41.0, 28.0, 23.0, 16.0, 15.0, 10.0, 12.0, 7.0, 7.0, 7.0, 9.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.8583984375, -0.8336105346679688, -0.8088226318359375, -0.7840347290039062, -0.759246826171875, -0.7344589233398438, -0.7096710205078125, -0.6848831176757812, -0.66009521484375, -0.6353073120117188, -0.6105194091796875, -0.5857315063476562, -0.560943603515625, -0.5361557006835938, -0.5113677978515625, -0.48657989501953125, -0.4617919921875, -0.43700408935546875, -0.4122161865234375, -0.38742828369140625, -0.362640380859375, -0.33785247802734375, -0.3130645751953125, -0.28827667236328125, -0.26348876953125, -0.23870086669921875, -0.2139129638671875, -0.18912506103515625, -0.164337158203125, -0.13954925537109375, -0.1147613525390625, -0.08997344970703125, -0.065185546875, -0.04039764404296875, -0.0156097412109375, 0.00917816162109375, 0.033966064453125, 0.05875396728515625, 0.0835418701171875, 0.10832977294921875, 0.13311767578125, 0.15790557861328125, 0.1826934814453125, 0.20748138427734375, 0.232269287109375, 0.25705718994140625, 0.2818450927734375, 0.30663299560546875, 0.3314208984375, 0.35620880126953125, 0.3809967041015625, 0.40578460693359375, 0.430572509765625, 0.45536041259765625, 0.4801483154296875, 0.5049362182617188, 0.52972412109375, 0.5545120239257812, 0.5792999267578125, 0.6040878295898438, 0.628875732421875, 0.6536636352539062, 0.6784515380859375, 0.7032394409179688, 0.72802734375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 6.0, 5.0, 7.0, 11.0, 5.0, 25.0, 28.0, 38.0, 68.0, 123.0, 209.0, 400.0, 942.0, 2725.0, 10547.0, 68983.0, 802373.0, 138581.0, 17144.0, 3965.0, 1264.0, 497.0, 218.0, 145.0, 75.0, 53.0, 22.0, 29.0, 16.0, 11.0, 10.0, 6.0, 1.0, 8.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.39453125, -0.3820648193359375, -0.369598388671875, -0.3571319580078125, -0.34466552734375, -0.3321990966796875, -0.319732666015625, -0.3072662353515625, -0.2947998046875, -0.2823333740234375, -0.269866943359375, -0.2574005126953125, -0.24493408203125, -0.2324676513671875, -0.220001220703125, -0.2075347900390625, -0.195068359375, -0.1826019287109375, -0.170135498046875, -0.1576690673828125, -0.14520263671875, -0.1327362060546875, -0.120269775390625, -0.1078033447265625, -0.0953369140625, -0.0828704833984375, -0.070404052734375, -0.0579376220703125, -0.04547119140625, -0.0330047607421875, -0.020538330078125, -0.0080718994140625, 0.00439453125, 0.0168609619140625, 0.029327392578125, 0.0417938232421875, 0.05426025390625, 0.0667266845703125, 0.079193115234375, 0.0916595458984375, 0.1041259765625, 0.1165924072265625, 0.129058837890625, 0.1415252685546875, 0.15399169921875, 0.1664581298828125, 0.178924560546875, 0.1913909912109375, 0.203857421875, 0.2163238525390625, 0.228790283203125, 0.2412567138671875, 0.25372314453125, 0.2661895751953125, 0.278656005859375, 0.2911224365234375, 0.3035888671875, 0.3160552978515625, 0.328521728515625, 0.3409881591796875, 0.35345458984375, 0.3659210205078125, 0.378387451171875, 0.3908538818359375, 0.4033203125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 5.0, 2.0, 12.0, 7.0, 10.0, 6.0, 15.0, 12.0, 29.0, 23.0, 35.0, 21.0, 42.0, 55.0, 84.0, 122.0, 107.0, 93.0, 70.0, 51.0, 28.0, 33.0, 28.0, 22.0, 22.0, 18.0, 8.0, 8.0, 8.0, 6.0, 6.0, 4.0, 1.0, 6.0, 1.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.914138793945312e-05, -6.629899144172668e-05, -6.345659494400024e-05, -6.0614198446273804e-05, -5.777180194854736e-05, -5.492940545082092e-05, -5.208700895309448e-05, -4.924461245536804e-05, -4.64022159576416e-05, -4.355981945991516e-05, -4.071742296218872e-05, -3.787502646446228e-05, -3.503262996673584e-05, -3.21902334690094e-05, -2.934783697128296e-05, -2.650544047355652e-05, -2.3663043975830078e-05, -2.0820647478103638e-05, -1.7978250980377197e-05, -1.5135854482650757e-05, -1.2293457984924316e-05, -9.451061487197876e-06, -6.6086649894714355e-06, -3.766268491744995e-06, -9.238719940185547e-07, 1.9185245037078857e-06, 4.760921001434326e-06, 7.603317499160767e-06, 1.0445713996887207e-05, 1.3288110494613647e-05, 1.6130506992340088e-05, 1.897290349006653e-05, 2.181529998779297e-05, 2.465769648551941e-05, 2.750009298324585e-05, 3.034248948097229e-05, 3.318488597869873e-05, 3.602728247642517e-05, 3.886967897415161e-05, 4.171207547187805e-05, 4.455447196960449e-05, 4.739686846733093e-05, 5.023926496505737e-05, 5.3081661462783813e-05, 5.5924057960510254e-05, 5.8766454458236694e-05, 6.160885095596313e-05, 6.445124745368958e-05, 6.729364395141602e-05, 7.013604044914246e-05, 7.29784369468689e-05, 7.582083344459534e-05, 7.866322994232178e-05, 8.150562644004822e-05, 8.434802293777466e-05, 8.71904194355011e-05, 9.003281593322754e-05, 9.287521243095398e-05, 9.571760892868042e-05, 9.856000542640686e-05, 0.0001014024019241333, 0.00010424479842185974, 0.00010708719491958618, 0.00010992959141731262, 0.00011277198791503906]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 4.0, 5.0, 13.0, 5.0, 12.0, 21.0, 28.0, 44.0, 70.0, 75.0, 142.0, 214.0, 394.0, 764.0, 1500.0, 3631.0, 11477.0, 73449.0, 806865.0, 125895.0, 15580.0, 4546.0, 1796.0, 897.0, 462.0, 239.0, 145.0, 91.0, 54.0, 30.0, 28.0, 26.0, 20.0, 8.0, 8.0, 5.0, 7.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.339599609375, -0.3281288146972656, -0.31665802001953125, -0.3051872253417969, -0.2937164306640625, -0.2822456359863281, -0.27077484130859375, -0.2593040466308594, -0.247833251953125, -0.23636245727539062, -0.22489166259765625, -0.21342086791992188, -0.2019500732421875, -0.19047927856445312, -0.17900848388671875, -0.16753768920898438, -0.15606689453125, -0.14459609985351562, -0.13312530517578125, -0.12165451049804688, -0.1101837158203125, -0.09871292114257812, -0.08724212646484375, -0.07577133178710938, -0.064300537109375, -0.052829742431640625, -0.04135894775390625, -0.029888153076171875, -0.0184173583984375, -0.006946563720703125, 0.00452423095703125, 0.015995025634765625, 0.0274658203125, 0.038936614990234375, 0.05040740966796875, 0.061878204345703125, 0.0733489990234375, 0.08481979370117188, 0.09629058837890625, 0.10776138305664062, 0.119232177734375, 0.13070297241210938, 0.14217376708984375, 0.15364456176757812, 0.1651153564453125, 0.17658615112304688, 0.18805694580078125, 0.19952774047851562, 0.21099853515625, 0.22246932983398438, 0.23394012451171875, 0.24541091918945312, 0.2568817138671875, 0.2683525085449219, 0.27982330322265625, 0.2912940979003906, 0.302764892578125, 0.3142356872558594, 0.32570648193359375, 0.3371772766113281, 0.3486480712890625, 0.3601188659667969, 0.37158966064453125, 0.3830604553222656, 0.39453125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 0.0, 3.0, 2.0, 7.0, 2.0, 3.0, 7.0, 8.0, 15.0, 10.0, 13.0, 26.0, 16.0, 39.0, 39.0, 50.0, 64.0, 96.0, 109.0, 92.0, 77.0, 69.0, 59.0, 40.0, 28.0, 29.0, 18.0, 16.0, 16.0, 10.0, 9.0, 9.0, 4.0, 4.0, 3.0, 1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.278564453125, -0.27008056640625, -0.2615966796875, -0.25311279296875, -0.24462890625, -0.23614501953125, -0.2276611328125, -0.21917724609375, -0.210693359375, -0.20220947265625, -0.1937255859375, -0.18524169921875, -0.1767578125, -0.16827392578125, -0.1597900390625, -0.15130615234375, -0.142822265625, -0.13433837890625, -0.1258544921875, -0.11737060546875, -0.10888671875, -0.10040283203125, -0.0919189453125, -0.08343505859375, -0.074951171875, -0.06646728515625, -0.0579833984375, -0.04949951171875, -0.041015625, -0.03253173828125, -0.0240478515625, -0.01556396484375, -0.007080078125, 0.00140380859375, 0.0098876953125, 0.01837158203125, 0.02685546875, 0.03533935546875, 0.0438232421875, 0.05230712890625, 0.060791015625, 0.06927490234375, 0.0777587890625, 0.08624267578125, 0.0947265625, 0.10321044921875, 0.1116943359375, 0.12017822265625, 0.128662109375, 0.13714599609375, 0.1456298828125, 0.15411376953125, 0.16259765625, 0.17108154296875, 0.1795654296875, 0.18804931640625, 0.196533203125, 0.20501708984375, 0.2135009765625, 0.22198486328125, 0.23046875, 0.23895263671875, 0.2474365234375, 0.25592041015625, 0.264404296875]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 3.0, 10.0, 12.0, 32.0, 120.0, 370.0, 301.0, 106.0, 27.0, 9.0, 6.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.280471801757812, -10.916205406188965, -10.5519380569458, -10.187671661376953, -9.823404312133789, -9.459137916564941, -9.094870567321777, -8.73060417175293, -8.366336822509766, -8.002070426940918, -7.637803077697754, -7.273536205291748, -6.909269332885742, -6.545002460479736, -6.1807355880737305, -5.816469192504883, -5.452202320098877, -5.087935447692871, -4.723668575286865, -4.359401702880859, -3.9951348304748535, -3.6308679580688477, -3.266601324081421, -2.902334451675415, -2.538067579269409, -2.1738007068634033, -1.8095338344573975, -1.4452670812606812, -1.0810002088546753, -0.7167333364486694, -0.3524665832519531, 0.011800289154052734, 0.3760671615600586, 0.7403340339660645, 1.1046009063720703, 1.4688676595687866, 1.8331345319747925, 2.197401523590088, 2.5616681575775146, 2.9259350299835205, 3.2902019023895264, 3.6544687747955322, 4.018735408782959, 4.383002281188965, 4.747269153594971, 5.111536026000977, 5.475802898406982, 5.840069770812988, 6.204336643218994, 6.568603515625, 6.932870388031006, 7.297137260437012, 7.661404132843018, 8.025671005249023, 8.389937400817871, 8.754204750061035, 9.118471145629883, 9.48273754119873, 9.847004890441895, 10.211271286010742, 10.575538635253906, 10.939805030822754, 11.304072380065918, 11.668338775634766, 12.03260612487793]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 6.0, 5.0, 8.0, 3.0, 10.0, 8.0, 2.0, 9.0, 16.0, 13.0, 11.0, 8.0, 28.0, 18.0, 23.0, 18.0, 28.0, 25.0, 30.0, 28.0, 34.0, 43.0, 40.0, 47.0, 63.0, 42.0, 50.0, 49.0, 37.0, 29.0, 35.0, 35.0, 28.0, 20.0, 23.0, 20.0, 19.0, 13.0, 11.0, 13.0, 9.0, 9.0, 10.0, 4.0, 7.0, 5.0, 4.0, 4.0, 5.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.2793970108032227, -2.205794095993042, -2.1321909427642822, -2.0585880279541016, -1.9849849939346313, -1.9113819599151611, -1.837778925895691, -1.7641758918762207, -1.69057297706604, -1.6169699430465698, -1.5433669090270996, -1.469763994216919, -1.3961609601974487, -1.3225579261779785, -1.2489548921585083, -1.175351858139038, -1.1017488241195679, -1.0281457901000977, -0.9545428156852722, -0.880939781665802, -0.8073368072509766, -0.7337337732315063, -0.6601307392120361, -0.5865277647972107, -0.5129247307777405, -0.43932172656059265, -0.3657187223434448, -0.2921156883239746, -0.21851268410682678, -0.14490967988967896, -0.07130664587020874, 0.0022963285446166992, 0.07589936256408691, 0.14950236678123474, 0.22310538589954376, 0.2967084050178528, 0.3703114092350006, 0.44391441345214844, 0.5175174474716187, 0.5911204218864441, 0.6647234559059143, 0.7383264899253845, 0.81192946434021, 0.8855324983596802, 0.9591355323791504, 1.032738447189331, 1.1063416004180908, 1.1799445152282715, 1.2535475492477417, 1.327150583267212, 1.4007536172866821, 1.4743566513061523, 1.547959566116333, 1.6215626001358032, 1.6951656341552734, 1.768768548965454, 1.8423717021942139, 1.915974736213684, 1.9895777702331543, 2.063180685043335, 2.1367838382720947, 2.2103867530822754, 2.283989906311035, 2.357592821121216, 2.4311957359313965]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 3.0, 5.0, 3.0, 18.0, 26.0, 70.0, 181.0, 558.0, 2111.0, 12858.0, 232217.0, 3786273.0, 148121.0, 9522.0, 1588.0, 381.0, 161.0, 68.0, 31.0, 18.0, 20.0, 8.0, 6.0, 8.0, 9.0, 3.0, 6.0, 4.0, 2.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.327392578125, -0.3061943054199219, -0.28499603271484375, -0.2637977600097656, -0.2425994873046875, -0.22140121459960938, -0.20020294189453125, -0.17900466918945312, -0.157806396484375, -0.13660812377929688, -0.11540985107421875, -0.09421157836914062, -0.0730133056640625, -0.051815032958984375, -0.03061676025390625, -0.009418487548828125, 0.01177978515625, 0.032978057861328125, 0.05417633056640625, 0.07537460327148438, 0.0965728759765625, 0.11777114868164062, 0.13896942138671875, 0.16016769409179688, 0.181365966796875, 0.20256423950195312, 0.22376251220703125, 0.24496078491210938, 0.2661590576171875, 0.2873573303222656, 0.30855560302734375, 0.3297538757324219, 0.3509521484375, 0.3721504211425781, 0.39334869384765625, 0.4145469665527344, 0.4357452392578125, 0.4569435119628906, 0.47814178466796875, 0.4993400573730469, 0.520538330078125, 0.5417366027832031, 0.5629348754882812, 0.5841331481933594, 0.6053314208984375, 0.6265296936035156, 0.6477279663085938, 0.6689262390136719, 0.69012451171875, 0.7113227844238281, 0.7325210571289062, 0.7537193298339844, 0.7749176025390625, 0.7961158752441406, 0.8173141479492188, 0.8385124206542969, 0.859710693359375, 0.8809089660644531, 0.9021072387695312, 0.9233055114746094, 0.9445037841796875, 0.9657020568847656, 0.9869003295898438, 1.0080986022949219, 1.029296875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 7.0, 4.0, 13.0, 18.0, 24.0, 22.0, 29.0, 51.0, 57.0, 66.0, 71.0, 69.0, 82.0, 69.0, 69.0, 60.0, 59.0, 59.0, 51.0, 45.0, 26.0, 16.0, 18.0, 13.0, 5.0, 2.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1427001953125, -0.1355609893798828, -0.12842178344726562, -0.12128257751464844, -0.11414337158203125, -0.10700416564941406, -0.09986495971679688, -0.09272575378417969, -0.0855865478515625, -0.07844734191894531, -0.07130813598632812, -0.06416893005371094, -0.05702972412109375, -0.04989051818847656, -0.042751312255859375, -0.03561210632324219, -0.028472900390625, -0.021333694458007812, -0.014194488525390625, -0.0070552825927734375, 8.392333984375e-05, 0.0072231292724609375, 0.014362335205078125, 0.021501541137695312, 0.0286407470703125, 0.03577995300292969, 0.042919158935546875, 0.05005836486816406, 0.05719757080078125, 0.06433677673339844, 0.07147598266601562, 0.07861518859863281, 0.08575439453125, 0.09289360046386719, 0.10003280639648438, 0.10717201232910156, 0.11431121826171875, 0.12145042419433594, 0.12858963012695312, 0.1357288360595703, 0.1428680419921875, 0.1500072479248047, 0.15714645385742188, 0.16428565979003906, 0.17142486572265625, 0.17856407165527344, 0.18570327758789062, 0.1928424835205078, 0.199981689453125, 0.2071208953857422, 0.21426010131835938, 0.22139930725097656, 0.22853851318359375, 0.23567771911621094, 0.24281692504882812, 0.2499561309814453, 0.2570953369140625, 0.2642345428466797, 0.2713737487792969, 0.27851295471191406, 0.28565216064453125, 0.29279136657714844, 0.2999305725097656, 0.3070697784423828, 0.314208984375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 10.0, 6.0, 15.0, 15.0, 33.0, 66.0, 103.0, 160.0, 280.0, 587.0, 1265.0, 3535.0, 11796.0, 56801.0, 558943.0, 3251781.0, 262110.0, 34565.0, 7692.0, 2391.0, 923.0, 512.0, 279.0, 150.0, 90.0, 54.0, 40.0, 25.0, 17.0, 14.0, 13.0, 2.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.66845703125, -0.6518974304199219, -0.6353378295898438, -0.6187782287597656, -0.6022186279296875, -0.5856590270996094, -0.5690994262695312, -0.5525398254394531, -0.535980224609375, -0.5194206237792969, -0.5028610229492188, -0.4863014221191406, -0.4697418212890625, -0.4531822204589844, -0.43662261962890625, -0.4200630187988281, -0.40350341796875, -0.3869438171386719, -0.37038421630859375, -0.3538246154785156, -0.3372650146484375, -0.3207054138183594, -0.30414581298828125, -0.2875862121582031, -0.271026611328125, -0.2544670104980469, -0.23790740966796875, -0.22134780883789062, -0.2047882080078125, -0.18822860717773438, -0.17166900634765625, -0.15510940551757812, -0.1385498046875, -0.12199020385742188, -0.10543060302734375, -0.08887100219726562, -0.0723114013671875, -0.055751800537109375, -0.03919219970703125, -0.022632598876953125, -0.006072998046875, 0.010486602783203125, 0.02704620361328125, 0.043605804443359375, 0.0601654052734375, 0.07672500610351562, 0.09328460693359375, 0.10984420776367188, 0.12640380859375, 0.14296340942382812, 0.15952301025390625, 0.17608261108398438, 0.1926422119140625, 0.20920181274414062, 0.22576141357421875, 0.24232101440429688, 0.258880615234375, 0.2754402160644531, 0.29199981689453125, 0.3085594177246094, 0.3251190185546875, 0.3416786193847656, 0.35823822021484375, 0.3747978210449219, 0.391357421875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 5.0, 3.0, 6.0, 15.0, 11.0, 14.0, 24.0, 26.0, 40.0, 44.0, 93.0, 121.0, 227.0, 346.0, 575.0, 767.0, 643.0, 401.0, 260.0, 159.0, 101.0, 58.0, 54.0, 25.0, 24.0, 12.0, 11.0, 5.0, 4.0, 7.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.349365234375, -0.3316078186035156, -0.31385040283203125, -0.2960929870605469, -0.2783355712890625, -0.2605781555175781, -0.24282073974609375, -0.22506332397460938, -0.207305908203125, -0.18954849243164062, -0.17179107666015625, -0.15403366088867188, -0.1362762451171875, -0.11851882934570312, -0.10076141357421875, -0.08300399780273438, -0.06524658203125, -0.047489166259765625, -0.02973175048828125, -0.011974334716796875, 0.0057830810546875, 0.023540496826171875, 0.04129791259765625, 0.059055328369140625, 0.076812744140625, 0.09457015991210938, 0.11232757568359375, 0.13008499145507812, 0.1478424072265625, 0.16559982299804688, 0.18335723876953125, 0.20111465454101562, 0.2188720703125, 0.23662948608398438, 0.25438690185546875, 0.2721443176269531, 0.2899017333984375, 0.3076591491699219, 0.32541656494140625, 0.3431739807128906, 0.360931396484375, 0.3786888122558594, 0.39644622802734375, 0.4142036437988281, 0.4319610595703125, 0.4497184753417969, 0.46747589111328125, 0.4852333068847656, 0.50299072265625, 0.5207481384277344, 0.5385055541992188, 0.5562629699707031, 0.5740203857421875, 0.5917778015136719, 0.6095352172851562, 0.6272926330566406, 0.645050048828125, 0.6628074645996094, 0.6805648803710938, 0.6983222961425781, 0.7160797119140625, 0.7338371276855469, 0.7515945434570312, 0.7693519592285156, 0.787109375]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 2.0, 6.0, 12.0, 25.0, 102.0, 233.0, 314.0, 196.0, 66.0, 30.0, 7.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.890057563781738, -11.616432189941406, -11.342806816101074, -11.069180488586426, -10.795555114746094, -10.521929740905762, -10.24830436706543, -9.974678039550781, -9.70105266571045, -9.427427291870117, -9.153801918029785, -8.880175590515137, -8.606550216674805, -8.332924842834473, -8.05929946899414, -7.78567361831665, -7.512048244476318, -7.238422870635986, -6.964797019958496, -6.691171646118164, -6.417545795440674, -6.143920421600342, -5.870294570922852, -5.5966691970825195, -5.3230438232421875, -5.0494184494018555, -4.775792598724365, -4.502167224884033, -4.228541374206543, -3.954916000366211, -3.6812903881073, -3.4076647758483887, -3.1340389251708984, -2.8604133129119873, -2.586787700653076, -2.313162326812744, -2.039536476135254, -1.7659109830856323, -1.4922854900360107, -1.2186598777770996, -0.9450342655181885, -0.6714086532592773, -0.397783100605011, -0.12415754795074463, 0.1494680643081665, 0.42309367656707764, 0.6967191696166992, 0.9703447818756104, 1.2439703941345215, 1.5175960063934326, 1.7912216186523438, 2.064846992492676, 2.338472843170166, 2.612098217010498, 2.885723829269409, 3.1593494415283203, 3.4329750537872314, 3.7066006660461426, 3.9802262783050537, 4.253851890563965, 4.527477264404297, 4.801103115081787, 5.074728488922119, 5.348354339599609, 5.621979713439941]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 7.0, 5.0, 11.0, 10.0, 7.0, 14.0, 22.0, 18.0, 18.0, 22.0, 38.0, 44.0, 37.0, 45.0, 60.0, 63.0, 61.0, 76.0, 57.0, 52.0, 39.0, 47.0, 49.0, 40.0, 41.0, 30.0, 18.0, 11.0, 18.0, 12.0, 10.0, 10.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2216415405273438, -3.1345574855804443, -3.047473430633545, -2.9603896141052246, -2.873305559158325, -2.786221504211426, -2.6991376876831055, -2.612053632736206, -2.5249695777893066, -2.4378855228424072, -2.350801467895508, -2.2637176513671875, -2.176633596420288, -2.0895495414733887, -2.0024657249450684, -1.915381669998169, -1.8282976150512695, -1.7412135601043701, -1.6541296243667603, -1.5670456886291504, -1.479961633682251, -1.3928775787353516, -1.3057936429977417, -1.2187097072601318, -1.1316256523132324, -1.044541597366333, -0.9574576616287231, -0.8703736662864685, -0.7832896709442139, -0.6962056756019592, -0.6091216802597046, -0.52203768491745, -0.4349536895751953, -0.3478696942329407, -0.26078569889068604, -0.1737017035484314, -0.08661770820617676, 0.00046628713607788086, 0.08755028247833252, 0.17463427782058716, 0.2617182731628418, 0.34880226850509644, 0.4358862638473511, 0.5229702591896057, 0.6100542545318604, 0.697138249874115, 0.7842222452163696, 0.8713062405586243, 0.9583902359008789, 1.0454742908477783, 1.1325582265853882, 1.219642162322998, 1.3067262172698975, 1.3938102722167969, 1.4808942079544067, 1.5679781436920166, 1.655062198638916, 1.7421462535858154, 1.8292301893234253, 1.9163141250610352, 2.0033981800079346, 2.090482234954834, 2.1775660514831543, 2.2646501064300537, 2.351734161376953]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 4.0, 5.0, 6.0, 5.0, 8.0, 15.0, 25.0, 49.0, 73.0, 117.0, 238.0, 462.0, 932.0, 1953.0, 4339.0, 10561.0, 30138.0, 128568.0, 590304.0, 214991.0, 41786.0, 13783.0, 5619.0, 2323.0, 1073.0, 522.0, 294.0, 141.0, 86.0, 41.0, 26.0, 18.0, 14.0, 6.0, 7.0, 4.0, 7.0, 1.0, 3.0, 4.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.47607421875, -0.4610252380371094, -0.44597625732421875, -0.4309272766113281, -0.4158782958984375, -0.4008293151855469, -0.38578033447265625, -0.3707313537597656, -0.355682373046875, -0.3406333923339844, -0.32558441162109375, -0.3105354309082031, -0.2954864501953125, -0.2804374694824219, -0.26538848876953125, -0.2503395080566406, -0.23529052734375, -0.22024154663085938, -0.20519256591796875, -0.19014358520507812, -0.1750946044921875, -0.16004562377929688, -0.14499664306640625, -0.12994766235351562, -0.114898681640625, -0.09984970092773438, -0.08480072021484375, -0.06975173950195312, -0.0547027587890625, -0.039653778076171875, -0.02460479736328125, -0.009555816650390625, 0.0054931640625, 0.020542144775390625, 0.03559112548828125, 0.050640106201171875, 0.0656890869140625, 0.08073806762695312, 0.09578704833984375, 0.11083602905273438, 0.125885009765625, 0.14093399047851562, 0.15598297119140625, 0.17103195190429688, 0.1860809326171875, 0.20112991333007812, 0.21617889404296875, 0.23122787475585938, 0.24627685546875, 0.2613258361816406, 0.27637481689453125, 0.2914237976074219, 0.3064727783203125, 0.3215217590332031, 0.33657073974609375, 0.3516197204589844, 0.366668701171875, 0.3817176818847656, 0.39676666259765625, 0.4118156433105469, 0.4268646240234375, 0.4419136047363281, 0.45696258544921875, 0.4720115661621094, 0.487060546875]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 4.0, 1.0, 3.0, 2.0, 4.0, 5.0, 6.0, 8.0, 13.0, 14.0, 15.0, 20.0, 27.0, 29.0, 33.0, 37.0, 42.0, 41.0, 40.0, 42.0, 56.0, 61.0, 44.0, 47.0, 34.0, 53.0, 42.0, 33.0, 43.0, 43.0, 38.0, 27.0, 22.0, 18.0, 15.0, 15.0, 9.0, 12.0, 4.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1336669921875, -0.12839889526367188, -0.12313079833984375, -0.11786270141601562, -0.1125946044921875, -0.10732650756835938, -0.10205841064453125, -0.09679031372070312, -0.091522216796875, -0.08625411987304688, -0.08098602294921875, -0.07571792602539062, -0.0704498291015625, -0.06518173217773438, -0.05991363525390625, -0.054645538330078125, -0.04937744140625, -0.044109344482421875, -0.03884124755859375, -0.033573150634765625, -0.0283050537109375, -0.023036956787109375, -0.01776885986328125, -0.012500762939453125, -0.007232666015625, -0.001964569091796875, 0.00330352783203125, 0.008571624755859375, 0.0138397216796875, 0.019107818603515625, 0.02437591552734375, 0.029644012451171875, 0.034912109375, 0.040180206298828125, 0.04544830322265625, 0.050716400146484375, 0.0559844970703125, 0.061252593994140625, 0.06652069091796875, 0.07178878784179688, 0.077056884765625, 0.08232498168945312, 0.08759307861328125, 0.09286117553710938, 0.0981292724609375, 0.10339736938476562, 0.10866546630859375, 0.11393356323242188, 0.11920166015625, 0.12446975708007812, 0.12973785400390625, 0.13500595092773438, 0.1402740478515625, 0.14554214477539062, 0.15081024169921875, 0.15607833862304688, 0.161346435546875, 0.16661453247070312, 0.17188262939453125, 0.17715072631835938, 0.1824188232421875, 0.18768692016601562, 0.19295501708984375, 0.19822311401367188, 0.2034912109375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 5.0, 7.0, 9.0, 12.0, 22.0, 17.0, 26.0, 27.0, 49.0, 77.0, 117.0, 216.0, 305.0, 533.0, 1065.0, 2517.0, 8331.0, 44185.0, 801582.0, 164207.0, 17391.0, 4388.0, 1604.0, 734.0, 395.0, 250.0, 148.0, 103.0, 55.0, 51.0, 39.0, 26.0, 15.0, 12.0, 8.0, 8.0, 6.0, 5.0, 4.0, 1.0, 0.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.94287109375, -0.9140777587890625, -0.885284423828125, -0.8564910888671875, -0.82769775390625, -0.7989044189453125, -0.770111083984375, -0.7413177490234375, -0.7125244140625, -0.6837310791015625, -0.654937744140625, -0.6261444091796875, -0.59735107421875, -0.5685577392578125, -0.539764404296875, -0.5109710693359375, -0.482177734375, -0.4533843994140625, -0.424591064453125, -0.3957977294921875, -0.36700439453125, -0.3382110595703125, -0.309417724609375, -0.2806243896484375, -0.2518310546875, -0.2230377197265625, -0.194244384765625, -0.1654510498046875, -0.13665771484375, -0.1078643798828125, -0.079071044921875, -0.0502777099609375, -0.021484375, 0.0073089599609375, 0.036102294921875, 0.0648956298828125, 0.09368896484375, 0.1224822998046875, 0.151275634765625, 0.1800689697265625, 0.2088623046875, 0.2376556396484375, 0.266448974609375, 0.2952423095703125, 0.32403564453125, 0.3528289794921875, 0.381622314453125, 0.4104156494140625, 0.439208984375, 0.4680023193359375, 0.496795654296875, 0.5255889892578125, 0.55438232421875, 0.5831756591796875, 0.611968994140625, 0.6407623291015625, 0.6695556640625, 0.6983489990234375, 0.727142333984375, 0.7559356689453125, 0.78472900390625, 0.8135223388671875, 0.842315673828125, 0.8711090087890625, 0.89990234375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 3.0, 3.0, 3.0, 7.0, 9.0, 7.0, 14.0, 11.0, 11.0, 29.0, 20.0, 35.0, 23.0, 38.0, 47.0, 36.0, 40.0, 53.0, 46.0, 56.0, 67.0, 51.0, 42.0, 39.0, 46.0, 38.0, 41.0, 31.0, 27.0, 26.0, 13.0, 18.0, 15.0, 11.0, 12.0, 7.0, 11.0, 5.0, 2.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.72802734375, -0.7048187255859375, -0.681610107421875, -0.6584014892578125, -0.63519287109375, -0.6119842529296875, -0.588775634765625, -0.5655670166015625, -0.5423583984375, -0.5191497802734375, -0.495941162109375, -0.4727325439453125, -0.44952392578125, -0.4263153076171875, -0.403106689453125, -0.3798980712890625, -0.356689453125, -0.3334808349609375, -0.310272216796875, -0.2870635986328125, -0.26385498046875, -0.2406463623046875, -0.217437744140625, -0.1942291259765625, -0.1710205078125, -0.1478118896484375, -0.124603271484375, -0.1013946533203125, -0.07818603515625, -0.0549774169921875, -0.031768798828125, -0.0085601806640625, 0.0146484375, 0.0378570556640625, 0.061065673828125, 0.0842742919921875, 0.10748291015625, 0.1306915283203125, 0.153900146484375, 0.1771087646484375, 0.2003173828125, 0.2235260009765625, 0.246734619140625, 0.2699432373046875, 0.29315185546875, 0.3163604736328125, 0.339569091796875, 0.3627777099609375, 0.385986328125, 0.4091949462890625, 0.432403564453125, 0.4556121826171875, 0.47882080078125, 0.5020294189453125, 0.525238037109375, 0.5484466552734375, 0.5716552734375, 0.5948638916015625, 0.618072509765625, 0.6412811279296875, 0.66448974609375, 0.6876983642578125, 0.710906982421875, 0.7341156005859375, 0.75732421875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 6.0, 6.0, 4.0, 6.0, 11.0, 12.0, 21.0, 33.0, 49.0, 110.0, 226.0, 545.0, 1527.0, 6226.0, 51562.0, 857772.0, 116211.0, 10781.0, 2102.0, 771.0, 301.0, 114.0, 64.0, 34.0, 13.0, 11.0, 7.0, 6.0, 5.0, 3.0, 5.0, 3.0, 0.0, 3.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.56787109375, -0.5523757934570312, -0.5368804931640625, -0.5213851928710938, -0.505889892578125, -0.49039459228515625, -0.4748992919921875, -0.45940399169921875, -0.44390869140625, -0.42841339111328125, -0.4129180908203125, -0.39742279052734375, -0.381927490234375, -0.36643218994140625, -0.3509368896484375, -0.33544158935546875, -0.3199462890625, -0.30445098876953125, -0.2889556884765625, -0.27346038818359375, -0.257965087890625, -0.24246978759765625, -0.2269744873046875, -0.21147918701171875, -0.19598388671875, -0.18048858642578125, -0.1649932861328125, -0.14949798583984375, -0.134002685546875, -0.11850738525390625, -0.1030120849609375, -0.08751678466796875, -0.072021484375, -0.05652618408203125, -0.0410308837890625, -0.02553558349609375, -0.010040283203125, 0.00545501708984375, 0.0209503173828125, 0.03644561767578125, 0.05194091796875, 0.06743621826171875, 0.0829315185546875, 0.09842681884765625, 0.113922119140625, 0.12941741943359375, 0.1449127197265625, 0.16040802001953125, 0.1759033203125, 0.19139862060546875, 0.2068939208984375, 0.22238922119140625, 0.237884521484375, 0.25337982177734375, 0.2688751220703125, 0.28437042236328125, 0.29986572265625, 0.31536102294921875, 0.3308563232421875, 0.34635162353515625, 0.361846923828125, 0.37734222412109375, 0.3928375244140625, 0.40833282470703125, 0.423828125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 2.0, 7.0, 8.0, 8.0, 5.0, 5.0, 4.0, 6.0, 12.0, 13.0, 20.0, 20.0, 25.0, 27.0, 33.0, 43.0, 56.0, 68.0, 72.0, 84.0, 80.0, 78.0, 69.0, 43.0, 49.0, 24.0, 20.0, 15.0, 15.0, 11.0, 13.0, 5.0, 7.0, 7.0, 11.0, 4.0, 5.0, 4.0, 5.0, 6.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.371736526489258e-05, -6.15883618593216e-05, -5.945935845375061e-05, -5.7330355048179626e-05, -5.520135164260864e-05, -5.307234823703766e-05, -5.0943344831466675e-05, -4.881434142589569e-05, -4.668533802032471e-05, -4.455633461475372e-05, -4.242733120918274e-05, -4.0298327803611755e-05, -3.816932439804077e-05, -3.604032099246979e-05, -3.3911317586898804e-05, -3.178231418132782e-05, -2.9653310775756836e-05, -2.7524307370185852e-05, -2.5395303964614868e-05, -2.3266300559043884e-05, -2.11372971534729e-05, -1.9008293747901917e-05, -1.6879290342330933e-05, -1.4750286936759949e-05, -1.2621283531188965e-05, -1.0492280125617981e-05, -8.363276720046997e-06, -6.234273314476013e-06, -4.105269908905029e-06, -1.9762665033340454e-06, 1.5273690223693848e-07, 2.2817403078079224e-06, 4.410743713378906e-06, 6.53974711894989e-06, 8.668750524520874e-06, 1.0797753930091858e-05, 1.2926757335662842e-05, 1.5055760741233826e-05, 1.718476414680481e-05, 1.9313767552375793e-05, 2.1442770957946777e-05, 2.357177436351776e-05, 2.5700777769088745e-05, 2.782978117465973e-05, 2.9958784580230713e-05, 3.20877879858017e-05, 3.421679139137268e-05, 3.6345794796943665e-05, 3.847479820251465e-05, 4.060380160808563e-05, 4.2732805013656616e-05, 4.48618084192276e-05, 4.6990811824798584e-05, 4.911981523036957e-05, 5.124881863594055e-05, 5.3377822041511536e-05, 5.550682544708252e-05, 5.7635828852653503e-05, 5.976483225822449e-05, 6.189383566379547e-05, 6.402283906936646e-05, 6.615184247493744e-05, 6.828084588050842e-05, 7.04098492860794e-05, 7.253885269165039e-05]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 7.0, 1.0, 6.0, 10.0, 10.0, 10.0, 24.0, 15.0, 37.0, 41.0, 66.0, 84.0, 148.0, 265.0, 451.0, 758.0, 1581.0, 4064.0, 12503.0, 66736.0, 760560.0, 167404.0, 22892.0, 6157.0, 2295.0, 1084.0, 509.0, 316.0, 143.0, 117.0, 69.0, 43.0, 38.0, 24.0, 19.0, 20.0, 12.0, 10.0, 10.0, 7.0, 5.0, 1.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.324951171875, -0.3140106201171875, -0.303070068359375, -0.2921295166015625, -0.28118896484375, -0.2702484130859375, -0.259307861328125, -0.2483673095703125, -0.2374267578125, -0.2264862060546875, -0.215545654296875, -0.2046051025390625, -0.19366455078125, -0.1827239990234375, -0.171783447265625, -0.1608428955078125, -0.14990234375, -0.1389617919921875, -0.128021240234375, -0.1170806884765625, -0.10614013671875, -0.0951995849609375, -0.084259033203125, -0.0733184814453125, -0.0623779296875, -0.0514373779296875, -0.040496826171875, -0.0295562744140625, -0.01861572265625, -0.0076751708984375, 0.003265380859375, 0.0142059326171875, 0.025146484375, 0.0360870361328125, 0.047027587890625, 0.0579681396484375, 0.06890869140625, 0.0798492431640625, 0.090789794921875, 0.1017303466796875, 0.1126708984375, 0.1236114501953125, 0.134552001953125, 0.1454925537109375, 0.15643310546875, 0.1673736572265625, 0.178314208984375, 0.1892547607421875, 0.2001953125, 0.2111358642578125, 0.222076416015625, 0.2330169677734375, 0.24395751953125, 0.2548980712890625, 0.265838623046875, 0.2767791748046875, 0.2877197265625, 0.2986602783203125, 0.309600830078125, 0.3205413818359375, 0.33148193359375, 0.3424224853515625, 0.353363037109375, 0.3643035888671875, 0.375244140625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 5.0, 3.0, 1.0, 1.0, 2.0, 3.0, 5.0, 4.0, 4.0, 6.0, 12.0, 15.0, 16.0, 12.0, 20.0, 23.0, 35.0, 57.0, 86.0, 90.0, 110.0, 118.0, 87.0, 73.0, 50.0, 30.0, 26.0, 21.0, 16.0, 15.0, 11.0, 12.0, 10.0, 6.0, 11.0, 1.0, 3.0, 2.0, 3.0, 3.0, 5.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2080078125, -0.19958877563476562, -0.19116973876953125, -0.18275070190429688, -0.1743316650390625, -0.16591262817382812, -0.15749359130859375, -0.14907455444335938, -0.140655517578125, -0.13223648071289062, -0.12381744384765625, -0.11539840698242188, -0.1069793701171875, -0.09856033325195312, -0.09014129638671875, -0.08172225952148438, -0.07330322265625, -0.06488418579101562, -0.05646514892578125, -0.048046112060546875, -0.0396270751953125, -0.031208038330078125, -0.02278900146484375, -0.014369964599609375, -0.005950927734375, 0.002468109130859375, 0.01088714599609375, 0.019306182861328125, 0.0277252197265625, 0.036144256591796875, 0.04456329345703125, 0.052982330322265625, 0.0614013671875, 0.06982040405273438, 0.07823944091796875, 0.08665847778320312, 0.0950775146484375, 0.10349655151367188, 0.11191558837890625, 0.12033462524414062, 0.128753662109375, 0.13717269897460938, 0.14559173583984375, 0.15401077270507812, 0.1624298095703125, 0.17084884643554688, 0.17926788330078125, 0.18768692016601562, 0.19610595703125, 0.20452499389648438, 0.21294403076171875, 0.22136306762695312, 0.2297821044921875, 0.23820114135742188, 0.24662017822265625, 0.2550392150878906, 0.263458251953125, 0.2718772888183594, 0.28029632568359375, 0.2887153625488281, 0.2971343994140625, 0.3055534362792969, 0.31397247314453125, 0.3223915100097656, 0.330810546875]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 7.0, 5.0, 6.0, 10.0, 40.0, 66.0, 115.0, 286.0, 217.0, 96.0, 65.0, 30.0, 19.0, 8.0, 5.0, 6.0, 2.0, 6.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.227154731750488, -4.062632083892822, -3.8981094360351562, -3.7335870265960693, -3.5690643787384033, -3.4045417308807373, -3.2400193214416504, -3.0754966735839844, -2.9109740257263184, -2.7464513778686523, -2.5819287300109863, -2.4174063205718994, -2.2528836727142334, -2.0883610248565674, -1.923838496208191, -1.7593159675598145, -1.5947933197021484, -1.4302706718444824, -1.265748143196106, -1.1012256145477295, -0.9367029666900635, -0.7721803784370422, -0.607657790184021, -0.44313526153564453, -0.2786126136779785, -0.11409002542495728, 0.050432562828063965, 0.2149551510810852, 0.37947773933410645, 0.5440003275871277, 0.7085229158401489, 0.8730454444885254, 1.0375676155090332, 1.2020902633666992, 1.3666127920150757, 1.5311353206634521, 1.6956579685211182, 1.8601806163787842, 2.024703025817871, 2.189225673675537, 2.353748321533203, 2.518270969390869, 2.682793617248535, 2.847316026687622, 3.011838674545288, 3.176361322402954, 3.340883731842041, 3.505406379699707, 3.669929027557373, 3.834451675415039, 3.998974323272705, 4.163496971130371, 4.328019142150879, 4.492541790008545, 4.657064437866211, 4.821587085723877, 4.986109733581543, 5.150632381439209, 5.315155029296875, 5.479677677154541, 5.644200325012207, 5.808722496032715, 5.973245143890381, 6.137767791748047, 6.302290439605713]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 3.0, 4.0, 9.0, 7.0, 5.0, 8.0, 12.0, 16.0, 8.0, 14.0, 16.0, 20.0, 19.0, 19.0, 27.0, 37.0, 38.0, 33.0, 40.0, 48.0, 54.0, 65.0, 66.0, 57.0, 50.0, 31.0, 42.0, 35.0, 24.0, 26.0, 23.0, 21.0, 21.0, 21.0, 10.0, 15.0, 13.0, 9.0, 7.0, 8.0, 5.0, 7.0, 3.0, 2.0, 1.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5131168365478516, -2.4321579933166504, -2.351199150085449, -2.270240306854248, -2.189281463623047, -2.1083226203918457, -2.0273637771606445, -1.9464048147201538, -1.8654459714889526, -1.7844871282577515, -1.7035282850265503, -1.6225694417953491, -1.5416104793548584, -1.4606516361236572, -1.379692792892456, -1.2987339496612549, -1.2177751064300537, -1.1368162631988525, -1.0558574199676514, -0.9748985171318054, -0.8939396739006042, -0.8129808306694031, -0.7320219278335571, -0.651063084602356, -0.5701042413711548, -0.4891453981399536, -0.40818652510643005, -0.3272276520729065, -0.24626880884170532, -0.16530996561050415, -0.08435109257698059, -0.0033922195434570312, 0.07756686210632324, 0.1585257202386856, 0.23948457837104797, 0.32044345140457153, 0.4014022946357727, 0.4823611378669739, 0.5633200407028198, 0.644278883934021, 0.7252377271652222, 0.8061965703964233, 0.8871554136276245, 0.9681143164634705, 1.0490732192993164, 1.1300320625305176, 1.2109909057617188, 1.29194974899292, 1.372908592224121, 1.4538674354553223, 1.5348262786865234, 1.6157851219177246, 1.6967439651489258, 1.777702808380127, 1.8586617708206177, 1.9396206140518188, 2.0205793380737305, 2.1015381813049316, 2.182497024536133, 2.263455867767334, 2.344414710998535, 2.4253735542297363, 2.5063323974609375, 2.5872912406921387, 2.668250322341919]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 4.0, 7.0, 19.0, 29.0, 60.0, 124.0, 255.0, 612.0, 1838.0, 8210.0, 65676.0, 3139621.0, 942284.0, 29159.0, 4500.0, 1106.0, 349.0, 157.0, 90.0, 61.0, 24.0, 26.0, 15.0, 15.0, 4.0, 7.0, 5.0, 6.0, 6.0, 3.0, 1.0, 0.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3876953125, -0.36815643310546875, -0.3486175537109375, -0.32907867431640625, -0.309539794921875, -0.29000091552734375, -0.2704620361328125, -0.25092315673828125, -0.23138427734375, -0.21184539794921875, -0.1923065185546875, -0.17276763916015625, -0.153228759765625, -0.13368988037109375, -0.1141510009765625, -0.09461212158203125, -0.0750732421875, -0.05553436279296875, -0.0359954833984375, -0.01645660400390625, 0.003082275390625, 0.02262115478515625, 0.0421600341796875, 0.06169891357421875, 0.08123779296875, 0.10077667236328125, 0.1203155517578125, 0.13985443115234375, 0.159393310546875, 0.17893218994140625, 0.1984710693359375, 0.21800994873046875, 0.237548828125, 0.25708770751953125, 0.2766265869140625, 0.29616546630859375, 0.315704345703125, 0.33524322509765625, 0.3547821044921875, 0.37432098388671875, 0.39385986328125, 0.41339874267578125, 0.4329376220703125, 0.45247650146484375, 0.472015380859375, 0.49155426025390625, 0.5110931396484375, 0.5306320190429688, 0.5501708984375, 0.5697097778320312, 0.5892486572265625, 0.6087875366210938, 0.628326416015625, 0.6478652954101562, 0.6674041748046875, 0.6869430541992188, 0.70648193359375, 0.7260208129882812, 0.7455596923828125, 0.7650985717773438, 0.784637451171875, 0.8041763305664062, 0.8237152099609375, 0.8432540893554688, 0.86279296875]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 7.0, 10.0, 8.0, 13.0, 16.0, 27.0, 34.0, 36.0, 58.0, 45.0, 66.0, 83.0, 87.0, 73.0, 62.0, 73.0, 68.0, 53.0, 55.0, 34.0, 24.0, 23.0, 22.0, 11.0, 7.0, 4.0, 5.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2071533203125, -0.1992969512939453, -0.19144058227539062, -0.18358421325683594, -0.17572784423828125, -0.16787147521972656, -0.16001510620117188, -0.1521587371826172, -0.1443023681640625, -0.1364459991455078, -0.12858963012695312, -0.12073326110839844, -0.11287689208984375, -0.10502052307128906, -0.09716415405273438, -0.08930778503417969, -0.081451416015625, -0.07359504699707031, -0.06573867797851562, -0.05788230895996094, -0.05002593994140625, -0.04216957092285156, -0.034313201904296875, -0.026456832885742188, -0.0186004638671875, -0.010744094848632812, -0.002887725830078125, 0.0049686431884765625, 0.01282501220703125, 0.020681381225585938, 0.028537750244140625, 0.03639411926269531, 0.04425048828125, 0.05210685729980469, 0.059963226318359375, 0.06781959533691406, 0.07567596435546875, 0.08353233337402344, 0.09138870239257812, 0.09924507141113281, 0.1071014404296875, 0.11495780944824219, 0.12281417846679688, 0.13067054748535156, 0.13852691650390625, 0.14638328552246094, 0.15423965454101562, 0.1620960235595703, 0.169952392578125, 0.1778087615966797, 0.18566513061523438, 0.19352149963378906, 0.20137786865234375, 0.20923423767089844, 0.21709060668945312, 0.2249469757080078, 0.2328033447265625, 0.2406597137451172, 0.24851608276367188, 0.25637245178222656, 0.26422882080078125, 0.27208518981933594, 0.2799415588378906, 0.2877979278564453, 0.295654296875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 4.0, 8.0, 14.0, 23.0, 38.0, 48.0, 64.0, 129.0, 240.0, 471.0, 1249.0, 5493.0, 115938.0, 3997849.0, 66905.0, 4126.0, 975.0, 365.0, 166.0, 72.0, 46.0, 33.0, 16.0, 11.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4873046875, -1.4486083984375, -1.409912109375, -1.3712158203125, -1.33251953125, -1.2938232421875, -1.255126953125, -1.2164306640625, -1.177734375, -1.1390380859375, -1.100341796875, -1.0616455078125, -1.02294921875, -0.9842529296875, -0.945556640625, -0.9068603515625, -0.8681640625, -0.8294677734375, -0.790771484375, -0.7520751953125, -0.71337890625, -0.6746826171875, -0.635986328125, -0.5972900390625, -0.55859375, -0.5198974609375, -0.481201171875, -0.4425048828125, -0.40380859375, -0.3651123046875, -0.326416015625, -0.2877197265625, -0.2490234375, -0.2103271484375, -0.171630859375, -0.1329345703125, -0.09423828125, -0.0555419921875, -0.016845703125, 0.0218505859375, 0.060546875, 0.0992431640625, 0.137939453125, 0.1766357421875, 0.21533203125, 0.2540283203125, 0.292724609375, 0.3314208984375, 0.3701171875, 0.4088134765625, 0.447509765625, 0.4862060546875, 0.52490234375, 0.5635986328125, 0.602294921875, 0.6409912109375, 0.6796875, 0.7183837890625, 0.757080078125, 0.7957763671875, 0.83447265625, 0.8731689453125, 0.911865234375, 0.9505615234375, 0.9892578125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 2.0, 5.0, 6.0, 8.0, 32.0, 43.0, 119.0, 223.0, 553.0, 1379.0, 1046.0, 360.0, 142.0, 72.0, 40.0, 23.0, 13.0, 9.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3603515625, -1.3285598754882812, -1.2967681884765625, -1.2649765014648438, -1.233184814453125, -1.2013931274414062, -1.1696014404296875, -1.1378097534179688, -1.10601806640625, -1.0742263793945312, -1.0424346923828125, -1.0106430053710938, -0.978851318359375, -0.9470596313476562, -0.9152679443359375, -0.8834762573242188, -0.8516845703125, -0.8198928833007812, -0.7881011962890625, -0.7563095092773438, -0.724517822265625, -0.6927261352539062, -0.6609344482421875, -0.6291427612304688, -0.59735107421875, -0.5655593872070312, -0.5337677001953125, -0.5019760131835938, -0.470184326171875, -0.43839263916015625, -0.4066009521484375, -0.37480926513671875, -0.343017578125, -0.31122589111328125, -0.2794342041015625, -0.24764251708984375, -0.215850830078125, -0.18405914306640625, -0.1522674560546875, -0.12047576904296875, -0.08868408203125, -0.05689239501953125, -0.0251007080078125, 0.00669097900390625, 0.038482666015625, 0.07027435302734375, 0.1020660400390625, 0.13385772705078125, 0.1656494140625, 0.19744110107421875, 0.2292327880859375, 0.26102447509765625, 0.292816162109375, 0.32460784912109375, 0.3563995361328125, 0.38819122314453125, 0.41998291015625, 0.45177459716796875, 0.4835662841796875, 0.5153579711914062, 0.547149658203125, 0.5789413452148438, 0.6107330322265625, 0.6425247192382812, 0.67431640625]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 3.0, 5.0, 8.0, 17.0, 106.0, 286.0, 327.0, 174.0, 44.0, 17.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.782081604003906, -10.484752655029297, -10.187422752380371, -9.890093803405762, -9.592763900756836, -9.295434951782227, -8.9981050491333, -8.700776100158691, -8.403446197509766, -8.106117248535156, -7.8087873458862305, -7.511457920074463, -7.214128494262695, -6.916799545288086, -6.619470119476318, -6.322140693664551, -6.024811744689941, -5.727482318878174, -5.430152893066406, -5.132823467254639, -4.835494041442871, -4.538165092468262, -4.240835666656494, -3.9435062408447266, -3.646176815032959, -3.3488473892211914, -3.051517963409424, -2.7541887760162354, -2.4568593502044678, -2.1595299243927, -1.8622006177902222, -1.5648713111877441, -1.2675418853759766, -0.9702125191688538, -0.672883152961731, -0.37555378675460815, -0.07822442054748535, 0.21910500526428223, 0.5164343118667603, 0.8137636184692383, 1.1110930442810059, 1.4084224700927734, 1.7057517766952515, 2.0030810832977295, 2.300410509109497, 2.5977399349212646, 2.895069122314453, 3.1923985481262207, 3.4897279739379883, 3.787057399749756, 4.084386825561523, 4.381716251373291, 4.679045677185059, 4.976374626159668, 5.2737040519714355, 5.571033477783203, 5.868362903594971, 6.165692329406738, 6.463021755218506, 6.760351181030273, 7.057680130004883, 7.355010032653809, 7.652338981628418, 7.9496684074401855, 8.246997833251953]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 9.0, 22.0, 28.0, 45.0, 80.0, 103.0, 100.0, 125.0, 136.0, 118.0, 84.0, 65.0, 36.0, 30.0, 10.0, 8.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.117218494415283, -6.930070400238037, -6.742922782897949, -6.555774688720703, -6.368626594543457, -6.181478500366211, -5.994330883026123, -5.807182788848877, -5.620035171508789, -5.432887077331543, -5.245739459991455, -5.058591365814209, -4.871443271636963, -4.684295654296875, -4.497147560119629, -4.309999465942383, -4.122851371765137, -3.9357035160064697, -3.7485554218292236, -3.5614075660705566, -3.3742594718933105, -3.1871116161346436, -2.9999637603759766, -2.8128156661987305, -2.6256678104400635, -2.4385199546813965, -2.2513718605041504, -2.0642240047454834, -1.8770760297775269, -1.6899280548095703, -1.5027801990509033, -1.3156322240829468, -1.128483772277832, -0.9413357973098755, -0.7541878819465637, -0.567039966583252, -0.3798919916152954, -0.19274401664733887, -0.005596160888671875, 0.18155181407928467, 0.3686997890472412, 0.5558477640151978, 0.7429956793785095, 0.9301435947418213, 1.1172915697097778, 1.3044395446777344, 1.4915874004364014, 1.678735375404358, 1.8658833503723145, 2.0530312061309814, 2.2401793003082275, 2.4273271560668945, 2.6144752502441406, 2.8016231060028076, 2.9887709617614746, 3.1759190559387207, 3.3630669116973877, 3.5502147674560547, 3.737362861633301, 3.9245107173919678, 4.111658573150635, 4.298806667327881, 4.485954284667969, 4.673102378845215, 4.860250473022461]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 8.0, 5.0, 10.0, 17.0, 45.0, 119.0, 542.0, 4076.0, 136287.0, 890706.0, 15062.0, 1286.0, 253.0, 78.0, 35.0, 13.0, 7.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4365234375, -1.39794921875, -1.359375, -1.32080078125, -1.2822265625, -1.24365234375, -1.205078125, -1.16650390625, -1.1279296875, -1.08935546875, -1.05078125, -1.01220703125, -0.9736328125, -0.93505859375, -0.896484375, -0.85791015625, -0.8193359375, -0.78076171875, -0.7421875, -0.70361328125, -0.6650390625, -0.62646484375, -0.587890625, -0.54931640625, -0.5107421875, -0.47216796875, -0.43359375, -0.39501953125, -0.3564453125, -0.31787109375, -0.279296875, -0.24072265625, -0.2021484375, -0.16357421875, -0.125, -0.08642578125, -0.0478515625, -0.00927734375, 0.029296875, 0.06787109375, 0.1064453125, 0.14501953125, 0.18359375, 0.22216796875, 0.2607421875, 0.29931640625, 0.337890625, 0.37646484375, 0.4150390625, 0.45361328125, 0.4921875, 0.53076171875, 0.5693359375, 0.60791015625, 0.646484375, 0.68505859375, 0.7236328125, 0.76220703125, 0.80078125, 0.83935546875, 0.8779296875, 0.91650390625, 0.955078125, 0.99365234375, 1.0322265625]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 6.0, 8.0, 10.0, 12.0, 22.0, 28.0, 21.0, 22.0, 31.0, 43.0, 42.0, 46.0, 53.0, 54.0, 65.0, 72.0, 59.0, 58.0, 51.0, 54.0, 41.0, 36.0, 39.0, 31.0, 17.0, 28.0, 12.0, 11.0, 5.0, 6.0, 3.0, 5.0, 4.0, 4.0, 3.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.184326171875, -0.1776294708251953, -0.17093276977539062, -0.16423606872558594, -0.15753936767578125, -0.15084266662597656, -0.14414596557617188, -0.1374492645263672, -0.1307525634765625, -0.12405586242675781, -0.11735916137695312, -0.11066246032714844, -0.10396575927734375, -0.09726905822753906, -0.09057235717773438, -0.08387565612792969, -0.077178955078125, -0.07048225402832031, -0.06378555297851562, -0.05708885192871094, -0.05039215087890625, -0.04369544982910156, -0.036998748779296875, -0.030302047729492188, -0.0236053466796875, -0.016908645629882812, -0.010211944580078125, -0.0035152435302734375, 0.00318145751953125, 0.009878158569335938, 0.016574859619140625, 0.023271560668945312, 0.02996826171875, 0.03666496276855469, 0.043361663818359375, 0.05005836486816406, 0.05675506591796875, 0.06345176696777344, 0.07014846801757812, 0.07684516906738281, 0.0835418701171875, 0.09023857116699219, 0.09693527221679688, 0.10363197326660156, 0.11032867431640625, 0.11702537536621094, 0.12372207641601562, 0.1304187774658203, 0.137115478515625, 0.1438121795654297, 0.15050888061523438, 0.15720558166503906, 0.16390228271484375, 0.17059898376464844, 0.17729568481445312, 0.1839923858642578, 0.1906890869140625, 0.1973857879638672, 0.20408248901367188, 0.21077919006347656, 0.21747589111328125, 0.22417259216308594, 0.23086929321289062, 0.2375659942626953, 0.2442626953125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 9.0, 8.0, 9.0, 14.0, 19.0, 30.0, 32.0, 73.0, 114.0, 200.0, 389.0, 777.0, 1837.0, 5694.0, 29231.0, 368408.0, 595822.0, 35664.0, 6379.0, 2048.0, 831.0, 412.0, 204.0, 119.0, 74.0, 53.0, 29.0, 21.0, 14.0, 14.0, 5.0, 9.0, 6.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.5888671875, -0.5715713500976562, -0.5542755126953125, -0.5369796752929688, -0.519683837890625, -0.5023880004882812, -0.4850921630859375, -0.46779632568359375, -0.45050048828125, -0.43320465087890625, -0.4159088134765625, -0.39861297607421875, -0.381317138671875, -0.36402130126953125, -0.3467254638671875, -0.32942962646484375, -0.3121337890625, -0.29483795166015625, -0.2775421142578125, -0.26024627685546875, -0.242950439453125, -0.22565460205078125, -0.2083587646484375, -0.19106292724609375, -0.17376708984375, -0.15647125244140625, -0.1391754150390625, -0.12187957763671875, -0.104583740234375, -0.08728790283203125, -0.0699920654296875, -0.05269622802734375, -0.035400390625, -0.01810455322265625, -0.0008087158203125, 0.01648712158203125, 0.033782958984375, 0.05107879638671875, 0.0683746337890625, 0.08567047119140625, 0.10296630859375, 0.12026214599609375, 0.1375579833984375, 0.15485382080078125, 0.172149658203125, 0.18944549560546875, 0.2067413330078125, 0.22403717041015625, 0.2413330078125, 0.25862884521484375, 0.2759246826171875, 0.29322052001953125, 0.310516357421875, 0.32781219482421875, 0.3451080322265625, 0.36240386962890625, 0.37969970703125, 0.39699554443359375, 0.4142913818359375, 0.43158721923828125, 0.448883056640625, 0.46617889404296875, 0.4834747314453125, 0.5007705688476562, 0.51806640625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 2.0, 1.0, 5.0, 3.0, 9.0, 8.0, 11.0, 12.0, 13.0, 14.0, 21.0, 20.0, 33.0, 34.0, 40.0, 41.0, 29.0, 44.0, 65.0, 51.0, 62.0, 52.0, 56.0, 36.0, 45.0, 55.0, 40.0, 46.0, 26.0, 26.0, 13.0, 21.0, 14.0, 16.0, 8.0, 6.0, 6.0, 4.0, 6.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.6982421875, -0.6750259399414062, -0.6518096923828125, -0.6285934448242188, -0.605377197265625, -0.5821609497070312, -0.5589447021484375, -0.5357284545898438, -0.51251220703125, -0.48929595947265625, -0.4660797119140625, -0.44286346435546875, -0.419647216796875, -0.39643096923828125, -0.3732147216796875, -0.34999847412109375, -0.3267822265625, -0.30356597900390625, -0.2803497314453125, -0.25713348388671875, -0.233917236328125, -0.21070098876953125, -0.1874847412109375, -0.16426849365234375, -0.14105224609375, -0.11783599853515625, -0.0946197509765625, -0.07140350341796875, -0.048187255859375, -0.02497100830078125, -0.0017547607421875, 0.02146148681640625, 0.044677734375, 0.06789398193359375, 0.0911102294921875, 0.11432647705078125, 0.137542724609375, 0.16075897216796875, 0.1839752197265625, 0.20719146728515625, 0.23040771484375, 0.25362396240234375, 0.2768402099609375, 0.30005645751953125, 0.323272705078125, 0.34648895263671875, 0.3697052001953125, 0.39292144775390625, 0.4161376953125, 0.43935394287109375, 0.4625701904296875, 0.48578643798828125, 0.509002685546875, 0.5322189331054688, 0.5554351806640625, 0.5786514282226562, 0.60186767578125, 0.6250839233398438, 0.6483001708984375, 0.6715164184570312, 0.694732666015625, 0.7179489135742188, 0.7411651611328125, 0.7643814086914062, 0.78759765625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 4.0, 4.0, 7.0, 4.0, 4.0, 7.0, 11.0, 10.0, 21.0, 27.0, 50.0, 83.0, 150.0, 355.0, 988.0, 3209.0, 14064.0, 137069.0, 829250.0, 51851.0, 8042.0, 2082.0, 701.0, 261.0, 124.0, 58.0, 38.0, 26.0, 14.0, 12.0, 6.0, 4.0, 4.0, 2.0, 4.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.38916015625, -0.378143310546875, -0.36712646484375, -0.356109619140625, -0.3450927734375, -0.334075927734375, -0.32305908203125, -0.312042236328125, -0.301025390625, -0.290008544921875, -0.27899169921875, -0.267974853515625, -0.2569580078125, -0.245941162109375, -0.23492431640625, -0.223907470703125, -0.212890625, -0.201873779296875, -0.19085693359375, -0.179840087890625, -0.1688232421875, -0.157806396484375, -0.14678955078125, -0.135772705078125, -0.124755859375, -0.113739013671875, -0.10272216796875, -0.091705322265625, -0.0806884765625, -0.069671630859375, -0.05865478515625, -0.047637939453125, -0.03662109375, -0.025604248046875, -0.01458740234375, -0.003570556640625, 0.0074462890625, 0.018463134765625, 0.02947998046875, 0.040496826171875, 0.051513671875, 0.062530517578125, 0.07354736328125, 0.084564208984375, 0.0955810546875, 0.106597900390625, 0.11761474609375, 0.128631591796875, 0.1396484375, 0.150665283203125, 0.16168212890625, 0.172698974609375, 0.1837158203125, 0.194732666015625, 0.20574951171875, 0.216766357421875, 0.227783203125, 0.238800048828125, 0.24981689453125, 0.260833740234375, 0.2718505859375, 0.282867431640625, 0.29388427734375, 0.304901123046875, 0.31591796875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 4.0, 2.0, 3.0, 5.0, 2.0, 6.0, 16.0, 9.0, 15.0, 16.0, 26.0, 34.0, 51.0, 48.0, 86.0, 96.0, 102.0, 94.0, 94.0, 85.0, 49.0, 44.0, 26.0, 20.0, 14.0, 14.0, 8.0, 6.0, 5.0, 5.0, 3.0, 2.0, 3.0, 2.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.461143493652344e-05, -6.275344640016556e-05, -6.089545786380768e-05, -5.90374693274498e-05, -5.717948079109192e-05, -5.532149225473404e-05, -5.346350371837616e-05, -5.160551518201828e-05, -4.97475266456604e-05, -4.788953810930252e-05, -4.603154957294464e-05, -4.417356103658676e-05, -4.231557250022888e-05, -4.0457583963871e-05, -3.859959542751312e-05, -3.674160689115524e-05, -3.488361835479736e-05, -3.3025629818439484e-05, -3.1167641282081604e-05, -2.9309652745723724e-05, -2.7451664209365845e-05, -2.5593675673007965e-05, -2.3735687136650085e-05, -2.1877698600292206e-05, -2.0019710063934326e-05, -1.8161721527576447e-05, -1.6303732991218567e-05, -1.4445744454860687e-05, -1.2587755918502808e-05, -1.0729767382144928e-05, -8.871778845787048e-06, -7.013790309429169e-06, -5.155801773071289e-06, -3.2978132367134094e-06, -1.4398247003555298e-06, 4.1816383600234985e-07, 2.2761523723602295e-06, 4.134140908718109e-06, 5.992129445075989e-06, 7.850117981433868e-06, 9.708106517791748e-06, 1.1566095054149628e-05, 1.3424083590507507e-05, 1.5282072126865387e-05, 1.7140060663223267e-05, 1.8998049199581146e-05, 2.0856037735939026e-05, 2.2714026272296906e-05, 2.4572014808654785e-05, 2.6430003345012665e-05, 2.8287991881370544e-05, 3.0145980417728424e-05, 3.2003968954086304e-05, 3.386195749044418e-05, 3.571994602680206e-05, 3.757793456315994e-05, 3.943592309951782e-05, 4.12939116358757e-05, 4.315190017223358e-05, 4.500988870859146e-05, 4.686787724494934e-05, 4.872586578130722e-05, 5.05838543176651e-05, 5.244184285402298e-05, 5.429983139038086e-05]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 5.0, 2.0, 10.0, 14.0, 18.0, 38.0, 58.0, 118.0, 197.0, 418.0, 1162.0, 4251.0, 22322.0, 372065.0, 615290.0, 25582.0, 4626.0, 1309.0, 530.0, 225.0, 134.0, 74.0, 41.0, 21.0, 16.0, 8.0, 8.0, 6.0, 5.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.437255859375, -0.4251213073730469, -0.41298675537109375, -0.4008522033691406, -0.3887176513671875, -0.3765830993652344, -0.36444854736328125, -0.3523139953613281, -0.340179443359375, -0.3280448913574219, -0.31591033935546875, -0.3037757873535156, -0.2916412353515625, -0.2795066833496094, -0.26737213134765625, -0.2552375793457031, -0.24310302734375, -0.23096847534179688, -0.21883392333984375, -0.20669937133789062, -0.1945648193359375, -0.18243026733398438, -0.17029571533203125, -0.15816116333007812, -0.146026611328125, -0.13389205932617188, -0.12175750732421875, -0.10962295532226562, -0.0974884033203125, -0.08535385131835938, -0.07321929931640625, -0.061084747314453125, -0.0489501953125, -0.036815643310546875, -0.02468109130859375, -0.012546539306640625, -0.0004119873046875, 0.011722564697265625, 0.02385711669921875, 0.035991668701171875, 0.048126220703125, 0.060260772705078125, 0.07239532470703125, 0.08452987670898438, 0.0966644287109375, 0.10879898071289062, 0.12093353271484375, 0.13306808471679688, 0.14520263671875, 0.15733718872070312, 0.16947174072265625, 0.18160629272460938, 0.1937408447265625, 0.20587539672851562, 0.21800994873046875, 0.23014450073242188, 0.242279052734375, 0.2544136047363281, 0.26654815673828125, 0.2786827087402344, 0.2908172607421875, 0.3029518127441406, 0.31508636474609375, 0.3272209167480469, 0.33935546875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 10.0, 6.0, 12.0, 17.0, 40.0, 60.0, 112.0, 152.0, 176.0, 133.0, 112.0, 58.0, 35.0, 24.0, 16.0, 13.0, 7.0, 6.0, 6.0, 0.0, 5.0, 5.0, 3.0, 4.0], "bins": [-0.5380859375, -0.5270023345947266, -0.5159187316894531, -0.5048351287841797, -0.49375152587890625, -0.4826679229736328, -0.4715843200683594, -0.46050071716308594, -0.4494171142578125, -0.43833351135253906, -0.4272499084472656, -0.4161663055419922, -0.40508270263671875, -0.3939990997314453, -0.3829154968261719, -0.37183189392089844, -0.360748291015625, -0.34966468811035156, -0.3385810852050781, -0.3274974822998047, -0.31641387939453125, -0.3053302764892578, -0.2942466735839844, -0.28316307067871094, -0.2720794677734375, -0.26099586486816406, -0.24991226196289062, -0.2388286590576172, -0.22774505615234375, -0.2166614532470703, -0.20557785034179688, -0.19449424743652344, -0.18341064453125, -0.17232704162597656, -0.16124343872070312, -0.1501598358154297, -0.13907623291015625, -0.1279926300048828, -0.11690902709960938, -0.10582542419433594, -0.0947418212890625, -0.08365821838378906, -0.07257461547851562, -0.06149101257324219, -0.05040740966796875, -0.03932380676269531, -0.028240203857421875, -0.017156600952148438, -0.006072998046875, 0.0050106048583984375, 0.016094207763671875, 0.027177810668945312, 0.03826141357421875, 0.04934501647949219, 0.060428619384765625, 0.07151222229003906, 0.0825958251953125, 0.09367942810058594, 0.10476303100585938, 0.11584663391113281, 0.12693023681640625, 0.1380138397216797, 0.14909744262695312, 0.16018104553222656, 0.1712646484375]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 10.0, 41.0, 181.0, 552.0, 166.0, 33.0, 15.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.33070182800293, -4.985713958740234, -4.640725612640381, -4.2957377433776855, -3.9507498741149902, -3.605761766433716, -3.2607736587524414, -2.915785789489746, -2.5707976818084717, -2.2258095741271973, -1.880821704864502, -1.5358335971832275, -1.1908456087112427, -0.8458576202392578, -0.5008695125579834, -0.15588164329528809, 0.18910646438598633, 0.5340944528579712, 0.8790825009346008, 1.2240705490112305, 1.5690585374832153, 1.9140465259552002, 2.2590346336364746, 2.60402250289917, 2.9490106105804443, 3.2939987182617188, 3.638986587524414, 3.9839746952056885, 4.328962802886963, 4.673950672149658, 5.018939018249512, 5.363926887512207, 5.708914756774902, 6.053902626037598, 6.398890972137451, 6.7438788414001465, 7.088866710662842, 7.433855056762695, 7.778842926025391, 8.123830795288086, 8.468818664550781, 8.813806533813477, 9.158794403076172, 9.503782272338867, 9.848771095275879, 10.193758964538574, 10.53874683380127, 10.883734703063965, 11.228723526000977, 11.573711395263672, 11.918699264526367, 12.263687133789062, 12.608675956726074, 12.95366382598877, 13.298651695251465, 13.64363956451416, 13.988627433776855, 14.33361530303955, 14.678603172302246, 15.023591995239258, 15.368579864501953, 15.713567733764648, 16.058555603027344, 16.40354347229004, 16.748531341552734]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 1.0, 5.0, 2.0, 2.0, 8.0, 9.0, 10.0, 8.0, 11.0, 14.0, 14.0, 27.0, 19.0, 30.0, 22.0, 32.0, 27.0, 31.0, 44.0, 58.0, 54.0, 66.0, 83.0, 79.0, 45.0, 45.0, 36.0, 33.0, 32.0, 27.0, 16.0, 15.0, 24.0, 18.0, 11.0, 11.0, 4.0, 8.0, 9.0, 3.0, 2.0, 4.0, 2.0, 1.0, 6.0, 0.0, 0.0, 1.0, 1.0, 3.0], "bins": [-2.987886428833008, -2.9050605297088623, -2.8222343921661377, -2.739408493041992, -2.6565823554992676, -2.573756456375122, -2.4909305572509766, -2.408104419708252, -2.3252785205841064, -2.242452621459961, -2.1596264839172363, -2.076800584793091, -1.9939745664596558, -1.9111485481262207, -1.8283226490020752, -1.7454966306686401, -1.662670612335205, -1.57984459400177, -1.497018575668335, -1.4141926765441895, -1.3313666582107544, -1.2485406398773193, -1.1657147407531738, -1.0828887224197388, -1.0000627040863037, -0.9172366857528687, -0.8344107270240784, -0.7515847682952881, -0.668758749961853, -0.585932731628418, -0.5031067728996277, -0.4202808141708374, -0.33745479583740234, -0.2546288073062897, -0.171802818775177, -0.08897683024406433, -0.00615084171295166, 0.07667514681816101, 0.15950113534927368, 0.24232709407806396, 0.325153112411499, 0.4079791009426117, 0.49080508947372437, 0.5736310482025146, 0.6564570665359497, 0.7392830848693848, 0.822109043598175, 0.9049350023269653, 0.9877610206604004, 1.0705870389938354, 1.1534130573272705, 1.236238956451416, 1.319064974784851, 1.4018909931182861, 1.4847168922424316, 1.5675429105758667, 1.6503689289093018, 1.7331949472427368, 1.8160209655761719, 1.8988468647003174, 1.9816728830337524, 2.0644989013671875, 2.147324800491333, 2.2301506996154785, 2.312976837158203]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 4.0, 4.0, 3.0, 3.0, 7.0, 10.0, 8.0, 33.0, 53.0, 93.0, 174.0, 431.0, 1372.0, 5195.0, 25227.0, 370052.0, 3573447.0, 195782.0, 16998.0, 3585.0, 1046.0, 379.0, 158.0, 75.0, 45.0, 28.0, 19.0, 15.0, 8.0, 3.0, 2.0, 7.0, 5.0, 0.0, 1.0, 8.0, 1.0, 2.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.331298828125, -0.3150672912597656, -0.29883575439453125, -0.2826042175292969, -0.2663726806640625, -0.2501411437988281, -0.23390960693359375, -0.21767807006835938, -0.201446533203125, -0.18521499633789062, -0.16898345947265625, -0.15275192260742188, -0.1365203857421875, -0.12028884887695312, -0.10405731201171875, -0.08782577514648438, -0.07159423828125, -0.055362701416015625, -0.03913116455078125, -0.022899627685546875, -0.0066680908203125, 0.009563446044921875, 0.02579498291015625, 0.042026519775390625, 0.058258056640625, 0.07448959350585938, 0.09072113037109375, 0.10695266723632812, 0.1231842041015625, 0.13941574096679688, 0.15564727783203125, 0.17187881469726562, 0.1881103515625, 0.20434188842773438, 0.22057342529296875, 0.23680496215820312, 0.2530364990234375, 0.2692680358886719, 0.28549957275390625, 0.3017311096191406, 0.317962646484375, 0.3341941833496094, 0.35042572021484375, 0.3666572570800781, 0.3828887939453125, 0.3991203308105469, 0.41535186767578125, 0.4315834045410156, 0.44781494140625, 0.4640464782714844, 0.48027801513671875, 0.4965095520019531, 0.5127410888671875, 0.5289726257324219, 0.5452041625976562, 0.5614356994628906, 0.577667236328125, 0.5938987731933594, 0.6101303100585938, 0.6263618469238281, 0.6425933837890625, 0.6588249206542969, 0.6750564575195312, 0.6912879943847656, 0.70751953125]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 5.0, 5.0, 13.0, 8.0, 12.0, 20.0, 20.0, 16.0, 19.0, 39.0, 43.0, 52.0, 60.0, 61.0, 61.0, 67.0, 79.0, 70.0, 59.0, 48.0, 51.0, 40.0, 38.0, 32.0, 25.0, 22.0, 13.0, 12.0, 7.0, 6.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17041015625, -0.16330337524414062, -0.15619659423828125, -0.14908981323242188, -0.1419830322265625, -0.13487625122070312, -0.12776947021484375, -0.12066268920898438, -0.113555908203125, -0.10644912719726562, -0.09934234619140625, -0.09223556518554688, -0.0851287841796875, -0.07802200317382812, -0.07091522216796875, -0.06380844116210938, -0.05670166015625, -0.049594879150390625, -0.04248809814453125, -0.035381317138671875, -0.0282745361328125, -0.021167755126953125, -0.01406097412109375, -0.006954193115234375, 0.000152587890625, 0.007259368896484375, 0.01436614990234375, 0.021472930908203125, 0.0285797119140625, 0.035686492919921875, 0.04279327392578125, 0.049900054931640625, 0.0570068359375, 0.06411361694335938, 0.07122039794921875, 0.07832717895507812, 0.0854339599609375, 0.09254074096679688, 0.09964752197265625, 0.10675430297851562, 0.113861083984375, 0.12096786499023438, 0.12807464599609375, 0.13518142700195312, 0.1422882080078125, 0.14939498901367188, 0.15650177001953125, 0.16360855102539062, 0.17071533203125, 0.17782211303710938, 0.18492889404296875, 0.19203567504882812, 0.1991424560546875, 0.20624923706054688, 0.21335601806640625, 0.22046279907226562, 0.227569580078125, 0.23467636108398438, 0.24178314208984375, 0.24888992309570312, 0.2559967041015625, 0.2631034851074219, 0.27021026611328125, 0.2773170471191406, 0.284423828125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 3.0, 5.0, 3.0, 4.0, 9.0, 10.0, 10.0, 9.0, 17.0, 20.0, 32.0, 50.0, 63.0, 143.0, 217.0, 555.0, 1463.0, 5210.0, 26203.0, 251568.0, 3610045.0, 263645.0, 26863.0, 5386.0, 1512.0, 588.0, 261.0, 146.0, 91.0, 43.0, 24.0, 19.0, 17.0, 11.0, 9.0, 7.0, 6.0, 7.0, 2.0, 2.0, 5.0, 4.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.4599609375, -0.441192626953125, -0.42242431640625, -0.403656005859375, -0.3848876953125, -0.366119384765625, -0.34735107421875, -0.328582763671875, -0.309814453125, -0.291046142578125, -0.27227783203125, -0.253509521484375, -0.2347412109375, -0.215972900390625, -0.19720458984375, -0.178436279296875, -0.15966796875, -0.140899658203125, -0.12213134765625, -0.103363037109375, -0.0845947265625, -0.065826416015625, -0.04705810546875, -0.028289794921875, -0.009521484375, 0.009246826171875, 0.02801513671875, 0.046783447265625, 0.0655517578125, 0.084320068359375, 0.10308837890625, 0.121856689453125, 0.140625, 0.159393310546875, 0.17816162109375, 0.196929931640625, 0.2156982421875, 0.234466552734375, 0.25323486328125, 0.272003173828125, 0.290771484375, 0.309539794921875, 0.32830810546875, 0.347076416015625, 0.3658447265625, 0.384613037109375, 0.40338134765625, 0.422149658203125, 0.44091796875, 0.459686279296875, 0.47845458984375, 0.497222900390625, 0.5159912109375, 0.534759521484375, 0.55352783203125, 0.572296142578125, 0.591064453125, 0.609832763671875, 0.62860107421875, 0.647369384765625, 0.6661376953125, 0.684906005859375, 0.70367431640625, 0.722442626953125, 0.7412109375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 2.0, 5.0, 10.0, 9.0, 19.0, 9.0, 17.0, 30.0, 27.0, 37.0, 58.0, 97.0, 152.0, 214.0, 358.0, 552.0, 743.0, 579.0, 392.0, 235.0, 153.0, 113.0, 65.0, 52.0, 33.0, 18.0, 27.0, 12.0, 11.0, 13.0, 9.0, 5.0, 6.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.45654296875, -0.4429473876953125, -0.429351806640625, -0.4157562255859375, -0.40216064453125, -0.3885650634765625, -0.374969482421875, -0.3613739013671875, -0.3477783203125, -0.3341827392578125, -0.320587158203125, -0.3069915771484375, -0.29339599609375, -0.2798004150390625, -0.266204833984375, -0.2526092529296875, -0.239013671875, -0.2254180908203125, -0.211822509765625, -0.1982269287109375, -0.18463134765625, -0.1710357666015625, -0.157440185546875, -0.1438446044921875, -0.1302490234375, -0.1166534423828125, -0.103057861328125, -0.0894622802734375, -0.07586669921875, -0.0622711181640625, -0.048675537109375, -0.0350799560546875, -0.021484375, -0.0078887939453125, 0.005706787109375, 0.0193023681640625, 0.03289794921875, 0.0464935302734375, 0.060089111328125, 0.0736846923828125, 0.0872802734375, 0.1008758544921875, 0.114471435546875, 0.1280670166015625, 0.14166259765625, 0.1552581787109375, 0.168853759765625, 0.1824493408203125, 0.196044921875, 0.2096405029296875, 0.223236083984375, 0.2368316650390625, 0.25042724609375, 0.2640228271484375, 0.277618408203125, 0.2912139892578125, 0.3048095703125, 0.3184051513671875, 0.332000732421875, 0.3455963134765625, 0.35919189453125, 0.3727874755859375, 0.386383056640625, 0.3999786376953125, 0.41357421875]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 2.0, 9.0, 16.0, 84.0, 244.0, 342.0, 206.0, 76.0, 19.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.545073509216309, -5.284889221191406, -5.024704933166504, -4.764520168304443, -4.504335880279541, -4.244151592254639, -3.9839670658111572, -3.723782539367676, -3.4635982513427734, -3.203413963317871, -2.9432294368743896, -2.683044910430908, -2.422860622406006, -2.1626763343811035, -1.902491807937622, -1.6423074007034302, -1.3821229934692383, -1.1219385862350464, -0.8617541790008545, -0.6015697717666626, -0.3413853645324707, -0.08120095729827881, 0.17898344993591309, 0.439167857170105, 0.6993522644042969, 0.9595366716384888, 1.2197210788726807, 1.4799054861068726, 1.7400898933410645, 2.000274181365967, 2.2604587078094482, 2.5206432342529297, 2.7808265686035156, 3.041010856628418, 3.3011953830718994, 3.561379909515381, 3.821564197540283, 4.0817484855651855, 4.341933250427246, 4.602117538452148, 4.862301826477051, 5.122486114501953, 5.3826704025268555, 5.642855167388916, 5.903039455413818, 6.163223743438721, 6.423408508300781, 6.683592796325684, 6.943777084350586, 7.203961372375488, 7.464145660400391, 7.724330425262451, 7.9845147132873535, 8.244699478149414, 8.504883766174316, 8.765068054199219, 9.025252342224121, 9.285436630249023, 9.545620918273926, 9.805805206298828, 10.065990447998047, 10.32617473602295, 10.586359024047852, 10.846543312072754, 11.106727600097656]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 6.0, 5.0, 9.0, 12.0, 17.0, 23.0, 29.0, 35.0, 35.0, 35.0, 30.0, 46.0, 51.0, 57.0, 73.0, 75.0, 57.0, 58.0, 53.0, 48.0, 43.0, 32.0, 25.0, 31.0, 27.0, 21.0, 14.0, 16.0, 9.0, 12.0, 7.0, 8.0, 2.0, 4.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.832974433898926, -2.758089065551758, -2.683203935623169, -2.608318567276001, -2.533433437347412, -2.458548069000244, -2.3836629390716553, -2.3087775707244873, -2.2338924407958984, -2.1590070724487305, -2.0841219425201416, -2.0092365741729736, -1.9343514442443848, -1.8594660758972168, -1.7845808267593384, -1.70969557762146, -1.634810209274292, -1.5599249601364136, -1.4850397109985352, -1.4101544618606567, -1.3352692127227783, -1.2603838443756104, -1.185498595237732, -1.1106133460998535, -1.035728096961975, -0.9608428478240967, -0.8859575986862183, -0.8110722899436951, -0.7361870408058167, -0.6613017916679382, -0.586416482925415, -0.5115312337875366, -0.43664586544036865, -0.36176061630249023, -0.28687533736228943, -0.21199007332324982, -0.1371048092842102, -0.06221956014633179, 0.012665718793869019, 0.08755099773406982, 0.16243624687194824, 0.23732151091098785, 0.31220677495002747, 0.38709205389022827, 0.4619773030281067, 0.5368625521659851, 0.6117478609085083, 0.6866331100463867, 0.7615183591842651, 0.8364036083221436, 0.911288857460022, 0.9861741662025452, 1.0610594749450684, 1.1359446048736572, 1.2108299732208252, 1.2857152223587036, 1.360600471496582, 1.4354857206344604, 1.5103709697723389, 1.5852562189102173, 1.6601414680480957, 1.7350268363952637, 1.809912085533142, 1.8847973346710205, 1.959682583808899]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 6.0, 9.0, 5.0, 22.0, 18.0, 24.0, 64.0, 121.0, 175.0, 369.0, 842.0, 2305.0, 8068.0, 42953.0, 424856.0, 503614.0, 51631.0, 9085.0, 2568.0, 964.0, 410.0, 203.0, 101.0, 53.0, 24.0, 28.0, 13.0, 10.0, 9.0, 2.0, 2.0, 2.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51904296875, -0.5028457641601562, -0.4866485595703125, -0.47045135498046875, -0.454254150390625, -0.43805694580078125, -0.4218597412109375, -0.40566253662109375, -0.38946533203125, -0.37326812744140625, -0.3570709228515625, -0.34087371826171875, -0.324676513671875, -0.30847930908203125, -0.2922821044921875, -0.27608489990234375, -0.2598876953125, -0.24369049072265625, -0.2274932861328125, -0.21129608154296875, -0.195098876953125, -0.17890167236328125, -0.1627044677734375, -0.14650726318359375, -0.13031005859375, -0.11411285400390625, -0.0979156494140625, -0.08171844482421875, -0.065521240234375, -0.04932403564453125, -0.0331268310546875, -0.01692962646484375, -0.000732421875, 0.01546478271484375, 0.0316619873046875, 0.04785919189453125, 0.064056396484375, 0.08025360107421875, 0.0964508056640625, 0.11264801025390625, 0.12884521484375, 0.14504241943359375, 0.1612396240234375, 0.17743682861328125, 0.193634033203125, 0.20983123779296875, 0.2260284423828125, 0.24222564697265625, 0.2584228515625, 0.27462005615234375, 0.2908172607421875, 0.30701446533203125, 0.323211669921875, 0.33940887451171875, 0.3556060791015625, 0.37180328369140625, 0.38800048828125, 0.40419769287109375, 0.4203948974609375, 0.43659210205078125, 0.452789306640625, 0.46898651123046875, 0.4851837158203125, 0.5013809204101562, 0.517578125]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 5.0, 7.0, 14.0, 22.0, 30.0, 47.0, 67.0, 70.0, 100.0, 110.0, 104.0, 104.0, 85.0, 84.0, 57.0, 43.0, 25.0, 18.0, 5.0, 7.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.56298828125, -0.5496978759765625, -0.536407470703125, -0.5231170654296875, -0.50982666015625, -0.4965362548828125, -0.483245849609375, -0.4699554443359375, -0.4566650390625, -0.4433746337890625, -0.430084228515625, -0.4167938232421875, -0.40350341796875, -0.3902130126953125, -0.376922607421875, -0.3636322021484375, -0.350341796875, -0.3370513916015625, -0.323760986328125, -0.3104705810546875, -0.29718017578125, -0.2838897705078125, -0.270599365234375, -0.2573089599609375, -0.2440185546875, -0.2307281494140625, -0.217437744140625, -0.2041473388671875, -0.19085693359375, -0.1775665283203125, -0.164276123046875, -0.1509857177734375, -0.1376953125, -0.1244049072265625, -0.111114501953125, -0.0978240966796875, -0.08453369140625, -0.0712432861328125, -0.057952880859375, -0.0446624755859375, -0.0313720703125, -0.0180816650390625, -0.004791259765625, 0.0084991455078125, 0.02178955078125, 0.0350799560546875, 0.048370361328125, 0.0616607666015625, 0.074951171875, 0.0882415771484375, 0.101531982421875, 0.1148223876953125, 0.12811279296875, 0.1414031982421875, 0.154693603515625, 0.1679840087890625, 0.1812744140625, 0.1945648193359375, 0.207855224609375, 0.2211456298828125, 0.23443603515625, 0.2477264404296875, 0.261016845703125, 0.2743072509765625, 0.28759765625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 2.0, 1.0, 4.0, 1.0, 5.0, 7.0, 17.0, 20.0, 24.0, 46.0, 55.0, 93.0, 141.0, 217.0, 393.0, 841.0, 2147.0, 6925.0, 35218.0, 524960.0, 432216.0, 34549.0, 6797.0, 2034.0, 825.0, 395.0, 222.0, 151.0, 73.0, 50.0, 36.0, 24.0, 20.0, 17.0, 8.0, 7.0, 2.0, 3.0, 3.0, 4.0, 2.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.50830078125, -0.4907684326171875, -0.473236083984375, -0.4557037353515625, -0.43817138671875, -0.4206390380859375, -0.403106689453125, -0.3855743408203125, -0.3680419921875, -0.3505096435546875, -0.332977294921875, -0.3154449462890625, -0.29791259765625, -0.2803802490234375, -0.262847900390625, -0.2453155517578125, -0.227783203125, -0.2102508544921875, -0.192718505859375, -0.1751861572265625, -0.15765380859375, -0.1401214599609375, -0.122589111328125, -0.1050567626953125, -0.0875244140625, -0.0699920654296875, -0.052459716796875, -0.0349273681640625, -0.01739501953125, 0.0001373291015625, 0.017669677734375, 0.0352020263671875, 0.052734375, 0.0702667236328125, 0.087799072265625, 0.1053314208984375, 0.12286376953125, 0.1403961181640625, 0.157928466796875, 0.1754608154296875, 0.1929931640625, 0.2105255126953125, 0.228057861328125, 0.2455902099609375, 0.26312255859375, 0.2806549072265625, 0.298187255859375, 0.3157196044921875, 0.333251953125, 0.3507843017578125, 0.368316650390625, 0.3858489990234375, 0.40338134765625, 0.4209136962890625, 0.438446044921875, 0.4559783935546875, 0.4735107421875, 0.4910430908203125, 0.508575439453125, 0.5261077880859375, 0.54364013671875, 0.5611724853515625, 0.578704833984375, 0.5962371826171875, 0.61376953125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 3.0, 3.0, 3.0, 5.0, 4.0, 8.0, 4.0, 10.0, 16.0, 7.0, 15.0, 13.0, 19.0, 21.0, 37.0, 17.0, 32.0, 36.0, 41.0, 43.0, 43.0, 41.0, 52.0, 46.0, 52.0, 62.0, 51.0, 42.0, 45.0, 32.0, 34.0, 31.0, 20.0, 22.0, 15.0, 12.0, 11.0, 7.0, 9.0, 7.0, 8.0, 5.0, 3.0, 3.0, 5.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.7470703125, -0.7223129272460938, -0.6975555419921875, -0.6727981567382812, -0.648040771484375, -0.6232833862304688, -0.5985260009765625, -0.5737686157226562, -0.54901123046875, -0.5242538452148438, -0.4994964599609375, -0.47473907470703125, -0.449981689453125, -0.42522430419921875, -0.4004669189453125, -0.37570953369140625, -0.3509521484375, -0.32619476318359375, -0.3014373779296875, -0.27667999267578125, -0.251922607421875, -0.22716522216796875, -0.2024078369140625, -0.17765045166015625, -0.15289306640625, -0.12813568115234375, -0.1033782958984375, -0.07862091064453125, -0.053863525390625, -0.02910614013671875, -0.0043487548828125, 0.02040863037109375, 0.045166015625, 0.06992340087890625, 0.0946807861328125, 0.11943817138671875, 0.144195556640625, 0.16895294189453125, 0.1937103271484375, 0.21846771240234375, 0.24322509765625, 0.26798248291015625, 0.2927398681640625, 0.31749725341796875, 0.342254638671875, 0.36701202392578125, 0.3917694091796875, 0.41652679443359375, 0.4412841796875, 0.46604156494140625, 0.4907989501953125, 0.5155563354492188, 0.540313720703125, 0.5650711059570312, 0.5898284912109375, 0.6145858764648438, 0.63934326171875, 0.6641006469726562, 0.6888580322265625, 0.7136154174804688, 0.738372802734375, 0.7631301879882812, 0.7878875732421875, 0.8126449584960938, 0.83740234375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 4.0, 3.0, 2.0, 6.0, 11.0, 14.0, 36.0, 54.0, 99.0, 192.0, 473.0, 1188.0, 3844.0, 15656.0, 119047.0, 824771.0, 67804.0, 10742.0, 2908.0, 992.0, 354.0, 164.0, 81.0, 49.0, 22.0, 10.0, 12.0, 11.0, 3.0, 2.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.30810546875, -0.2998638153076172, -0.2916221618652344, -0.28338050842285156, -0.27513885498046875, -0.26689720153808594, -0.2586555480957031, -0.2504138946533203, -0.2421722412109375, -0.2339305877685547, -0.22568893432617188, -0.21744728088378906, -0.20920562744140625, -0.20096397399902344, -0.19272232055664062, -0.1844806671142578, -0.176239013671875, -0.1679973602294922, -0.15975570678710938, -0.15151405334472656, -0.14327239990234375, -0.13503074645996094, -0.12678909301757812, -0.11854743957519531, -0.1103057861328125, -0.10206413269042969, -0.09382247924804688, -0.08558082580566406, -0.07733917236328125, -0.06909751892089844, -0.060855865478515625, -0.05261421203613281, -0.04437255859375, -0.03613090515136719, -0.027889251708984375, -0.019647598266601562, -0.01140594482421875, -0.0031642913818359375, 0.005077362060546875, 0.013319015502929688, 0.0215606689453125, 0.029802322387695312, 0.038043975830078125, 0.04628562927246094, 0.05452728271484375, 0.06276893615722656, 0.07101058959960938, 0.07925224304199219, 0.087493896484375, 0.09573554992675781, 0.10397720336914062, 0.11221885681152344, 0.12046051025390625, 0.12870216369628906, 0.13694381713867188, 0.1451854705810547, 0.1534271240234375, 0.1616687774658203, 0.16991043090820312, 0.17815208435058594, 0.18639373779296875, 0.19463539123535156, 0.20287704467773438, 0.2111186981201172, 0.2193603515625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 4.0, 2.0, 3.0, 7.0, 6.0, 11.0, 16.0, 25.0, 35.0, 34.0, 45.0, 66.0, 93.0, 105.0, 91.0, 90.0, 90.0, 90.0, 56.0, 50.0, 20.0, 16.0, 15.0, 4.0, 6.0, 5.0, 1.0, 5.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.942583084106445e-05, -5.7647936046123505e-05, -5.5870041251182556e-05, -5.409214645624161e-05, -5.231425166130066e-05, -5.053635686635971e-05, -4.875846207141876e-05, -4.6980567276477814e-05, -4.5202672481536865e-05, -4.342477768659592e-05, -4.164688289165497e-05, -3.986898809671402e-05, -3.809109330177307e-05, -3.631319850683212e-05, -3.4535303711891174e-05, -3.2757408916950226e-05, -3.097951412200928e-05, -2.920161932706833e-05, -2.742372453212738e-05, -2.5645829737186432e-05, -2.3867934942245483e-05, -2.2090040147304535e-05, -2.0312145352363586e-05, -1.8534250557422638e-05, -1.675635576248169e-05, -1.4978460967540741e-05, -1.3200566172599792e-05, -1.1422671377658844e-05, -9.644776582717896e-06, -7.866881787776947e-06, -6.0889869928359985e-06, -4.31109219789505e-06, -2.5331974029541016e-06, -7.553026080131531e-07, 1.0225921869277954e-06, 2.800486981868744e-06, 4.578381776809692e-06, 6.356276571750641e-06, 8.13417136669159e-06, 9.912066161632538e-06, 1.1689960956573486e-05, 1.3467855751514435e-05, 1.5245750546455383e-05, 1.7023645341396332e-05, 1.880154013633728e-05, 2.057943493127823e-05, 2.2357329726219177e-05, 2.4135224521160126e-05, 2.5913119316101074e-05, 2.7691014111042023e-05, 2.946890890598297e-05, 3.124680370092392e-05, 3.302469849586487e-05, 3.480259329080582e-05, 3.6580488085746765e-05, 3.8358382880687714e-05, 4.013627767562866e-05, 4.191417247056961e-05, 4.369206726551056e-05, 4.546996206045151e-05, 4.7247856855392456e-05, 4.9025751650333405e-05, 5.080364644527435e-05, 5.25815412402153e-05, 5.435943603515625e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 8.0, 3.0, 6.0, 13.0, 20.0, 22.0, 44.0, 53.0, 123.0, 234.0, 498.0, 1185.0, 3037.0, 11005.0, 59805.0, 757559.0, 183030.0, 23200.0, 5436.0, 1815.0, 766.0, 300.0, 150.0, 83.0, 52.0, 31.0, 23.0, 16.0, 9.0, 13.0, 5.0, 3.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.21875, -0.21113967895507812, -0.20352935791015625, -0.19591903686523438, -0.1883087158203125, -0.18069839477539062, -0.17308807373046875, -0.16547775268554688, -0.157867431640625, -0.15025711059570312, -0.14264678955078125, -0.13503646850585938, -0.1274261474609375, -0.11981582641601562, -0.11220550537109375, -0.10459518432617188, -0.09698486328125, -0.08937454223632812, -0.08176422119140625, -0.07415390014648438, -0.0665435791015625, -0.058933258056640625, -0.05132293701171875, -0.043712615966796875, -0.036102294921875, -0.028491973876953125, -0.02088165283203125, -0.013271331787109375, -0.0056610107421875, 0.001949310302734375, 0.00955963134765625, 0.017169952392578125, 0.0247802734375, 0.032390594482421875, 0.04000091552734375, 0.047611236572265625, 0.0552215576171875, 0.06283187866210938, 0.07044219970703125, 0.07805252075195312, 0.085662841796875, 0.09327316284179688, 0.10088348388671875, 0.10849380493164062, 0.1161041259765625, 0.12371444702148438, 0.13132476806640625, 0.13893508911132812, 0.14654541015625, 0.15415573120117188, 0.16176605224609375, 0.16937637329101562, 0.1769866943359375, 0.18459701538085938, 0.19220733642578125, 0.19981765747070312, 0.207427978515625, 0.21503829956054688, 0.22264862060546875, 0.23025894165039062, 0.2378692626953125, 0.24547958374023438, 0.25308990478515625, 0.2607002258300781, 0.268310546875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 7.0, 4.0, 3.0, 8.0, 12.0, 14.0, 13.0, 20.0, 30.0, 36.0, 51.0, 83.0, 112.0, 126.0, 94.0, 110.0, 80.0, 53.0, 30.0, 19.0, 19.0, 18.0, 13.0, 13.0, 8.0, 7.0, 3.0, 5.0, 1.0, 2.0, 4.0, 2.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2108154296875, -0.2044219970703125, -0.198028564453125, -0.1916351318359375, -0.18524169921875, -0.1788482666015625, -0.172454833984375, -0.1660614013671875, -0.15966796875, -0.1532745361328125, -0.146881103515625, -0.1404876708984375, -0.13409423828125, -0.1277008056640625, -0.121307373046875, -0.1149139404296875, -0.1085205078125, -0.1021270751953125, -0.095733642578125, -0.0893402099609375, -0.08294677734375, -0.0765533447265625, -0.070159912109375, -0.0637664794921875, -0.057373046875, -0.0509796142578125, -0.044586181640625, -0.0381927490234375, -0.03179931640625, -0.0254058837890625, -0.019012451171875, -0.0126190185546875, -0.0062255859375, 0.0001678466796875, 0.006561279296875, 0.0129547119140625, 0.01934814453125, 0.0257415771484375, 0.032135009765625, 0.0385284423828125, 0.044921875, 0.0513153076171875, 0.057708740234375, 0.0641021728515625, 0.07049560546875, 0.0768890380859375, 0.083282470703125, 0.0896759033203125, 0.0960693359375, 0.1024627685546875, 0.108856201171875, 0.1152496337890625, 0.12164306640625, 0.1280364990234375, 0.134429931640625, 0.1408233642578125, 0.147216796875, 0.1536102294921875, 0.160003662109375, 0.1663970947265625, 0.17279052734375, 0.1791839599609375, 0.185577392578125, 0.1919708251953125, 0.1983642578125]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 5.0, 5.0, 5.0, 11.0, 17.0, 28.0, 71.0, 156.0, 331.0, 178.0, 87.0, 57.0, 19.0, 8.0, 12.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.112656593322754, -3.968852996826172, -3.82504940032959, -3.681245803833008, -3.537442207336426, -3.3936386108398438, -3.2498350143432617, -3.1060314178466797, -2.9622278213500977, -2.8184242248535156, -2.6746206283569336, -2.5308170318603516, -2.3870134353637695, -2.2432098388671875, -2.0994062423706055, -1.9556026458740234, -1.8117990493774414, -1.6679954528808594, -1.5241918563842773, -1.3803882598876953, -1.2365846633911133, -1.0927810668945312, -0.9489774703979492, -0.8051738739013672, -0.6613702774047852, -0.5175666809082031, -0.3737630844116211, -0.22995948791503906, -0.08615589141845703, 0.057647705078125, 0.20145130157470703, 0.34525489807128906, 0.4890580177307129, 0.6328616142272949, 0.776665210723877, 0.920468807220459, 1.064272403717041, 1.208076000213623, 1.351879596710205, 1.495683193206787, 1.6394867897033691, 1.7832903861999512, 1.9270939826965332, 2.0708975791931152, 2.2147011756896973, 2.3585047721862793, 2.5023083686828613, 2.6461119651794434, 2.7899155616760254, 2.9337191581726074, 3.0775227546691895, 3.2213263511657715, 3.3651299476623535, 3.5089335441589355, 3.6527371406555176, 3.7965407371520996, 3.9403443336486816, 4.084147930145264, 4.227951526641846, 4.371755123138428, 4.51555871963501, 4.659362316131592, 4.803165912628174, 4.946969509124756, 5.090773105621338]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 7.0, 13.0, 8.0, 18.0, 19.0, 25.0, 32.0, 27.0, 51.0, 53.0, 70.0, 142.0, 129.0, 91.0, 56.0, 58.0, 52.0, 40.0, 30.0, 21.0, 25.0, 11.0, 7.0, 8.0, 6.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.8590455055236816, -3.70625901222229, -3.5534725189208984, -3.400686264038086, -3.2478997707366943, -3.0951132774353027, -2.9423270225524902, -2.7895405292510986, -2.636754035949707, -2.4839675426483154, -2.331181049346924, -2.1783947944641113, -2.0256083011627197, -1.8728218078613281, -1.720035433769226, -1.567249059677124, -1.4144625663757324, -1.2616760730743408, -1.1088896989822388, -0.9561032652854919, -0.8033168315887451, -0.6505303978919983, -0.49774396419525146, -0.3449575901031494, -0.1921710968017578, -0.039384663105010986, 0.11340177059173584, 0.26618820428848267, 0.4189746379852295, 0.5717610716819763, 0.7245475053787231, 0.8773338794708252, 1.030120849609375, 1.1829073429107666, 1.3356937170028687, 1.4884800910949707, 1.6412665843963623, 1.794053077697754, 1.946839451789856, 2.099625825881958, 2.2524123191833496, 2.405198812484741, 2.557985305786133, 2.7107715606689453, 2.863558053970337, 3.0163445472717285, 3.169130802154541, 3.3219172954559326, 3.474703788757324, 3.627490282058716, 3.7802767753601074, 3.93306303024292, 4.085849761962891, 4.238636016845703, 4.391422271728516, 4.544208526611328, 4.696995258331299, 4.849781513214111, 5.002568244934082, 5.1553544998168945, 5.308140754699707, 5.460927486419678, 5.61371374130249, 5.766500473022461, 5.919286727905273]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 10.0, 5.0, 10.0, 10.0, 20.0, 31.0, 39.0, 82.0, 178.0, 394.0, 991.0, 2910.0, 10070.0, 52964.0, 874221.0, 3045130.0, 178665.0, 20379.0, 5053.0, 1666.0, 697.0, 330.0, 174.0, 81.0, 61.0, 26.0, 18.0, 19.0, 9.0, 12.0, 7.0, 10.0, 4.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.432861328125, -0.4185523986816406, -0.40424346923828125, -0.3899345397949219, -0.3756256103515625, -0.3613166809082031, -0.34700775146484375, -0.3326988220214844, -0.318389892578125, -0.3040809631347656, -0.28977203369140625, -0.2754631042480469, -0.2611541748046875, -0.24684524536132812, -0.23253631591796875, -0.21822738647460938, -0.20391845703125, -0.18960952758789062, -0.17530059814453125, -0.16099166870117188, -0.1466827392578125, -0.13237380981445312, -0.11806488037109375, -0.10375595092773438, -0.089447021484375, -0.07513809204101562, -0.06082916259765625, -0.046520233154296875, -0.0322113037109375, -0.017902374267578125, -0.00359344482421875, 0.010715484619140625, 0.0250244140625, 0.039333343505859375, 0.05364227294921875, 0.06795120239257812, 0.0822601318359375, 0.09656906127929688, 0.11087799072265625, 0.12518692016601562, 0.139495849609375, 0.15380477905273438, 0.16811370849609375, 0.18242263793945312, 0.1967315673828125, 0.21104049682617188, 0.22534942626953125, 0.23965835571289062, 0.25396728515625, 0.2682762145996094, 0.28258514404296875, 0.2968940734863281, 0.3112030029296875, 0.3255119323730469, 0.33982086181640625, 0.3541297912597656, 0.368438720703125, 0.3827476501464844, 0.39705657958984375, 0.4113655090332031, 0.4256744384765625, 0.4399833679199219, 0.45429229736328125, 0.4686012268066406, 0.48291015625]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 7.0, 2.0, 5.0, 7.0, 11.0, 7.0, 11.0, 10.0, 17.0, 18.0, 17.0, 20.0, 25.0, 29.0, 34.0, 32.0, 46.0, 53.0, 46.0, 45.0, 55.0, 45.0, 34.0, 64.0, 48.0, 44.0, 43.0, 33.0, 29.0, 28.0, 28.0, 26.0, 19.0, 19.0, 17.0, 11.0, 11.0, 8.0, 3.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.153076171875, -0.146759033203125, -0.14044189453125, -0.134124755859375, -0.1278076171875, -0.121490478515625, -0.11517333984375, -0.108856201171875, -0.1025390625, -0.096221923828125, -0.08990478515625, -0.083587646484375, -0.0772705078125, -0.070953369140625, -0.06463623046875, -0.058319091796875, -0.052001953125, -0.045684814453125, -0.03936767578125, -0.033050537109375, -0.0267333984375, -0.020416259765625, -0.01409912109375, -0.007781982421875, -0.00146484375, 0.004852294921875, 0.01116943359375, 0.017486572265625, 0.0238037109375, 0.030120849609375, 0.03643798828125, 0.042755126953125, 0.049072265625, 0.055389404296875, 0.06170654296875, 0.068023681640625, 0.0743408203125, 0.080657958984375, 0.08697509765625, 0.093292236328125, 0.099609375, 0.105926513671875, 0.11224365234375, 0.118560791015625, 0.1248779296875, 0.131195068359375, 0.13751220703125, 0.143829345703125, 0.150146484375, 0.156463623046875, 0.16278076171875, 0.169097900390625, 0.1754150390625, 0.181732177734375, 0.18804931640625, 0.194366455078125, 0.20068359375, 0.207000732421875, 0.21331787109375, 0.219635009765625, 0.2259521484375, 0.232269287109375, 0.23858642578125, 0.244903564453125, 0.251220703125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 2.0, 4.0, 1.0, 6.0, 11.0, 9.0, 11.0, 10.0, 14.0, 18.0, 28.0, 52.0, 74.0, 113.0, 228.0, 533.0, 1295.0, 4869.0, 24514.0, 266100.0, 3596181.0, 268847.0, 24246.0, 4783.0, 1281.0, 493.0, 220.0, 121.0, 67.0, 40.0, 28.0, 19.0, 28.0, 13.0, 8.0, 5.0, 6.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52490234375, -0.507110595703125, -0.48931884765625, -0.471527099609375, -0.4537353515625, -0.435943603515625, -0.41815185546875, -0.400360107421875, -0.382568359375, -0.364776611328125, -0.34698486328125, -0.329193115234375, -0.3114013671875, -0.293609619140625, -0.27581787109375, -0.258026123046875, -0.240234375, -0.222442626953125, -0.20465087890625, -0.186859130859375, -0.1690673828125, -0.151275634765625, -0.13348388671875, -0.115692138671875, -0.097900390625, -0.080108642578125, -0.06231689453125, -0.044525146484375, -0.0267333984375, -0.008941650390625, 0.00885009765625, 0.026641845703125, 0.04443359375, 0.062225341796875, 0.08001708984375, 0.097808837890625, 0.1156005859375, 0.133392333984375, 0.15118408203125, 0.168975830078125, 0.186767578125, 0.204559326171875, 0.22235107421875, 0.240142822265625, 0.2579345703125, 0.275726318359375, 0.29351806640625, 0.311309814453125, 0.3291015625, 0.346893310546875, 0.36468505859375, 0.382476806640625, 0.4002685546875, 0.418060302734375, 0.43585205078125, 0.453643798828125, 0.471435546875, 0.489227294921875, 0.50701904296875, 0.524810791015625, 0.5426025390625, 0.560394287109375, 0.57818603515625, 0.595977783203125, 0.61376953125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 4.0, 4.0, 6.0, 9.0, 12.0, 17.0, 27.0, 34.0, 33.0, 59.0, 77.0, 145.0, 203.0, 309.0, 483.0, 703.0, 680.0, 456.0, 267.0, 167.0, 121.0, 85.0, 42.0, 33.0, 20.0, 22.0, 14.0, 13.0, 14.0, 6.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.5595703125, -0.5455322265625, -0.531494140625, -0.5174560546875, -0.50341796875, -0.4893798828125, -0.475341796875, -0.4613037109375, -0.447265625, -0.4332275390625, -0.419189453125, -0.4051513671875, -0.39111328125, -0.3770751953125, -0.363037109375, -0.3489990234375, -0.3349609375, -0.3209228515625, -0.306884765625, -0.2928466796875, -0.27880859375, -0.2647705078125, -0.250732421875, -0.2366943359375, -0.22265625, -0.2086181640625, -0.194580078125, -0.1805419921875, -0.16650390625, -0.1524658203125, -0.138427734375, -0.1243896484375, -0.1103515625, -0.0963134765625, -0.082275390625, -0.0682373046875, -0.05419921875, -0.0401611328125, -0.026123046875, -0.0120849609375, 0.001953125, 0.0159912109375, 0.030029296875, 0.0440673828125, 0.05810546875, 0.0721435546875, 0.086181640625, 0.1002197265625, 0.1142578125, 0.1282958984375, 0.142333984375, 0.1563720703125, 0.17041015625, 0.1844482421875, 0.198486328125, 0.2125244140625, 0.2265625, 0.2406005859375, 0.254638671875, 0.2686767578125, 0.28271484375, 0.2967529296875, 0.310791015625, 0.3248291015625, 0.3388671875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 6.0, 4.0, 12.0, 20.0, 40.0, 112.0, 229.0, 293.0, 196.0, 65.0, 19.0, 4.0, 4.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.145954132080078, -8.940030097961426, -8.734106063842773, -8.528182983398438, -8.322258949279785, -8.116334915161133, -7.9104108810424805, -7.704486846923828, -7.498563289642334, -7.292639255523682, -7.0867156982421875, -6.880791664123535, -6.674867630004883, -6.468944072723389, -6.263020038604736, -6.057096481323242, -5.85117244720459, -5.6452484130859375, -5.439324855804443, -5.233400821685791, -5.027477264404297, -4.8215532302856445, -4.615629196166992, -4.40970516204834, -4.203781604766846, -3.9978578090667725, -3.791934013366699, -3.586009979248047, -3.3800861835479736, -3.1741623878479004, -2.968238353729248, -2.762314558029175, -2.5563902854919434, -2.35046648979187, -2.144542694091797, -1.9386186599731445, -1.7326948642730713, -1.526771068572998, -1.3208471536636353, -1.1149232387542725, -0.9089994430541992, -0.7030755877494812, -0.4971517324447632, -0.29122787714004517, -0.08530402183532715, 0.1206197738647461, 0.3265436887741089, 0.5324676036834717, 0.7383913993835449, 0.9443152546882629, 1.150239109992981, 1.3561630249023438, 1.562086820602417, 1.7680106163024902, 1.973934531211853, 2.179858446121216, 2.385782241821289, 2.5917060375213623, 2.7976298332214355, 3.003553867340088, 3.209477663040161, 3.4154014587402344, 3.6213254928588867, 3.82724928855896, 4.033173084259033]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 6.0, 4.0, 5.0, 4.0, 6.0, 4.0, 6.0, 8.0, 16.0, 15.0, 21.0, 18.0, 18.0, 21.0, 16.0, 31.0, 33.0, 45.0, 38.0, 27.0, 42.0, 62.0, 55.0, 43.0, 43.0, 39.0, 50.0, 34.0, 29.0, 28.0, 34.0, 39.0, 17.0, 15.0, 19.0, 22.0, 12.0, 12.0, 17.0, 8.0, 11.0, 4.0, 3.0, 8.0, 7.0, 4.0, 6.0, 3.0, 0.0, 3.0, 3.0, 1.0], "bins": [-1.8004441261291504, -1.749172568321228, -1.6979010105133057, -1.6466294527053833, -1.595357894897461, -1.5440863370895386, -1.4928147792816162, -1.4415431022644043, -1.3902716636657715, -1.3390001058578491, -1.2877285480499268, -1.2364569902420044, -1.185185432434082, -1.1339138746261597, -1.0826423168182373, -1.0313706398010254, -0.980099081993103, -0.9288275241851807, -0.8775559663772583, -0.8262844085693359, -0.7750128507614136, -0.7237412929534912, -0.6724696755409241, -0.6211981177330017, -0.5699265599250793, -0.518655002117157, -0.4673834443092346, -0.41611185669898987, -0.3648402988910675, -0.31356874108314514, -0.2622971534729004, -0.21102559566497803, -0.15975403785705566, -0.1084824725985527, -0.057210907340049744, -0.0059393346309661865, 0.04533222317695618, 0.09660378098487854, 0.1478753685951233, 0.19914692640304565, 0.250418484210968, 0.3016900420188904, 0.35296159982681274, 0.4042331874370575, 0.45550474524497986, 0.5067763328552246, 0.558047890663147, 0.6093194484710693, 0.6605910062789917, 0.7118625640869141, 0.7631341218948364, 0.8144056797027588, 0.8656772375106812, 0.9169487953186035, 0.9682204127311707, 1.0194919109344482, 1.0707635879516602, 1.1220351457595825, 1.1733067035675049, 1.2245782613754272, 1.2758498191833496, 1.327121376991272, 1.3783929347991943, 1.4296646118164062, 1.480936050415039]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 0.0, 4.0, 3.0, 5.0, 14.0, 8.0, 19.0, 24.0, 49.0, 57.0, 125.0, 230.0, 387.0, 762.0, 1763.0, 4183.0, 10806.0, 33274.0, 132735.0, 532262.0, 250238.0, 54700.0, 16416.0, 5759.0, 2426.0, 1102.0, 536.0, 257.0, 146.0, 100.0, 57.0, 42.0, 18.0, 12.0, 15.0, 5.0, 7.0, 5.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.38134765625, -0.3700294494628906, -0.35871124267578125, -0.3473930358886719, -0.3360748291015625, -0.3247566223144531, -0.31343841552734375, -0.3021202087402344, -0.290802001953125, -0.2794837951660156, -0.26816558837890625, -0.2568473815917969, -0.2455291748046875, -0.23421096801757812, -0.22289276123046875, -0.21157455444335938, -0.20025634765625, -0.18893814086914062, -0.17761993408203125, -0.16630172729492188, -0.1549835205078125, -0.14366531372070312, -0.13234710693359375, -0.12102890014648438, -0.109710693359375, -0.09839248657226562, -0.08707427978515625, -0.07575607299804688, -0.0644378662109375, -0.053119659423828125, -0.04180145263671875, -0.030483245849609375, -0.0191650390625, -0.007846832275390625, 0.00347137451171875, 0.014789581298828125, 0.0261077880859375, 0.037425994873046875, 0.04874420166015625, 0.060062408447265625, 0.071380615234375, 0.08269882202148438, 0.09401702880859375, 0.10533523559570312, 0.1166534423828125, 0.12797164916992188, 0.13928985595703125, 0.15060806274414062, 0.16192626953125, 0.17324447631835938, 0.18456268310546875, 0.19588088989257812, 0.2071990966796875, 0.21851730346679688, 0.22983551025390625, 0.24115371704101562, 0.252471923828125, 0.2637901306152344, 0.27510833740234375, 0.2864265441894531, 0.2977447509765625, 0.3090629577636719, 0.32038116455078125, 0.3316993713378906, 0.343017578125]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 3.0, 8.0, 13.0, 12.0, 12.0, 17.0, 20.0, 37.0, 43.0, 40.0, 49.0, 51.0, 66.0, 72.0, 77.0, 54.0, 69.0, 57.0, 58.0, 50.0, 42.0, 27.0, 32.0, 22.0, 22.0, 18.0, 5.0, 6.0, 3.0, 5.0, 7.0, 3.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.256103515625, -0.24726486206054688, -0.23842620849609375, -0.22958755493164062, -0.2207489013671875, -0.21191024780273438, -0.20307159423828125, -0.19423294067382812, -0.185394287109375, -0.17655563354492188, -0.16771697998046875, -0.15887832641601562, -0.1500396728515625, -0.14120101928710938, -0.13236236572265625, -0.12352371215820312, -0.11468505859375, -0.10584640502929688, -0.09700775146484375, -0.08816909790039062, -0.0793304443359375, -0.07049179077148438, -0.06165313720703125, -0.052814483642578125, -0.043975830078125, -0.035137176513671875, -0.02629852294921875, -0.017459869384765625, -0.0086212158203125, 0.000217437744140625, 0.00905609130859375, 0.017894744873046875, 0.0267333984375, 0.035572052001953125, 0.04441070556640625, 0.053249359130859375, 0.0620880126953125, 0.07092666625976562, 0.07976531982421875, 0.08860397338867188, 0.097442626953125, 0.10628128051757812, 0.11511993408203125, 0.12395858764648438, 0.1327972412109375, 0.14163589477539062, 0.15047454833984375, 0.15931320190429688, 0.16815185546875, 0.17699050903320312, 0.18582916259765625, 0.19466781616210938, 0.2035064697265625, 0.21234512329101562, 0.22118377685546875, 0.23002243041992188, 0.238861083984375, 0.24769973754882812, 0.25653839111328125, 0.2653770446777344, 0.2742156982421875, 0.2830543518066406, 0.29189300537109375, 0.3007316589355469, 0.3095703125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 6.0, 5.0, 15.0, 10.0, 23.0, 21.0, 32.0, 48.0, 87.0, 131.0, 227.0, 396.0, 835.0, 2280.0, 9054.0, 71674.0, 862494.0, 86928.0, 10043.0, 2363.0, 873.0, 413.0, 230.0, 139.0, 74.0, 50.0, 37.0, 23.0, 10.0, 10.0, 5.0, 7.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.67626953125, -0.6541213989257812, -0.6319732666015625, -0.6098251342773438, -0.587677001953125, -0.5655288696289062, -0.5433807373046875, -0.5212326049804688, -0.49908447265625, -0.47693634033203125, -0.4547882080078125, -0.43264007568359375, -0.410491943359375, -0.38834381103515625, -0.3661956787109375, -0.34404754638671875, -0.3218994140625, -0.29975128173828125, -0.2776031494140625, -0.25545501708984375, -0.233306884765625, -0.21115875244140625, -0.1890106201171875, -0.16686248779296875, -0.14471435546875, -0.12256622314453125, -0.1004180908203125, -0.07826995849609375, -0.056121826171875, -0.03397369384765625, -0.0118255615234375, 0.01032257080078125, 0.032470703125, 0.05461883544921875, 0.0767669677734375, 0.09891510009765625, 0.121063232421875, 0.14321136474609375, 0.1653594970703125, 0.18750762939453125, 0.20965576171875, 0.23180389404296875, 0.2539520263671875, 0.27610015869140625, 0.298248291015625, 0.32039642333984375, 0.3425445556640625, 0.36469268798828125, 0.3868408203125, 0.40898895263671875, 0.4311370849609375, 0.45328521728515625, 0.475433349609375, 0.49758148193359375, 0.5197296142578125, 0.5418777465820312, 0.56402587890625, 0.5861740112304688, 0.6083221435546875, 0.6304702758789062, 0.652618408203125, 0.6747665405273438, 0.6969146728515625, 0.7190628051757812, 0.7412109375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 4.0, 5.0, 6.0, 4.0, 8.0, 7.0, 14.0, 12.0, 12.0, 21.0, 25.0, 32.0, 30.0, 34.0, 45.0, 46.0, 60.0, 56.0, 64.0, 56.0, 61.0, 70.0, 55.0, 61.0, 38.0, 34.0, 26.0, 16.0, 20.0, 21.0, 14.0, 10.0, 11.0, 7.0, 7.0, 3.0, 4.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0341796875, -1.002838134765625, -0.97149658203125, -0.940155029296875, -0.9088134765625, -0.877471923828125, -0.84613037109375, -0.814788818359375, -0.783447265625, -0.752105712890625, -0.72076416015625, -0.689422607421875, -0.6580810546875, -0.626739501953125, -0.59539794921875, -0.564056396484375, -0.53271484375, -0.501373291015625, -0.47003173828125, -0.438690185546875, -0.4073486328125, -0.376007080078125, -0.34466552734375, -0.313323974609375, -0.281982421875, -0.250640869140625, -0.21929931640625, -0.187957763671875, -0.1566162109375, -0.125274658203125, -0.09393310546875, -0.062591552734375, -0.03125, 9.1552734375e-05, 0.03143310546875, 0.062774658203125, 0.0941162109375, 0.125457763671875, 0.15679931640625, 0.188140869140625, 0.219482421875, 0.250823974609375, 0.28216552734375, 0.313507080078125, 0.3448486328125, 0.376190185546875, 0.40753173828125, 0.438873291015625, 0.47021484375, 0.501556396484375, 0.53289794921875, 0.564239501953125, 0.5955810546875, 0.626922607421875, 0.65826416015625, 0.689605712890625, 0.720947265625, 0.752288818359375, 0.78363037109375, 0.814971923828125, 0.8463134765625, 0.877655029296875, 0.90899658203125, 0.940338134765625, 0.9716796875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 6.0, 16.0, 40.0, 83.0, 359.0, 2095.0, 31506.0, 969011.0, 42320.0, 2538.0, 392.0, 100.0, 35.0, 19.0, 12.0, 2.0, 3.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.337890625, -0.32562255859375, -0.3133544921875, -0.30108642578125, -0.288818359375, -0.27655029296875, -0.2642822265625, -0.25201416015625, -0.23974609375, -0.22747802734375, -0.2152099609375, -0.20294189453125, -0.190673828125, -0.17840576171875, -0.1661376953125, -0.15386962890625, -0.1416015625, -0.12933349609375, -0.1170654296875, -0.10479736328125, -0.092529296875, -0.08026123046875, -0.0679931640625, -0.05572509765625, -0.04345703125, -0.03118896484375, -0.0189208984375, -0.00665283203125, 0.005615234375, 0.01788330078125, 0.0301513671875, 0.04241943359375, 0.0546875, 0.06695556640625, 0.0792236328125, 0.09149169921875, 0.103759765625, 0.11602783203125, 0.1282958984375, 0.14056396484375, 0.15283203125, 0.16510009765625, 0.1773681640625, 0.18963623046875, 0.201904296875, 0.21417236328125, 0.2264404296875, 0.23870849609375, 0.2509765625, 0.26324462890625, 0.2755126953125, 0.28778076171875, 0.300048828125, 0.31231689453125, 0.3245849609375, 0.33685302734375, 0.34912109375, 0.36138916015625, 0.3736572265625, 0.38592529296875, 0.398193359375, 0.41046142578125, 0.4227294921875, 0.43499755859375, 0.447265625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 5.0, 4.0, 7.0, 12.0, 16.0, 17.0, 23.0, 41.0, 51.0, 73.0, 98.0, 143.0, 117.0, 113.0, 83.0, 62.0, 41.0, 27.0, 26.0, 14.0, 6.0, 4.0, 5.0, 5.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.175041198730469e-05, -5.983468145132065e-05, -5.791895091533661e-05, -5.600322037935257e-05, -5.408748984336853e-05, -5.217175930738449e-05, -5.025602877140045e-05, -4.834029823541641e-05, -4.642456769943237e-05, -4.4508837163448334e-05, -4.2593106627464294e-05, -4.0677376091480255e-05, -3.8761645555496216e-05, -3.6845915019512177e-05, -3.493018448352814e-05, -3.30144539475441e-05, -3.109872341156006e-05, -2.918299287557602e-05, -2.726726233959198e-05, -2.535153180360794e-05, -2.34358012676239e-05, -2.1520070731639862e-05, -1.9604340195655823e-05, -1.7688609659671783e-05, -1.5772879123687744e-05, -1.3857148587703705e-05, -1.1941418051719666e-05, -1.0025687515735626e-05, -8.109956979751587e-06, -6.194226443767548e-06, -4.278495907783508e-06, -2.362765371799469e-06, -4.470348358154297e-07, 1.4686957001686096e-06, 3.384426236152649e-06, 5.300156772136688e-06, 7.2158873081207275e-06, 9.131617844104767e-06, 1.1047348380088806e-05, 1.2963078916072845e-05, 1.4878809452056885e-05, 1.6794539988040924e-05, 1.8710270524024963e-05, 2.0626001060009003e-05, 2.2541731595993042e-05, 2.445746213197708e-05, 2.637319266796112e-05, 2.828892320394516e-05, 3.02046537399292e-05, 3.212038427591324e-05, 3.403611481189728e-05, 3.595184534788132e-05, 3.7867575883865356e-05, 3.9783306419849396e-05, 4.1699036955833435e-05, 4.3614767491817474e-05, 4.5530498027801514e-05, 4.744622856378555e-05, 4.936195909976959e-05, 5.127768963575363e-05, 5.319342017173767e-05, 5.510915070772171e-05, 5.702488124370575e-05, 5.894061177968979e-05, 6.085634231567383e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 4.0, 5.0, 3.0, 7.0, 7.0, 13.0, 25.0, 30.0, 48.0, 77.0, 142.0, 210.0, 471.0, 957.0, 2511.0, 7756.0, 32119.0, 224713.0, 704162.0, 57134.0, 12022.0, 3580.0, 1287.0, 576.0, 283.0, 151.0, 101.0, 54.0, 29.0, 24.0, 16.0, 9.0, 8.0, 7.0, 5.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1636962890625, -0.15860748291015625, -0.1535186767578125, -0.14842987060546875, -0.143341064453125, -0.13825225830078125, -0.1331634521484375, -0.12807464599609375, -0.12298583984375, -0.11789703369140625, -0.1128082275390625, -0.10771942138671875, -0.102630615234375, -0.09754180908203125, -0.0924530029296875, -0.08736419677734375, -0.082275390625, -0.07718658447265625, -0.0720977783203125, -0.06700897216796875, -0.061920166015625, -0.05683135986328125, -0.0517425537109375, -0.04665374755859375, -0.04156494140625, -0.03647613525390625, -0.0313873291015625, -0.02629852294921875, -0.021209716796875, -0.01612091064453125, -0.0110321044921875, -0.00594329833984375, -0.0008544921875, 0.00423431396484375, 0.0093231201171875, 0.01441192626953125, 0.019500732421875, 0.02458953857421875, 0.0296783447265625, 0.03476715087890625, 0.03985595703125, 0.04494476318359375, 0.0500335693359375, 0.05512237548828125, 0.060211181640625, 0.06529998779296875, 0.0703887939453125, 0.07547760009765625, 0.08056640625, 0.08565521240234375, 0.0907440185546875, 0.09583282470703125, 0.100921630859375, 0.10601043701171875, 0.1110992431640625, 0.11618804931640625, 0.12127685546875, 0.12636566162109375, 0.1314544677734375, 0.13654327392578125, 0.141632080078125, 0.14672088623046875, 0.1518096923828125, 0.15689849853515625, 0.1619873046875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 4.0, 7.0, 8.0, 11.0, 14.0, 24.0, 18.0, 39.0, 48.0, 63.0, 76.0, 84.0, 102.0, 120.0, 100.0, 80.0, 38.0, 44.0, 25.0, 26.0, 17.0, 13.0, 10.0, 6.0, 3.0, 5.0, 5.0, 5.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1817626953125, -0.17656517028808594, -0.17136764526367188, -0.1661701202392578, -0.16097259521484375, -0.1557750701904297, -0.15057754516601562, -0.14538002014160156, -0.1401824951171875, -0.13498497009277344, -0.12978744506835938, -0.12458992004394531, -0.11939239501953125, -0.11419486999511719, -0.10899734497070312, -0.10379981994628906, -0.098602294921875, -0.09340476989746094, -0.08820724487304688, -0.08300971984863281, -0.07781219482421875, -0.07261466979980469, -0.06741714477539062, -0.06221961975097656, -0.0570220947265625, -0.05182456970214844, -0.046627044677734375, -0.04142951965332031, -0.03623199462890625, -0.031034469604492188, -0.025836944580078125, -0.020639419555664062, -0.01544189453125, -0.010244369506835938, -0.005046844482421875, 0.0001506805419921875, 0.00534820556640625, 0.010545730590820312, 0.015743255615234375, 0.020940780639648438, 0.0261383056640625, 0.03133583068847656, 0.036533355712890625, 0.04173088073730469, 0.04692840576171875, 0.05212593078613281, 0.057323455810546875, 0.06252098083496094, 0.067718505859375, 0.07291603088378906, 0.07811355590820312, 0.08331108093261719, 0.08850860595703125, 0.09370613098144531, 0.09890365600585938, 0.10410118103027344, 0.1092987060546875, 0.11449623107910156, 0.11969375610351562, 0.12489128112792969, 0.13008880615234375, 0.1352863311767578, 0.14048385620117188, 0.14568138122558594, 0.15087890625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 7.0, 4.0, 9.0, 18.0, 42.0, 96.0, 236.0, 331.0, 143.0, 54.0, 33.0, 10.0, 11.0, 5.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.313342094421387, -4.154363632202148, -3.9953854084014893, -3.836406946182251, -3.677428722381592, -3.5184502601623535, -3.3594717979431152, -3.200493335723877, -3.0415151119232178, -2.8825366497039795, -2.7235584259033203, -2.564579963684082, -2.4056015014648438, -2.2466232776641846, -2.0876448154449463, -1.9286664724349976, -1.7696881294250488, -1.6107097864151, -1.4517314434051514, -1.292752981185913, -1.1337746381759644, -0.9747962951660156, -0.8158178925514221, -0.6568394899368286, -0.4978611469268799, -0.33888277411460876, -0.17990440130233765, -0.02092602849006653, 0.1380523443222046, 0.2970306873321533, 0.4560090899467468, 0.6149874925613403, 0.7739663124084473, 0.932944655418396, 1.0919229984283447, 1.250901460647583, 1.4098798036575317, 1.5688581466674805, 1.7278366088867188, 1.8868149518966675, 2.045793294906616, 2.2047717571258545, 2.3637499809265137, 2.522728443145752, 2.6817069053649902, 2.8406851291656494, 2.9996635913848877, 3.158641815185547, 3.317620277404785, 3.4765987396240234, 3.6355769634246826, 3.794555425643921, 3.95353364944458, 4.112512111663818, 4.271490573883057, 4.430469036102295, 4.589447021484375, 4.748425483703613, 4.907403945922852, 5.066381931304932, 5.22536039352417, 5.384338855743408, 5.5433173179626465, 5.702295780181885, 5.861274242401123]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 5.0, 11.0, 13.0, 5.0, 18.0, 19.0, 19.0, 22.0, 23.0, 19.0, 37.0, 23.0, 44.0, 68.0, 124.0, 157.0, 70.0, 46.0, 35.0, 44.0, 37.0, 30.0, 31.0, 20.0, 16.0, 13.0, 19.0, 14.0, 4.0, 8.0, 2.0, 3.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-5.04792594909668, -4.915694713592529, -4.783463478088379, -4.6512322425842285, -4.519001007080078, -4.386769771575928, -4.254538536071777, -4.122307777404785, -3.9900763034820557, -3.8578450679779053, -3.725613832473755, -3.5933825969696045, -3.461151599884033, -3.328920364379883, -3.1966891288757324, -3.064457893371582, -2.9322266578674316, -2.7999954223632812, -2.667764186859131, -2.5355329513549805, -2.40330171585083, -2.2710704803466797, -2.1388394832611084, -2.006608247756958, -1.8743770122528076, -1.7421457767486572, -1.6099145412445068, -1.477683424949646, -1.3454521894454956, -1.2132209539413452, -1.0809898376464844, -0.948758602142334, -0.8165268898010254, -0.684295654296875, -0.5520644783973694, -0.4198332726955414, -0.2876020669937134, -0.155370831489563, -0.023139655590057373, 0.10909152030944824, 0.24132275581359863, 0.37355396151542664, 0.5057851672172546, 0.6380163431167603, 0.7702475786209106, 0.902478814125061, 1.0347099304199219, 1.1669411659240723, 1.2991724014282227, 1.431403636932373, 1.5636348724365234, 1.6958659887313843, 1.8280972242355347, 1.960328459739685, 2.092559576034546, 2.2247908115386963, 2.3570220470428467, 2.489253282546997, 2.6214845180511475, 2.753715753555298, 2.885946750640869, 3.0181779861450195, 3.15040922164917, 3.2826404571533203, 3.4148716926574707]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 4.0, 0.0, 2.0, 7.0, 7.0, 12.0, 22.0, 46.0, 80.0, 157.0, 352.0, 851.0, 2632.0, 8705.0, 37362.0, 248228.0, 2368085.0, 1370554.0, 125400.0, 22180.0, 5931.0, 1992.0, 754.0, 315.0, 186.0, 114.0, 83.0, 51.0, 45.0, 28.0, 22.0, 17.0, 10.0, 9.0, 10.0, 8.0, 7.0, 7.0, 4.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.35791015625, -0.33988189697265625, -0.3218536376953125, -0.30382537841796875, -0.285797119140625, -0.26776885986328125, -0.2497406005859375, -0.23171234130859375, -0.21368408203125, -0.19565582275390625, -0.1776275634765625, -0.15959930419921875, -0.141571044921875, -0.12354278564453125, -0.1055145263671875, -0.08748626708984375, -0.0694580078125, -0.05142974853515625, -0.0334014892578125, -0.01537322998046875, 0.002655029296875, 0.02068328857421875, 0.0387115478515625, 0.05673980712890625, 0.07476806640625, 0.09279632568359375, 0.1108245849609375, 0.12885284423828125, 0.146881103515625, 0.16490936279296875, 0.1829376220703125, 0.20096588134765625, 0.218994140625, 0.23702239990234375, 0.2550506591796875, 0.27307891845703125, 0.291107177734375, 0.30913543701171875, 0.3271636962890625, 0.34519195556640625, 0.36322021484375, 0.38124847412109375, 0.3992767333984375, 0.41730499267578125, 0.435333251953125, 0.45336151123046875, 0.4713897705078125, 0.48941802978515625, 0.5074462890625, 0.5254745483398438, 0.5435028076171875, 0.5615310668945312, 0.579559326171875, 0.5975875854492188, 0.6156158447265625, 0.6336441040039062, 0.65167236328125, 0.6697006225585938, 0.6877288818359375, 0.7057571411132812, 0.723785400390625, 0.7418136596679688, 0.7598419189453125, 0.7778701782226562, 0.7958984375]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 2.0, 11.0, 8.0, 9.0, 20.0, 17.0, 21.0, 22.0, 36.0, 38.0, 49.0, 46.0, 49.0, 55.0, 67.0, 53.0, 59.0, 57.0, 57.0, 36.0, 48.0, 44.0, 36.0, 34.0, 30.0, 15.0, 18.0, 15.0, 13.0, 15.0, 12.0, 6.0, 8.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.213134765625, -0.205810546875, -0.198486328125, -0.191162109375, -0.183837890625, -0.176513671875, -0.169189453125, -0.161865234375, -0.154541015625, -0.147216796875, -0.139892578125, -0.132568359375, -0.125244140625, -0.117919921875, -0.110595703125, -0.103271484375, -0.095947265625, -0.088623046875, -0.081298828125, -0.073974609375, -0.066650390625, -0.059326171875, -0.052001953125, -0.044677734375, -0.037353515625, -0.030029296875, -0.022705078125, -0.015380859375, -0.008056640625, -0.000732421875, 0.006591796875, 0.013916015625, 0.021240234375, 0.028564453125, 0.035888671875, 0.043212890625, 0.050537109375, 0.057861328125, 0.065185546875, 0.072509765625, 0.079833984375, 0.087158203125, 0.094482421875, 0.101806640625, 0.109130859375, 0.116455078125, 0.123779296875, 0.131103515625, 0.138427734375, 0.145751953125, 0.153076171875, 0.160400390625, 0.167724609375, 0.175048828125, 0.182373046875, 0.189697265625, 0.197021484375, 0.204345703125, 0.211669921875, 0.218994140625, 0.226318359375, 0.233642578125, 0.240966796875, 0.248291015625, 0.255615234375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 6.0, 3.0, 5.0, 5.0, 25.0, 18.0, 26.0, 34.0, 73.0, 119.0, 206.0, 368.0, 815.0, 2282.0, 13530.0, 1027285.0, 3124570.0, 20046.0, 2872.0, 989.0, 445.0, 216.0, 130.0, 90.0, 42.0, 26.0, 26.0, 14.0, 8.0, 7.0, 9.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.666015625, -1.61407470703125, -1.5621337890625, -1.51019287109375, -1.458251953125, -1.40631103515625, -1.3543701171875, -1.30242919921875, -1.25048828125, -1.19854736328125, -1.1466064453125, -1.09466552734375, -1.042724609375, -0.99078369140625, -0.9388427734375, -0.88690185546875, -0.8349609375, -0.78302001953125, -0.7310791015625, -0.67913818359375, -0.627197265625, -0.57525634765625, -0.5233154296875, -0.47137451171875, -0.41943359375, -0.36749267578125, -0.3155517578125, -0.26361083984375, -0.211669921875, -0.15972900390625, -0.1077880859375, -0.05584716796875, -0.00390625, 0.04803466796875, 0.0999755859375, 0.15191650390625, 0.203857421875, 0.25579833984375, 0.3077392578125, 0.35968017578125, 0.41162109375, 0.46356201171875, 0.5155029296875, 0.56744384765625, 0.619384765625, 0.67132568359375, 0.7232666015625, 0.77520751953125, 0.8271484375, 0.87908935546875, 0.9310302734375, 0.98297119140625, 1.034912109375, 1.08685302734375, 1.1387939453125, 1.19073486328125, 1.24267578125, 1.29461669921875, 1.3465576171875, 1.39849853515625, 1.450439453125, 1.50238037109375, 1.5543212890625, 1.60626220703125, 1.658203125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 5.0, 7.0, 21.0, 9.0, 22.0, 28.0, 34.0, 44.0, 60.0, 71.0, 102.0, 139.0, 196.0, 247.0, 316.0, 451.0, 481.0, 445.0, 340.0, 242.0, 200.0, 135.0, 126.0, 90.0, 71.0, 38.0, 38.0, 22.0, 26.0, 12.0, 11.0, 7.0, 9.0, 10.0, 4.0, 5.0, 3.0, 1.0, 2.0, 3.0, 1.0, 3.0, 2.0, 1.0], "bins": [-0.68310546875, -0.6644744873046875, -0.645843505859375, -0.6272125244140625, -0.60858154296875, -0.5899505615234375, -0.571319580078125, -0.5526885986328125, -0.5340576171875, -0.5154266357421875, -0.496795654296875, -0.4781646728515625, -0.45953369140625, -0.4409027099609375, -0.422271728515625, -0.4036407470703125, -0.385009765625, -0.3663787841796875, -0.347747802734375, -0.3291168212890625, -0.31048583984375, -0.2918548583984375, -0.273223876953125, -0.2545928955078125, -0.2359619140625, -0.2173309326171875, -0.198699951171875, -0.1800689697265625, -0.16143798828125, -0.1428070068359375, -0.124176025390625, -0.1055450439453125, -0.0869140625, -0.0682830810546875, -0.049652099609375, -0.0310211181640625, -0.01239013671875, 0.0062408447265625, 0.024871826171875, 0.0435028076171875, 0.0621337890625, 0.0807647705078125, 0.099395751953125, 0.1180267333984375, 0.13665771484375, 0.1552886962890625, 0.173919677734375, 0.1925506591796875, 0.211181640625, 0.2298126220703125, 0.248443603515625, 0.2670745849609375, 0.28570556640625, 0.3043365478515625, 0.322967529296875, 0.3415985107421875, 0.3602294921875, 0.3788604736328125, 0.397491455078125, 0.4161224365234375, 0.43475341796875, 0.4533843994140625, 0.472015380859375, 0.4906463623046875, 0.50927734375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 8.0, 10.0, 14.0, 28.0, 48.0, 105.0, 181.0, 210.0, 157.0, 98.0, 44.0, 35.0, 20.0, 14.0, 13.0, 4.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.362655639648438, -10.053583145141602, -9.744510650634766, -9.43543815612793, -9.126365661621094, -8.817293167114258, -8.508220672607422, -8.199148178100586, -7.890076160430908, -7.581003665924072, -7.271931171417236, -6.9628586769104, -6.653786659240723, -6.344714164733887, -6.035641670227051, -5.726569175720215, -5.417496681213379, -5.108424186706543, -4.799351692199707, -4.490279197692871, -4.181206703186035, -3.8721344470977783, -3.5630621910095215, -3.2539896965026855, -2.9449172019958496, -2.6358447074890137, -2.3267722129821777, -2.017699956893921, -1.708627462387085, -1.399554967880249, -1.0904825925827026, -0.7814102172851562, -0.4723367691040039, -0.16326433420181274, 0.14580810070037842, 0.4548805356025696, 0.7639529705047607, 1.0730254650115967, 1.382097840309143, 1.6911702156066895, 2.0002427101135254, 2.3093152046203613, 2.6183876991271973, 2.927459955215454, 3.23653244972229, 3.545604944229126, 3.854677200317383, 4.163749694824219, 4.472822189331055, 4.781894683837891, 5.090967178344727, 5.4000396728515625, 5.709112167358398, 6.018184661865234, 6.327256679534912, 6.636329174041748, 6.945401668548584, 7.25447416305542, 7.563546657562256, 7.872619152069092, 8.18169116973877, 8.490763664245605, 8.799836158752441, 9.108908653259277, 9.417981147766113]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 6.0, 6.0, 4.0, 10.0, 9.0, 8.0, 12.0, 11.0, 10.0, 21.0, 17.0, 24.0, 27.0, 32.0, 38.0, 33.0, 40.0, 40.0, 52.0, 50.0, 50.0, 53.0, 45.0, 52.0, 46.0, 45.0, 32.0, 39.0, 25.0, 18.0, 20.0, 25.0, 6.0, 16.0, 17.0, 8.0, 9.0, 12.0, 9.0, 3.0, 10.0, 3.0, 2.0, 4.0, 0.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-3.583139419555664, -3.4764435291290283, -3.3697476387023926, -3.263051986694336, -3.1563560962677, -3.0496602058410645, -2.9429643154144287, -2.836268424987793, -2.7295725345611572, -2.6228766441345215, -2.5161807537078857, -2.40948486328125, -2.3027892112731934, -2.1960933208465576, -2.089397430419922, -1.9827015399932861, -1.87600576877594, -1.7693098783493042, -1.662614107131958, -1.5559182167053223, -1.4492223262786865, -1.3425264358520508, -1.2358306646347046, -1.1291347742080688, -1.0224390029907227, -0.9157431721687317, -0.809047281742096, -0.702351450920105, -0.5956555604934692, -0.48895972967147827, -0.3822638988494873, -0.27556800842285156, -0.16887211799621582, -0.06217626482248306, 0.044519588351249695, 0.15121543407440186, 0.2579112946987152, 0.36460715532302856, 0.47130298614501953, 0.5779988765716553, 0.6846947073936462, 0.7913905382156372, 0.898086428642273, 1.0047821998596191, 1.1114780902862549, 1.2181739807128906, 1.3248698711395264, 1.431565761566162, 1.5382615327835083, 1.644957423210144, 1.7516531944274902, 1.858349084854126, 1.9650449752807617, 2.0717408657073975, 2.178436756134033, 2.28513240814209, 2.3918282985687256, 2.4985241889953613, 2.605220079421997, 2.711915969848633, 2.8186116218566895, 2.925307512283325, 3.032003402709961, 3.1386992931365967, 3.2453951835632324]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 5.0, 4.0, 6.0, 11.0, 17.0, 23.0, 37.0, 43.0, 72.0, 123.0, 155.0, 247.0, 416.0, 730.0, 1356.0, 2628.0, 5793.0, 13900.0, 42591.0, 179135.0, 606905.0, 136839.0, 34918.0, 12131.0, 5153.0, 2364.0, 1179.0, 674.0, 386.0, 241.0, 176.0, 99.0, 55.0, 43.0, 21.0, 27.0, 16.0, 9.0, 11.0, 7.0, 5.0, 6.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.377197265625, -0.36556243896484375, -0.3539276123046875, -0.34229278564453125, -0.330657958984375, -0.31902313232421875, -0.3073883056640625, -0.29575347900390625, -0.28411865234375, -0.27248382568359375, -0.2608489990234375, -0.24921417236328125, -0.237579345703125, -0.22594451904296875, -0.2143096923828125, -0.20267486572265625, -0.1910400390625, -0.17940521240234375, -0.1677703857421875, -0.15613555908203125, -0.144500732421875, -0.13286590576171875, -0.1212310791015625, -0.10959625244140625, -0.09796142578125, -0.08632659912109375, -0.0746917724609375, -0.06305694580078125, -0.051422119140625, -0.03978729248046875, -0.0281524658203125, -0.01651763916015625, -0.0048828125, 0.00675201416015625, 0.0183868408203125, 0.03002166748046875, 0.041656494140625, 0.05329132080078125, 0.0649261474609375, 0.07656097412109375, 0.08819580078125, 0.09983062744140625, 0.1114654541015625, 0.12310028076171875, 0.134735107421875, 0.14636993408203125, 0.1580047607421875, 0.16963958740234375, 0.1812744140625, 0.19290924072265625, 0.2045440673828125, 0.21617889404296875, 0.227813720703125, 0.23944854736328125, 0.2510833740234375, 0.26271820068359375, 0.27435302734375, 0.28598785400390625, 0.2976226806640625, 0.30925750732421875, 0.320892333984375, 0.33252716064453125, 0.3441619873046875, 0.35579681396484375, 0.367431640625]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 7.0, 6.0, 6.0, 16.0, 21.0, 24.0, 25.0, 28.0, 38.0, 40.0, 40.0, 53.0, 54.0, 67.0, 60.0, 80.0, 59.0, 46.0, 47.0, 46.0, 42.0, 36.0, 36.0, 29.0, 24.0, 21.0, 16.0, 10.0, 5.0, 4.0, 6.0, 2.0, 3.0, 1.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.403564453125, -0.39208984375, -0.380615234375, -0.369140625, -0.357666015625, -0.34619140625, -0.334716796875, -0.3232421875, -0.311767578125, -0.30029296875, -0.288818359375, -0.27734375, -0.265869140625, -0.25439453125, -0.242919921875, -0.2314453125, -0.219970703125, -0.20849609375, -0.197021484375, -0.185546875, -0.174072265625, -0.16259765625, -0.151123046875, -0.1396484375, -0.128173828125, -0.11669921875, -0.105224609375, -0.09375, -0.082275390625, -0.07080078125, -0.059326171875, -0.0478515625, -0.036376953125, -0.02490234375, -0.013427734375, -0.001953125, 0.009521484375, 0.02099609375, 0.032470703125, 0.0439453125, 0.055419921875, 0.06689453125, 0.078369140625, 0.08984375, 0.101318359375, 0.11279296875, 0.124267578125, 0.1357421875, 0.147216796875, 0.15869140625, 0.170166015625, 0.181640625, 0.193115234375, 0.20458984375, 0.216064453125, 0.2275390625, 0.239013671875, 0.25048828125, 0.261962890625, 0.2734375, 0.284912109375, 0.29638671875, 0.307861328125, 0.3193359375, 0.330810546875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 2.0, 1.0, 2.0, 4.0, 7.0, 14.0, 19.0, 19.0, 35.0, 49.0, 98.0, 122.0, 235.0, 397.0, 866.0, 2148.0, 7630.0, 46927.0, 874408.0, 97309.0, 12731.0, 3153.0, 1158.0, 497.0, 253.0, 163.0, 96.0, 63.0, 43.0, 31.0, 26.0, 13.0, 9.0, 8.0, 5.0, 6.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.56689453125, -0.54840087890625, -0.5299072265625, -0.51141357421875, -0.492919921875, -0.47442626953125, -0.4559326171875, -0.43743896484375, -0.4189453125, -0.40045166015625, -0.3819580078125, -0.36346435546875, -0.344970703125, -0.32647705078125, -0.3079833984375, -0.28948974609375, -0.27099609375, -0.25250244140625, -0.2340087890625, -0.21551513671875, -0.197021484375, -0.17852783203125, -0.1600341796875, -0.14154052734375, -0.123046875, -0.10455322265625, -0.0860595703125, -0.06756591796875, -0.049072265625, -0.03057861328125, -0.0120849609375, 0.00640869140625, 0.02490234375, 0.04339599609375, 0.0618896484375, 0.08038330078125, 0.098876953125, 0.11737060546875, 0.1358642578125, 0.15435791015625, 0.1728515625, 0.19134521484375, 0.2098388671875, 0.22833251953125, 0.246826171875, 0.26531982421875, 0.2838134765625, 0.30230712890625, 0.32080078125, 0.33929443359375, 0.3577880859375, 0.37628173828125, 0.394775390625, 0.41326904296875, 0.4317626953125, 0.45025634765625, 0.46875, 0.48724365234375, 0.5057373046875, 0.52423095703125, 0.542724609375, 0.56121826171875, 0.5797119140625, 0.59820556640625, 0.61669921875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 3.0, 3.0, 6.0, 7.0, 12.0, 13.0, 6.0, 15.0, 17.0, 17.0, 21.0, 35.0, 25.0, 38.0, 38.0, 52.0, 83.0, 90.0, 89.0, 72.0, 55.0, 52.0, 39.0, 41.0, 32.0, 19.0, 20.0, 19.0, 14.0, 16.0, 10.0, 7.0, 15.0, 4.0, 5.0, 3.0, 4.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.3564453125, -1.3155364990234375, -1.274627685546875, -1.2337188720703125, -1.19281005859375, -1.1519012451171875, -1.110992431640625, -1.0700836181640625, -1.0291748046875, -0.9882659912109375, -0.947357177734375, -0.9064483642578125, -0.86553955078125, -0.8246307373046875, -0.783721923828125, -0.7428131103515625, -0.701904296875, -0.6609954833984375, -0.620086669921875, -0.5791778564453125, -0.53826904296875, -0.4973602294921875, -0.456451416015625, -0.4155426025390625, -0.3746337890625, -0.3337249755859375, -0.292816162109375, -0.2519073486328125, -0.21099853515625, -0.1700897216796875, -0.129180908203125, -0.0882720947265625, -0.04736328125, -0.0064544677734375, 0.034454345703125, 0.0753631591796875, 0.11627197265625, 0.1571807861328125, 0.198089599609375, 0.2389984130859375, 0.2799072265625, 0.3208160400390625, 0.361724853515625, 0.4026336669921875, 0.44354248046875, 0.4844512939453125, 0.525360107421875, 0.5662689208984375, 0.607177734375, 0.6480865478515625, 0.688995361328125, 0.7299041748046875, 0.77081298828125, 0.8117218017578125, 0.852630615234375, 0.8935394287109375, 0.9344482421875, 0.9753570556640625, 1.016265869140625, 1.0571746826171875, 1.09808349609375, 1.1389923095703125, 1.179901123046875, 1.2208099365234375, 1.26171875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 4.0, 6.0, 6.0, 14.0, 24.0, 18.0, 36.0, 59.0, 99.0, 158.0, 247.0, 445.0, 1062.0, 2515.0, 8113.0, 34419.0, 753326.0, 211347.0, 26255.0, 6438.0, 2089.0, 843.0, 400.0, 185.0, 146.0, 93.0, 57.0, 41.0, 27.0, 17.0, 11.0, 17.0, 10.0, 7.0, 5.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.09893798828125, -0.09573745727539062, -0.09253692626953125, -0.08933639526367188, -0.0861358642578125, -0.08293533325195312, -0.07973480224609375, -0.07653427124023438, -0.073333740234375, -0.07013320922851562, -0.06693267822265625, -0.06373214721679688, -0.0605316162109375, -0.057331085205078125, -0.05413055419921875, -0.050930023193359375, -0.0477294921875, -0.044528961181640625, -0.04132843017578125, -0.038127899169921875, -0.0349273681640625, -0.031726837158203125, -0.02852630615234375, -0.025325775146484375, -0.022125244140625, -0.018924713134765625, -0.01572418212890625, -0.012523651123046875, -0.0093231201171875, -0.006122589111328125, -0.00292205810546875, 0.000278472900390625, 0.00347900390625, 0.006679534912109375, 0.00988006591796875, 0.013080596923828125, 0.0162811279296875, 0.019481658935546875, 0.02268218994140625, 0.025882720947265625, 0.029083251953125, 0.032283782958984375, 0.03548431396484375, 0.038684844970703125, 0.0418853759765625, 0.045085906982421875, 0.04828643798828125, 0.051486968994140625, 0.0546875, 0.057888031005859375, 0.06108856201171875, 0.06428909301757812, 0.0674896240234375, 0.07069015502929688, 0.07389068603515625, 0.07709121704101562, 0.080291748046875, 0.08349227905273438, 0.08669281005859375, 0.08989334106445312, 0.0930938720703125, 0.09629440307617188, 0.09949493408203125, 0.10269546508789062, 0.10589599609375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 2.0, 6.0, 7.0, 5.0, 16.0, 9.0, 7.0, 8.0, 21.0, 15.0, 17.0, 17.0, 20.0, 36.0, 43.0, 58.0, 59.0, 66.0, 79.0, 87.0, 66.0, 59.0, 54.0, 43.0, 35.0, 24.0, 26.0, 18.0, 10.0, 6.0, 11.0, 8.0, 10.0, 6.0, 9.0, 10.0, 4.0, 5.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.5987625122070312e-05, -2.519134432077408e-05, -2.4395063519477844e-05, -2.359878271818161e-05, -2.2802501916885376e-05, -2.2006221115589142e-05, -2.1209940314292908e-05, -2.0413659512996674e-05, -1.961737871170044e-05, -1.8821097910404205e-05, -1.802481710910797e-05, -1.7228536307811737e-05, -1.6432255506515503e-05, -1.563597470521927e-05, -1.4839693903923035e-05, -1.40434131026268e-05, -1.3247132301330566e-05, -1.2450851500034332e-05, -1.1654570698738098e-05, -1.0858289897441864e-05, -1.006200909614563e-05, -9.265728294849396e-06, -8.469447493553162e-06, -7.673166692256927e-06, -6.876885890960693e-06, -6.080605089664459e-06, -5.284324288368225e-06, -4.488043487071991e-06, -3.691762685775757e-06, -2.8954818844795227e-06, -2.0992010831832886e-06, -1.3029202818870544e-06, -5.066394805908203e-07, 2.896413207054138e-07, 1.085922122001648e-06, 1.882202923297882e-06, 2.678483724594116e-06, 3.4747645258903503e-06, 4.2710453271865845e-06, 5.067326128482819e-06, 5.863606929779053e-06, 6.659887731075287e-06, 7.456168532371521e-06, 8.252449333667755e-06, 9.04873013496399e-06, 9.845010936260223e-06, 1.0641291737556458e-05, 1.1437572538852692e-05, 1.2233853340148926e-05, 1.303013414144516e-05, 1.3826414942741394e-05, 1.4622695744037628e-05, 1.5418976545333862e-05, 1.6215257346630096e-05, 1.701153814792633e-05, 1.7807818949222565e-05, 1.86040997505188e-05, 1.9400380551815033e-05, 2.0196661353111267e-05, 2.09929421544075e-05, 2.1789222955703735e-05, 2.258550375699997e-05, 2.3381784558296204e-05, 2.4178065359592438e-05, 2.4974346160888672e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 6.0, 4.0, 10.0, 18.0, 28.0, 44.0, 89.0, 172.0, 429.0, 1247.0, 4028.0, 20827.0, 830424.0, 173531.0, 13125.0, 2954.0, 967.0, 340.0, 124.0, 75.0, 35.0, 25.0, 19.0, 9.0, 6.0, 3.0, 2.0, 3.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.173095703125, -0.166656494140625, -0.16021728515625, -0.153778076171875, -0.1473388671875, -0.140899658203125, -0.13446044921875, -0.128021240234375, -0.12158203125, -0.115142822265625, -0.10870361328125, -0.102264404296875, -0.0958251953125, -0.089385986328125, -0.08294677734375, -0.076507568359375, -0.070068359375, -0.063629150390625, -0.05718994140625, -0.050750732421875, -0.0443115234375, -0.037872314453125, -0.03143310546875, -0.024993896484375, -0.0185546875, -0.012115478515625, -0.00567626953125, 0.000762939453125, 0.0072021484375, 0.013641357421875, 0.02008056640625, 0.026519775390625, 0.032958984375, 0.039398193359375, 0.04583740234375, 0.052276611328125, 0.0587158203125, 0.065155029296875, 0.07159423828125, 0.078033447265625, 0.08447265625, 0.090911865234375, 0.09735107421875, 0.103790283203125, 0.1102294921875, 0.116668701171875, 0.12310791015625, 0.129547119140625, 0.135986328125, 0.142425537109375, 0.14886474609375, 0.155303955078125, 0.1617431640625, 0.168182373046875, 0.17462158203125, 0.181060791015625, 0.1875, 0.193939208984375, 0.20037841796875, 0.206817626953125, 0.2132568359375, 0.219696044921875, 0.22613525390625, 0.232574462890625, 0.239013671875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 4.0, 1.0, 2.0, 3.0, 0.0, 4.0, 1.0, 2.0, 4.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 3.0, 6.0, 6.0, 10.0, 17.0, 17.0, 27.0, 27.0, 37.0, 30.0, 38.0, 65.0, 66.0, 71.0, 93.0, 81.0, 55.0, 54.0, 48.0, 50.0, 38.0, 34.0, 18.0, 14.0, 10.0, 8.0, 13.0, 4.0, 6.0, 6.0, 7.0, 4.0, 6.0, 1.0, 1.0, 3.0, 2.0, 4.0, 1.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08740234375, -0.08473014831542969, -0.08205795288085938, -0.07938575744628906, -0.07671356201171875, -0.07404136657714844, -0.07136917114257812, -0.06869697570800781, -0.0660247802734375, -0.06335258483886719, -0.060680389404296875, -0.05800819396972656, -0.05533599853515625, -0.05266380310058594, -0.049991607666015625, -0.04731941223144531, -0.044647216796875, -0.04197502136230469, -0.039302825927734375, -0.03663063049316406, -0.03395843505859375, -0.03128623962402344, -0.028614044189453125, -0.025941848754882812, -0.0232696533203125, -0.020597457885742188, -0.017925262451171875, -0.015253067016601562, -0.01258087158203125, -0.009908676147460938, -0.007236480712890625, -0.0045642852783203125, -0.00189208984375, 0.0007801055908203125, 0.003452301025390625, 0.0061244964599609375, 0.00879669189453125, 0.011468887329101562, 0.014141082763671875, 0.016813278198242188, 0.0194854736328125, 0.022157669067382812, 0.024829864501953125, 0.027502059936523438, 0.03017425537109375, 0.03284645080566406, 0.035518646240234375, 0.03819084167480469, 0.040863037109375, 0.04353523254394531, 0.046207427978515625, 0.04887962341308594, 0.05155181884765625, 0.05422401428222656, 0.056896209716796875, 0.05956840515136719, 0.0622406005859375, 0.06491279602050781, 0.06758499145507812, 0.07025718688964844, 0.07292938232421875, 0.07560157775878906, 0.07827377319335938, 0.08094596862792969, 0.0836181640625]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 2.0, 9.0, 13.0, 31.0, 72.0, 189.0, 442.0, 120.0, 49.0, 40.0, 17.0, 7.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.835155963897705, -5.654603481292725, -5.474050521850586, -5.2934980392456055, -5.112945556640625, -4.9323930740356445, -4.751840114593506, -4.571287631988525, -4.390734672546387, -4.210182189941406, -4.029629230499268, -3.849076747894287, -3.6685242652893066, -3.487971544265747, -3.3074188232421875, -3.126866340637207, -2.9463138580322266, -2.765761137008667, -2.5852086544036865, -2.404655933380127, -2.2241034507751465, -2.043550729751587, -1.8629980087280273, -1.6824454069137573, -1.5018928050994873, -1.3213402032852173, -1.1407876014709473, -0.9602348804473877, -0.7796822786331177, -0.5991296768188477, -0.4185769557952881, -0.23802435398101807, -0.05747222900390625, 0.12308040261268616, 0.30363303422927856, 0.48418569564819336, 0.6647382974624634, 0.8452908992767334, 1.025843620300293, 1.206396222114563, 1.386948823928833, 1.567501425743103, 1.748054027557373, 1.9286067485809326, 2.109159469604492, 2.2897119522094727, 2.4702646732330322, 2.650817394256592, 2.8313698768615723, 3.011922597885132, 3.1924750804901123, 3.373027801513672, 3.5535802841186523, 3.734133005142212, 3.9146857261657715, 4.095238208770752, 4.275791168212891, 4.456343650817871, 4.63689661026001, 4.81744909286499, 4.998001575469971, 5.178554534912109, 5.35910701751709, 5.53965950012207, 5.720211982727051]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 5.0, 9.0, 6.0, 5.0, 13.0, 12.0, 9.0, 18.0, 15.0, 16.0, 11.0, 15.0, 19.0, 21.0, 32.0, 40.0, 72.0, 88.0, 114.0, 126.0, 76.0, 58.0, 32.0, 19.0, 17.0, 21.0, 15.0, 13.0, 13.0, 18.0, 12.0, 7.0, 17.0, 2.0, 9.0, 4.0, 2.0, 3.0, 6.0, 3.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.700096845626831, -2.6126434803009033, -2.5251901149749756, -2.437736749649048, -2.35028338432312, -2.2628297805786133, -2.1753764152526855, -2.087923049926758, -2.00046968460083, -1.9130163192749023, -1.8255629539489746, -1.7381095886230469, -1.6506561040878296, -1.5632027387619019, -1.4757493734359741, -1.3882958889007568, -1.3008426427841187, -1.213389277458191, -1.1259359121322632, -1.038482427597046, -0.9510290622711182, -0.8635756969451904, -0.7761223316192627, -0.6886689066886902, -0.6012155413627625, -0.5137621760368347, -0.4263087511062622, -0.3388553857803345, -0.25140199065208435, -0.16394859552383423, -0.0764952301979065, 0.010958194732666016, 0.09841156005859375, 0.18586495518684387, 0.273318350315094, 0.36077171564102173, 0.44822511076927185, 0.535678505897522, 0.6231318712234497, 0.7105852961540222, 0.79803866147995, 0.8854920268058777, 0.9729454517364502, 1.060398817062378, 1.1478521823883057, 1.2353055477142334, 1.3227589130401611, 1.4102123975753784, 1.4976657629013062, 1.5851191282272339, 1.6725724935531616, 1.760025978088379, 1.8474793434143066, 1.9349327087402344, 2.022386074066162, 2.10983943939209, 2.1972928047180176, 2.2847461700439453, 2.372199535369873, 2.459652900695801, 2.5471062660217285, 2.6345596313476562, 2.722012996673584, 2.809466600418091, 2.8969199657440186]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 4.0, 2.0, 1.0, 2.0, 5.0, 5.0, 4.0, 8.0, 9.0, 12.0, 10.0, 16.0, 12.0, 16.0, 27.0, 25.0, 26.0, 34.0, 33.0, 41.0, 75.0, 173.0, 135.0, 64.0, 50.0, 22.0, 25.0, 22.0, 22.0, 16.0, 14.0, 18.0, 17.0, 17.0, 7.0, 8.0, 10.0, 2.0, 7.0, 5.0, 3.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.34130859375, -0.3315086364746094, -0.32170867919921875, -0.3119087219238281, -0.3021087646484375, -0.2923088073730469, -0.28250885009765625, -0.2727088928222656, -0.262908935546875, -0.2531089782714844, -0.24330902099609375, -0.23350906372070312, -0.2237091064453125, -0.21390914916992188, -0.20410919189453125, -0.19430923461914062, -0.18450927734375, -0.17470932006835938, -0.16490936279296875, -0.15510940551757812, -0.1453094482421875, -0.13550949096679688, -0.12570953369140625, -0.11590957641601562, -0.106109619140625, -0.09630966186523438, -0.08650970458984375, -0.07670974731445312, -0.0669097900390625, -0.057109832763671875, -0.04730987548828125, -0.037509918212890625, -0.0277099609375, -0.017910003662109375, -0.00811004638671875, 0.001689910888671875, 0.0114898681640625, 0.021289825439453125, 0.03108978271484375, 0.040889739990234375, 0.050689697265625, 0.060489654541015625, 0.07028961181640625, 0.08008956909179688, 0.0898895263671875, 0.09968948364257812, 0.10948944091796875, 0.11928939819335938, 0.12908935546875, 0.13888931274414062, 0.14868927001953125, 0.15848922729492188, 0.1682891845703125, 0.17808914184570312, 0.18788909912109375, 0.19768905639648438, 0.207489013671875, 0.21728897094726562, 0.22708892822265625, 0.23688888549804688, 0.2466888427734375, 0.2564888000488281, 0.26628875732421875, 0.2760887145996094, 0.285888671875]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 5.0, 5.0, 13.0, 30.0, 27.0, 43.0, 86.0, 163.0, 309.0, 920.0, 3025.0, 16804.0, 8334188.0, 27081.0, 4050.0, 1034.0, 366.0, 189.0, 81.0, 39.0, 42.0, 24.0, 12.0, 11.0, 5.0, 2.0, 5.0, 5.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-2.7938287258148193, -2.723268508911133, -2.6527082920074463, -2.5821480751037598, -2.5115878582000732, -2.4410276412963867, -2.3704674243927, -2.2999072074890137, -2.229346752166748, -2.1587865352630615, -2.088226318359375, -2.0176661014556885, -1.947105884552002, -1.8765456676483154, -1.8059853315353394, -1.7354251146316528, -1.6648650169372559, -1.5943048000335693, -1.5237445831298828, -1.4531843662261963, -1.3826241493225098, -1.3120639324188232, -1.2415035963058472, -1.1709433794021606, -1.1003831624984741, -1.0298229455947876, -0.9592627286911011, -0.8887024521827698, -0.8181422352790833, -0.7475820183753967, -0.6770217418670654, -0.6064615249633789, -0.5359013080596924, -0.46534109115600586, -0.39478084444999695, -0.32422059774398804, -0.2536603808403015, -0.183100163936615, -0.11253991723060608, -0.04197967052459717, 0.028580546379089355, 0.09914077818393707, 0.1697010099887848, 0.2402612417936325, 0.3108214735984802, 0.38138169050216675, 0.45194193720817566, 0.5225021839141846, 0.5930624008178711, 0.6636226177215576, 0.7341828346252441, 0.8047431111335754, 0.875303328037262, 0.9458635449409485, 1.0164238214492798, 1.0869840383529663, 1.1575442552566528, 1.2281044721603394, 1.2986646890640259, 1.3692249059677124, 1.4397852420806885, 1.510345458984375, 1.5809056758880615, 1.651465892791748, 1.7220261096954346]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 4.0, 4.0, 5.0, 2.0, 4.0, 1.0, 3.0, 5.0, 5.0, 3.0, 2.0, 4.0, 3.0, 4.0, 4.0, 3.0, 2.0, 4.0, 5.0, 3.0, 4.0, 1.0, 3.0, 4.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.462428092956543, -2.3887715339660645, -2.315114974975586, -2.2414584159851074, -2.167801856994629, -2.0941450595855713, -2.0204885005950928, -1.9468319416046143, -1.8731753826141357, -1.7995188236236572, -1.7258622646331787, -1.6522055864334106, -1.5785490274429321, -1.5048924684524536, -1.4312357902526855, -1.357579231262207, -1.2839226722717285, -1.21026611328125, -1.1366095542907715, -1.0629528760910034, -0.9892963171005249, -0.9156397581100464, -0.8419831395149231, -0.7683265209197998, -0.6946699619293213, -0.6210134029388428, -0.5473567843437195, -0.4737001955509186, -0.4000436067581177, -0.3263870179653168, -0.25273042917251587, -0.17907381057739258, -0.10541725158691406, -0.03176066279411316, 0.041895925998687744, 0.11555251479148865, 0.18920910358428955, 0.26286569237709045, 0.33652228116989136, 0.41017889976501465, 0.48383545875549316, 0.5574920177459717, 0.631148636341095, 0.7048052549362183, 0.7784618139266968, 0.8521183729171753, 0.9257749915122986, 0.9994316101074219, 1.0730881690979004, 1.146744728088379, 1.2204012870788574, 1.2940579652786255, 1.367714524269104, 1.4413710832595825, 1.5150277614593506, 1.588684320449829, 1.6623408794403076, 1.7359974384307861, 1.8096539974212646, 1.8833106756210327, 1.9569672346115112, 2.0306239128112793, 2.104280471801758, 2.1779370307922363, 2.251593589782715]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 2.0, 4.0, 5.0, 7.0, 4.0, 6.0, 17.0, 17.0, 21.0, 21.0, 28.0, 30.0, 40.0, 51.0, 40.0, 45.0, 56.0, 57.0, 73.0, 64.0, 53.0, 39.0, 61.0, 45.0, 43.0, 35.0, 23.0, 18.0, 17.0, 21.0, 13.0, 14.0, 7.0, 6.0, 7.0, 2.0, 4.0, 1.0, 3.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.282958984375, -0.27495574951171875, -0.2669525146484375, -0.25894927978515625, -0.250946044921875, -0.24294281005859375, -0.2349395751953125, -0.22693634033203125, -0.21893310546875, -0.21092987060546875, -0.2029266357421875, -0.19492340087890625, -0.186920166015625, -0.17891693115234375, -0.1709136962890625, -0.16291046142578125, -0.1549072265625, -0.14690399169921875, -0.1389007568359375, -0.13089752197265625, -0.122894287109375, -0.11489105224609375, -0.1068878173828125, -0.09888458251953125, -0.09088134765625, -0.08287811279296875, -0.0748748779296875, -0.06687164306640625, -0.058868408203125, -0.05086517333984375, -0.0428619384765625, -0.03485870361328125, -0.02685546875, -0.01885223388671875, -0.0108489990234375, -0.00284576416015625, 0.005157470703125, 0.01316070556640625, 0.0211639404296875, 0.02916717529296875, 0.03717041015625, 0.04517364501953125, 0.0531768798828125, 0.06118011474609375, 0.069183349609375, 0.07718658447265625, 0.0851898193359375, 0.09319305419921875, 0.1011962890625, 0.10919952392578125, 0.1172027587890625, 0.12520599365234375, 0.133209228515625, 0.14121246337890625, 0.1492156982421875, 0.15721893310546875, 0.16522216796875, 0.17322540283203125, 0.1812286376953125, 0.18923187255859375, 0.197235107421875, 0.20523834228515625, 0.2132415771484375, 0.22124481201171875, 0.229248046875]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 6.0, 7.0, 5.0, 17.0, 15.0, 26.0, 35.0, 41.0, 86.0, 157.0, 281.0, 501.0, 963.0, 2150.0, 5533.0, 14922.0, 45060.0, 139478.0, 197741.0, 77454.0, 24908.0, 8830.0, 3283.0, 1305.0, 661.0, 329.0, 185.0, 110.0, 54.0, 41.0, 26.0, 17.0, 11.0, 15.0, 3.0, 5.0, 5.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.291015625, -2.227783203125, -2.16455078125, -2.101318359375, -2.0380859375, -1.974853515625, -1.91162109375, -1.848388671875, -1.78515625, -1.721923828125, -1.65869140625, -1.595458984375, -1.5322265625, -1.468994140625, -1.40576171875, -1.342529296875, -1.279296875, -1.216064453125, -1.15283203125, -1.089599609375, -1.0263671875, -0.963134765625, -0.89990234375, -0.836669921875, -0.7734375, -0.710205078125, -0.64697265625, -0.583740234375, -0.5205078125, -0.457275390625, -0.39404296875, -0.330810546875, -0.267578125, -0.204345703125, -0.14111328125, -0.077880859375, -0.0146484375, 0.048583984375, 0.11181640625, 0.175048828125, 0.23828125, 0.301513671875, 0.36474609375, 0.427978515625, 0.4912109375, 0.554443359375, 0.61767578125, 0.680908203125, 0.744140625, 0.807373046875, 0.87060546875, 0.933837890625, 0.9970703125, 1.060302734375, 1.12353515625, 1.186767578125, 1.25, 1.313232421875, 1.37646484375, 1.439697265625, 1.5029296875, 1.566162109375, 1.62939453125, 1.692626953125, 1.755859375]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 1.0, 7.0, 4.0, 2.0, 12.0, 6.0, 9.0, 11.0, 22.0, 18.0, 18.0, 18.0, 19.0, 29.0, 25.0, 37.0, 42.0, 47.0, 58.0, 46.0, 45.0, 43.0, 52.0, 45.0, 45.0, 41.0, 39.0, 33.0, 24.0, 32.0, 34.0, 25.0, 18.0, 19.0, 18.0, 12.0, 7.0, 12.0, 4.0, 6.0, 6.0, 6.0, 2.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.2279052734375, -0.22067832946777344, -0.21345138549804688, -0.2062244415283203, -0.19899749755859375, -0.1917705535888672, -0.18454360961914062, -0.17731666564941406, -0.1700897216796875, -0.16286277770996094, -0.15563583374023438, -0.1484088897705078, -0.14118194580078125, -0.1339550018310547, -0.12672805786132812, -0.11950111389160156, -0.112274169921875, -0.10504722595214844, -0.09782028198242188, -0.09059333801269531, -0.08336639404296875, -0.07613945007324219, -0.06891250610351562, -0.06168556213378906, -0.0544586181640625, -0.04723167419433594, -0.040004730224609375, -0.03277778625488281, -0.02555084228515625, -0.018323898315429688, -0.011096954345703125, -0.0038700103759765625, 0.00335693359375, 0.010583877563476562, 0.017810821533203125, 0.025037765502929688, 0.03226470947265625, 0.03949165344238281, 0.046718597412109375, 0.05394554138183594, 0.0611724853515625, 0.06839942932128906, 0.07562637329101562, 0.08285331726074219, 0.09008026123046875, 0.09730720520019531, 0.10453414916992188, 0.11176109313964844, 0.118988037109375, 0.12621498107910156, 0.13344192504882812, 0.1406688690185547, 0.14789581298828125, 0.1551227569580078, 0.16234970092773438, 0.16957664489746094, 0.1768035888671875, 0.18403053283691406, 0.19125747680664062, 0.1984844207763672, 0.20571136474609375, 0.2129383087158203, 0.22016525268554688, 0.22739219665527344, 0.234619140625]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 5.0, 7.0, 6.0, 8.0, 10.0, 21.0, 39.0, 75.0, 86.0, 83.0, 52.0, 36.0, 7.0, 11.0, 10.0, 3.0, 4.0, 6.0, 5.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.4071333408355713, -2.3411073684692383, -2.275081157684326, -2.209055185317993, -2.14302921295166, -2.077003240585327, -2.010977268218994, -1.944951057434082, -1.878925085067749, -1.812899112701416, -1.7468730211257935, -1.680846929550171, -1.614820957183838, -1.5487949848175049, -1.4827688932418823, -1.4167428016662598, -1.3507168292999268, -1.2846908569335938, -1.2186647653579712, -1.1526386737823486, -1.0866127014160156, -1.0205867290496826, -0.9545606374740601, -0.8885346055030823, -0.8225085735321045, -0.7564825415611267, -0.6904565095901489, -0.6244304776191711, -0.5584044456481934, -0.4923784136772156, -0.4263523817062378, -0.36032634973526, -0.29430055618286133, -0.22827452421188354, -0.16224849224090576, -0.09622246026992798, -0.030196428298950195, 0.03582960367202759, 0.10185563564300537, 0.16788166761398315, 0.23390769958496094, 0.2999337315559387, 0.3659597635269165, 0.4319857954978943, 0.49801182746887207, 0.5640378594398499, 0.6300638914108276, 0.6960899233818054, 0.7621159553527832, 0.828141987323761, 0.8941680192947388, 0.9601940512657166, 1.0262200832366943, 1.0922460556030273, 1.15827214717865, 1.2242982387542725, 1.2903242111206055, 1.3563501834869385, 1.422376275062561, 1.4884023666381836, 1.5544283390045166, 1.6204543113708496, 1.6864804029464722, 1.7525064945220947, 1.8185324668884277]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 7.0, 6.0, 2.0, 2.0, 4.0, 4.0, 5.0, 4.0, 6.0, 2.0, 9.0, 21.0, 40.0, 51.0, 83.0, 79.0, 58.0, 31.0, 20.0, 9.0, 11.0, 5.0, 5.0, 1.0, 8.0, 3.0, 4.0, 2.0, 1.0, 4.0, 1.0, 3.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-2.291684627532959, -2.2347826957702637, -2.1778810024261475, -2.120979070663452, -2.064077138900757, -2.0071754455566406, -1.9502735137939453, -1.89337158203125, -1.8364697694778442, -1.7795679569244385, -1.7226660251617432, -1.6657642126083374, -1.6088624000549316, -1.5519604682922363, -1.4950586557388306, -1.4381568431854248, -1.3812549114227295, -1.3243530988693237, -1.2674511671066284, -1.2105493545532227, -1.1536474227905273, -1.0967456102371216, -1.0398437976837158, -0.9829419255256653, -0.9260400533676147, -0.8691381812095642, -0.8122363090515137, -0.7553344964981079, -0.6984326243400574, -0.6415307521820068, -0.5846289396286011, -0.5277270674705505, -0.47082507610321045, -0.4139232039451599, -0.35702136158943176, -0.3001195192337036, -0.24321764707565308, -0.18631577491760254, -0.1294139325618744, -0.07251209020614624, -0.015610218048095703, 0.04129163920879364, 0.09819349646568298, 0.15509535372257233, 0.21199721097946167, 0.2688990831375122, 0.32580092549324036, 0.3827027678489685, 0.43960464000701904, 0.4965065121650696, 0.5534083843231201, 0.6103101968765259, 0.6672120690345764, 0.724113941192627, 0.7810157537460327, 0.8379176259040833, 0.8948194980621338, 0.9517213702201843, 1.0086232423782349, 1.0655250549316406, 1.122426986694336, 1.1793287992477417, 1.2362306118011475, 1.2931325435638428, 1.3500343561172485]}, "eval/loss": 0.32974740862846375, "eval/wer": 0.09492264974216581, "eval/runtime": 555.2371, "eval/samples_per_second": 4.758, "eval/steps_per_second": 0.596} \ No newline at end of file +{"train/loss": 0.0607, "train/learning_rate": 6.936416184971098e-07, "train/epoch": 5.0, "train/global_step": 2230, "_runtime": 26664, "_timestamp": 1648081418, "_step": 2234, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 9.0, 68.0, 378.0, 461.0, 73.0, 23.0, 5.0], "bins": [-18.02739143371582, -17.72731590270996, -17.4272403717041, -17.127166748046875, -16.827091217041016, -16.527015686035156, -16.226940155029297, -15.926865577697754, -15.626791000366211, -15.326715469360352, -15.026640892028809, -14.72656536102295, -14.426490783691406, -14.126415252685547, -13.826340675354004, -13.526265144348145, -13.226189613342285, -12.926114082336426, -12.626039505004883, -12.325963973999023, -12.02588939666748, -11.725813865661621, -11.425739288330078, -11.125663757324219, -10.82558822631836, -10.5255126953125, -10.225438117980957, -9.925362586975098, -9.625288009643555, -9.325212478637695, -9.025137901306152, -8.725062370300293, -8.42498779296875, -8.12491226196289, -7.824837684631348, -7.5247626304626465, -7.224687576293945, -6.924612045288086, -6.624536991119385, -6.324461936950684, -6.024386882781982, -5.724311828613281, -5.42423677444458, -5.124161720275879, -4.8240861892700195, -4.524011611938477, -4.223936080932617, -3.923861026763916, -3.623785972595215, -3.3237109184265137, -3.0236358642578125, -2.7235605716705322, -2.423485517501831, -2.12341046333313, -1.8233352899551392, -1.5232601165771484, -1.2231850624084473, -0.9231099486351013, -0.6230348348617554, -0.3229597210884094, -0.022884607315063477, 0.2771904468536377, 0.5772656202316284, 0.8773407936096191, 1.1774158477783203]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 5.0, 5.0, 4.0, 11.0, 14.0, 14.0, 20.0, 26.0, 20.0, 29.0, 30.0, 47.0, 41.0, 36.0, 27.0, 36.0, 39.0, 42.0, 64.0, 43.0, 57.0, 43.0, 37.0, 54.0, 40.0, 31.0, 31.0, 27.0, 24.0, 22.0, 22.0, 21.0, 7.0, 10.0, 10.0, 3.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.5585064888000488, -1.5144308805465698, -1.4703552722930908, -1.4262796640396118, -1.3822040557861328, -1.3381283283233643, -1.2940528392791748, -1.2499771118164062, -1.2059015035629272, -1.1618258953094482, -1.1177502870559692, -1.0736746788024902, -1.0295990705490112, -0.9855234026908875, -0.9414477944374084, -0.8973721265792847, -0.8532965779304504, -0.8092209696769714, -0.7651453614234924, -0.7210696935653687, -0.6769940853118896, -0.6329184770584106, -0.5888428688049316, -0.5447672605514526, -0.5006916522979736, -0.45661604404449463, -0.41254040598869324, -0.36846479773521423, -0.32438915967941284, -0.28031355142593384, -0.23623794317245483, -0.19216230511665344, -0.14808666706085205, -0.10401104390621185, -0.05993542820215225, -0.01585981249809265, 0.028215810656547546, 0.07229143381118774, 0.11636704206466675, 0.16044268012046814, 0.20451828837394714, 0.24859391152858734, 0.29266953468322754, 0.33674514293670654, 0.38082075119018555, 0.42489638924598694, 0.46897199749946594, 0.5130476355552673, 0.5571232438087463, 0.6011988520622253, 0.6452744603157043, 0.6893501281738281, 0.7334257364273071, 0.7775013446807861, 0.8215769529342651, 0.8656525611877441, 0.9097281694412231, 0.9538037776947021, 0.9978793859481812, 1.0419549942016602, 1.0860306024551392, 1.1301062107086182, 1.1741819381713867, 1.2182575464248657, 1.2623331546783447]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 3.0, 2.0, 5.0, 3.0, 5.0, 15.0, 18.0, 25.0, 39.0, 64.0, 77.0, 122.0, 168.0, 265.0, 409.0, 597.0, 977.0, 1516.0, 2377.0, 3912.0, 7508.0, 26892.0, 350221.0, 3272449.0, 467680.0, 39875.0, 8556.0, 4066.0, 2386.0, 1466.0, 911.0, 571.0, 376.0, 238.0, 168.0, 115.0, 81.0, 39.0, 27.0, 22.0, 20.0, 7.0, 7.0, 2.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.64453125, -4.497314453125, -4.35009765625, -4.202880859375, -4.0556640625, -3.908447265625, -3.76123046875, -3.614013671875, -3.466796875, -3.319580078125, -3.17236328125, -3.025146484375, -2.8779296875, -2.730712890625, -2.58349609375, -2.436279296875, -2.2890625, -2.141845703125, -1.99462890625, -1.847412109375, -1.7001953125, -1.552978515625, -1.40576171875, -1.258544921875, -1.111328125, -0.964111328125, -0.81689453125, -0.669677734375, -0.5224609375, -0.375244140625, -0.22802734375, -0.080810546875, 0.06640625, 0.213623046875, 0.36083984375, 0.508056640625, 0.6552734375, 0.802490234375, 0.94970703125, 1.096923828125, 1.244140625, 1.391357421875, 1.53857421875, 1.685791015625, 1.8330078125, 1.980224609375, 2.12744140625, 2.274658203125, 2.421875, 2.569091796875, 2.71630859375, 2.863525390625, 3.0107421875, 3.157958984375, 3.30517578125, 3.452392578125, 3.599609375, 3.746826171875, 3.89404296875, 4.041259765625, 4.1884765625, 4.335693359375, 4.48291015625, 4.630126953125, 4.77734375]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 5.0, 6.0, 4.0, 8.0, 8.0, 12.0, 9.0, 15.0, 17.0, 23.0, 21.0, 27.0, 31.0, 29.0, 33.0, 34.0, 27.0, 40.0, 35.0, 35.0, 55.0, 54.0, 52.0, 42.0, 45.0, 38.0, 34.0, 50.0, 24.0, 26.0, 26.0, 29.0, 12.0, 17.0, 22.0, 13.0, 6.0, 10.0, 7.0, 10.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0], "bins": [-2.458984375, -2.390777587890625, -2.32257080078125, -2.254364013671875, -2.1861572265625, -2.117950439453125, -2.04974365234375, -1.981536865234375, -1.913330078125, -1.845123291015625, -1.77691650390625, -1.708709716796875, -1.6405029296875, -1.572296142578125, -1.50408935546875, -1.435882568359375, -1.36767578125, -1.299468994140625, -1.23126220703125, -1.163055419921875, -1.0948486328125, -1.026641845703125, -0.95843505859375, -0.890228271484375, -0.822021484375, -0.753814697265625, -0.68560791015625, -0.617401123046875, -0.5491943359375, -0.480987548828125, -0.41278076171875, -0.344573974609375, -0.2763671875, -0.208160400390625, -0.13995361328125, -0.071746826171875, -0.0035400390625, 0.064666748046875, 0.13287353515625, 0.201080322265625, 0.269287109375, 0.337493896484375, 0.40570068359375, 0.473907470703125, 0.5421142578125, 0.610321044921875, 0.67852783203125, 0.746734619140625, 0.81494140625, 0.883148193359375, 0.95135498046875, 1.019561767578125, 1.0877685546875, 1.155975341796875, 1.22418212890625, 1.292388916015625, 1.360595703125, 1.428802490234375, 1.49700927734375, 1.565216064453125, 1.6334228515625, 1.701629638671875, 1.76983642578125, 1.838043212890625, 1.90625]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 5.0, 7.0, 10.0, 21.0, 21.0, 29.0, 86.0, 312.0, 6910.0, 4183939.0, 2593.0, 203.0, 59.0, 28.0, 21.0, 15.0, 9.0, 3.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-51.5, -50.001953125, -48.50390625, -47.005859375, -45.5078125, -44.009765625, -42.51171875, -41.013671875, -39.515625, -38.017578125, -36.51953125, -35.021484375, -33.5234375, -32.025390625, -30.52734375, -29.029296875, -27.53125, -26.033203125, -24.53515625, -23.037109375, -21.5390625, -20.041015625, -18.54296875, -17.044921875, -15.546875, -14.048828125, -12.55078125, -11.052734375, -9.5546875, -8.056640625, -6.55859375, -5.060546875, -3.5625, -2.064453125, -0.56640625, 0.931640625, 2.4296875, 3.927734375, 5.42578125, 6.923828125, 8.421875, 9.919921875, 11.41796875, 12.916015625, 14.4140625, 15.912109375, 17.41015625, 18.908203125, 20.40625, 21.904296875, 23.40234375, 24.900390625, 26.3984375, 27.896484375, 29.39453125, 30.892578125, 32.390625, 33.888671875, 35.38671875, 36.884765625, 38.3828125, 39.880859375, 41.37890625, 42.876953125, 44.375]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 8.0, 9.0, 20.0, 16.0, 29.0, 66.0, 144.0, 864.0, 2344.0, 370.0, 80.0, 45.0, 16.0, 23.0, 14.0, 7.0, 5.0, 4.0, 5.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.607421875, -2.533538818359375, -2.45965576171875, -2.385772705078125, -2.3118896484375, -2.238006591796875, -2.16412353515625, -2.090240478515625, -2.016357421875, -1.942474365234375, -1.86859130859375, -1.794708251953125, -1.7208251953125, -1.646942138671875, -1.57305908203125, -1.499176025390625, -1.42529296875, -1.351409912109375, -1.27752685546875, -1.203643798828125, -1.1297607421875, -1.055877685546875, -0.98199462890625, -0.908111572265625, -0.834228515625, -0.760345458984375, -0.68646240234375, -0.612579345703125, -0.5386962890625, -0.464813232421875, -0.39093017578125, -0.317047119140625, -0.2431640625, -0.169281005859375, -0.09539794921875, -0.021514892578125, 0.0523681640625, 0.126251220703125, 0.20013427734375, 0.274017333984375, 0.347900390625, 0.421783447265625, 0.49566650390625, 0.569549560546875, 0.6434326171875, 0.717315673828125, 0.79119873046875, 0.865081787109375, 0.93896484375, 1.012847900390625, 1.08673095703125, 1.160614013671875, 1.2344970703125, 1.308380126953125, 1.38226318359375, 1.456146240234375, 1.530029296875, 1.603912353515625, 1.67779541015625, 1.751678466796875, 1.8255615234375, 1.899444580078125, 1.97332763671875, 2.047210693359375, 2.12109375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 5.0, 7.0, 6.0, 2.0, 4.0, 8.0, 13.0, 14.0, 20.0, 23.0, 24.0, 29.0, 54.0, 62.0, 87.0, 85.0, 102.0, 96.0, 86.0, 60.0, 49.0, 35.0, 28.0, 20.0, 25.0, 10.0, 12.0, 6.0, 5.0, 8.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.95149827003479, -2.8608500957489014, -2.7702019214630127, -2.679553985595703, -2.5889058113098145, -2.498257637023926, -2.407609462738037, -2.3169612884521484, -2.2263131141662598, -2.135664939880371, -2.0450167655944824, -1.9543687105178833, -1.8637206554412842, -1.7730724811553955, -1.6824243068695068, -1.5917761325836182, -1.5011281967163086, -1.41048002243042, -1.3198319673538208, -1.2291837930679321, -1.138535737991333, -1.0478875637054443, -0.9572393894195557, -0.8665912747383118, -0.7759431600570679, -0.685295045375824, -0.5946469306945801, -0.5039987564086914, -0.4133506417274475, -0.3227025270462036, -0.23205435276031494, -0.14140623807907104, -0.05075812339782715, 0.03989000618457794, 0.13053813576698303, 0.22118628025054932, 0.3118343949317932, 0.4024825096130371, 0.4931306838989258, 0.5837787985801697, 0.6744269132614136, 0.7650750279426575, 0.8557231426239014, 0.94637131690979, 1.0370194911956787, 1.1276675462722778, 1.2183157205581665, 1.3089637756347656, 1.3996119499206543, 1.490260124206543, 1.580908179283142, 1.6715563535690308, 1.7622044086456299, 1.8528525829315186, 1.9435007572174072, 2.034148931503296, 2.1247968673706055, 2.215445041656494, 2.306093215942383, 2.3967413902282715, 2.487389326095581, 2.5780375003814697, 2.6686856746673584, 2.759333848953247, 2.8499820232391357]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 5.0, 4.0, 4.0, 1.0, 5.0, 9.0, 6.0, 12.0, 13.0, 15.0, 19.0, 20.0, 22.0, 32.0, 32.0, 28.0, 35.0, 31.0, 33.0, 36.0, 44.0, 40.0, 29.0, 58.0, 43.0, 46.0, 36.0, 34.0, 40.0, 33.0, 30.0, 26.0, 21.0, 26.0, 20.0, 18.0, 20.0, 18.0, 9.0, 15.0, 8.0, 10.0, 7.0, 3.0, 5.0, 2.0, 0.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.039533853530884, -1.9769076108932495, -1.9142814874649048, -1.8516552448272705, -1.7890291213989258, -1.7264028787612915, -1.6637766361236572, -1.6011505126953125, -1.5385242700576782, -1.475898027420044, -1.4132719039916992, -1.350645661354065, -1.2880194187164307, -1.225393295288086, -1.1627670526504517, -1.1001408100128174, -1.0375146865844727, -0.9748885035514832, -0.9122623205184937, -0.8496360778808594, -0.7870098948478699, -0.7243837118148804, -0.6617574691772461, -0.5991312861442566, -0.5365051031112671, -0.4738789200782776, -0.4112527072429657, -0.3486264944076538, -0.2860003113746643, -0.2233741283416748, -0.16074791550636292, -0.09812170267105103, -0.03549528121948242, 0.027130916714668274, 0.08975711464881897, 0.15238331258296967, 0.21500951051712036, 0.27763569355010986, 0.34026190638542175, 0.40288811922073364, 0.46551430225372314, 0.5281404852867126, 0.5907666683197021, 0.6533929109573364, 0.7160190939903259, 0.7786452770233154, 0.8412715196609497, 0.9038977026939392, 0.9665238857269287, 1.029150128364563, 1.0917762517929077, 1.154402494430542, 1.2170286178588867, 1.279654860496521, 1.3422811031341553, 1.4049072265625, 1.4675334692001343, 1.5301597118377686, 1.5927858352661133, 1.6554120779037476, 1.7180383205413818, 1.7806644439697266, 1.8432906866073608, 1.9059169292449951, 1.9685430526733398]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 8.0, 8.0, 13.0, 12.0, 19.0, 36.0, 41.0, 56.0, 86.0, 116.0, 169.0, 263.0, 363.0, 556.0, 840.0, 1318.0, 2252.0, 3521.0, 6272.0, 11190.0, 21637.0, 44246.0, 99651.0, 244308.0, 335984.0, 148025.0, 63239.0, 29368.0, 14888.0, 8000.0, 4501.0, 2753.0, 1727.0, 1051.0, 682.0, 442.0, 298.0, 176.0, 135.0, 94.0, 63.0, 46.0, 39.0, 23.0, 16.0, 11.0, 11.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.708984375, -0.6876449584960938, -0.6663055419921875, -0.6449661254882812, -0.623626708984375, -0.6022872924804688, -0.5809478759765625, -0.5596084594726562, -0.53826904296875, -0.5169296264648438, -0.4955902099609375, -0.47425079345703125, -0.452911376953125, -0.43157196044921875, -0.4102325439453125, -0.38889312744140625, -0.3675537109375, -0.34621429443359375, -0.3248748779296875, -0.30353546142578125, -0.282196044921875, -0.26085662841796875, -0.2395172119140625, -0.21817779541015625, -0.19683837890625, -0.17549896240234375, -0.1541595458984375, -0.13282012939453125, -0.111480712890625, -0.09014129638671875, -0.0688018798828125, -0.04746246337890625, -0.026123046875, -0.00478363037109375, 0.0165557861328125, 0.03789520263671875, 0.059234619140625, 0.08057403564453125, 0.1019134521484375, 0.12325286865234375, 0.14459228515625, 0.16593170166015625, 0.1872711181640625, 0.20861053466796875, 0.229949951171875, 0.25128936767578125, 0.2726287841796875, 0.29396820068359375, 0.3153076171875, 0.33664703369140625, 0.3579864501953125, 0.37932586669921875, 0.400665283203125, 0.42200469970703125, 0.4433441162109375, 0.46468353271484375, 0.48602294921875, 0.5073623657226562, 0.5287017822265625, 0.5500411987304688, 0.571380615234375, 0.5927200317382812, 0.6140594482421875, 0.6353988647460938, 0.65673828125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 6.0, 3.0, 2.0, 4.0, 6.0, 7.0, 22.0, 9.0, 18.0, 14.0, 19.0, 39.0, 32.0, 31.0, 30.0, 41.0, 42.0, 52.0, 53.0, 45.0, 48.0, 65.0, 56.0, 41.0, 54.0, 32.0, 40.0, 24.0, 37.0, 10.0, 19.0, 18.0, 17.0, 16.0, 18.0, 12.0, 5.0, 9.0, 4.0, 1.0, 3.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.8525390625, -1.7936248779296875, -1.734710693359375, -1.6757965087890625, -1.61688232421875, -1.5579681396484375, -1.499053955078125, -1.4401397705078125, -1.3812255859375, -1.3223114013671875, -1.263397216796875, -1.2044830322265625, -1.14556884765625, -1.0866546630859375, -1.027740478515625, -0.9688262939453125, -0.909912109375, -0.8509979248046875, -0.792083740234375, -0.7331695556640625, -0.67425537109375, -0.6153411865234375, -0.556427001953125, -0.4975128173828125, -0.4385986328125, -0.3796844482421875, -0.320770263671875, -0.2618560791015625, -0.20294189453125, -0.1440277099609375, -0.085113525390625, -0.0261993408203125, 0.03271484375, 0.0916290283203125, 0.150543212890625, 0.2094573974609375, 0.26837158203125, 0.3272857666015625, 0.386199951171875, 0.4451141357421875, 0.5040283203125, 0.5629425048828125, 0.621856689453125, 0.6807708740234375, 0.73968505859375, 0.7985992431640625, 0.857513427734375, 0.9164276123046875, 0.975341796875, 1.0342559814453125, 1.093170166015625, 1.1520843505859375, 1.21099853515625, 1.2699127197265625, 1.328826904296875, 1.3877410888671875, 1.4466552734375, 1.5055694580078125, 1.564483642578125, 1.6233978271484375, 1.68231201171875, 1.7412261962890625, 1.800140380859375, 1.8590545654296875, 1.91796875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 2.0, 7.0, 5.0, 6.0, 5.0, 8.0, 14.0, 16.0, 34.0, 42.0, 48.0, 80.0, 104.0, 115.0, 207.0, 283.0, 366.0, 585.0, 890.0, 1314.0, 2122.0, 3317.0, 5547.0, 10256.0, 21772.0, 56196.0, 187567.0, 465487.0, 187973.0, 56884.0, 21818.0, 10281.0, 5666.0, 3281.0, 2050.0, 1350.0, 884.0, 591.0, 455.0, 271.0, 169.0, 132.0, 92.0, 66.0, 57.0, 36.0, 26.0, 27.0, 22.0, 8.0, 7.0, 8.0, 6.0, 6.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.70849609375, -0.6852645874023438, -0.6620330810546875, -0.6388015747070312, -0.615570068359375, -0.5923385620117188, -0.5691070556640625, -0.5458755493164062, -0.52264404296875, -0.49941253662109375, -0.4761810302734375, -0.45294952392578125, -0.429718017578125, -0.40648651123046875, -0.3832550048828125, -0.36002349853515625, -0.3367919921875, -0.31356048583984375, -0.2903289794921875, -0.26709747314453125, -0.243865966796875, -0.22063446044921875, -0.1974029541015625, -0.17417144775390625, -0.15093994140625, -0.12770843505859375, -0.1044769287109375, -0.08124542236328125, -0.058013916015625, -0.03478240966796875, -0.0115509033203125, 0.01168060302734375, 0.034912109375, 0.05814361572265625, 0.0813751220703125, 0.10460662841796875, 0.127838134765625, 0.15106964111328125, 0.1743011474609375, 0.19753265380859375, 0.22076416015625, 0.24399566650390625, 0.2672271728515625, 0.29045867919921875, 0.313690185546875, 0.33692169189453125, 0.3601531982421875, 0.38338470458984375, 0.4066162109375, 0.42984771728515625, 0.4530792236328125, 0.47631072998046875, 0.499542236328125, 0.5227737426757812, 0.5460052490234375, 0.5692367553710938, 0.59246826171875, 0.6156997680664062, 0.6389312744140625, 0.6621627807617188, 0.685394287109375, 0.7086257934570312, 0.7318572998046875, 0.7550888061523438, 0.7783203125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 1.0, 4.0, 6.0, 5.0, 7.0, 7.0, 6.0, 12.0, 12.0, 20.0, 16.0, 7.0, 22.0, 28.0, 39.0, 35.0, 30.0, 56.0, 34.0, 43.0, 49.0, 45.0, 39.0, 41.0, 43.0, 51.0, 32.0, 50.0, 40.0, 23.0, 25.0, 24.0, 27.0, 18.0, 9.0, 19.0, 11.0, 14.0, 12.0, 12.0, 4.0, 5.0, 7.0, 6.0, 6.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.44921875, -3.3392333984375, -3.229248046875, -3.1192626953125, -3.00927734375, -2.8992919921875, -2.789306640625, -2.6793212890625, -2.5693359375, -2.4593505859375, -2.349365234375, -2.2393798828125, -2.12939453125, -2.0194091796875, -1.909423828125, -1.7994384765625, -1.689453125, -1.5794677734375, -1.469482421875, -1.3594970703125, -1.24951171875, -1.1395263671875, -1.029541015625, -0.9195556640625, -0.8095703125, -0.6995849609375, -0.589599609375, -0.4796142578125, -0.36962890625, -0.2596435546875, -0.149658203125, -0.0396728515625, 0.0703125, 0.1802978515625, 0.290283203125, 0.4002685546875, 0.51025390625, 0.6202392578125, 0.730224609375, 0.8402099609375, 0.9501953125, 1.0601806640625, 1.170166015625, 1.2801513671875, 1.39013671875, 1.5001220703125, 1.610107421875, 1.7200927734375, 1.830078125, 1.9400634765625, 2.050048828125, 2.1600341796875, 2.27001953125, 2.3800048828125, 2.489990234375, 2.5999755859375, 2.7099609375, 2.8199462890625, 2.929931640625, 3.0399169921875, 3.14990234375, 3.2598876953125, 3.369873046875, 3.4798583984375, 3.58984375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 9.0, 5.0, 14.0, 18.0, 23.0, 37.0, 57.0, 74.0, 125.0, 217.0, 385.0, 715.0, 1460.0, 3476.0, 10271.0, 44002.0, 572482.0, 365937.0, 34546.0, 8662.0, 3029.0, 1363.0, 666.0, 366.0, 205.0, 133.0, 82.0, 61.0, 39.0, 29.0, 21.0, 17.0, 8.0, 6.0, 4.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.338134765625, -0.326446533203125, -0.31475830078125, -0.303070068359375, -0.2913818359375, -0.279693603515625, -0.26800537109375, -0.256317138671875, -0.24462890625, -0.232940673828125, -0.22125244140625, -0.209564208984375, -0.1978759765625, -0.186187744140625, -0.17449951171875, -0.162811279296875, -0.151123046875, -0.139434814453125, -0.12774658203125, -0.116058349609375, -0.1043701171875, -0.092681884765625, -0.08099365234375, -0.069305419921875, -0.0576171875, -0.045928955078125, -0.03424072265625, -0.022552490234375, -0.0108642578125, 0.000823974609375, 0.01251220703125, 0.024200439453125, 0.035888671875, 0.047576904296875, 0.05926513671875, 0.070953369140625, 0.0826416015625, 0.094329833984375, 0.10601806640625, 0.117706298828125, 0.12939453125, 0.141082763671875, 0.15277099609375, 0.164459228515625, 0.1761474609375, 0.187835693359375, 0.19952392578125, 0.211212158203125, 0.222900390625, 0.234588623046875, 0.24627685546875, 0.257965087890625, 0.2696533203125, 0.281341552734375, 0.29302978515625, 0.304718017578125, 0.31640625, 0.328094482421875, 0.33978271484375, 0.351470947265625, 0.3631591796875, 0.374847412109375, 0.38653564453125, 0.398223876953125, 0.409912109375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 1.0, 3.0, 9.0, 3.0, 6.0, 10.0, 17.0, 14.0, 41.0, 69.0, 100.0, 209.0, 223.0, 124.0, 60.0, 39.0, 24.0, 12.0, 10.0, 10.0, 4.0, 6.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002739429473876953, -0.0002659037709236145, -0.0002578645944595337, -0.0002498254179954529, -0.00024178624153137207, -0.00023374706506729126, -0.00022570788860321045, -0.00021766871213912964, -0.00020962953567504883, -0.00020159035921096802, -0.0001935511827468872, -0.0001855120062828064, -0.00017747282981872559, -0.00016943365335464478, -0.00016139447689056396, -0.00015335530042648315, -0.00014531612396240234, -0.00013727694749832153, -0.00012923777103424072, -0.00012119859457015991, -0.0001131594181060791, -0.00010512024164199829, -9.708106517791748e-05, -8.904188871383667e-05, -8.100271224975586e-05, -7.296353578567505e-05, -6.492435932159424e-05, -5.688518285751343e-05, -4.884600639343262e-05, -4.080682992935181e-05, -3.2767653465270996e-05, -2.4728477001190186e-05, -1.6689300537109375e-05, -8.650124073028564e-06, -6.109476089477539e-07, 7.428228855133057e-06, 1.5467405319213867e-05, 2.3506581783294678e-05, 3.154575824737549e-05, 3.95849347114563e-05, 4.762411117553711e-05, 5.566328763961792e-05, 6.370246410369873e-05, 7.174164056777954e-05, 7.978081703186035e-05, 8.781999349594116e-05, 9.585916996002197e-05, 0.00010389834642410278, 0.0001119375228881836, 0.0001199766993522644, 0.00012801587581634521, 0.00013605505228042603, 0.00014409422874450684, 0.00015213340520858765, 0.00016017258167266846, 0.00016821175813674927, 0.00017625093460083008, 0.0001842901110649109, 0.0001923292875289917, 0.0002003684639930725, 0.00020840764045715332, 0.00021644681692123413, 0.00022448599338531494, 0.00023252516984939575, 0.00024056434631347656]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 5.0, 10.0, 6.0, 12.0, 27.0, 44.0, 101.0, 160.0, 367.0, 973.0, 2628.0, 9675.0, 47184.0, 656701.0, 291334.0, 29329.0, 6594.0, 2026.0, 759.0, 324.0, 131.0, 66.0, 35.0, 11.0, 12.0, 12.0, 10.0, 3.0, 6.0, 1.0, 5.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.67333984375, -0.6534576416015625, -0.633575439453125, -0.6136932373046875, -0.59381103515625, -0.5739288330078125, -0.554046630859375, -0.5341644287109375, -0.5142822265625, -0.4944000244140625, -0.474517822265625, -0.4546356201171875, -0.43475341796875, -0.4148712158203125, -0.394989013671875, -0.3751068115234375, -0.355224609375, -0.3353424072265625, -0.315460205078125, -0.2955780029296875, -0.27569580078125, -0.2558135986328125, -0.235931396484375, -0.2160491943359375, -0.1961669921875, -0.1762847900390625, -0.156402587890625, -0.1365203857421875, -0.11663818359375, -0.0967559814453125, -0.076873779296875, -0.0569915771484375, -0.037109375, -0.0172271728515625, 0.002655029296875, 0.0225372314453125, 0.04241943359375, 0.0623016357421875, 0.082183837890625, 0.1020660400390625, 0.1219482421875, 0.1418304443359375, 0.161712646484375, 0.1815948486328125, 0.20147705078125, 0.2213592529296875, 0.241241455078125, 0.2611236572265625, 0.281005859375, 0.3008880615234375, 0.320770263671875, 0.3406524658203125, 0.36053466796875, 0.3804168701171875, 0.400299072265625, 0.4201812744140625, 0.4400634765625, 0.4599456787109375, 0.479827880859375, 0.4997100830078125, 0.51959228515625, 0.5394744873046875, 0.559356689453125, 0.5792388916015625, 0.59912109375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 1.0, 7.0, 5.0, 2.0, 4.0, 13.0, 18.0, 20.0, 29.0, 28.0, 34.0, 47.0, 67.0, 99.0, 104.0, 140.0, 93.0, 73.0, 52.0, 45.0, 26.0, 28.0, 10.0, 13.0, 8.0, 6.0, 7.0, 8.0, 3.0, 3.0, 2.0, 3.0, 1.0, 5.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.137939453125, -0.13399505615234375, -0.1300506591796875, -0.12610626220703125, -0.122161865234375, -0.11821746826171875, -0.1142730712890625, -0.11032867431640625, -0.10638427734375, -0.10243988037109375, -0.0984954833984375, -0.09455108642578125, -0.090606689453125, -0.08666229248046875, -0.0827178955078125, -0.07877349853515625, -0.0748291015625, -0.07088470458984375, -0.0669403076171875, -0.06299591064453125, -0.059051513671875, -0.05510711669921875, -0.0511627197265625, -0.04721832275390625, -0.04327392578125, -0.03932952880859375, -0.0353851318359375, -0.03144073486328125, -0.027496337890625, -0.02355194091796875, -0.0196075439453125, -0.01566314697265625, -0.01171875, -0.00777435302734375, -0.0038299560546875, 0.00011444091796875, 0.004058837890625, 0.00800323486328125, 0.0119476318359375, 0.01589202880859375, 0.01983642578125, 0.02378082275390625, 0.0277252197265625, 0.03166961669921875, 0.035614013671875, 0.03955841064453125, 0.0435028076171875, 0.04744720458984375, 0.0513916015625, 0.05533599853515625, 0.0592803955078125, 0.06322479248046875, 0.067169189453125, 0.07111358642578125, 0.0750579833984375, 0.07900238037109375, 0.08294677734375, 0.08689117431640625, 0.0908355712890625, 0.09477996826171875, 0.098724365234375, 0.10266876220703125, 0.1066131591796875, 0.11055755615234375, 0.114501953125]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 9.0, 11.0, 11.0, 9.0, 12.0, 26.0, 34.0, 40.0, 72.0, 86.0, 120.0, 145.0, 113.0, 87.0, 56.0, 42.0, 36.0, 20.0, 17.0, 12.0, 7.0, 8.0, 7.0, 3.0, 3.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.930957317352295, -2.8432822227478027, -2.7556071281433105, -2.6679320335388184, -2.580256938934326, -2.492581844329834, -2.404906749725342, -2.3172316551208496, -2.2295565605163574, -2.1418814659118652, -2.054206371307373, -1.9665312767028809, -1.8788561820983887, -1.7911810874938965, -1.7035058736801147, -1.6158307790756226, -1.5281555652618408, -1.4404804706573486, -1.3528053760528564, -1.2651302814483643, -1.177455186843872, -1.0897800922393799, -1.0021048784255981, -0.914429783821106, -0.8267546892166138, -0.7390795946121216, -0.6514045000076294, -0.5637293457984924, -0.47605425119400024, -0.38837915658950806, -0.3007040023803711, -0.2130289077758789, -0.12535405158996582, -0.03767894208431244, 0.04999616742134094, 0.13767129182815552, 0.2253463864326477, 0.3130214810371399, 0.40069663524627686, 0.48837172985076904, 0.5760468244552612, 0.6637219190597534, 0.7513970136642456, 0.8390721678733826, 0.9267472624778748, 1.0144224166870117, 1.102097511291504, 1.189772605895996, 1.2774477005004883, 1.3651227951049805, 1.4527978897094727, 1.5404729843139648, 1.628148078918457, 1.7158231735229492, 1.803498387336731, 1.8911734819412231, 1.9788485765457153, 2.066523790359497, 2.1541988849639893, 2.2418739795684814, 2.3295490741729736, 2.417224168777466, 2.504899263381958, 2.59257435798645, 2.6802494525909424]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 5.0, 0.0, 1.0, 10.0, 3.0, 7.0, 14.0, 15.0, 20.0, 16.0, 24.0, 33.0, 26.0, 43.0, 31.0, 44.0, 41.0, 38.0, 47.0, 45.0, 64.0, 50.0, 49.0, 47.0, 42.0, 40.0, 38.0, 23.0, 31.0, 19.0, 18.0, 27.0, 22.0, 23.0, 13.0, 8.0, 5.0, 10.0, 1.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.7804385423660278, -1.7255982160568237, -1.67075777053833, -1.615917444229126, -1.5610769987106323, -1.5062366724014282, -1.4513962268829346, -1.3965559005737305, -1.3417155742645264, -1.2868752479553223, -1.2320348024368286, -1.1771944761276245, -1.1223540306091309, -1.0675137042999268, -1.0126733779907227, -0.957832932472229, -0.9029924869537354, -0.8481521010398865, -0.7933117151260376, -0.7384713888168335, -0.6836309432983398, -0.6287906169891357, -0.5739502310752869, -0.519109845161438, -0.4642694592475891, -0.40942907333374023, -0.35458868741989136, -0.29974833130836487, -0.244907945394516, -0.19006755948066711, -0.13522720336914062, -0.08038681745529175, -0.02554631233215332, 0.02929406613111496, 0.08413444459438324, 0.13897481560707092, 0.1938152015209198, 0.24865558743476868, 0.30349594354629517, 0.35833632946014404, 0.4131767153739929, 0.4680171012878418, 0.5228574872016907, 0.5776978731155396, 0.6325381994247437, 0.6873786449432373, 0.7422189712524414, 0.7970593571662903, 0.8518997430801392, 0.906740128993988, 0.9615805149078369, 1.016420841217041, 1.0712612867355347, 1.1261016130447388, 1.1809420585632324, 1.2357823848724365, 1.2906227111816406, 1.3454630374908447, 1.4003034830093384, 1.4551438093185425, 1.5099842548370361, 1.5648245811462402, 1.6196649074554443, 1.674505352973938, 1.7293457984924316]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 3.0, 5.0, 6.0, 9.0, 10.0, 17.0, 20.0, 28.0, 56.0, 58.0, 104.0, 147.0, 251.0, 434.0, 601.0, 1047.0, 1671.0, 2732.0, 4621.0, 7970.0, 15159.0, 34077.0, 167967.0, 690710.0, 69267.0, 24022.0, 11784.0, 6347.0, 3722.0, 2156.0, 1356.0, 808.0, 493.0, 323.0, 174.0, 141.0, 101.0, 47.0, 30.0, 22.0, 12.0, 14.0, 10.0, 9.0, 6.0, 3.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.21875, -2.152099609375, -2.08544921875, -2.018798828125, -1.9521484375, -1.885498046875, -1.81884765625, -1.752197265625, -1.685546875, -1.618896484375, -1.55224609375, -1.485595703125, -1.4189453125, -1.352294921875, -1.28564453125, -1.218994140625, -1.15234375, -1.085693359375, -1.01904296875, -0.952392578125, -0.8857421875, -0.819091796875, -0.75244140625, -0.685791015625, -0.619140625, -0.552490234375, -0.48583984375, -0.419189453125, -0.3525390625, -0.285888671875, -0.21923828125, -0.152587890625, -0.0859375, -0.019287109375, 0.04736328125, 0.114013671875, 0.1806640625, 0.247314453125, 0.31396484375, 0.380615234375, 0.447265625, 0.513916015625, 0.58056640625, 0.647216796875, 0.7138671875, 0.780517578125, 0.84716796875, 0.913818359375, 0.98046875, 1.047119140625, 1.11376953125, 1.180419921875, 1.2470703125, 1.313720703125, 1.38037109375, 1.447021484375, 1.513671875, 1.580322265625, 1.64697265625, 1.713623046875, 1.7802734375, 1.846923828125, 1.91357421875, 1.980224609375, 2.046875]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 5.0, 4.0, 2.0, 7.0, 7.0, 5.0, 9.0, 10.0, 12.0, 16.0, 15.0, 23.0, 23.0, 24.0, 17.0, 33.0, 40.0, 25.0, 27.0, 31.0, 54.0, 42.0, 51.0, 41.0, 51.0, 45.0, 37.0, 39.0, 40.0, 28.0, 26.0, 25.0, 24.0, 21.0, 22.0, 13.0, 28.0, 18.0, 16.0, 15.0, 6.0, 11.0, 2.0, 6.0, 5.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 2.0], "bins": [-3.05859375, -2.9703369140625, -2.882080078125, -2.7938232421875, -2.70556640625, -2.6173095703125, -2.529052734375, -2.4407958984375, -2.3525390625, -2.2642822265625, -2.176025390625, -2.0877685546875, -1.99951171875, -1.9112548828125, -1.822998046875, -1.7347412109375, -1.646484375, -1.5582275390625, -1.469970703125, -1.3817138671875, -1.29345703125, -1.2052001953125, -1.116943359375, -1.0286865234375, -0.9404296875, -0.8521728515625, -0.763916015625, -0.6756591796875, -0.58740234375, -0.4991455078125, -0.410888671875, -0.3226318359375, -0.234375, -0.1461181640625, -0.057861328125, 0.0303955078125, 0.11865234375, 0.2069091796875, 0.295166015625, 0.3834228515625, 0.4716796875, 0.5599365234375, 0.648193359375, 0.7364501953125, 0.82470703125, 0.9129638671875, 1.001220703125, 1.0894775390625, 1.177734375, 1.2659912109375, 1.354248046875, 1.4425048828125, 1.53076171875, 1.6190185546875, 1.707275390625, 1.7955322265625, 1.8837890625, 1.9720458984375, 2.060302734375, 2.1485595703125, 2.23681640625, 2.3250732421875, 2.413330078125, 2.5015869140625, 2.58984375]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 4.0, 7.0, 11.0, 20.0, 16.0, 17.0, 25.0, 38.0, 56.0, 72.0, 100.0, 123.0, 210.0, 323.0, 536.0, 907.0, 1728.0, 3448.0, 7046.0, 16164.0, 47933.0, 506600.0, 390783.0, 43192.0, 15279.0, 6607.0, 3126.0, 1684.0, 955.0, 544.0, 324.0, 219.0, 114.0, 88.0, 68.0, 49.0, 41.0, 23.0, 19.0, 13.0, 11.0, 11.0, 7.0, 3.0, 3.0, 1.0, 0.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.21875, -2.1470947265625, -2.075439453125, -2.0037841796875, -1.93212890625, -1.8604736328125, -1.788818359375, -1.7171630859375, -1.6455078125, -1.5738525390625, -1.502197265625, -1.4305419921875, -1.35888671875, -1.2872314453125, -1.215576171875, -1.1439208984375, -1.072265625, -1.0006103515625, -0.928955078125, -0.8572998046875, -0.78564453125, -0.7139892578125, -0.642333984375, -0.5706787109375, -0.4990234375, -0.4273681640625, -0.355712890625, -0.2840576171875, -0.21240234375, -0.1407470703125, -0.069091796875, 0.0025634765625, 0.07421875, 0.1458740234375, 0.217529296875, 0.2891845703125, 0.36083984375, 0.4324951171875, 0.504150390625, 0.5758056640625, 0.6474609375, 0.7191162109375, 0.790771484375, 0.8624267578125, 0.93408203125, 1.0057373046875, 1.077392578125, 1.1490478515625, 1.220703125, 1.2923583984375, 1.364013671875, 1.4356689453125, 1.50732421875, 1.5789794921875, 1.650634765625, 1.7222900390625, 1.7939453125, 1.8656005859375, 1.937255859375, 2.0089111328125, 2.08056640625, 2.1522216796875, 2.223876953125, 2.2955322265625, 2.3671875]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 4.0, 6.0, 4.0, 5.0, 7.0, 12.0, 8.0, 13.0, 19.0, 9.0, 20.0, 15.0, 25.0, 37.0, 32.0, 30.0, 30.0, 45.0, 51.0, 35.0, 43.0, 42.0, 41.0, 53.0, 30.0, 36.0, 45.0, 33.0, 32.0, 25.0, 33.0, 22.0, 28.0, 25.0, 24.0, 16.0, 9.0, 7.0, 11.0, 15.0, 5.0, 6.0, 3.0, 4.0, 6.0, 3.0, 4.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-3.12890625, -3.03497314453125, -2.9410400390625, -2.84710693359375, -2.753173828125, -2.65924072265625, -2.5653076171875, -2.47137451171875, -2.37744140625, -2.28350830078125, -2.1895751953125, -2.09564208984375, -2.001708984375, -1.90777587890625, -1.8138427734375, -1.71990966796875, -1.6259765625, -1.53204345703125, -1.4381103515625, -1.34417724609375, -1.250244140625, -1.15631103515625, -1.0623779296875, -0.96844482421875, -0.87451171875, -0.78057861328125, -0.6866455078125, -0.59271240234375, -0.498779296875, -0.40484619140625, -0.3109130859375, -0.21697998046875, -0.123046875, -0.02911376953125, 0.0648193359375, 0.15875244140625, 0.252685546875, 0.34661865234375, 0.4405517578125, 0.53448486328125, 0.62841796875, 0.72235107421875, 0.8162841796875, 0.91021728515625, 1.004150390625, 1.09808349609375, 1.1920166015625, 1.28594970703125, 1.3798828125, 1.47381591796875, 1.5677490234375, 1.66168212890625, 1.755615234375, 1.84954833984375, 1.9434814453125, 2.03741455078125, 2.13134765625, 2.22528076171875, 2.3192138671875, 2.41314697265625, 2.507080078125, 2.60101318359375, 2.6949462890625, 2.78887939453125, 2.8828125]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 3.0, 6.0, 5.0, 15.0, 18.0, 14.0, 24.0, 38.0, 58.0, 59.0, 97.0, 151.0, 253.0, 451.0, 800.0, 1596.0, 2942.0, 6542.0, 21353.0, 933773.0, 60981.0, 10562.0, 4107.0, 2112.0, 1085.0, 590.0, 333.0, 187.0, 114.0, 76.0, 54.0, 50.0, 36.0, 23.0, 15.0, 7.0, 7.0, 7.0, 4.0, 2.0, 5.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.130859375, -2.065765380859375, -2.00067138671875, -1.935577392578125, -1.8704833984375, -1.805389404296875, -1.74029541015625, -1.675201416015625, -1.610107421875, -1.545013427734375, -1.47991943359375, -1.414825439453125, -1.3497314453125, -1.284637451171875, -1.21954345703125, -1.154449462890625, -1.08935546875, -1.024261474609375, -0.95916748046875, -0.894073486328125, -0.8289794921875, -0.763885498046875, -0.69879150390625, -0.633697509765625, -0.568603515625, -0.503509521484375, -0.43841552734375, -0.373321533203125, -0.3082275390625, -0.243133544921875, -0.17803955078125, -0.112945556640625, -0.0478515625, 0.017242431640625, 0.08233642578125, 0.147430419921875, 0.2125244140625, 0.277618408203125, 0.34271240234375, 0.407806396484375, 0.472900390625, 0.537994384765625, 0.60308837890625, 0.668182373046875, 0.7332763671875, 0.798370361328125, 0.86346435546875, 0.928558349609375, 0.99365234375, 1.058746337890625, 1.12384033203125, 1.188934326171875, 1.2540283203125, 1.319122314453125, 1.38421630859375, 1.449310302734375, 1.514404296875, 1.579498291015625, 1.64459228515625, 1.709686279296875, 1.7747802734375, 1.839874267578125, 1.90496826171875, 1.970062255859375, 2.03515625]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 8.0, 3.0, 2.0, 8.0, 12.0, 46.0, 333.0, 500.0, 33.0, 16.0, 11.0, 7.0, 7.0, 2.0, 7.0, 6.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000331878662109375, -0.00031444430351257324, -0.0002970099449157715, -0.0002795755863189697, -0.00026214122772216797, -0.0002447068691253662, -0.00022727251052856445, -0.0002098381519317627, -0.00019240379333496094, -0.00017496943473815918, -0.00015753507614135742, -0.00014010071754455566, -0.0001226663589477539, -0.00010523200035095215, -8.779764175415039e-05, -7.036328315734863e-05, -5.2928924560546875e-05, -3.549456596374512e-05, -1.806020736694336e-05, -6.258487701416016e-07, 1.6808509826660156e-05, 3.4242868423461914e-05, 5.167722702026367e-05, 6.911158561706543e-05, 8.654594421386719e-05, 0.00010398030281066895, 0.0001214146614074707, 0.00013884902000427246, 0.00015628337860107422, 0.00017371773719787598, 0.00019115209579467773, 0.0002085864543914795, 0.00022602081298828125, 0.000243455171585083, 0.00026088953018188477, 0.0002783238887786865, 0.0002957582473754883, 0.00031319260597229004, 0.0003306269645690918, 0.00034806132316589355, 0.0003654956817626953, 0.00038293004035949707, 0.00040036439895629883, 0.0004177987575531006, 0.00043523311614990234, 0.0004526674747467041, 0.00047010183334350586, 0.0004875361919403076, 0.0005049705505371094, 0.0005224049091339111, 0.0005398392677307129, 0.0005572736263275146, 0.0005747079849243164, 0.0005921423435211182, 0.0006095767021179199, 0.0006270110607147217, 0.0006444454193115234, 0.0006618797779083252, 0.000679314136505127, 0.0006967484951019287, 0.0007141828536987305, 0.0007316172122955322, 0.000749051570892334, 0.0007664859294891357, 0.0007839202880859375]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 3.0, 4.0, 13.0, 12.0, 21.0, 28.0, 47.0, 70.0, 81.0, 141.0, 182.0, 267.0, 414.0, 679.0, 1077.0, 1869.0, 3831.0, 10748.0, 126518.0, 876760.0, 15522.0, 4696.0, 2179.0, 1199.0, 746.0, 488.0, 293.0, 199.0, 145.0, 103.0, 62.0, 55.0, 34.0, 25.0, 20.0, 10.0, 6.0, 4.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.857421875, -1.79364013671875, -1.7298583984375, -1.66607666015625, -1.602294921875, -1.53851318359375, -1.4747314453125, -1.41094970703125, -1.34716796875, -1.28338623046875, -1.2196044921875, -1.15582275390625, -1.092041015625, -1.02825927734375, -0.9644775390625, -0.90069580078125, -0.8369140625, -0.77313232421875, -0.7093505859375, -0.64556884765625, -0.581787109375, -0.51800537109375, -0.4542236328125, -0.39044189453125, -0.32666015625, -0.26287841796875, -0.1990966796875, -0.13531494140625, -0.071533203125, -0.00775146484375, 0.0560302734375, 0.11981201171875, 0.18359375, 0.24737548828125, 0.3111572265625, 0.37493896484375, 0.438720703125, 0.50250244140625, 0.5662841796875, 0.63006591796875, 0.69384765625, 0.75762939453125, 0.8214111328125, 0.88519287109375, 0.948974609375, 1.01275634765625, 1.0765380859375, 1.14031982421875, 1.2041015625, 1.26788330078125, 1.3316650390625, 1.39544677734375, 1.459228515625, 1.52301025390625, 1.5867919921875, 1.65057373046875, 1.71435546875, 1.77813720703125, 1.8419189453125, 1.90570068359375, 1.969482421875, 2.03326416015625, 2.0970458984375, 2.16082763671875, 2.224609375]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 2.0, 3.0, 3.0, 5.0, 5.0, 7.0, 14.0, 24.0, 41.0, 286.0, 473.0, 72.0, 25.0, 16.0, 7.0, 8.0, 6.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.974609375, -0.941131591796875, -0.90765380859375, -0.874176025390625, -0.8406982421875, -0.807220458984375, -0.77374267578125, -0.740264892578125, -0.706787109375, -0.673309326171875, -0.63983154296875, -0.606353759765625, -0.5728759765625, -0.539398193359375, -0.50592041015625, -0.472442626953125, -0.43896484375, -0.405487060546875, -0.37200927734375, -0.338531494140625, -0.3050537109375, -0.271575927734375, -0.23809814453125, -0.204620361328125, -0.171142578125, -0.137664794921875, -0.10418701171875, -0.070709228515625, -0.0372314453125, -0.003753662109375, 0.02972412109375, 0.063201904296875, 0.0966796875, 0.130157470703125, 0.16363525390625, 0.197113037109375, 0.2305908203125, 0.264068603515625, 0.29754638671875, 0.331024169921875, 0.364501953125, 0.397979736328125, 0.43145751953125, 0.464935302734375, 0.4984130859375, 0.531890869140625, 0.56536865234375, 0.598846435546875, 0.63232421875, 0.665802001953125, 0.69927978515625, 0.732757568359375, 0.7662353515625, 0.799713134765625, 0.83319091796875, 0.866668701171875, 0.900146484375, 0.933624267578125, 0.96710205078125, 1.000579833984375, 1.0340576171875, 1.067535400390625, 1.10101318359375, 1.134490966796875, 1.16796875]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 31.0, 811.0, 173.0, 7.0], "bins": [-150.4115753173828, -147.9746856689453, -145.5377960205078, -143.1009063720703, -140.6640167236328, -138.2271270751953, -135.7902374267578, -133.3533477783203, -130.9164581298828, -128.4795684814453, -126.04267883300781, -123.60578918457031, -121.16889953613281, -118.73200988769531, -116.29512023925781, -113.85823059082031, -111.42134094238281, -108.98445129394531, -106.54756164550781, -104.11067199707031, -101.67378234863281, -99.23689270019531, -96.80000305175781, -94.36311340332031, -91.92621612548828, -89.48932647705078, -87.05243682861328, -84.61554718017578, -82.17865753173828, -79.74176788330078, -77.30487823486328, -74.86798858642578, -72.43109130859375, -69.99420166015625, -67.55731201171875, -65.12042236328125, -62.68353271484375, -60.24664306640625, -57.80975341796875, -55.37286376953125, -52.93597412109375, -50.49908447265625, -48.06219482421875, -45.62530517578125, -43.18841552734375, -40.75152587890625, -38.31463623046875, -35.87774658203125, -33.440853118896484, -31.003963470458984, -28.567073822021484, -26.130184173583984, -23.693294525146484, -21.256404876708984, -18.81951332092285, -16.38262367248535, -13.945734977722168, -11.508845329284668, -9.071954727172852, -6.635065078735352, -4.198175430297852, -1.7612857818603516, 0.6756048202514648, 3.112494468688965, 5.549384117126465]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 4.0, 5.0, 0.0, 8.0, 7.0, 12.0, 16.0, 15.0, 20.0, 23.0, 21.0, 25.0, 31.0, 30.0, 33.0, 21.0, 29.0, 40.0, 35.0, 39.0, 46.0, 34.0, 39.0, 51.0, 37.0, 33.0, 34.0, 35.0, 29.0, 39.0, 34.0, 22.0, 25.0, 18.0, 21.0, 15.0, 19.0, 9.0, 18.0, 10.0, 5.0, 6.0, 3.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.3116960525512695, -5.159384727478027, -5.007073402404785, -4.854762554168701, -4.702451229095459, -4.550139904022217, -4.397828578948975, -4.245517253875732, -4.093206405639648, -3.9408950805664062, -3.788583993911743, -3.636272668838501, -3.483961582183838, -3.3316502571105957, -3.1793389320373535, -3.0270276069641113, -2.874716281890869, -2.722404956817627, -2.570093870162964, -2.4177825450897217, -2.2654714584350586, -2.1131601333618164, -1.9608488082885742, -1.8085376024246216, -1.656226396560669, -1.5039151906967163, -1.3516039848327637, -1.1992926597595215, -1.0469814538955688, -0.8946702480316162, -0.7423589825630188, -0.5900477170944214, -0.43773651123046875, -0.2854252755641937, -0.1331140398979187, 0.019197195768356323, 0.17150843143463135, 0.323819637298584, 0.4761309027671814, 0.6284421682357788, 0.7807533740997314, 0.9330645799636841, 1.0853757858276367, 1.237687110900879, 1.3899983167648315, 1.5423095226287842, 1.6946208477020264, 1.846932053565979, 1.9992432594299316, 2.151554584503174, 2.303865671157837, 2.456176996231079, 2.608488082885742, 2.7607994079589844, 2.9131107330322266, 3.0654220581054688, 3.217733144760132, 3.370044469833374, 3.522355556488037, 3.6746668815612793, 3.8269782066345215, 3.9792892932891846, 4.131600379943848, 4.28391170501709, 4.436223030090332]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 3.0, 9.0, 3.0, 14.0, 31.0, 27.0, 37.0, 66.0, 118.0, 232.0, 558.0, 2089.0, 10890.0, 3698554.0, 472496.0, 6517.0, 1563.0, 561.0, 205.0, 119.0, 65.0, 32.0, 29.0, 23.0, 9.0, 15.0, 8.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.4609375, -13.02490234375, -12.5888671875, -12.15283203125, -11.716796875, -11.28076171875, -10.8447265625, -10.40869140625, -9.97265625, -9.53662109375, -9.1005859375, -8.66455078125, -8.228515625, -7.79248046875, -7.3564453125, -6.92041015625, -6.484375, -6.04833984375, -5.6123046875, -5.17626953125, -4.740234375, -4.30419921875, -3.8681640625, -3.43212890625, -2.99609375, -2.56005859375, -2.1240234375, -1.68798828125, -1.251953125, -0.81591796875, -0.3798828125, 0.05615234375, 0.4921875, 0.92822265625, 1.3642578125, 1.80029296875, 2.236328125, 2.67236328125, 3.1083984375, 3.54443359375, 3.98046875, 4.41650390625, 4.8525390625, 5.28857421875, 5.724609375, 6.16064453125, 6.5966796875, 7.03271484375, 7.46875, 7.90478515625, 8.3408203125, 8.77685546875, 9.212890625, 9.64892578125, 10.0849609375, 10.52099609375, 10.95703125, 11.39306640625, 11.8291015625, 12.26513671875, 12.701171875, 13.13720703125, 13.5732421875, 14.00927734375, 14.4453125]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 3.0, 3.0, 5.0, 14.0, 18.0, 13.0, 25.0, 44.0, 47.0, 44.0, 69.0, 57.0, 58.0, 66.0, 83.0, 83.0, 55.0, 66.0, 45.0, 38.0, 37.0, 46.0, 16.0, 16.0, 19.0, 14.0, 8.0, 3.0, 6.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.658203125, -2.57354736328125, -2.4888916015625, -2.40423583984375, -2.319580078125, -2.23492431640625, -2.1502685546875, -2.06561279296875, -1.98095703125, -1.89630126953125, -1.8116455078125, -1.72698974609375, -1.642333984375, -1.55767822265625, -1.4730224609375, -1.38836669921875, -1.3037109375, -1.21905517578125, -1.1343994140625, -1.04974365234375, -0.965087890625, -0.88043212890625, -0.7957763671875, -0.71112060546875, -0.62646484375, -0.54180908203125, -0.4571533203125, -0.37249755859375, -0.287841796875, -0.20318603515625, -0.1185302734375, -0.03387451171875, 0.05078125, 0.13543701171875, 0.2200927734375, 0.30474853515625, 0.389404296875, 0.47406005859375, 0.5587158203125, 0.64337158203125, 0.72802734375, 0.81268310546875, 0.8973388671875, 0.98199462890625, 1.066650390625, 1.15130615234375, 1.2359619140625, 1.32061767578125, 1.4052734375, 1.48992919921875, 1.5745849609375, 1.65924072265625, 1.743896484375, 1.82855224609375, 1.9132080078125, 1.99786376953125, 2.08251953125, 2.16717529296875, 2.2518310546875, 2.33648681640625, 2.421142578125, 2.50579833984375, 2.5904541015625, 2.67510986328125, 2.759765625]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 6.0, 9.0, 10.0, 11.0, 19.0, 28.0, 52.0, 115.0, 481.0, 7503.0, 4175189.0, 10101.0, 490.0, 128.0, 46.0, 32.0, 18.0, 13.0, 10.0, 9.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.578125, -19.7724609375, -18.966796875, -18.1611328125, -17.35546875, -16.5498046875, -15.744140625, -14.9384765625, -14.1328125, -13.3271484375, -12.521484375, -11.7158203125, -10.91015625, -10.1044921875, -9.298828125, -8.4931640625, -7.6875, -6.8818359375, -6.076171875, -5.2705078125, -4.46484375, -3.6591796875, -2.853515625, -2.0478515625, -1.2421875, -0.4365234375, 0.369140625, 1.1748046875, 1.98046875, 2.7861328125, 3.591796875, 4.3974609375, 5.203125, 6.0087890625, 6.814453125, 7.6201171875, 8.42578125, 9.2314453125, 10.037109375, 10.8427734375, 11.6484375, 12.4541015625, 13.259765625, 14.0654296875, 14.87109375, 15.6767578125, 16.482421875, 17.2880859375, 18.09375, 18.8994140625, 19.705078125, 20.5107421875, 21.31640625, 22.1220703125, 22.927734375, 23.7333984375, 24.5390625, 25.3447265625, 26.150390625, 26.9560546875, 27.76171875, 28.5673828125, 29.373046875, 30.1787109375, 30.984375]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 4.0, 2.0, 4.0, 9.0, 9.0, 11.0, 15.0, 32.0, 46.0, 82.0, 292.0, 1887.0, 1341.0, 195.0, 61.0, 28.0, 19.0, 19.0, 5.0, 9.0, 6.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8271484375, -1.7616729736328125, -1.696197509765625, -1.6307220458984375, -1.56524658203125, -1.4997711181640625, -1.434295654296875, -1.3688201904296875, -1.3033447265625, -1.2378692626953125, -1.172393798828125, -1.1069183349609375, -1.04144287109375, -0.9759674072265625, -0.910491943359375, -0.8450164794921875, -0.779541015625, -0.7140655517578125, -0.648590087890625, -0.5831146240234375, -0.51763916015625, -0.4521636962890625, -0.386688232421875, -0.3212127685546875, -0.2557373046875, -0.1902618408203125, -0.124786376953125, -0.0593109130859375, 0.00616455078125, 0.0716400146484375, 0.137115478515625, 0.2025909423828125, 0.26806640625, 0.3335418701171875, 0.399017333984375, 0.4644927978515625, 0.52996826171875, 0.5954437255859375, 0.660919189453125, 0.7263946533203125, 0.7918701171875, 0.8573455810546875, 0.922821044921875, 0.9882965087890625, 1.05377197265625, 1.1192474365234375, 1.184722900390625, 1.2501983642578125, 1.315673828125, 1.3811492919921875, 1.446624755859375, 1.5121002197265625, 1.57757568359375, 1.6430511474609375, 1.708526611328125, 1.7740020751953125, 1.8394775390625, 1.9049530029296875, 1.970428466796875, 2.0359039306640625, 2.10137939453125, 2.1668548583984375, 2.232330322265625, 2.2978057861328125, 2.36328125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 6.0, 5.0, 3.0, 14.0, 19.0, 17.0, 15.0, 34.0, 49.0, 62.0, 73.0, 86.0, 102.0, 92.0, 96.0, 89.0, 53.0, 34.0, 30.0, 29.0, 20.0, 17.0, 13.0, 6.0, 10.0, 9.0, 3.0, 4.0, 3.0, 1.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7544424533843994, -2.671036958694458, -2.5876314640045166, -2.504225969314575, -2.420820713043213, -2.3374152183532715, -2.25400972366333, -2.1706042289733887, -2.0871987342834473, -2.003793239593506, -1.9203877449035645, -1.8369823694229126, -1.7535768747329712, -1.6701713800430298, -1.586766004562378, -1.5033605098724365, -1.4199550151824951, -1.3365495204925537, -1.2531440258026123, -1.1697386503219604, -1.086333155632019, -1.0029276609420776, -0.919522225856781, -0.8361167907714844, -0.752711296081543, -0.6693058013916016, -0.5859003663063049, -0.5024949312210083, -0.4190894365310669, -0.3356839716434479, -0.25227850675582886, -0.16887307167053223, -0.08546781539916992, -0.0020623505115509033, 0.08134311437606812, 0.16474857926368713, 0.24815404415130615, 0.33155950903892517, 0.4149649739265442, 0.4983704090118408, 0.5817759037017822, 0.6651813983917236, 0.7485868334770203, 0.8319922685623169, 0.9153977632522583, 0.9988032579421997, 1.0822086334228516, 1.165614128112793, 1.2490196228027344, 1.3324251174926758, 1.4158306121826172, 1.499235987663269, 1.5826414823532104, 1.6660469770431519, 1.7494523525238037, 1.8328578472137451, 1.9162633419036865, 1.999668836593628, 2.0830743312835693, 2.1664798259735107, 2.249885082244873, 2.3332905769348145, 2.416696071624756, 2.5001015663146973, 2.5835070610046387]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 9.0, 8.0, 11.0, 7.0, 10.0, 11.0, 21.0, 19.0, 16.0, 27.0, 24.0, 32.0, 32.0, 36.0, 32.0, 42.0, 40.0, 56.0, 36.0, 52.0, 44.0, 47.0, 49.0, 35.0, 27.0, 35.0, 32.0, 36.0, 25.0, 29.0, 15.0, 23.0, 13.0, 21.0, 10.0, 6.0, 6.0, 10.0, 5.0, 7.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.1681621074676514, -2.1113107204437256, -2.054459571838379, -1.9976081848144531, -1.9407567977905273, -1.8839055299758911, -1.8270541429519653, -1.770202875137329, -1.7133514881134033, -1.656500220298767, -1.5996488332748413, -1.542797565460205, -1.4859461784362793, -1.429094910621643, -1.3722435235977173, -1.315392255783081, -1.2585408687591553, -1.201689600944519, -1.1448382139205933, -1.087986946105957, -1.0311355590820312, -0.974284291267395, -0.9174329042434692, -0.860581636428833, -0.8037303686141968, -0.7468790411949158, -0.6900277137756348, -0.6331763863563538, -0.5763250589370728, -0.5194737911224365, -0.46262243390083313, -0.4057711064815521, -0.34891974925994873, -0.2920684218406677, -0.23521709442138672, -0.1783657819032669, -0.1215144544839859, -0.06466314196586609, -0.007811814546585083, 0.04903951287269592, 0.10589084029197693, 0.16274216771125793, 0.21959349513053894, 0.27644479274749756, 0.33329612016677856, 0.39014744758605957, 0.4469987750053406, 0.5038501024246216, 0.5607014298439026, 0.6175527572631836, 0.6744040846824646, 0.7312554121017456, 0.7881067395210266, 0.8449580669403076, 0.9018093347549438, 0.9586607217788696, 1.0155119895935059, 1.072363257408142, 1.1292146444320679, 1.186065912246704, 1.2429172992706299, 1.2997685670852661, 1.356619954109192, 1.4134712219238281, 1.470322608947754]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 0.0, 4.0, 4.0, 3.0, 4.0, 8.0, 10.0, 19.0, 28.0, 39.0, 61.0, 153.0, 363.0, 977.0, 2735.0, 9230.0, 40653.0, 384261.0, 541903.0, 51936.0, 11016.0, 3297.0, 1079.0, 405.0, 177.0, 69.0, 37.0, 19.0, 19.0, 10.0, 10.0, 5.0, 8.0, 4.0, 5.0, 0.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3603515625, -1.3151092529296875, -1.269866943359375, -1.2246246337890625, -1.17938232421875, -1.1341400146484375, -1.088897705078125, -1.0436553955078125, -0.9984130859375, -0.9531707763671875, -0.907928466796875, -0.8626861572265625, -0.81744384765625, -0.7722015380859375, -0.726959228515625, -0.6817169189453125, -0.636474609375, -0.5912322998046875, -0.545989990234375, -0.5007476806640625, -0.45550537109375, -0.4102630615234375, -0.365020751953125, -0.3197784423828125, -0.2745361328125, -0.2292938232421875, -0.184051513671875, -0.1388092041015625, -0.09356689453125, -0.0483245849609375, -0.003082275390625, 0.0421600341796875, 0.08740234375, 0.1326446533203125, 0.177886962890625, 0.2231292724609375, 0.26837158203125, 0.3136138916015625, 0.358856201171875, 0.4040985107421875, 0.4493408203125, 0.4945831298828125, 0.539825439453125, 0.5850677490234375, 0.63031005859375, 0.6755523681640625, 0.720794677734375, 0.7660369873046875, 0.811279296875, 0.8565216064453125, 0.901763916015625, 0.9470062255859375, 0.99224853515625, 1.0374908447265625, 1.082733154296875, 1.1279754638671875, 1.1732177734375, 1.2184600830078125, 1.263702392578125, 1.3089447021484375, 1.35418701171875, 1.3994293212890625, 1.444671630859375, 1.4899139404296875, 1.53515625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 17.0, 14.0, 19.0, 50.0, 29.0, 62.0, 71.0, 92.0, 97.0, 106.0, 102.0, 73.0, 81.0, 61.0, 36.0, 30.0, 26.0, 11.0, 15.0, 10.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6767578125, -1.5949554443359375, -1.513153076171875, -1.4313507080078125, -1.34954833984375, -1.2677459716796875, -1.185943603515625, -1.1041412353515625, -1.0223388671875, -0.9405364990234375, -0.858734130859375, -0.7769317626953125, -0.69512939453125, -0.6133270263671875, -0.531524658203125, -0.4497222900390625, -0.367919921875, -0.2861175537109375, -0.204315185546875, -0.1225128173828125, -0.04071044921875, 0.0410919189453125, 0.122894287109375, 0.2046966552734375, 0.2864990234375, 0.3683013916015625, 0.450103759765625, 0.5319061279296875, 0.61370849609375, 0.6955108642578125, 0.777313232421875, 0.8591156005859375, 0.94091796875, 1.0227203369140625, 1.104522705078125, 1.1863250732421875, 1.26812744140625, 1.3499298095703125, 1.431732177734375, 1.5135345458984375, 1.5953369140625, 1.6771392822265625, 1.758941650390625, 1.8407440185546875, 1.92254638671875, 2.0043487548828125, 2.086151123046875, 2.1679534912109375, 2.249755859375, 2.3315582275390625, 2.413360595703125, 2.4951629638671875, 2.57696533203125, 2.6587677001953125, 2.740570068359375, 2.8223724365234375, 2.9041748046875, 2.9859771728515625, 3.067779541015625, 3.1495819091796875, 3.23138427734375, 3.3131866455078125, 3.394989013671875, 3.4767913818359375, 3.55859375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 7.0, 4.0, 10.0, 10.0, 21.0, 25.0, 32.0, 43.0, 74.0, 105.0, 176.0, 224.0, 399.0, 642.0, 1000.0, 1943.0, 3658.0, 7585.0, 17788.0, 50204.0, 198266.0, 542977.0, 152395.0, 41458.0, 15293.0, 6662.0, 3343.0, 1669.0, 951.0, 568.0, 336.0, 236.0, 145.0, 95.0, 67.0, 41.0, 29.0, 17.0, 13.0, 19.0, 6.0, 5.0, 1.0, 7.0, 5.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.6484375, -0.6284332275390625, -0.608428955078125, -0.5884246826171875, -0.56842041015625, -0.5484161376953125, -0.528411865234375, -0.5084075927734375, -0.4884033203125, -0.4683990478515625, -0.448394775390625, -0.4283905029296875, -0.40838623046875, -0.3883819580078125, -0.368377685546875, -0.3483734130859375, -0.328369140625, -0.3083648681640625, -0.288360595703125, -0.2683563232421875, -0.24835205078125, -0.2283477783203125, -0.208343505859375, -0.1883392333984375, -0.1683349609375, -0.1483306884765625, -0.128326416015625, -0.1083221435546875, -0.08831787109375, -0.0683135986328125, -0.048309326171875, -0.0283050537109375, -0.00830078125, 0.0117034912109375, 0.031707763671875, 0.0517120361328125, 0.07171630859375, 0.0917205810546875, 0.111724853515625, 0.1317291259765625, 0.1517333984375, 0.1717376708984375, 0.191741943359375, 0.2117462158203125, 0.23175048828125, 0.2517547607421875, 0.271759033203125, 0.2917633056640625, 0.311767578125, 0.3317718505859375, 0.351776123046875, 0.3717803955078125, 0.39178466796875, 0.4117889404296875, 0.431793212890625, 0.4517974853515625, 0.4718017578125, 0.4918060302734375, 0.511810302734375, 0.5318145751953125, 0.55181884765625, 0.5718231201171875, 0.591827392578125, 0.6118316650390625, 0.6318359375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 4.0, 3.0, 7.0, 6.0, 20.0, 10.0, 12.0, 11.0, 15.0, 19.0, 20.0, 21.0, 27.0, 35.0, 45.0, 36.0, 44.0, 46.0, 55.0, 48.0, 56.0, 45.0, 42.0, 58.0, 47.0, 45.0, 32.0, 26.0, 27.0, 21.0, 28.0, 22.0, 12.0, 9.0, 8.0, 8.0, 12.0, 5.0, 6.0, 0.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.4453125, -2.367218017578125, -2.28912353515625, -2.211029052734375, -2.1329345703125, -2.054840087890625, -1.97674560546875, -1.898651123046875, -1.820556640625, -1.742462158203125, -1.66436767578125, -1.586273193359375, -1.5081787109375, -1.430084228515625, -1.35198974609375, -1.273895263671875, -1.19580078125, -1.117706298828125, -1.03961181640625, -0.961517333984375, -0.8834228515625, -0.805328369140625, -0.72723388671875, -0.649139404296875, -0.571044921875, -0.492950439453125, -0.41485595703125, -0.336761474609375, -0.2586669921875, -0.180572509765625, -0.10247802734375, -0.024383544921875, 0.0537109375, 0.131805419921875, 0.20989990234375, 0.287994384765625, 0.3660888671875, 0.444183349609375, 0.52227783203125, 0.600372314453125, 0.678466796875, 0.756561279296875, 0.83465576171875, 0.912750244140625, 0.9908447265625, 1.068939208984375, 1.14703369140625, 1.225128173828125, 1.30322265625, 1.381317138671875, 1.45941162109375, 1.537506103515625, 1.6156005859375, 1.693695068359375, 1.77178955078125, 1.849884033203125, 1.927978515625, 2.006072998046875, 2.08416748046875, 2.162261962890625, 2.2403564453125, 2.318450927734375, 2.39654541015625, 2.474639892578125, 2.552734375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 2.0, 3.0, 2.0, 4.0, 5.0, 7.0, 8.0, 13.0, 23.0, 18.0, 38.0, 53.0, 121.0, 167.0, 276.0, 484.0, 1047.0, 2168.0, 4957.0, 13092.0, 46912.0, 423910.0, 480812.0, 50976.0, 13783.0, 5216.0, 2168.0, 1028.0, 544.0, 298.0, 157.0, 105.0, 58.0, 39.0, 27.0, 13.0, 9.0, 2.0, 4.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1619873046875, -0.1552448272705078, -0.14850234985351562, -0.14175987243652344, -0.13501739501953125, -0.12827491760253906, -0.12153244018554688, -0.11478996276855469, -0.1080474853515625, -0.10130500793457031, -0.09456253051757812, -0.08782005310058594, -0.08107757568359375, -0.07433509826660156, -0.06759262084960938, -0.06085014343261719, -0.054107666015625, -0.04736518859863281, -0.040622711181640625, -0.03388023376464844, -0.02713775634765625, -0.020395278930664062, -0.013652801513671875, -0.0069103240966796875, -0.0001678466796875, 0.0065746307373046875, 0.013317108154296875, 0.020059585571289062, 0.02680206298828125, 0.03354454040527344, 0.040287017822265625, 0.04702949523925781, 0.05377197265625, 0.06051445007324219, 0.06725692749023438, 0.07399940490722656, 0.08074188232421875, 0.08748435974121094, 0.09422683715820312, 0.10096931457519531, 0.1077117919921875, 0.11445426940917969, 0.12119674682617188, 0.12793922424316406, 0.13468170166015625, 0.14142417907714844, 0.14816665649414062, 0.1549091339111328, 0.161651611328125, 0.1683940887451172, 0.17513656616210938, 0.18187904357910156, 0.18862152099609375, 0.19536399841308594, 0.20210647583007812, 0.2088489532470703, 0.2155914306640625, 0.2223339080810547, 0.22907638549804688, 0.23581886291503906, 0.24256134033203125, 0.24930381774902344, 0.2560462951660156, 0.2627887725830078, 0.26953125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 6.0, 2.0, 5.0, 5.0, 6.0, 15.0, 19.0, 13.0, 16.0, 35.0, 54.0, 66.0, 115.0, 160.0, 156.0, 116.0, 64.0, 37.0, 39.0, 22.0, 11.0, 7.0, 7.0, 9.0, 6.0, 4.0, 5.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.00017189979553222656, -0.0001672450453042984, -0.00016259029507637024, -0.00015793554484844208, -0.00015328079462051392, -0.00014862604439258575, -0.0001439712941646576, -0.00013931654393672943, -0.00013466179370880127, -0.0001300070434808731, -0.00012535229325294495, -0.00012069754302501678, -0.00011604279279708862, -0.00011138804256916046, -0.0001067332923412323, -0.00010207854211330414, -9.742379188537598e-05, -9.276904165744781e-05, -8.811429142951965e-05, -8.345954120159149e-05, -7.880479097366333e-05, -7.415004074573517e-05, -6.949529051780701e-05, -6.484054028987885e-05, -6.0185790061950684e-05, -5.553103983402252e-05, -5.087628960609436e-05, -4.62215393781662e-05, -4.156678915023804e-05, -3.6912038922309875e-05, -3.2257288694381714e-05, -2.7602538466453552e-05, -2.294778823852539e-05, -1.829303801059723e-05, -1.3638287782669067e-05, -8.983537554740906e-06, -4.328787326812744e-06, 3.259629011154175e-07, 4.980713129043579e-06, 9.63546335697174e-06, 1.4290213584899902e-05, 1.8944963812828064e-05, 2.3599714040756226e-05, 2.8254464268684387e-05, 3.290921449661255e-05, 3.756396472454071e-05, 4.221871495246887e-05, 4.6873465180397034e-05, 5.1528215408325195e-05, 5.618296563625336e-05, 6.083771586418152e-05, 6.549246609210968e-05, 7.014721632003784e-05, 7.4801966547966e-05, 7.945671677589417e-05, 8.411146700382233e-05, 8.876621723175049e-05, 9.342096745967865e-05, 9.807571768760681e-05, 0.00010273046791553497, 0.00010738521814346313, 0.0001120399683713913, 0.00011669471859931946, 0.00012134946882724762, 0.00012600421905517578]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 5.0, 7.0, 5.0, 17.0, 33.0, 120.0, 533.0, 4067.0, 129270.0, 901820.0, 11190.0, 1136.0, 222.0, 67.0, 27.0, 14.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.65576171875, -0.6297378540039062, -0.6037139892578125, -0.5776901245117188, -0.551666259765625, -0.5256423950195312, -0.4996185302734375, -0.47359466552734375, -0.44757080078125, -0.42154693603515625, -0.3955230712890625, -0.36949920654296875, -0.343475341796875, -0.31745147705078125, -0.2914276123046875, -0.26540374755859375, -0.2393798828125, -0.21335601806640625, -0.1873321533203125, -0.16130828857421875, -0.135284423828125, -0.10926055908203125, -0.0832366943359375, -0.05721282958984375, -0.03118896484375, -0.00516510009765625, 0.0208587646484375, 0.04688262939453125, 0.072906494140625, 0.09893035888671875, 0.1249542236328125, 0.15097808837890625, 0.177001953125, 0.20302581787109375, 0.2290496826171875, 0.25507354736328125, 0.281097412109375, 0.30712127685546875, 0.3331451416015625, 0.35916900634765625, 0.38519287109375, 0.41121673583984375, 0.4372406005859375, 0.46326446533203125, 0.489288330078125, 0.5153121948242188, 0.5413360595703125, 0.5673599243164062, 0.5933837890625, 0.6194076538085938, 0.6454315185546875, 0.6714553833007812, 0.697479248046875, 0.7235031127929688, 0.7495269775390625, 0.7755508422851562, 0.80157470703125, 0.8275985717773438, 0.8536224365234375, 0.8796463012695312, 0.905670166015625, 0.9316940307617188, 0.9577178955078125, 0.9837417602539062, 1.009765625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 6.0, 6.0, 6.0, 5.0, 10.0, 19.0, 17.0, 24.0, 37.0, 41.0, 52.0, 78.0, 85.0, 114.0, 114.0, 78.0, 74.0, 53.0, 41.0, 35.0, 24.0, 21.0, 9.0, 12.0, 11.0, 7.0, 8.0, 6.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.06536865234375, -0.06344318389892578, -0.06151771545410156, -0.059592247009277344, -0.057666778564453125, -0.055741310119628906, -0.05381584167480469, -0.05189037322998047, -0.04996490478515625, -0.04803943634033203, -0.04611396789550781, -0.044188499450683594, -0.042263031005859375, -0.040337562561035156, -0.03841209411621094, -0.03648662567138672, -0.0345611572265625, -0.03263568878173828, -0.030710220336914062, -0.028784751892089844, -0.026859283447265625, -0.024933815002441406, -0.023008346557617188, -0.02108287811279297, -0.01915740966796875, -0.01723194122314453, -0.015306472778320312, -0.013381004333496094, -0.011455535888671875, -0.009530067443847656, -0.0076045989990234375, -0.005679130554199219, -0.003753662109375, -0.0018281936645507812, 9.72747802734375e-05, 0.0020227432250976562, 0.003948211669921875, 0.005873680114746094, 0.0077991485595703125, 0.009724617004394531, 0.01165008544921875, 0.013575553894042969, 0.015501022338867188, 0.017426490783691406, 0.019351959228515625, 0.021277427673339844, 0.023202896118164062, 0.02512836456298828, 0.0270538330078125, 0.02897930145263672, 0.030904769897460938, 0.032830238342285156, 0.034755706787109375, 0.036681175231933594, 0.03860664367675781, 0.04053211212158203, 0.04245758056640625, 0.04438304901123047, 0.04630851745605469, 0.048233985900878906, 0.050159454345703125, 0.052084922790527344, 0.05401039123535156, 0.05593585968017578, 0.057861328125]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 6.0, 14.0, 17.0, 24.0, 60.0, 95.0, 237.0, 215.0, 154.0, 82.0, 47.0, 22.0, 14.0, 10.0, 4.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4313602447509766, -2.3174726963043213, -2.203585147857666, -2.0896973609924316, -1.975809931755066, -1.861922264099121, -1.7480347156524658, -1.6341471672058105, -1.5202596187591553, -1.4063720703125, -1.2924844026565552, -1.1785968542099, -1.0647093057632446, -0.9508216977119446, -0.8369340896606445, -0.7230465412139893, -0.6091588735580444, -0.4952712953090668, -0.3813837170600891, -0.26749610900878906, -0.1536085307598114, -0.03972095251083374, 0.07416665554046631, 0.18805420398712158, 0.30194181203842163, 0.4158293902873993, 0.529716968536377, 0.643604576587677, 0.757492184638977, 0.8713797330856323, 0.9852673411369324, 1.0991549491882324, 1.2130424976348877, 1.326930046081543, 1.4408177137374878, 1.554705262184143, 1.6685928106307983, 1.7824804782867432, 1.8963680267333984, 2.0102555751800537, 2.124143123626709, 2.2380306720733643, 2.3519182205200195, 2.465806007385254, 2.579693555831909, 2.6935811042785645, 2.8074686527252197, 2.921356201171875, 3.0352439880371094, 3.1491315364837646, 3.26301908493042, 3.3769068717956543, 3.4907944202423096, 3.604681968688965, 3.71856951713562, 3.8324570655822754, 3.9463446140289307, 4.060232162475586, 4.17411994934082, 4.2880072593688965, 4.401895046234131, 4.515782356262207, 4.629670143127441, 4.743557929992676, 4.857445240020752]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 14.0, 22.0, 18.0, 35.0, 42.0, 54.0, 61.0, 75.0, 83.0, 106.0, 115.0, 71.0, 77.0, 60.0, 52.0, 40.0, 26.0, 28.0, 12.0, 7.0, 7.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.684027075767517, -1.607417106628418, -1.5308072566986084, -1.4541972875595093, -1.3775873184204102, -1.3009774684906006, -1.2243674993515015, -1.1477575302124023, -1.0711476802825928, -0.9945377707481384, -0.9179278016090393, -0.841317892074585, -0.7647079229354858, -0.6880980134010315, -0.6114881038665771, -0.534878134727478, -0.4582681655883789, -0.3816582262516022, -0.30504828691482544, -0.2284383773803711, -0.15182843804359436, -0.07521849870681763, 0.0013914108276367188, 0.07800137996673584, 0.15461128950119019, 0.23122122883796692, 0.30783116817474365, 0.384441077709198, 0.46105101704597473, 0.5376609563827515, 0.6142708659172058, 0.6908808350563049, 0.7674908638000488, 0.8441007733345032, 0.9207107424736023, 0.9973206520080566, 1.0739306211471558, 1.1505405902862549, 1.2271504402160645, 1.3037604093551636, 1.3803703784942627, 1.4569803476333618, 1.5335901975631714, 1.6102001667022705, 1.6868101358413696, 1.7634201049804688, 1.8400299549102783, 1.9166399240493774, 1.993249773979187, 2.069859743118286, 2.1464695930480957, 2.2230796813964844, 2.299689531326294, 2.3762993812561035, 2.452909469604492, 2.5295193195343018, 2.6061291694641113, 2.682739019393921, 2.7593491077423096, 2.835958957672119, 2.9125688076019287, 2.9891788959503174, 3.065788745880127, 3.1423988342285156, 3.219008684158325]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 8.0, 6.0, 15.0, 32.0, 85.0, 270.0, 739.0, 2174.0, 14801.0, 1011544.0, 15497.0, 2189.0, 765.0, 263.0, 97.0, 41.0, 14.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.2578125, -8.9970703125, -8.736328125, -8.4755859375, -8.21484375, -7.9541015625, -7.693359375, -7.4326171875, -7.171875, -6.9111328125, -6.650390625, -6.3896484375, -6.12890625, -5.8681640625, -5.607421875, -5.3466796875, -5.0859375, -4.8251953125, -4.564453125, -4.3037109375, -4.04296875, -3.7822265625, -3.521484375, -3.2607421875, -3.0, -2.7392578125, -2.478515625, -2.2177734375, -1.95703125, -1.6962890625, -1.435546875, -1.1748046875, -0.9140625, -0.6533203125, -0.392578125, -0.1318359375, 0.12890625, 0.3896484375, 0.650390625, 0.9111328125, 1.171875, 1.4326171875, 1.693359375, 1.9541015625, 2.21484375, 2.4755859375, 2.736328125, 2.9970703125, 3.2578125, 3.5185546875, 3.779296875, 4.0400390625, 4.30078125, 4.5615234375, 4.822265625, 5.0830078125, 5.34375, 5.6044921875, 5.865234375, 6.1259765625, 6.38671875, 6.6474609375, 6.908203125, 7.1689453125, 7.4296875]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 4.0, 3.0, 8.0, 17.0, 26.0, 35.0, 35.0, 55.0, 76.0, 108.0, 117.0, 104.0, 101.0, 94.0, 69.0, 55.0, 27.0, 37.0, 25.0, 8.0, 7.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.70703125, -2.53021240234375, -2.3533935546875, -2.17657470703125, -1.999755859375, -1.82293701171875, -1.6461181640625, -1.46929931640625, -1.29248046875, -1.11566162109375, -0.9388427734375, -0.76202392578125, -0.585205078125, -0.40838623046875, -0.2315673828125, -0.05474853515625, 0.1220703125, 0.29888916015625, 0.4757080078125, 0.65252685546875, 0.829345703125, 1.00616455078125, 1.1829833984375, 1.35980224609375, 1.53662109375, 1.71343994140625, 1.8902587890625, 2.06707763671875, 2.243896484375, 2.42071533203125, 2.5975341796875, 2.77435302734375, 2.951171875, 3.12799072265625, 3.3048095703125, 3.48162841796875, 3.658447265625, 3.83526611328125, 4.0120849609375, 4.18890380859375, 4.36572265625, 4.54254150390625, 4.7193603515625, 4.89617919921875, 5.072998046875, 5.24981689453125, 5.4266357421875, 5.60345458984375, 5.7802734375, 5.95709228515625, 6.1339111328125, 6.31072998046875, 6.487548828125, 6.66436767578125, 6.8411865234375, 7.01800537109375, 7.19482421875, 7.37164306640625, 7.5484619140625, 7.72528076171875, 7.902099609375, 8.07891845703125, 8.2557373046875, 8.43255615234375, 8.609375]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 6.0, 0.0, 1.0, 5.0, 3.0, 10.0, 7.0, 11.0, 12.0, 14.0, 31.0, 51.0, 51.0, 92.0, 182.0, 423.0, 1178.0, 4959.0, 971537.0, 65308.0, 3168.0, 821.0, 304.0, 119.0, 70.0, 45.0, 34.0, 24.0, 25.0, 11.0, 14.0, 9.0, 12.0, 3.0, 5.0, 3.0, 2.0, 2.0, 0.0, 5.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.1796875, -7.8861083984375, -7.592529296875, -7.2989501953125, -7.00537109375, -6.7117919921875, -6.418212890625, -6.1246337890625, -5.8310546875, -5.5374755859375, -5.243896484375, -4.9503173828125, -4.65673828125, -4.3631591796875, -4.069580078125, -3.7760009765625, -3.482421875, -3.1888427734375, -2.895263671875, -2.6016845703125, -2.30810546875, -2.0145263671875, -1.720947265625, -1.4273681640625, -1.1337890625, -0.8402099609375, -0.546630859375, -0.2530517578125, 0.04052734375, 0.3341064453125, 0.627685546875, 0.9212646484375, 1.21484375, 1.5084228515625, 1.802001953125, 2.0955810546875, 2.38916015625, 2.6827392578125, 2.976318359375, 3.2698974609375, 3.5634765625, 3.8570556640625, 4.150634765625, 4.4442138671875, 4.73779296875, 5.0313720703125, 5.324951171875, 5.6185302734375, 5.912109375, 6.2056884765625, 6.499267578125, 6.7928466796875, 7.08642578125, 7.3800048828125, 7.673583984375, 7.9671630859375, 8.2607421875, 8.5543212890625, 8.847900390625, 9.1414794921875, 9.43505859375, 9.7286376953125, 10.022216796875, 10.3157958984375, 10.609375]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 5.0, 3.0, 4.0, 9.0, 6.0, 9.0, 9.0, 12.0, 15.0, 31.0, 23.0, 36.0, 44.0, 46.0, 53.0, 62.0, 54.0, 66.0, 53.0, 57.0, 58.0, 48.0, 53.0, 55.0, 34.0, 28.0, 25.0, 21.0, 13.0, 21.0, 7.0, 14.0, 8.0, 7.0, 1.0, 5.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.763671875, -2.658416748046875, -2.55316162109375, -2.447906494140625, -2.3426513671875, -2.237396240234375, -2.13214111328125, -2.026885986328125, -1.921630859375, -1.816375732421875, -1.71112060546875, -1.605865478515625, -1.5006103515625, -1.395355224609375, -1.29010009765625, -1.184844970703125, -1.07958984375, -0.974334716796875, -0.86907958984375, -0.763824462890625, -0.6585693359375, -0.553314208984375, -0.44805908203125, -0.342803955078125, -0.237548828125, -0.132293701171875, -0.02703857421875, 0.078216552734375, 0.1834716796875, 0.288726806640625, 0.39398193359375, 0.499237060546875, 0.6044921875, 0.709747314453125, 0.81500244140625, 0.920257568359375, 1.0255126953125, 1.130767822265625, 1.23602294921875, 1.341278076171875, 1.446533203125, 1.551788330078125, 1.65704345703125, 1.762298583984375, 1.8675537109375, 1.972808837890625, 2.07806396484375, 2.183319091796875, 2.28857421875, 2.393829345703125, 2.49908447265625, 2.604339599609375, 2.7095947265625, 2.814849853515625, 2.92010498046875, 3.025360107421875, 3.130615234375, 3.235870361328125, 3.34112548828125, 3.446380615234375, 3.5516357421875, 3.656890869140625, 3.76214599609375, 3.867401123046875, 3.97265625]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 2.0, 4.0, 7.0, 8.0, 5.0, 12.0, 7.0, 15.0, 20.0, 40.0, 74.0, 244.0, 1425.0, 13914.0, 981718.0, 47442.0, 2943.0, 429.0, 99.0, 47.0, 21.0, 20.0, 8.0, 13.0, 4.0, 5.0, 6.0, 6.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.9833984375, -1.9278106689453125, -1.872222900390625, -1.8166351318359375, -1.76104736328125, -1.7054595947265625, -1.649871826171875, -1.5942840576171875, -1.5386962890625, -1.4831085205078125, -1.427520751953125, -1.3719329833984375, -1.31634521484375, -1.2607574462890625, -1.205169677734375, -1.1495819091796875, -1.093994140625, -1.0384063720703125, -0.982818603515625, -0.9272308349609375, -0.87164306640625, -0.8160552978515625, -0.760467529296875, -0.7048797607421875, -0.6492919921875, -0.5937042236328125, -0.538116455078125, -0.4825286865234375, -0.42694091796875, -0.3713531494140625, -0.315765380859375, -0.2601776123046875, -0.20458984375, -0.1490020751953125, -0.093414306640625, -0.0378265380859375, 0.01776123046875, 0.0733489990234375, 0.128936767578125, 0.1845245361328125, 0.2401123046875, 0.2957000732421875, 0.351287841796875, 0.4068756103515625, 0.46246337890625, 0.5180511474609375, 0.573638916015625, 0.6292266845703125, 0.684814453125, 0.7404022216796875, 0.795989990234375, 0.8515777587890625, 0.90716552734375, 0.9627532958984375, 1.018341064453125, 1.0739288330078125, 1.1295166015625, 1.1851043701171875, 1.240692138671875, 1.2962799072265625, 1.35186767578125, 1.4074554443359375, 1.463043212890625, 1.5186309814453125, 1.57421875]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 3.0, 1.0, 9.0, 12.0, 10.0, 12.0, 16.0, 23.0, 40.0, 66.0, 210.0, 321.0, 121.0, 57.0, 31.0, 18.0, 14.0, 8.0, 7.0, 4.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.465217590332031e-05, -9.140651673078537e-05, -8.816085755825043e-05, -8.491519838571548e-05, -8.166953921318054e-05, -7.84238800406456e-05, -7.517822086811066e-05, -7.193256169557571e-05, -6.868690252304077e-05, -6.544124335050583e-05, -6.219558417797089e-05, -5.8949925005435944e-05, -5.5704265832901e-05, -5.245860666036606e-05, -4.9212947487831116e-05, -4.596728831529617e-05, -4.272162914276123e-05, -3.947596997022629e-05, -3.6230310797691345e-05, -3.29846516251564e-05, -2.973899245262146e-05, -2.6493333280086517e-05, -2.3247674107551575e-05, -2.0002014935016632e-05, -1.675635576248169e-05, -1.3510696589946747e-05, -1.0265037417411804e-05, -7.0193782448768616e-06, -3.773719072341919e-06, -5.280598998069763e-07, 2.7175992727279663e-06, 5.963258445262909e-06, 9.208917617797852e-06, 1.2454576790332794e-05, 1.5700235962867737e-05, 1.894589513540268e-05, 2.2191554307937622e-05, 2.5437213480472565e-05, 2.8682872653007507e-05, 3.192853182554245e-05, 3.517419099807739e-05, 3.8419850170612335e-05, 4.166550934314728e-05, 4.491116851568222e-05, 4.815682768821716e-05, 5.1402486860752106e-05, 5.464814603328705e-05, 5.789380520582199e-05, 6.113946437835693e-05, 6.438512355089188e-05, 6.763078272342682e-05, 7.087644189596176e-05, 7.41221010684967e-05, 7.736776024103165e-05, 8.061341941356659e-05, 8.385907858610153e-05, 8.710473775863647e-05, 9.035039693117142e-05, 9.359605610370636e-05, 9.68417152762413e-05, 0.00010008737444877625, 0.00010333303362131119, 0.00010657869279384613, 0.00010982435196638107, 0.00011307001113891602]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 2.0, 6.0, 4.0, 12.0, 8.0, 15.0, 20.0, 32.0, 65.0, 150.0, 404.0, 1385.0, 8625.0, 258555.0, 765219.0, 11493.0, 1784.0, 454.0, 137.0, 60.0, 39.0, 23.0, 19.0, 8.0, 6.0, 3.0, 9.0, 2.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0302734375, -0.989166259765625, -0.94805908203125, -0.906951904296875, -0.8658447265625, -0.824737548828125, -0.78363037109375, -0.742523193359375, -0.701416015625, -0.660308837890625, -0.61920166015625, -0.578094482421875, -0.5369873046875, -0.495880126953125, -0.45477294921875, -0.413665771484375, -0.37255859375, -0.331451416015625, -0.29034423828125, -0.249237060546875, -0.2081298828125, -0.167022705078125, -0.12591552734375, -0.084808349609375, -0.043701171875, -0.002593994140625, 0.03851318359375, 0.079620361328125, 0.1207275390625, 0.161834716796875, 0.20294189453125, 0.244049072265625, 0.28515625, 0.326263427734375, 0.36737060546875, 0.408477783203125, 0.4495849609375, 0.490692138671875, 0.53179931640625, 0.572906494140625, 0.614013671875, 0.655120849609375, 0.69622802734375, 0.737335205078125, 0.7784423828125, 0.819549560546875, 0.86065673828125, 0.901763916015625, 0.94287109375, 0.983978271484375, 1.02508544921875, 1.066192626953125, 1.1072998046875, 1.148406982421875, 1.18951416015625, 1.230621337890625, 1.271728515625, 1.312835693359375, 1.35394287109375, 1.395050048828125, 1.4361572265625, 1.477264404296875, 1.51837158203125, 1.559478759765625, 1.6005859375]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 6.0, 5.0, 6.0, 10.0, 12.0, 18.0, 19.0, 22.0, 31.0, 32.0, 53.0, 95.0, 179.0, 201.0, 97.0, 54.0, 31.0, 34.0, 20.0, 18.0, 9.0, 13.0, 7.0, 11.0, 2.0, 5.0, 4.0, 1.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.267822265625, -0.2609672546386719, -0.25411224365234375, -0.24725723266601562, -0.2404022216796875, -0.23354721069335938, -0.22669219970703125, -0.21983718872070312, -0.212982177734375, -0.20612716674804688, -0.19927215576171875, -0.19241714477539062, -0.1855621337890625, -0.17870712280273438, -0.17185211181640625, -0.16499710083007812, -0.15814208984375, -0.15128707885742188, -0.14443206787109375, -0.13757705688476562, -0.1307220458984375, -0.12386703491210938, -0.11701202392578125, -0.11015701293945312, -0.103302001953125, -0.09644699096679688, -0.08959197998046875, -0.08273696899414062, -0.0758819580078125, -0.06902694702148438, -0.06217193603515625, -0.055316925048828125, -0.0484619140625, -0.041606903076171875, -0.03475189208984375, -0.027896881103515625, -0.0210418701171875, -0.014186859130859375, -0.00733184814453125, -0.000476837158203125, 0.006378173828125, 0.013233184814453125, 0.02008819580078125, 0.026943206787109375, 0.0337982177734375, 0.040653228759765625, 0.04750823974609375, 0.054363250732421875, 0.06121826171875, 0.06807327270507812, 0.07492828369140625, 0.08178329467773438, 0.0886383056640625, 0.09549331665039062, 0.10234832763671875, 0.10920333862304688, 0.116058349609375, 0.12291336059570312, 0.12976837158203125, 0.13662338256835938, 0.1434783935546875, 0.15033340454101562, 0.15718841552734375, 0.16404342651367188, 0.1708984375]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [5.0, 34.0, 186.0, 633.0, 135.0, 22.0, 8.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.469989061355591, -1.7525253295898438, -1.0350614786148071, -0.3175976276397705, 0.39986610412597656, 1.1173298358917236, 1.8347938060760498, 2.5522572994232178, 3.269721269607544, 3.987185001373291, 4.704648971557617, 5.422112464904785, 6.139576435089111, 6.8570404052734375, 7.5745038986206055, 8.291967391967773, 9.009431838989258, 9.726895332336426, 10.44435977935791, 11.161823272705078, 11.879286766052246, 12.596750259399414, 13.314214706420898, 14.031678199768066, 14.749141693115234, 15.466605186462402, 16.18406867980957, 16.901533126831055, 17.61899757385254, 18.33646011352539, 19.053924560546875, 19.77138900756836, 20.48885154724121, 21.206315994262695, 21.923778533935547, 22.64124298095703, 23.358707427978516, 24.076169967651367, 24.79363441467285, 25.511096954345703, 26.228561401367188, 26.946025848388672, 27.663488388061523, 28.380952835083008, 29.098417282104492, 29.815879821777344, 30.533344268798828, 31.250808715820312, 31.968273162841797, 32.68573760986328, 33.403202056884766, 34.12066650390625, 34.83812713623047, 35.55559158325195, 36.27305603027344, 36.99052047729492, 37.70798110961914, 38.425445556640625, 39.14291000366211, 39.860374450683594, 40.57783508300781, 41.2952995300293, 42.01276397705078, 42.730228424072266, 43.44769287109375]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 8.0, 13.0, 13.0, 17.0, 16.0, 27.0, 39.0, 42.0, 50.0, 56.0, 41.0, 78.0, 65.0, 58.0, 49.0, 49.0, 56.0, 48.0, 43.0, 46.0, 31.0, 36.0, 43.0, 23.0, 19.0, 14.0, 12.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7473456859588623, -3.5792205333709717, -3.411095142364502, -3.2429699897766113, -3.0748448371887207, -2.90671968460083, -2.7385945320129395, -2.5704691410064697, -2.402343988418579, -2.2342188358306885, -2.0660934448242188, -1.8979682922363281, -1.7298431396484375, -1.5617179870605469, -1.3935927152633667, -1.2254674434661865, -1.057342290878296, -0.8892170786857605, -0.7210918664932251, -0.5529666543006897, -0.3848414421081543, -0.2167162299156189, -0.048591017723083496, 0.11953425407409668, 0.2876594066619873, 0.4557846188545227, 0.6239098310470581, 0.7920350432395935, 0.9601602554321289, 1.1282854080200195, 1.2964106798171997, 1.4645359516143799, 1.6326613426208496, 1.8007864952087402, 1.9689117670059204, 2.1370370388031006, 2.305162191390991, 2.473287343978882, 2.6414127349853516, 2.809537887573242, 2.977663040161133, 3.1457881927490234, 3.313913345336914, 3.482038736343384, 3.6501638889312744, 3.818289041519165, 3.9864144325256348, 4.154539585113525, 4.322664737701416, 4.490789890289307, 4.658915042877197, 4.827040195465088, 4.995165824890137, 5.163290977478027, 5.331416130065918, 5.499541282653809, 5.667666435241699, 5.83579158782959, 6.0039167404174805, 6.172041893005371, 6.340167045593262, 6.5082926750183105, 6.676417827606201, 6.844542980194092, 7.012668132781982]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 7.0, 3.0, 5.0, 8.0, 11.0, 20.0, 31.0, 46.0, 56.0, 83.0, 84.0, 143.0, 220.0, 369.0, 588.0, 1142.0, 3074.0, 12078.0, 847305.0, 3294529.0, 26550.0, 4348.0, 1555.0, 774.0, 394.0, 253.0, 173.0, 129.0, 83.0, 63.0, 41.0, 26.0, 17.0, 18.0, 15.0, 13.0, 6.0, 11.0, 4.0, 2.0, 5.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.48046875, -6.29608154296875, -6.1116943359375, -5.92730712890625, -5.742919921875, -5.55853271484375, -5.3741455078125, -5.18975830078125, -5.00537109375, -4.82098388671875, -4.6365966796875, -4.45220947265625, -4.267822265625, -4.08343505859375, -3.8990478515625, -3.71466064453125, -3.5302734375, -3.34588623046875, -3.1614990234375, -2.97711181640625, -2.792724609375, -2.60833740234375, -2.4239501953125, -2.23956298828125, -2.05517578125, -1.87078857421875, -1.6864013671875, -1.50201416015625, -1.317626953125, -1.13323974609375, -0.9488525390625, -0.76446533203125, -0.580078125, -0.39569091796875, -0.2113037109375, -0.02691650390625, 0.157470703125, 0.34185791015625, 0.5262451171875, 0.71063232421875, 0.89501953125, 1.07940673828125, 1.2637939453125, 1.44818115234375, 1.632568359375, 1.81695556640625, 2.0013427734375, 2.18572998046875, 2.3701171875, 2.55450439453125, 2.7388916015625, 2.92327880859375, 3.107666015625, 3.29205322265625, 3.4764404296875, 3.66082763671875, 3.84521484375, 4.02960205078125, 4.2139892578125, 4.39837646484375, 4.582763671875, 4.76715087890625, 4.9515380859375, 5.13592529296875, 5.3203125]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 4.0, 6.0, 6.0, 12.0, 10.0, 10.0, 30.0, 13.0, 27.0, 31.0, 34.0, 26.0, 40.0, 55.0, 58.0, 55.0, 60.0, 62.0, 67.0, 43.0, 54.0, 47.0, 47.0, 33.0, 25.0, 31.0, 22.0, 28.0, 11.0, 8.0, 12.0, 10.0, 7.0, 7.0, 3.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.9716796875, -1.9201812744140625, -1.868682861328125, -1.8171844482421875, -1.76568603515625, -1.7141876220703125, -1.662689208984375, -1.6111907958984375, -1.5596923828125, -1.5081939697265625, -1.456695556640625, -1.4051971435546875, -1.35369873046875, -1.3022003173828125, -1.250701904296875, -1.1992034912109375, -1.147705078125, -1.0962066650390625, -1.044708251953125, -0.9932098388671875, -0.94171142578125, -0.8902130126953125, -0.838714599609375, -0.7872161865234375, -0.7357177734375, -0.6842193603515625, -0.632720947265625, -0.5812225341796875, -0.52972412109375, -0.4782257080078125, -0.426727294921875, -0.3752288818359375, -0.32373046875, -0.2722320556640625, -0.220733642578125, -0.1692352294921875, -0.11773681640625, -0.0662384033203125, -0.014739990234375, 0.0367584228515625, 0.0882568359375, 0.1397552490234375, 0.191253662109375, 0.2427520751953125, 0.29425048828125, 0.3457489013671875, 0.397247314453125, 0.4487457275390625, 0.500244140625, 0.5517425537109375, 0.603240966796875, 0.6547393798828125, 0.70623779296875, 0.7577362060546875, 0.809234619140625, 0.8607330322265625, 0.9122314453125, 0.9637298583984375, 1.015228271484375, 1.0667266845703125, 1.11822509765625, 1.1697235107421875, 1.221221923828125, 1.2727203369140625, 1.32421875]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 3.0, 4.0, 1.0, 3.0, 3.0, 2.0, 10.0, 6.0, 15.0, 9.0, 22.0, 28.0, 43.0, 77.0, 162.0, 302.0, 941.0, 3852.0, 35359.0, 4094043.0, 52897.0, 4643.0, 1094.0, 339.0, 158.0, 93.0, 36.0, 34.0, 24.0, 19.0, 15.0, 6.0, 8.0, 9.0, 4.0, 4.0, 3.0, 1.0, 3.0, 1.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0], "bins": [-7.96484375, -7.7408447265625, -7.516845703125, -7.2928466796875, -7.06884765625, -6.8448486328125, -6.620849609375, -6.3968505859375, -6.1728515625, -5.9488525390625, -5.724853515625, -5.5008544921875, -5.27685546875, -5.0528564453125, -4.828857421875, -4.6048583984375, -4.380859375, -4.1568603515625, -3.932861328125, -3.7088623046875, -3.48486328125, -3.2608642578125, -3.036865234375, -2.8128662109375, -2.5888671875, -2.3648681640625, -2.140869140625, -1.9168701171875, -1.69287109375, -1.4688720703125, -1.244873046875, -1.0208740234375, -0.796875, -0.5728759765625, -0.348876953125, -0.1248779296875, 0.09912109375, 0.3231201171875, 0.547119140625, 0.7711181640625, 0.9951171875, 1.2191162109375, 1.443115234375, 1.6671142578125, 1.89111328125, 2.1151123046875, 2.339111328125, 2.5631103515625, 2.787109375, 3.0111083984375, 3.235107421875, 3.4591064453125, 3.68310546875, 3.9071044921875, 4.131103515625, 4.3551025390625, 4.5791015625, 4.8031005859375, 5.027099609375, 5.2510986328125, 5.47509765625, 5.6990966796875, 5.923095703125, 6.1470947265625, 6.37109375]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 5.0, 2.0, 6.0, 4.0, 10.0, 13.0, 15.0, 16.0, 33.0, 51.0, 91.0, 182.0, 491.0, 1129.0, 1121.0, 487.0, 174.0, 87.0, 37.0, 33.0, 21.0, 13.0, 8.0, 14.0, 4.0, 4.0, 2.0, 4.0, 2.0, 1.0, 4.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.9853515625, -0.9563369750976562, -0.9273223876953125, -0.8983078002929688, -0.869293212890625, -0.8402786254882812, -0.8112640380859375, -0.7822494506835938, -0.75323486328125, -0.7242202758789062, -0.6952056884765625, -0.6661911010742188, -0.637176513671875, -0.6081619262695312, -0.5791473388671875, -0.5501327514648438, -0.5211181640625, -0.49210357666015625, -0.4630889892578125, -0.43407440185546875, -0.405059814453125, -0.37604522705078125, -0.3470306396484375, -0.31801605224609375, -0.28900146484375, -0.25998687744140625, -0.2309722900390625, -0.20195770263671875, -0.172943115234375, -0.14392852783203125, -0.1149139404296875, -0.08589935302734375, -0.056884765625, -0.02787017822265625, 0.0011444091796875, 0.03015899658203125, 0.059173583984375, 0.08818817138671875, 0.1172027587890625, 0.14621734619140625, 0.17523193359375, 0.20424652099609375, 0.2332611083984375, 0.26227569580078125, 0.291290283203125, 0.32030487060546875, 0.3493194580078125, 0.37833404541015625, 0.4073486328125, 0.43636322021484375, 0.4653778076171875, 0.49439239501953125, 0.523406982421875, 0.5524215698242188, 0.5814361572265625, 0.6104507446289062, 0.63946533203125, 0.6684799194335938, 0.6974945068359375, 0.7265090942382812, 0.755523681640625, 0.7845382690429688, 0.8135528564453125, 0.8425674438476562, 0.87158203125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 3.0, 4.0, 5.0, 7.0, 8.0, 7.0, 22.0, 29.0, 52.0, 91.0, 107.0, 120.0, 165.0, 132.0, 77.0, 62.0, 39.0, 24.0, 18.0, 7.0, 8.0, 3.0, 7.0, 2.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.905581474304199, -3.803659677505493, -3.701737880706787, -3.59981632232666, -3.497894525527954, -3.395972728729248, -3.294050931930542, -3.192129135131836, -3.090207576751709, -2.988285779953003, -2.886363983154297, -2.78444242477417, -2.682520627975464, -2.580598831176758, -2.4786770343780518, -2.3767552375793457, -2.2748334407806396, -2.1729116439819336, -2.0709898471832275, -1.969068169593811, -1.8671464920043945, -1.7652246952056885, -1.6633028984069824, -1.5613811016082764, -1.4594594240188599, -1.3575376272201538, -1.2556159496307373, -1.1536941528320312, -1.0517723560333252, -0.9498506784439087, -0.8479288816452026, -0.7460071444511414, -0.6440856456756592, -0.5421639084815979, -0.44024214148521423, -0.33832037448883057, -0.2363986372947693, -0.134476900100708, -0.03255510330200195, 0.06936663389205933, 0.1712883710861206, 0.2732101082801819, 0.37513187527656555, 0.4770536422729492, 0.5789753794670105, 0.6808971166610718, 0.7828189134597778, 0.8847406506538391, 0.9866623878479004, 1.0885841846466064, 1.190505862236023, 1.292427659034729, 1.3943493366241455, 1.4962711334228516, 1.5981929302215576, 1.7001147270202637, 1.8020364046096802, 1.9039582014083862, 2.0058798789978027, 2.107801675796509, 2.209723472595215, 2.311645030975342, 2.413567066192627, 2.515488624572754, 2.61741042137146]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 5.0, 4.0, 1.0, 6.0, 14.0, 23.0, 18.0, 22.0, 28.0, 30.0, 38.0, 45.0, 41.0, 51.0, 57.0, 51.0, 62.0, 59.0, 53.0, 61.0, 51.0, 59.0, 42.0, 31.0, 26.0, 28.0, 26.0, 13.0, 9.0, 14.0, 9.0, 8.0, 8.0, 5.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.178774833679199, -2.117802858352661, -2.056831121444702, -1.9958592653274536, -1.934887409210205, -1.873915433883667, -1.8129435777664185, -1.75197172164917, -1.6909998655319214, -1.6300280094146729, -1.5690561532974243, -1.5080842971801758, -1.4471123218536377, -1.3861405849456787, -1.3251686096191406, -1.264196753501892, -1.2032248973846436, -1.142253041267395, -1.0812811851501465, -1.020309329032898, -0.9593374133110046, -0.8983655571937561, -0.8373936414718628, -0.7764217853546143, -0.7154499292373657, -0.6544780731201172, -0.5935062170028687, -0.5325343012809753, -0.4715624451637268, -0.41059058904647827, -0.34961870312690735, -0.2886468172073364, -0.22767508029937744, -0.1667032092809677, -0.10573133826255798, -0.044759467244148254, 0.016212403774261475, 0.07718425989151001, 0.13815614581108093, 0.19912803173065186, 0.2600998878479004, 0.3210717439651489, 0.38204362988471985, 0.44301551580429077, 0.5039873719215393, 0.5649592280387878, 0.6259311437606812, 0.6869029998779297, 0.7478748559951782, 0.8088467121124268, 0.8698185682296753, 0.9307904839515686, 0.9917623400688171, 1.052734136581421, 1.113706111907959, 1.1746779680252075, 1.235649824142456, 1.2966216802597046, 1.3575935363769531, 1.4185653924942017, 1.4795372486114502, 1.5405092239379883, 1.6014810800552368, 1.6624529361724854, 1.7234247922897339]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 3.0, 0.0, 2.0, 3.0, 1.0, 2.0, 5.0, 7.0, 13.0, 8.0, 7.0, 12.0, 9.0, 14.0, 22.0, 27.0, 61.0, 150.0, 373.0, 1375.0, 6529.0, 45116.0, 869081.0, 110698.0, 11702.0, 2314.0, 575.0, 206.0, 81.0, 34.0, 27.0, 19.0, 19.0, 9.0, 5.0, 13.0, 4.0, 6.0, 4.0, 5.0, 0.0, 1.0, 7.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.169921875, -2.10546875, -2.041015625, -1.9765625, -1.912109375, -1.84765625, -1.783203125, -1.71875, -1.654296875, -1.58984375, -1.525390625, -1.4609375, -1.396484375, -1.33203125, -1.267578125, -1.203125, -1.138671875, -1.07421875, -1.009765625, -0.9453125, -0.880859375, -0.81640625, -0.751953125, -0.6875, -0.623046875, -0.55859375, -0.494140625, -0.4296875, -0.365234375, -0.30078125, -0.236328125, -0.171875, -0.107421875, -0.04296875, 0.021484375, 0.0859375, 0.150390625, 0.21484375, 0.279296875, 0.34375, 0.408203125, 0.47265625, 0.537109375, 0.6015625, 0.666015625, 0.73046875, 0.794921875, 0.859375, 0.923828125, 0.98828125, 1.052734375, 1.1171875, 1.181640625, 1.24609375, 1.310546875, 1.375, 1.439453125, 1.50390625, 1.568359375, 1.6328125, 1.697265625, 1.76171875, 1.826171875, 1.890625, 1.955078125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 6.0, 5.0, 10.0, 21.0, 50.0, 69.0, 83.0, 109.0, 147.0, 121.0, 139.0, 106.0, 67.0, 32.0, 20.0, 13.0, 11.0, 0.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6845703125, -1.6005096435546875, -1.516448974609375, -1.4323883056640625, -1.34832763671875, -1.2642669677734375, -1.180206298828125, -1.0961456298828125, -1.0120849609375, -0.9280242919921875, -0.843963623046875, -0.7599029541015625, -0.67584228515625, -0.5917816162109375, -0.507720947265625, -0.4236602783203125, -0.339599609375, -0.2555389404296875, -0.171478271484375, -0.0874176025390625, -0.00335693359375, 0.0807037353515625, 0.164764404296875, 0.2488250732421875, 0.3328857421875, 0.4169464111328125, 0.501007080078125, 0.5850677490234375, 0.66912841796875, 0.7531890869140625, 0.837249755859375, 0.9213104248046875, 1.00537109375, 1.0894317626953125, 1.173492431640625, 1.2575531005859375, 1.34161376953125, 1.4256744384765625, 1.509735107421875, 1.5937957763671875, 1.6778564453125, 1.7619171142578125, 1.845977783203125, 1.9300384521484375, 2.01409912109375, 2.0981597900390625, 2.182220458984375, 2.2662811279296875, 2.350341796875, 2.4344024658203125, 2.518463134765625, 2.6025238037109375, 2.68658447265625, 2.7706451416015625, 2.854705810546875, 2.9387664794921875, 3.0228271484375, 3.1068878173828125, 3.190948486328125, 3.2750091552734375, 3.35906982421875, 3.4431304931640625, 3.527191162109375, 3.6112518310546875, 3.6953125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 6.0, 4.0, 8.0, 6.0, 13.0, 26.0, 33.0, 55.0, 108.0, 194.0, 283.0, 467.0, 888.0, 1692.0, 3450.0, 7705.0, 18884.0, 57623.0, 342602.0, 499653.0, 74893.0, 22619.0, 8974.0, 4054.0, 1952.0, 1006.0, 555.0, 311.0, 178.0, 123.0, 76.0, 48.0, 30.0, 14.0, 12.0, 6.0, 5.0, 5.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51318359375, -0.49554443359375, -0.4779052734375, -0.46026611328125, -0.442626953125, -0.42498779296875, -0.4073486328125, -0.38970947265625, -0.3720703125, -0.35443115234375, -0.3367919921875, -0.31915283203125, -0.301513671875, -0.28387451171875, -0.2662353515625, -0.24859619140625, -0.23095703125, -0.21331787109375, -0.1956787109375, -0.17803955078125, -0.160400390625, -0.14276123046875, -0.1251220703125, -0.10748291015625, -0.08984375, -0.07220458984375, -0.0545654296875, -0.03692626953125, -0.019287109375, -0.00164794921875, 0.0159912109375, 0.03363037109375, 0.05126953125, 0.06890869140625, 0.0865478515625, 0.10418701171875, 0.121826171875, 0.13946533203125, 0.1571044921875, 0.17474365234375, 0.1923828125, 0.21002197265625, 0.2276611328125, 0.24530029296875, 0.262939453125, 0.28057861328125, 0.2982177734375, 0.31585693359375, 0.33349609375, 0.35113525390625, 0.3687744140625, 0.38641357421875, 0.404052734375, 0.42169189453125, 0.4393310546875, 0.45697021484375, 0.474609375, 0.49224853515625, 0.5098876953125, 0.52752685546875, 0.545166015625, 0.56280517578125, 0.5804443359375, 0.59808349609375, 0.61572265625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 4.0, 5.0, 5.0, 3.0, 14.0, 6.0, 8.0, 17.0, 17.0, 20.0, 15.0, 32.0, 40.0, 28.0, 38.0, 41.0, 46.0, 56.0, 48.0, 59.0, 53.0, 63.0, 52.0, 50.0, 44.0, 32.0, 49.0, 35.0, 20.0, 14.0, 19.0, 16.0, 9.0, 13.0, 12.0, 6.0, 5.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.8896484375, -1.8306121826171875, -1.771575927734375, -1.7125396728515625, -1.65350341796875, -1.5944671630859375, -1.535430908203125, -1.4763946533203125, -1.4173583984375, -1.3583221435546875, -1.299285888671875, -1.2402496337890625, -1.18121337890625, -1.1221771240234375, -1.063140869140625, -1.0041046142578125, -0.945068359375, -0.8860321044921875, -0.826995849609375, -0.7679595947265625, -0.70892333984375, -0.6498870849609375, -0.590850830078125, -0.5318145751953125, -0.4727783203125, -0.4137420654296875, -0.354705810546875, -0.2956695556640625, -0.23663330078125, -0.1775970458984375, -0.118560791015625, -0.0595245361328125, -0.00048828125, 0.0585479736328125, 0.117584228515625, 0.1766204833984375, 0.23565673828125, 0.2946929931640625, 0.353729248046875, 0.4127655029296875, 0.4718017578125, 0.5308380126953125, 0.589874267578125, 0.6489105224609375, 0.70794677734375, 0.7669830322265625, 0.826019287109375, 0.8850555419921875, 0.944091796875, 1.0031280517578125, 1.062164306640625, 1.1212005615234375, 1.18023681640625, 1.2392730712890625, 1.298309326171875, 1.3573455810546875, 1.4163818359375, 1.4754180908203125, 1.534454345703125, 1.5934906005859375, 1.65252685546875, 1.7115631103515625, 1.770599365234375, 1.8296356201171875, 1.888671875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 3.0, 4.0, 8.0, 8.0, 16.0, 31.0, 37.0, 63.0, 106.0, 156.0, 286.0, 596.0, 1201.0, 2601.0, 7436.0, 25906.0, 168115.0, 743987.0, 73165.0, 15769.0, 5096.0, 1961.0, 868.0, 465.0, 243.0, 163.0, 83.0, 53.0, 39.0, 23.0, 23.0, 15.0, 12.0, 5.0, 4.0, 4.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15478515625, -0.149505615234375, -0.14422607421875, -0.138946533203125, -0.1336669921875, -0.128387451171875, -0.12310791015625, -0.117828369140625, -0.112548828125, -0.107269287109375, -0.10198974609375, -0.096710205078125, -0.0914306640625, -0.086151123046875, -0.08087158203125, -0.075592041015625, -0.0703125, -0.065032958984375, -0.05975341796875, -0.054473876953125, -0.0491943359375, -0.043914794921875, -0.03863525390625, -0.033355712890625, -0.028076171875, -0.022796630859375, -0.01751708984375, -0.012237548828125, -0.0069580078125, -0.001678466796875, 0.00360107421875, 0.008880615234375, 0.01416015625, 0.019439697265625, 0.02471923828125, 0.029998779296875, 0.0352783203125, 0.040557861328125, 0.04583740234375, 0.051116943359375, 0.056396484375, 0.061676025390625, 0.06695556640625, 0.072235107421875, 0.0775146484375, 0.082794189453125, 0.08807373046875, 0.093353271484375, 0.0986328125, 0.103912353515625, 0.10919189453125, 0.114471435546875, 0.1197509765625, 0.125030517578125, 0.13031005859375, 0.135589599609375, 0.140869140625, 0.146148681640625, 0.15142822265625, 0.156707763671875, 0.1619873046875, 0.167266845703125, 0.17254638671875, 0.177825927734375, 0.18310546875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 2.0, 5.0, 6.0, 8.0, 8.0, 9.0, 24.0, 36.0, 54.0, 91.0, 203.0, 250.0, 110.0, 73.0, 39.0, 22.0, 17.0, 13.0, 11.0, 4.0, 4.0, 7.0, 3.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001537799835205078, -0.00014941394329071045, -0.00014504790306091309, -0.00014068186283111572, -0.00013631582260131836, -0.000131949782371521, -0.00012758374214172363, -0.00012321770191192627, -0.0001188516616821289, -0.00011448562145233154, -0.00011011958122253418, -0.00010575354099273682, -0.00010138750076293945, -9.702146053314209e-05, -9.265542030334473e-05, -8.828938007354736e-05, -8.392333984375e-05, -7.955729961395264e-05, -7.519125938415527e-05, -7.082521915435791e-05, -6.645917892456055e-05, -6.209313869476318e-05, -5.772709846496582e-05, -5.336105823516846e-05, -4.8995018005371094e-05, -4.462897777557373e-05, -4.026293754577637e-05, -3.5896897315979004e-05, -3.153085708618164e-05, -2.7164816856384277e-05, -2.2798776626586914e-05, -1.843273639678955e-05, -1.4066696166992188e-05, -9.700655937194824e-06, -5.334615707397461e-06, -9.685754776000977e-07, 3.3974647521972656e-06, 7.763504981994629e-06, 1.2129545211791992e-05, 1.6495585441589355e-05, 2.086162567138672e-05, 2.5227665901184082e-05, 2.9593706130981445e-05, 3.395974636077881e-05, 3.832578659057617e-05, 4.2691826820373535e-05, 4.70578670501709e-05, 5.142390727996826e-05, 5.5789947509765625e-05, 6.015598773956299e-05, 6.452202796936035e-05, 6.888806819915771e-05, 7.325410842895508e-05, 7.762014865875244e-05, 8.19861888885498e-05, 8.635222911834717e-05, 9.071826934814453e-05, 9.50843095779419e-05, 9.945034980773926e-05, 0.00010381639003753662, 0.00010818243026733398, 0.00011254847049713135, 0.00011691451072692871, 0.00012128055095672607, 0.00012564659118652344]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 3.0, 2.0, 9.0, 2.0, 10.0, 17.0, 18.0, 24.0, 41.0, 55.0, 102.0, 195.0, 371.0, 846.0, 1875.0, 4724.0, 14013.0, 60315.0, 637229.0, 279206.0, 33879.0, 9400.0, 3490.0, 1362.0, 650.0, 323.0, 156.0, 74.0, 66.0, 32.0, 16.0, 18.0, 12.0, 8.0, 7.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1912841796875, -0.1859455108642578, -0.18060684204101562, -0.17526817321777344, -0.16992950439453125, -0.16459083557128906, -0.15925216674804688, -0.1539134979248047, -0.1485748291015625, -0.1432361602783203, -0.13789749145507812, -0.13255882263183594, -0.12722015380859375, -0.12188148498535156, -0.11654281616210938, -0.11120414733886719, -0.105865478515625, -0.10052680969238281, -0.09518814086914062, -0.08984947204589844, -0.08451080322265625, -0.07917213439941406, -0.07383346557617188, -0.06849479675292969, -0.0631561279296875, -0.05781745910644531, -0.052478790283203125, -0.04714012145996094, -0.04180145263671875, -0.03646278381347656, -0.031124114990234375, -0.025785446166992188, -0.02044677734375, -0.015108108520507812, -0.009769439697265625, -0.0044307708740234375, 0.00090789794921875, 0.0062465667724609375, 0.011585235595703125, 0.016923904418945312, 0.0222625732421875, 0.027601242065429688, 0.032939910888671875, 0.03827857971191406, 0.04361724853515625, 0.04895591735839844, 0.054294586181640625, 0.05963325500488281, 0.064971923828125, 0.07031059265136719, 0.07564926147460938, 0.08098793029785156, 0.08632659912109375, 0.09166526794433594, 0.09700393676757812, 0.10234260559082031, 0.1076812744140625, 0.11301994323730469, 0.11835861206054688, 0.12369728088378906, 0.12903594970703125, 0.13437461853027344, 0.13971328735351562, 0.1450519561767578, 0.150390625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 6.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 4.0, 6.0, 1.0, 7.0, 10.0, 5.0, 20.0, 24.0, 41.0, 36.0, 57.0, 67.0, 70.0, 116.0, 144.0, 95.0, 60.0, 61.0, 37.0, 29.0, 18.0, 17.0, 15.0, 9.0, 7.0, 8.0, 7.0, 5.0, 5.0, 4.0, 6.0, 0.0, 0.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0290069580078125, -0.028013944625854492, -0.027020931243896484, -0.026027917861938477, -0.02503490447998047, -0.02404189109802246, -0.023048877716064453, -0.022055864334106445, -0.021062850952148438, -0.02006983757019043, -0.019076824188232422, -0.018083810806274414, -0.017090797424316406, -0.0160977840423584, -0.01510477066040039, -0.014111757278442383, -0.013118743896484375, -0.012125730514526367, -0.01113271713256836, -0.010139703750610352, -0.009146690368652344, -0.008153676986694336, -0.007160663604736328, -0.00616765022277832, -0.0051746368408203125, -0.004181623458862305, -0.003188610076904297, -0.002195596694946289, -0.0012025833129882812, -0.00020956993103027344, 0.0007834434509277344, 0.0017764568328857422, 0.00276947021484375, 0.003762483596801758, 0.004755496978759766, 0.0057485103607177734, 0.006741523742675781, 0.007734537124633789, 0.008727550506591797, 0.009720563888549805, 0.010713577270507812, 0.01170659065246582, 0.012699604034423828, 0.013692617416381836, 0.014685630798339844, 0.01567864418029785, 0.01667165756225586, 0.017664670944213867, 0.018657684326171875, 0.019650697708129883, 0.02064371109008789, 0.0216367244720459, 0.022629737854003906, 0.023622751235961914, 0.024615764617919922, 0.02560877799987793, 0.026601791381835938, 0.027594804763793945, 0.028587818145751953, 0.02958083152770996, 0.03057384490966797, 0.03156685829162598, 0.032559871673583984, 0.03355288505554199, 0.0345458984375]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 4.0, 8.0, 16.0, 23.0, 63.0, 137.0, 276.0, 243.0, 123.0, 58.0, 29.0, 13.0, 6.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.240875244140625, -4.134738445281982, -4.02860164642334, -3.922464609146118, -3.8163275718688965, -3.710190773010254, -3.6040539741516113, -3.4979169368743896, -3.391779899597168, -3.2856431007385254, -3.1795060634613037, -3.073369264602661, -2.9672322273254395, -2.861095428466797, -2.7549586296081543, -2.6488215923309326, -2.54268479347229, -2.4365479946136475, -2.330410957336426, -2.224274158477783, -2.1181371212005615, -2.012000322341919, -1.9058634042739868, -1.7997264862060547, -1.6935895681381226, -1.5874526500701904, -1.4813157320022583, -1.3751788139343262, -1.2690420150756836, -1.162904977798462, -1.0567681789398193, -0.9506312608718872, -0.8444943428039551, -0.738357424736023, -0.6322205066680908, -0.5260836482048035, -0.41994673013687134, -0.3138098120689392, -0.20767295360565186, -0.10153603553771973, 0.004600882530212402, 0.11073778569698334, 0.21687468886375427, 0.323011577129364, 0.42914849519729614, 0.5352854132652283, 0.6414222717285156, 0.7475591897964478, 0.8536961078643799, 0.959833025932312, 1.0659699440002441, 1.1721067428588867, 1.2782437801361084, 1.384380578994751, 1.490517497062683, 1.5966544151306152, 1.7027913331985474, 1.8089282512664795, 1.9150651693344116, 2.0212020874023438, 2.1273388862609863, 2.233475923538208, 2.3396127223968506, 2.4457497596740723, 2.551886558532715]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 6.0, 12.0, 14.0, 47.0, 55.0, 80.0, 107.0, 117.0, 125.0, 130.0, 111.0, 79.0, 50.0, 28.0, 20.0, 14.0, 10.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5628656148910522, -1.4866338968276978, -1.4104021787643433, -1.3341704607009888, -1.2579387426376343, -1.1817070245742798, -1.1054753065109253, -1.0292435884475708, -0.9530118703842163, -0.8767801523208618, -0.8005484342575073, -0.7243167161941528, -0.6480849981307983, -0.5718532800674438, -0.49562156200408936, -0.41938984394073486, -0.34315812587738037, -0.2669264078140259, -0.1906946897506714, -0.1144629716873169, -0.0382312536239624, 0.03800046443939209, 0.11423218250274658, 0.19046390056610107, 0.26669561862945557, 0.34292733669281006, 0.41915905475616455, 0.49539077281951904, 0.5716224908828735, 0.647854208946228, 0.7240859270095825, 0.800317645072937, 0.876549243927002, 0.9527809619903564, 1.029012680053711, 1.1052443981170654, 1.18147611618042, 1.2577078342437744, 1.333939552307129, 1.4101712703704834, 1.486402988433838, 1.5626347064971924, 1.6388664245605469, 1.7150981426239014, 1.7913298606872559, 1.8675615787506104, 1.9437932968139648, 2.0200250148773193, 2.096256732940674, 2.1724884510040283, 2.248720169067383, 2.3249518871307373, 2.401183605194092, 2.4774153232574463, 2.553647041320801, 2.6298787593841553, 2.7061104774475098, 2.7823421955108643, 2.8585739135742188, 2.9348056316375732, 3.0110373497009277, 3.0872690677642822, 3.1635007858276367, 3.239732503890991, 3.3159642219543457]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 5.0, 2.0, 3.0, 2.0, 5.0, 3.0, 2.0, 1.0, 0.0, 5.0, 8.0, 16.0, 32.0, 118.0, 469.0, 1653.0, 7448.0, 112744.0, 908152.0, 14005.0, 2856.0, 703.0, 209.0, 54.0, 16.0, 14.0, 8.0, 8.0, 3.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9453125, -4.7916259765625, -4.637939453125, -4.4842529296875, -4.33056640625, -4.1768798828125, -4.023193359375, -3.8695068359375, -3.7158203125, -3.5621337890625, -3.408447265625, -3.2547607421875, -3.10107421875, -2.9473876953125, -2.793701171875, -2.6400146484375, -2.486328125, -2.3326416015625, -2.178955078125, -2.0252685546875, -1.87158203125, -1.7178955078125, -1.564208984375, -1.4105224609375, -1.2568359375, -1.1031494140625, -0.949462890625, -0.7957763671875, -0.64208984375, -0.4884033203125, -0.334716796875, -0.1810302734375, -0.02734375, 0.1263427734375, 0.280029296875, 0.4337158203125, 0.58740234375, 0.7410888671875, 0.894775390625, 1.0484619140625, 1.2021484375, 1.3558349609375, 1.509521484375, 1.6632080078125, 1.81689453125, 1.9705810546875, 2.124267578125, 2.2779541015625, 2.431640625, 2.5853271484375, 2.739013671875, 2.8927001953125, 3.04638671875, 3.2000732421875, 3.353759765625, 3.5074462890625, 3.6611328125, 3.8148193359375, 3.968505859375, 4.1221923828125, 4.27587890625, 4.4295654296875, 4.583251953125, 4.7369384765625, 4.890625]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [7.0, 4.0, 6.0, 9.0, 8.0, 9.0, 29.0, 22.0, 44.0, 58.0, 58.0, 78.0, 90.0, 94.0, 94.0, 88.0, 64.0, 73.0, 55.0, 37.0, 28.0, 19.0, 14.0, 12.0, 10.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.650390625, -1.532684326171875, -1.41497802734375, -1.297271728515625, -1.1795654296875, -1.061859130859375, -0.94415283203125, -0.826446533203125, -0.708740234375, -0.591033935546875, -0.47332763671875, -0.355621337890625, -0.2379150390625, -0.120208740234375, -0.00250244140625, 0.115203857421875, 0.23291015625, 0.350616455078125, 0.46832275390625, 0.586029052734375, 0.7037353515625, 0.821441650390625, 0.93914794921875, 1.056854248046875, 1.174560546875, 1.292266845703125, 1.40997314453125, 1.527679443359375, 1.6453857421875, 1.763092041015625, 1.88079833984375, 1.998504638671875, 2.1162109375, 2.233917236328125, 2.35162353515625, 2.469329833984375, 2.5870361328125, 2.704742431640625, 2.82244873046875, 2.940155029296875, 3.057861328125, 3.175567626953125, 3.29327392578125, 3.410980224609375, 3.5286865234375, 3.646392822265625, 3.76409912109375, 3.881805419921875, 3.99951171875, 4.117218017578125, 4.23492431640625, 4.352630615234375, 4.4703369140625, 4.588043212890625, 4.70574951171875, 4.823455810546875, 4.941162109375, 5.058868408203125, 5.17657470703125, 5.294281005859375, 5.4119873046875, 5.529693603515625, 5.64739990234375, 5.765106201171875, 5.8828125]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 1.0, 3.0, 7.0, 1.0, 5.0, 2.0, 2.0, 6.0, 6.0, 8.0, 6.0, 9.0, 13.0, 17.0, 11.0, 20.0, 27.0, 27.0, 32.0, 46.0, 41.0, 55.0, 71.0, 189.0, 754.0, 11338.0, 1022694.0, 11897.0, 708.0, 140.0, 76.0, 38.0, 46.0, 38.0, 33.0, 20.0, 30.0, 29.0, 12.0, 16.0, 15.0, 15.0, 12.0, 11.0, 13.0, 4.0, 9.0, 4.0, 2.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.1171875, -6.8839111328125, -6.650634765625, -6.4173583984375, -6.18408203125, -5.9508056640625, -5.717529296875, -5.4842529296875, -5.2509765625, -5.0177001953125, -4.784423828125, -4.5511474609375, -4.31787109375, -4.0845947265625, -3.851318359375, -3.6180419921875, -3.384765625, -3.1514892578125, -2.918212890625, -2.6849365234375, -2.45166015625, -2.2183837890625, -1.985107421875, -1.7518310546875, -1.5185546875, -1.2852783203125, -1.052001953125, -0.8187255859375, -0.58544921875, -0.3521728515625, -0.118896484375, 0.1143798828125, 0.34765625, 0.5809326171875, 0.814208984375, 1.0474853515625, 1.28076171875, 1.5140380859375, 1.747314453125, 1.9805908203125, 2.2138671875, 2.4471435546875, 2.680419921875, 2.9136962890625, 3.14697265625, 3.3802490234375, 3.613525390625, 3.8468017578125, 4.080078125, 4.3133544921875, 4.546630859375, 4.7799072265625, 5.01318359375, 5.2464599609375, 5.479736328125, 5.7130126953125, 5.9462890625, 6.1795654296875, 6.412841796875, 6.6461181640625, 6.87939453125, 7.1126708984375, 7.345947265625, 7.5792236328125, 7.8125]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 4.0, 2.0, 2.0, 6.0, 2.0, 2.0, 8.0, 7.0, 1.0, 10.0, 4.0, 9.0, 14.0, 18.0, 24.0, 15.0, 17.0, 16.0, 22.0, 44.0, 35.0, 25.0, 41.0, 34.0, 32.0, 32.0, 41.0, 39.0, 50.0, 40.0, 35.0, 37.0, 37.0, 28.0, 34.0, 29.0, 22.0, 29.0, 29.0, 17.0, 15.0, 15.0, 14.0, 9.0, 14.0, 16.0, 11.0, 5.0, 8.0, 5.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.615234375, -1.5607757568359375, -1.506317138671875, -1.4518585205078125, -1.39739990234375, -1.3429412841796875, -1.288482666015625, -1.2340240478515625, -1.1795654296875, -1.1251068115234375, -1.070648193359375, -1.0161895751953125, -0.96173095703125, -0.9072723388671875, -0.852813720703125, -0.7983551025390625, -0.743896484375, -0.6894378662109375, -0.634979248046875, -0.5805206298828125, -0.52606201171875, -0.4716033935546875, -0.417144775390625, -0.3626861572265625, -0.3082275390625, -0.2537689208984375, -0.199310302734375, -0.1448516845703125, -0.09039306640625, -0.0359344482421875, 0.018524169921875, 0.0729827880859375, 0.12744140625, 0.1819000244140625, 0.236358642578125, 0.2908172607421875, 0.34527587890625, 0.3997344970703125, 0.454193115234375, 0.5086517333984375, 0.5631103515625, 0.6175689697265625, 0.672027587890625, 0.7264862060546875, 0.78094482421875, 0.8354034423828125, 0.889862060546875, 0.9443206787109375, 0.998779296875, 1.0532379150390625, 1.107696533203125, 1.1621551513671875, 1.21661376953125, 1.2710723876953125, 1.325531005859375, 1.3799896240234375, 1.4344482421875, 1.4889068603515625, 1.543365478515625, 1.5978240966796875, 1.65228271484375, 1.7067413330078125, 1.761199951171875, 1.8156585693359375, 1.8701171875]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 6.0, 2.0, 4.0, 10.0, 12.0, 19.0, 24.0, 26.0, 36.0, 52.0, 58.0, 134.0, 245.0, 435.0, 959.0, 2551.0, 8551.0, 53586.0, 910460.0, 57741.0, 8911.0, 2646.0, 1007.0, 468.0, 220.0, 132.0, 74.0, 46.0, 31.0, 32.0, 17.0, 14.0, 12.0, 5.0, 6.0, 13.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0], "bins": [-0.6025390625, -0.5860366821289062, -0.5695343017578125, -0.5530319213867188, -0.536529541015625, -0.5200271606445312, -0.5035247802734375, -0.48702239990234375, -0.47052001953125, -0.45401763916015625, -0.4375152587890625, -0.42101287841796875, -0.404510498046875, -0.38800811767578125, -0.3715057373046875, -0.35500335693359375, -0.3385009765625, -0.32199859619140625, -0.3054962158203125, -0.28899383544921875, -0.272491455078125, -0.25598907470703125, -0.2394866943359375, -0.22298431396484375, -0.20648193359375, -0.18997955322265625, -0.1734771728515625, -0.15697479248046875, -0.140472412109375, -0.12397003173828125, -0.1074676513671875, -0.09096527099609375, -0.074462890625, -0.05796051025390625, -0.0414581298828125, -0.02495574951171875, -0.008453369140625, 0.00804901123046875, 0.0245513916015625, 0.04105377197265625, 0.05755615234375, 0.07405853271484375, 0.0905609130859375, 0.10706329345703125, 0.123565673828125, 0.14006805419921875, 0.1565704345703125, 0.17307281494140625, 0.1895751953125, 0.20607757568359375, 0.2225799560546875, 0.23908233642578125, 0.255584716796875, 0.27208709716796875, 0.2885894775390625, 0.30509185791015625, 0.32159423828125, 0.33809661865234375, 0.3545989990234375, 0.37110137939453125, 0.387603759765625, 0.40410614013671875, 0.4206085205078125, 0.43711090087890625, 0.45361328125]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 8.0, 6.0, 8.0, 13.0, 12.0, 15.0, 21.0, 44.0, 95.0, 194.0, 307.0, 100.0, 63.0, 29.0, 14.0, 18.0, 17.0, 7.0, 7.0, 6.0, 1.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.296966552734375e-05, -8.079409599304199e-05, -7.861852645874023e-05, -7.644295692443848e-05, -7.426738739013672e-05, -7.209181785583496e-05, -6.99162483215332e-05, -6.774067878723145e-05, -6.556510925292969e-05, -6.338953971862793e-05, -6.121397018432617e-05, -5.9038400650024414e-05, -5.6862831115722656e-05, -5.46872615814209e-05, -5.251169204711914e-05, -5.033612251281738e-05, -4.8160552978515625e-05, -4.598498344421387e-05, -4.380941390991211e-05, -4.163384437561035e-05, -3.9458274841308594e-05, -3.7282705307006836e-05, -3.510713577270508e-05, -3.293156623840332e-05, -3.075599670410156e-05, -2.8580427169799805e-05, -2.6404857635498047e-05, -2.422928810119629e-05, -2.205371856689453e-05, -1.9878149032592773e-05, -1.7702579498291016e-05, -1.5527009963989258e-05, -1.33514404296875e-05, -1.1175870895385742e-05, -9.000301361083984e-06, -6.8247318267822266e-06, -4.649162292480469e-06, -2.473592758178711e-06, -2.980232238769531e-07, 1.8775463104248047e-06, 4.0531158447265625e-06, 6.22868537902832e-06, 8.404254913330078e-06, 1.0579824447631836e-05, 1.2755393981933594e-05, 1.4930963516235352e-05, 1.710653305053711e-05, 1.9282102584838867e-05, 2.1457672119140625e-05, 2.3633241653442383e-05, 2.580881118774414e-05, 2.79843807220459e-05, 3.0159950256347656e-05, 3.2335519790649414e-05, 3.451108932495117e-05, 3.668665885925293e-05, 3.886222839355469e-05, 4.1037797927856445e-05, 4.32133674621582e-05, 4.538893699645996e-05, 4.756450653076172e-05, 4.9740076065063477e-05, 5.1915645599365234e-05, 5.409121513366699e-05, 5.626678466796875e-05]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 6.0, 2.0, 3.0, 13.0, 10.0, 10.0, 22.0, 24.0, 46.0, 77.0, 175.0, 375.0, 972.0, 3599.0, 20136.0, 871043.0, 138548.0, 10056.0, 2186.0, 690.0, 271.0, 129.0, 64.0, 41.0, 16.0, 9.0, 8.0, 9.0, 7.0, 5.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.63671875, -0.6153640747070312, -0.5940093994140625, -0.5726547241210938, -0.551300048828125, -0.5299453735351562, -0.5085906982421875, -0.48723602294921875, -0.46588134765625, -0.44452667236328125, -0.4231719970703125, -0.40181732177734375, -0.380462646484375, -0.35910797119140625, -0.3377532958984375, -0.31639862060546875, -0.2950439453125, -0.27368927001953125, -0.2523345947265625, -0.23097991943359375, -0.209625244140625, -0.18827056884765625, -0.1669158935546875, -0.14556121826171875, -0.12420654296875, -0.10285186767578125, -0.0814971923828125, -0.06014251708984375, -0.038787841796875, -0.01743316650390625, 0.0039215087890625, 0.02527618408203125, 0.046630859375, 0.06798553466796875, 0.0893402099609375, 0.11069488525390625, 0.132049560546875, 0.15340423583984375, 0.1747589111328125, 0.19611358642578125, 0.21746826171875, 0.23882293701171875, 0.2601776123046875, 0.28153228759765625, 0.302886962890625, 0.32424163818359375, 0.3455963134765625, 0.36695098876953125, 0.3883056640625, 0.40966033935546875, 0.4310150146484375, 0.45236968994140625, 0.473724365234375, 0.49507904052734375, 0.5164337158203125, 0.5377883911132812, 0.55914306640625, 0.5804977416992188, 0.6018524169921875, 0.6232070922851562, 0.644561767578125, 0.6659164428710938, 0.6872711181640625, 0.7086257934570312, 0.72998046875]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 6.0, 2.0, 2.0, 3.0, 3.0, 7.0, 6.0, 18.0, 15.0, 18.0, 42.0, 75.0, 156.0, 255.0, 138.0, 76.0, 44.0, 30.0, 22.0, 26.0, 13.0, 7.0, 7.0, 6.0, 6.0, 8.0, 3.0, 1.0, 5.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2115478515625, -0.2054290771484375, -0.199310302734375, -0.1931915283203125, -0.18707275390625, -0.1809539794921875, -0.174835205078125, -0.1687164306640625, -0.16259765625, -0.1564788818359375, -0.150360107421875, -0.1442413330078125, -0.13812255859375, -0.1320037841796875, -0.125885009765625, -0.1197662353515625, -0.1136474609375, -0.1075286865234375, -0.101409912109375, -0.0952911376953125, -0.08917236328125, -0.0830535888671875, -0.076934814453125, -0.0708160400390625, -0.064697265625, -0.0585784912109375, -0.052459716796875, -0.0463409423828125, -0.04022216796875, -0.0341033935546875, -0.027984619140625, -0.0218658447265625, -0.0157470703125, -0.0096282958984375, -0.003509521484375, 0.0026092529296875, 0.00872802734375, 0.0148468017578125, 0.020965576171875, 0.0270843505859375, 0.033203125, 0.0393218994140625, 0.045440673828125, 0.0515594482421875, 0.05767822265625, 0.0637969970703125, 0.069915771484375, 0.0760345458984375, 0.0821533203125, 0.0882720947265625, 0.094390869140625, 0.1005096435546875, 0.10662841796875, 0.1127471923828125, 0.118865966796875, 0.1249847412109375, 0.131103515625, 0.1372222900390625, 0.143341064453125, 0.1494598388671875, 0.15557861328125, 0.1616973876953125, 0.167816162109375, 0.1739349365234375, 0.1800537109375]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 4.0, 7.0, 9.0, 16.0, 13.0, 30.0, 45.0, 75.0, 168.0, 215.0, 163.0, 91.0, 64.0, 42.0, 20.0, 11.0, 9.0, 9.0, 8.0, 3.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.364039421081543, -5.232263565063477, -5.10048770904541, -4.9687113761901855, -4.836935520172119, -4.705159664154053, -4.573383808135986, -4.44160795211792, -4.309831619262695, -4.178055763244629, -4.0462799072265625, -3.914503812789917, -3.7827277183532715, -3.650951862335205, -3.5191760063171387, -3.3874001502990723, -3.255624294281006, -3.1238484382629395, -2.992072343826294, -2.8602964878082275, -2.728520393371582, -2.5967445373535156, -2.464968681335449, -2.333192825317383, -2.2014167308807373, -2.069640874862671, -1.9378647804260254, -1.806088924407959, -1.674312949180603, -1.542536973953247, -1.4107611179351807, -1.2789851427078247, -1.1472094058990479, -1.015433430671692, -0.8836575150489807, -0.7518815994262695, -0.6201056241989136, -0.4883296489715576, -0.35655373334884644, -0.22477781772613525, -0.0930018424987793, 0.03877410292625427, 0.17055004835128784, 0.3023259937763214, 0.434101939201355, 0.5658779144287109, 0.6976538300514221, 0.8294297456741333, 0.9612057209014893, 1.0929816961288452, 1.2247576713562012, 1.3565335273742676, 1.4883095026016235, 1.6200854778289795, 1.751861333847046, 1.8836373090744019, 2.015413284301758, 2.147189140319824, 2.2789652347564697, 2.410741090774536, 2.5425171852111816, 2.674293041229248, 2.8060688972473145, 2.937844753265381, 3.0696208477020264]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 7.0, 3.0, 5.0, 4.0, 8.0, 14.0, 14.0, 16.0, 26.0, 32.0, 33.0, 40.0, 45.0, 51.0, 50.0, 50.0, 64.0, 67.0, 56.0, 45.0, 65.0, 50.0, 47.0, 35.0, 41.0, 33.0, 25.0, 24.0, 18.0, 11.0, 8.0, 5.0, 7.0, 4.0, 4.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.515451192855835, -2.3930253982543945, -2.270599842071533, -2.148174285888672, -2.0257484912872314, -1.9033228158950806, -1.7808971405029297, -1.6584714651107788, -1.536045789718628, -1.413620114326477, -1.2911944389343262, -1.1687687635421753, -1.0463430881500244, -0.9239174127578735, -0.8014917373657227, -0.6790660619735718, -0.5566403865814209, -0.43421471118927, -0.31178903579711914, -0.18936336040496826, -0.06693768501281738, 0.055487990379333496, 0.17791366577148438, 0.30033934116363525, 0.42276501655578613, 0.545190691947937, 0.6676163673400879, 0.7900420427322388, 0.9124677181243896, 1.0348933935165405, 1.1573190689086914, 1.2797447443008423, 1.402170181274414, 1.524595856666565, 1.6470215320587158, 1.7694472074508667, 1.8918728828430176, 2.014298439025879, 2.1367242336273193, 2.2591500282287598, 2.381575584411621, 2.5040011405944824, 2.626426935195923, 2.7488527297973633, 2.8712782859802246, 2.993703842163086, 3.1161296367645264, 3.238555431365967, 3.360980987548828, 3.4834065437316895, 3.60583233833313, 3.7282581329345703, 3.8506836891174316, 3.973109245300293, 4.0955352783203125, 4.217960834503174, 4.340386390686035, 4.4628119468688965, 4.585237503051758, 4.707663536071777, 4.830089092254639, 4.9525146484375, 5.0749406814575195, 5.197366237640381, 5.319791793823242]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 5.0, 1.0, 5.0, 7.0, 14.0, 10.0, 14.0, 8.0, 16.0, 12.0, 18.0, 33.0, 42.0, 39.0, 79.0, 114.0, 241.0, 461.0, 1210.0, 5910.0, 2078111.0, 2099369.0, 6270.0, 1184.0, 467.0, 220.0, 143.0, 78.0, 41.0, 32.0, 25.0, 19.0, 23.0, 11.0, 10.0, 3.0, 2.0, 10.0, 3.0, 6.0, 5.0, 4.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.359375, -6.14739990234375, -5.9354248046875, -5.72344970703125, -5.511474609375, -5.29949951171875, -5.0875244140625, -4.87554931640625, -4.66357421875, -4.45159912109375, -4.2396240234375, -4.02764892578125, -3.815673828125, -3.60369873046875, -3.3917236328125, -3.17974853515625, -2.9677734375, -2.75579833984375, -2.5438232421875, -2.33184814453125, -2.119873046875, -1.90789794921875, -1.6959228515625, -1.48394775390625, -1.27197265625, -1.05999755859375, -0.8480224609375, -0.63604736328125, -0.424072265625, -0.21209716796875, -0.0001220703125, 0.21185302734375, 0.423828125, 0.63580322265625, 0.8477783203125, 1.05975341796875, 1.271728515625, 1.48370361328125, 1.6956787109375, 1.90765380859375, 2.11962890625, 2.33160400390625, 2.5435791015625, 2.75555419921875, 2.967529296875, 3.17950439453125, 3.3914794921875, 3.60345458984375, 3.8154296875, 4.02740478515625, 4.2393798828125, 4.45135498046875, 4.663330078125, 4.87530517578125, 5.0872802734375, 5.29925537109375, 5.51123046875, 5.72320556640625, 5.9351806640625, 6.14715576171875, 6.359130859375, 6.57110595703125, 6.7830810546875, 6.99505615234375, 7.20703125]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 5.0, 11.0, 8.0, 16.0, 16.0, 18.0, 28.0, 25.0, 41.0, 40.0, 49.0, 53.0, 63.0, 68.0, 68.0, 57.0, 60.0, 64.0, 57.0, 54.0, 34.0, 38.0, 27.0, 23.0, 20.0, 12.0, 11.0, 10.0, 11.0, 6.0, 5.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.880859375, -1.8299560546875, -1.779052734375, -1.7281494140625, -1.67724609375, -1.6263427734375, -1.575439453125, -1.5245361328125, -1.4736328125, -1.4227294921875, -1.371826171875, -1.3209228515625, -1.27001953125, -1.2191162109375, -1.168212890625, -1.1173095703125, -1.06640625, -1.0155029296875, -0.964599609375, -0.9136962890625, -0.86279296875, -0.8118896484375, -0.760986328125, -0.7100830078125, -0.6591796875, -0.6082763671875, -0.557373046875, -0.5064697265625, -0.45556640625, -0.4046630859375, -0.353759765625, -0.3028564453125, -0.251953125, -0.2010498046875, -0.150146484375, -0.0992431640625, -0.04833984375, 0.0025634765625, 0.053466796875, 0.1043701171875, 0.1552734375, 0.2061767578125, 0.257080078125, 0.3079833984375, 0.35888671875, 0.4097900390625, 0.460693359375, 0.5115966796875, 0.5625, 0.6134033203125, 0.664306640625, 0.7152099609375, 0.76611328125, 0.8170166015625, 0.867919921875, 0.9188232421875, 0.9697265625, 1.0206298828125, 1.071533203125, 1.1224365234375, 1.17333984375, 1.2242431640625, 1.275146484375, 1.3260498046875, 1.376953125]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 7.0, 6.0, 9.0, 14.0, 20.0, 66.0, 208.0, 1175.0, 3583173.0, 608237.0, 991.0, 192.0, 71.0, 39.0, 27.0, 9.0, 10.0, 5.0, 8.0, 3.0, 1.0, 1.0, 6.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-14.3515625, -13.9027099609375, -13.453857421875, -13.0050048828125, -12.55615234375, -12.1072998046875, -11.658447265625, -11.2095947265625, -10.7607421875, -10.3118896484375, -9.863037109375, -9.4141845703125, -8.96533203125, -8.5164794921875, -8.067626953125, -7.6187744140625, -7.169921875, -6.7210693359375, -6.272216796875, -5.8233642578125, -5.37451171875, -4.9256591796875, -4.476806640625, -4.0279541015625, -3.5791015625, -3.1302490234375, -2.681396484375, -2.2325439453125, -1.78369140625, -1.3348388671875, -0.885986328125, -0.4371337890625, 0.01171875, 0.4605712890625, 0.909423828125, 1.3582763671875, 1.80712890625, 2.2559814453125, 2.704833984375, 3.1536865234375, 3.6025390625, 4.0513916015625, 4.500244140625, 4.9490966796875, 5.39794921875, 5.8468017578125, 6.295654296875, 6.7445068359375, 7.193359375, 7.6422119140625, 8.091064453125, 8.5399169921875, 8.98876953125, 9.4376220703125, 9.886474609375, 10.3353271484375, 10.7841796875, 11.2330322265625, 11.681884765625, 12.1307373046875, 12.57958984375, 13.0284423828125, 13.477294921875, 13.9261474609375, 14.375]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 7.0, 12.0, 23.0, 36.0, 74.0, 260.0, 1573.0, 1606.0, 321.0, 86.0, 35.0, 15.0, 15.0, 6.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.376953125, -1.3364715576171875, -1.295989990234375, -1.2555084228515625, -1.21502685546875, -1.1745452880859375, -1.134063720703125, -1.0935821533203125, -1.0531005859375, -1.0126190185546875, -0.972137451171875, -0.9316558837890625, -0.89117431640625, -0.8506927490234375, -0.810211181640625, -0.7697296142578125, -0.729248046875, -0.6887664794921875, -0.648284912109375, -0.6078033447265625, -0.56732177734375, -0.5268402099609375, -0.486358642578125, -0.4458770751953125, -0.4053955078125, -0.3649139404296875, -0.324432373046875, -0.2839508056640625, -0.24346923828125, -0.2029876708984375, -0.162506103515625, -0.1220245361328125, -0.08154296875, -0.0410614013671875, -0.000579833984375, 0.0399017333984375, 0.08038330078125, 0.1208648681640625, 0.161346435546875, 0.2018280029296875, 0.2423095703125, 0.2827911376953125, 0.323272705078125, 0.3637542724609375, 0.40423583984375, 0.4447174072265625, 0.485198974609375, 0.5256805419921875, 0.566162109375, 0.6066436767578125, 0.647125244140625, 0.6876068115234375, 0.72808837890625, 0.7685699462890625, 0.809051513671875, 0.8495330810546875, 0.8900146484375, 0.9304962158203125, 0.970977783203125, 1.0114593505859375, 1.05194091796875, 1.0924224853515625, 1.132904052734375, 1.1733856201171875, 1.2138671875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 6.0, 2.0, 3.0, 10.0, 17.0, 24.0, 49.0, 77.0, 128.0, 197.0, 177.0, 124.0, 72.0, 48.0, 25.0, 17.0, 13.0, 3.0, 6.0, 8.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.4512486457824707, -3.3520452976226807, -3.2528417110443115, -3.1536383628845215, -3.0544350147247314, -2.9552314281463623, -2.8560280799865723, -2.756824493408203, -2.657621145248413, -2.558417797088623, -2.459214210510254, -2.360010862350464, -2.260807514190674, -2.1616039276123047, -2.0624005794525146, -1.963197112083435, -1.863993763923645, -1.7647902965545654, -1.6655869483947754, -1.5663834810256958, -1.4671800136566162, -1.3679766654968262, -1.2687731981277466, -1.169569730758667, -1.070366382598877, -0.9711629748344421, -0.8719595074653625, -0.7727560997009277, -0.6735526323318481, -0.5743492245674133, -0.4751458168029785, -0.3759423494338989, -0.27673888206481934, -0.17753544449806213, -0.07833202183246613, 0.020871400833129883, 0.12007483839988708, 0.2192782759666443, 0.3184816837310791, 0.4176851511001587, 0.5168885588645935, 0.6160919666290283, 0.7152954339981079, 0.8144988417625427, 0.9137022495269775, 1.0129057168960571, 1.1121091842651367, 1.2113125324249268, 1.3105159997940063, 1.409719467163086, 1.508922815322876, 1.6081262826919556, 1.7073297500610352, 1.8065330982208252, 1.9057365655899048, 2.0049400329589844, 2.1041433811187744, 2.2033467292785645, 2.3025503158569336, 2.4017536640167236, 2.5009570121765137, 2.600160598754883, 2.699363946914673, 2.798567295074463, 2.897770881652832]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 4.0, 2.0, 5.0, 3.0, 5.0, 9.0, 16.0, 16.0, 19.0, 33.0, 32.0, 32.0, 52.0, 46.0, 42.0, 55.0, 58.0, 61.0, 53.0, 58.0, 61.0, 50.0, 43.0, 53.0, 45.0, 32.0, 25.0, 21.0, 24.0, 20.0, 8.0, 11.0, 5.0, 5.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7910429239273071, -1.7389572858810425, -1.6868716478347778, -1.6347860097885132, -1.5827003717422485, -1.5306147336959839, -1.4785289764404297, -1.426443338394165, -1.3743577003479004, -1.3222720623016357, -1.270186424255371, -1.2181007862091064, -1.1660151481628418, -1.1139295101165771, -1.0618438720703125, -1.0097582340240479, -0.9576725959777832, -0.9055869579315186, -0.8535013198852539, -0.8014156818389893, -0.7493300437927246, -0.69724440574646, -0.6451587080955505, -0.5930730700492859, -0.5409874320030212, -0.4889017939567566, -0.43681615591049194, -0.3847304880619049, -0.33264485001564026, -0.2805592119693756, -0.22847354412078857, -0.17638790607452393, -0.12430238723754883, -0.07221674174070358, -0.020131096243858337, 0.031954556703567505, 0.08404019474983215, 0.1361258327960968, 0.18821150064468384, 0.2402971386909485, 0.29238277673721313, 0.3444684147834778, 0.39655405282974243, 0.44863972067832947, 0.5007253885269165, 0.5528110265731812, 0.6048966646194458, 0.6569823026657104, 0.7090679407119751, 0.7611535787582397, 0.8132392168045044, 0.865324854850769, 0.9174104928970337, 0.9694961309432983, 1.0215818881988525, 1.0736675262451172, 1.1257531642913818, 1.1778388023376465, 1.2299244403839111, 1.2820100784301758, 1.3340957164764404, 1.386181354522705, 1.4382669925689697, 1.4903526306152344, 1.542438268661499]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 7.0, 5.0, 6.0, 7.0, 16.0, 17.0, 34.0, 64.0, 142.0, 350.0, 865.0, 2737.0, 10385.0, 70445.0, 909373.0, 42752.0, 7928.0, 2161.0, 718.0, 278.0, 126.0, 61.0, 30.0, 13.0, 10.0, 4.0, 6.0, 4.0, 2.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-1.7236328125, -1.6762847900390625, -1.628936767578125, -1.5815887451171875, -1.53424072265625, -1.4868927001953125, -1.439544677734375, -1.3921966552734375, -1.3448486328125, -1.2975006103515625, -1.250152587890625, -1.2028045654296875, -1.15545654296875, -1.1081085205078125, -1.060760498046875, -1.0134124755859375, -0.966064453125, -0.9187164306640625, -0.871368408203125, -0.8240203857421875, -0.77667236328125, -0.7293243408203125, -0.681976318359375, -0.6346282958984375, -0.5872802734375, -0.5399322509765625, -0.492584228515625, -0.4452362060546875, -0.39788818359375, -0.3505401611328125, -0.303192138671875, -0.2558441162109375, -0.20849609375, -0.1611480712890625, -0.113800048828125, -0.0664520263671875, -0.01910400390625, 0.0282440185546875, 0.075592041015625, 0.1229400634765625, 0.1702880859375, 0.2176361083984375, 0.264984130859375, 0.3123321533203125, 0.35968017578125, 0.4070281982421875, 0.454376220703125, 0.5017242431640625, 0.549072265625, 0.5964202880859375, 0.643768310546875, 0.6911163330078125, 0.73846435546875, 0.7858123779296875, 0.833160400390625, 0.8805084228515625, 0.9278564453125, 0.9752044677734375, 1.022552490234375, 1.0699005126953125, 1.11724853515625, 1.1645965576171875, 1.211944580078125, 1.2592926025390625, 1.306640625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 7.0, 4.0, 6.0, 8.0, 18.0, 22.0, 27.0, 38.0, 53.0, 62.0, 72.0, 81.0, 85.0, 81.0, 92.0, 78.0, 60.0, 56.0, 39.0, 40.0, 19.0, 27.0, 12.0, 12.0, 7.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.74609375, -1.7027130126953125, -1.659332275390625, -1.6159515380859375, -1.57257080078125, -1.5291900634765625, -1.485809326171875, -1.4424285888671875, -1.3990478515625, -1.3556671142578125, -1.312286376953125, -1.2689056396484375, -1.22552490234375, -1.1821441650390625, -1.138763427734375, -1.0953826904296875, -1.052001953125, -1.0086212158203125, -0.965240478515625, -0.9218597412109375, -0.87847900390625, -0.8350982666015625, -0.791717529296875, -0.7483367919921875, -0.7049560546875, -0.6615753173828125, -0.618194580078125, -0.5748138427734375, -0.53143310546875, -0.4880523681640625, -0.444671630859375, -0.4012908935546875, -0.35791015625, -0.3145294189453125, -0.271148681640625, -0.2277679443359375, -0.18438720703125, -0.1410064697265625, -0.097625732421875, -0.0542449951171875, -0.0108642578125, 0.0325164794921875, 0.075897216796875, 0.1192779541015625, 0.16265869140625, 0.2060394287109375, 0.249420166015625, 0.2928009033203125, 0.336181640625, 0.3795623779296875, 0.422943115234375, 0.4663238525390625, 0.50970458984375, 0.5530853271484375, 0.596466064453125, 0.6398468017578125, 0.6832275390625, 0.7266082763671875, 0.769989013671875, 0.8133697509765625, 0.85675048828125, 0.9001312255859375, 0.943511962890625, 0.9868927001953125, 1.0302734375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 1.0, 4.0, 3.0, 13.0, 9.0, 12.0, 18.0, 33.0, 40.0, 88.0, 126.0, 216.0, 459.0, 826.0, 1847.0, 4413.0, 12832.0, 51023.0, 612549.0, 313743.0, 34027.0, 9528.0, 3621.0, 1485.0, 745.0, 383.0, 198.0, 110.0, 80.0, 34.0, 22.0, 24.0, 4.0, 6.0, 8.0, 7.0, 6.0, 1.0, 7.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.515625, -0.49892425537109375, -0.4822235107421875, -0.46552276611328125, -0.448822021484375, -0.43212127685546875, -0.4154205322265625, -0.39871978759765625, -0.38201904296875, -0.36531829833984375, -0.3486175537109375, -0.33191680908203125, -0.315216064453125, -0.29851531982421875, -0.2818145751953125, -0.26511383056640625, -0.2484130859375, -0.23171234130859375, -0.2150115966796875, -0.19831085205078125, -0.181610107421875, -0.16490936279296875, -0.1482086181640625, -0.13150787353515625, -0.11480712890625, -0.09810638427734375, -0.0814056396484375, -0.06470489501953125, -0.048004150390625, -0.03130340576171875, -0.0146026611328125, 0.00209808349609375, 0.018798828125, 0.03549957275390625, 0.0522003173828125, 0.06890106201171875, 0.085601806640625, 0.10230255126953125, 0.1190032958984375, 0.13570404052734375, 0.15240478515625, 0.16910552978515625, 0.1858062744140625, 0.20250701904296875, 0.219207763671875, 0.23590850830078125, 0.2526092529296875, 0.26930999755859375, 0.2860107421875, 0.30271148681640625, 0.3194122314453125, 0.33611297607421875, 0.352813720703125, 0.36951446533203125, 0.3862152099609375, 0.40291595458984375, 0.41961669921875, 0.43631744384765625, 0.4530181884765625, 0.46971893310546875, 0.486419677734375, 0.5031204223632812, 0.5198211669921875, 0.5365219116210938, 0.55322265625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 8.0, 6.0, 1.0, 8.0, 12.0, 16.0, 15.0, 16.0, 21.0, 27.0, 30.0, 44.0, 41.0, 49.0, 49.0, 42.0, 62.0, 55.0, 60.0, 47.0, 40.0, 54.0, 45.0, 47.0, 38.0, 39.0, 24.0, 11.0, 26.0, 15.0, 18.0, 7.0, 7.0, 7.0, 4.0, 7.0, 2.0, 2.0, 0.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.69140625, -1.6441192626953125, -1.596832275390625, -1.5495452880859375, -1.50225830078125, -1.4549713134765625, -1.407684326171875, -1.3603973388671875, -1.3131103515625, -1.2658233642578125, -1.218536376953125, -1.1712493896484375, -1.12396240234375, -1.0766754150390625, -1.029388427734375, -0.9821014404296875, -0.934814453125, -0.8875274658203125, -0.840240478515625, -0.7929534912109375, -0.74566650390625, -0.6983795166015625, -0.651092529296875, -0.6038055419921875, -0.5565185546875, -0.5092315673828125, -0.461944580078125, -0.4146575927734375, -0.36737060546875, -0.3200836181640625, -0.272796630859375, -0.2255096435546875, -0.17822265625, -0.1309356689453125, -0.083648681640625, -0.0363616943359375, 0.01092529296875, 0.0582122802734375, 0.105499267578125, 0.1527862548828125, 0.2000732421875, 0.2473602294921875, 0.294647216796875, 0.3419342041015625, 0.38922119140625, 0.4365081787109375, 0.483795166015625, 0.5310821533203125, 0.578369140625, 0.6256561279296875, 0.672943115234375, 0.7202301025390625, 0.76751708984375, 0.8148040771484375, 0.862091064453125, 0.9093780517578125, 0.9566650390625, 1.0039520263671875, 1.051239013671875, 1.0985260009765625, 1.14581298828125, 1.1930999755859375, 1.240386962890625, 1.2876739501953125, 1.3349609375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 5.0, 5.0, 10.0, 9.0, 18.0, 23.0, 36.0, 41.0, 71.0, 85.0, 136.0, 195.0, 343.0, 552.0, 1033.0, 2053.0, 5045.0, 16951.0, 111584.0, 782196.0, 102506.0, 16211.0, 4873.0, 2016.0, 1029.0, 539.0, 349.0, 185.0, 136.0, 85.0, 71.0, 47.0, 29.0, 27.0, 14.0, 11.0, 14.0, 8.0, 3.0, 5.0, 2.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.10308837890625, -0.09946918487548828, -0.09584999084472656, -0.09223079681396484, -0.08861160278320312, -0.0849924087524414, -0.08137321472167969, -0.07775402069091797, -0.07413482666015625, -0.07051563262939453, -0.06689643859863281, -0.0632772445678711, -0.059658050537109375, -0.056038856506347656, -0.05241966247558594, -0.04880046844482422, -0.0451812744140625, -0.04156208038330078, -0.03794288635253906, -0.034323692321777344, -0.030704498291015625, -0.027085304260253906, -0.023466110229492188, -0.01984691619873047, -0.01622772216796875, -0.012608528137207031, -0.008989334106445312, -0.005370140075683594, -0.001750946044921875, 0.0018682479858398438, 0.0054874420166015625, 0.009106636047363281, 0.012725830078125, 0.01634502410888672, 0.019964218139648438, 0.023583412170410156, 0.027202606201171875, 0.030821800231933594, 0.03444099426269531, 0.03806018829345703, 0.04167938232421875, 0.04529857635498047, 0.04891777038574219, 0.052536964416503906, 0.056156158447265625, 0.059775352478027344, 0.06339454650878906, 0.06701374053955078, 0.0706329345703125, 0.07425212860107422, 0.07787132263183594, 0.08149051666259766, 0.08510971069335938, 0.0887289047241211, 0.09234809875488281, 0.09596729278564453, 0.09958648681640625, 0.10320568084716797, 0.10682487487792969, 0.1104440689086914, 0.11406326293945312, 0.11768245697021484, 0.12130165100097656, 0.12492084503173828, 0.1285400390625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 3.0, 4.0, 4.0, 4.0, 10.0, 10.0, 28.0, 32.0, 67.0, 118.0, 203.0, 184.0, 139.0, 86.0, 43.0, 29.0, 13.0, 8.0, 6.0, 7.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.562471389770508e-05, -6.311200559139252e-05, -6.0599297285079956e-05, -5.8086588978767395e-05, -5.5573880672454834e-05, -5.306117236614227e-05, -5.054846405982971e-05, -4.803575575351715e-05, -4.552304744720459e-05, -4.301033914089203e-05, -4.049763083457947e-05, -3.798492252826691e-05, -3.5472214221954346e-05, -3.2959505915641785e-05, -3.0446797609329224e-05, -2.7934089303016663e-05, -2.54213809967041e-05, -2.290867269039154e-05, -2.039596438407898e-05, -1.788325607776642e-05, -1.5370547771453857e-05, -1.2857839465141296e-05, -1.0345131158828735e-05, -7.832422852516174e-06, -5.319714546203613e-06, -2.8070062398910522e-06, -2.942979335784912e-07, 2.21841037273407e-06, 4.731118679046631e-06, 7.243826985359192e-06, 9.756535291671753e-06, 1.2269243597984314e-05, 1.4781951904296875e-05, 1.7294660210609436e-05, 1.9807368516921997e-05, 2.2320076823234558e-05, 2.483278512954712e-05, 2.734549343585968e-05, 2.985820174217224e-05, 3.23709100484848e-05, 3.488361835479736e-05, 3.7396326661109924e-05, 3.9909034967422485e-05, 4.2421743273735046e-05, 4.493445158004761e-05, 4.744715988636017e-05, 4.995986819267273e-05, 5.247257649898529e-05, 5.498528480529785e-05, 5.749799311161041e-05, 6.0010701417922974e-05, 6.252340972423553e-05, 6.50361180305481e-05, 6.754882633686066e-05, 7.006153464317322e-05, 7.257424294948578e-05, 7.508695125579834e-05, 7.75996595621109e-05, 8.011236786842346e-05, 8.262507617473602e-05, 8.513778448104858e-05, 8.765049278736115e-05, 9.01632010936737e-05, 9.267590939998627e-05, 9.518861770629883e-05]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 3.0, 6.0, 3.0, 10.0, 10.0, 12.0, 14.0, 37.0, 72.0, 245.0, 654.0, 2726.0, 30165.0, 990137.0, 21225.0, 2305.0, 573.0, 196.0, 70.0, 30.0, 17.0, 16.0, 7.0, 5.0, 1.0, 0.0, 4.0, 1.0, 5.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.3935546875, -0.38245391845703125, -0.3713531494140625, -0.36025238037109375, -0.349151611328125, -0.33805084228515625, -0.3269500732421875, -0.31584930419921875, -0.30474853515625, -0.29364776611328125, -0.2825469970703125, -0.27144622802734375, -0.260345458984375, -0.24924468994140625, -0.2381439208984375, -0.22704315185546875, -0.2159423828125, -0.20484161376953125, -0.1937408447265625, -0.18264007568359375, -0.171539306640625, -0.16043853759765625, -0.1493377685546875, -0.13823699951171875, -0.12713623046875, -0.11603546142578125, -0.1049346923828125, -0.09383392333984375, -0.082733154296875, -0.07163238525390625, -0.0605316162109375, -0.04943084716796875, -0.038330078125, -0.02722930908203125, -0.0161285400390625, -0.00502777099609375, 0.006072998046875, 0.01717376708984375, 0.0282745361328125, 0.03937530517578125, 0.05047607421875, 0.06157684326171875, 0.0726776123046875, 0.08377838134765625, 0.094879150390625, 0.10597991943359375, 0.1170806884765625, 0.12818145751953125, 0.1392822265625, 0.15038299560546875, 0.1614837646484375, 0.17258453369140625, 0.183685302734375, 0.19478607177734375, 0.2058868408203125, 0.21698760986328125, 0.22808837890625, 0.23918914794921875, 0.2502899169921875, 0.26139068603515625, 0.272491455078125, 0.28359222412109375, 0.2946929931640625, 0.30579376220703125, 0.31689453125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 3.0, 5.0, 4.0, 6.0, 5.0, 6.0, 7.0, 20.0, 29.0, 34.0, 31.0, 71.0, 103.0, 141.0, 133.0, 118.0, 80.0, 60.0, 35.0, 27.0, 18.0, 20.0, 11.0, 7.0, 6.0, 8.0, 2.0, 4.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0280914306640625, -0.027221202850341797, -0.026350975036621094, -0.02548074722290039, -0.024610519409179688, -0.023740291595458984, -0.02287006378173828, -0.021999835968017578, -0.021129608154296875, -0.020259380340576172, -0.01938915252685547, -0.018518924713134766, -0.017648696899414062, -0.01677846908569336, -0.015908241271972656, -0.015038013458251953, -0.01416778564453125, -0.013297557830810547, -0.012427330017089844, -0.01155710220336914, -0.010686874389648438, -0.009816646575927734, -0.008946418762207031, -0.008076190948486328, -0.007205963134765625, -0.006335735321044922, -0.005465507507324219, -0.004595279693603516, -0.0037250518798828125, -0.0028548240661621094, -0.0019845962524414062, -0.0011143684387207031, -0.000244140625, 0.0006260871887207031, 0.0014963150024414062, 0.0023665428161621094, 0.0032367706298828125, 0.004106998443603516, 0.004977226257324219, 0.005847454071044922, 0.006717681884765625, 0.007587909698486328, 0.008458137512207031, 0.009328365325927734, 0.010198593139648438, 0.01106882095336914, 0.011939048767089844, 0.012809276580810547, 0.01367950439453125, 0.014549732208251953, 0.015419960021972656, 0.01629018783569336, 0.017160415649414062, 0.018030643463134766, 0.01890087127685547, 0.019771099090576172, 0.020641326904296875, 0.021511554718017578, 0.02238178253173828, 0.023252010345458984, 0.024122238159179688, 0.02499246597290039, 0.025862693786621094, 0.026732921600341797, 0.0276031494140625]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 8.0, 16.0, 30.0, 53.0, 102.0, 263.0, 260.0, 140.0, 71.0, 23.0, 10.0, 11.0, 7.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.3868608474731445, -3.309995412826538, -3.2331299781799316, -3.1562647819519043, -3.079399347305298, -3.0025339126586914, -2.925668478012085, -2.8488030433654785, -2.771937847137451, -2.6950724124908447, -2.6182069778442383, -2.541341781616211, -2.4644763469696045, -2.387610912322998, -2.3107454776763916, -2.233880043029785, -2.1570146083831787, -2.0801491737365723, -2.003283739089966, -1.926418423652649, -1.849553108215332, -1.7726876735687256, -1.6958222389221191, -1.6189568042755127, -1.5420914888381958, -1.4652260541915894, -1.3883607387542725, -1.311495304107666, -1.2346298694610596, -1.1577645540237427, -1.0808991193771362, -1.0040338039398193, -0.9271682500839233, -0.8503028750419617, -0.7734375, -0.6965720653533936, -0.6197066903114319, -0.5428413152694702, -0.46597591042518616, -0.3891105055809021, -0.31224513053894043, -0.23537974059581757, -0.1585143506526947, -0.08164896070957184, -0.004783570766448975, 0.0720818042755127, 0.14894720911979675, 0.2258126139640808, 0.3026779890060425, 0.37954336404800415, 0.4564087688922882, 0.5332741737365723, 0.6101395487785339, 0.6870049238204956, 0.763870358467102, 0.8407357335090637, 0.9176011085510254, 0.9944664835929871, 1.0713318586349487, 1.1481972932815552, 1.225062608718872, 1.3019280433654785, 1.378793478012085, 1.4556589126586914, 1.5325242280960083]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 9.0, 6.0, 11.0, 13.0, 28.0, 33.0, 41.0, 57.0, 63.0, 55.0, 72.0, 84.0, 67.0, 90.0, 68.0, 58.0, 64.0, 39.0, 41.0, 35.0, 16.0, 23.0, 15.0, 6.0, 4.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.5457602739334106, -1.5074880123138428, -1.4692156314849854, -1.430943250656128, -1.39267098903656, -1.3543987274169922, -1.3161263465881348, -1.2778539657592773, -1.2395817041397095, -1.2013094425201416, -1.1630370616912842, -1.1247646808624268, -1.0864924192428589, -1.048220157623291, -1.0099477767944336, -0.971675455570221, -0.9334031343460083, -0.8951308131217957, -0.856858491897583, -0.8185861706733704, -0.7803138494491577, -0.7420415282249451, -0.7037692070007324, -0.6654968857765198, -0.6272245645523071, -0.5889522433280945, -0.5506799221038818, -0.5124076008796692, -0.47413527965545654, -0.4358629584312439, -0.39759063720703125, -0.3593183159828186, -0.32104605436325073, -0.2827737331390381, -0.24450141191482544, -0.2062290906906128, -0.16795676946640015, -0.1296844482421875, -0.09141212701797485, -0.05313980579376221, -0.01486748456954956, 0.023404836654663086, 0.06167715787887573, 0.09994947910308838, 0.13822180032730103, 0.17649412155151367, 0.21476644277572632, 0.25303876399993896, 0.2913110852241516, 0.32958340644836426, 0.3678557276725769, 0.40612804889678955, 0.4444003701210022, 0.48267269134521484, 0.5209450125694275, 0.5592173337936401, 0.5974896550178528, 0.6357619762420654, 0.6740342974662781, 0.7123066186904907, 0.7505789399147034, 0.788851261138916, 0.8271235823631287, 0.8653959035873413, 0.903668224811554]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 4.0, 4.0, 7.0, 5.0, 13.0, 18.0, 44.0, 78.0, 140.0, 310.0, 805.0, 2258.0, 7211.0, 28975.0, 857963.0, 127729.0, 15924.0, 4493.0, 1500.0, 601.0, 245.0, 99.0, 41.0, 29.0, 19.0, 5.0, 9.0, 3.0, 4.0, 9.0, 2.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.76953125, -2.676605224609375, -2.58367919921875, -2.490753173828125, -2.3978271484375, -2.304901123046875, -2.21197509765625, -2.119049072265625, -2.026123046875, -1.933197021484375, -1.84027099609375, -1.747344970703125, -1.6544189453125, -1.561492919921875, -1.46856689453125, -1.375640869140625, -1.28271484375, -1.189788818359375, -1.09686279296875, -1.003936767578125, -0.9110107421875, -0.818084716796875, -0.72515869140625, -0.632232666015625, -0.539306640625, -0.446380615234375, -0.35345458984375, -0.260528564453125, -0.1676025390625, -0.074676513671875, 0.01824951171875, 0.111175537109375, 0.2041015625, 0.297027587890625, 0.38995361328125, 0.482879638671875, 0.5758056640625, 0.668731689453125, 0.76165771484375, 0.854583740234375, 0.947509765625, 1.040435791015625, 1.13336181640625, 1.226287841796875, 1.3192138671875, 1.412139892578125, 1.50506591796875, 1.597991943359375, 1.69091796875, 1.783843994140625, 1.87677001953125, 1.969696044921875, 2.0626220703125, 2.155548095703125, 2.24847412109375, 2.341400146484375, 2.434326171875, 2.527252197265625, 2.62017822265625, 2.713104248046875, 2.8060302734375, 2.898956298828125, 2.99188232421875, 3.084808349609375, 3.177734375]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 0.0, 6.0, 6.0, 6.0, 13.0, 8.0, 15.0, 10.0, 26.0, 25.0, 18.0, 31.0, 33.0, 26.0, 46.0, 50.0, 48.0, 49.0, 47.0, 48.0, 61.0, 59.0, 55.0, 42.0, 42.0, 44.0, 35.0, 20.0, 32.0, 18.0, 11.0, 20.0, 11.0, 9.0, 9.0, 8.0, 5.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.6748046875, -1.6140289306640625, -1.553253173828125, -1.4924774169921875, -1.43170166015625, -1.3709259033203125, -1.310150146484375, -1.2493743896484375, -1.1885986328125, -1.1278228759765625, -1.067047119140625, -1.0062713623046875, -0.94549560546875, -0.8847198486328125, -0.823944091796875, -0.7631683349609375, -0.702392578125, -0.6416168212890625, -0.580841064453125, -0.5200653076171875, -0.45928955078125, -0.3985137939453125, -0.337738037109375, -0.2769622802734375, -0.2161865234375, -0.1554107666015625, -0.094635009765625, -0.0338592529296875, 0.02691650390625, 0.0876922607421875, 0.148468017578125, 0.2092437744140625, 0.27001953125, 0.3307952880859375, 0.391571044921875, 0.4523468017578125, 0.51312255859375, 0.5738983154296875, 0.634674072265625, 0.6954498291015625, 0.7562255859375, 0.8170013427734375, 0.877777099609375, 0.9385528564453125, 0.99932861328125, 1.0601043701171875, 1.120880126953125, 1.1816558837890625, 1.242431640625, 1.3032073974609375, 1.363983154296875, 1.4247589111328125, 1.48553466796875, 1.5463104248046875, 1.607086181640625, 1.6678619384765625, 1.7286376953125, 1.7894134521484375, 1.850189208984375, 1.9109649658203125, 1.97174072265625, 2.0325164794921875, 2.093292236328125, 2.1540679931640625, 2.21484375]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 4.0, 2.0, 1.0, 3.0, 4.0, 5.0, 5.0, 7.0, 14.0, 12.0, 13.0, 26.0, 25.0, 15.0, 27.0, 23.0, 33.0, 42.0, 74.0, 86.0, 184.0, 479.0, 2553.0, 36455.0, 994964.0, 11429.0, 1236.0, 325.0, 147.0, 62.0, 57.0, 47.0, 34.0, 34.0, 18.0, 15.0, 17.0, 22.0, 12.0, 8.0, 13.0, 7.0, 8.0, 5.0, 4.0, 5.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.04296875, -5.86163330078125, -5.6802978515625, -5.49896240234375, -5.317626953125, -5.13629150390625, -4.9549560546875, -4.77362060546875, -4.59228515625, -4.41094970703125, -4.2296142578125, -4.04827880859375, -3.866943359375, -3.68560791015625, -3.5042724609375, -3.32293701171875, -3.1416015625, -2.96026611328125, -2.7789306640625, -2.59759521484375, -2.416259765625, -2.23492431640625, -2.0535888671875, -1.87225341796875, -1.69091796875, -1.50958251953125, -1.3282470703125, -1.14691162109375, -0.965576171875, -0.78424072265625, -0.6029052734375, -0.42156982421875, -0.240234375, -0.05889892578125, 0.1224365234375, 0.30377197265625, 0.485107421875, 0.66644287109375, 0.8477783203125, 1.02911376953125, 1.21044921875, 1.39178466796875, 1.5731201171875, 1.75445556640625, 1.935791015625, 2.11712646484375, 2.2984619140625, 2.47979736328125, 2.6611328125, 2.84246826171875, 3.0238037109375, 3.20513916015625, 3.386474609375, 3.56781005859375, 3.7491455078125, 3.93048095703125, 4.11181640625, 4.29315185546875, 4.4744873046875, 4.65582275390625, 4.837158203125, 5.01849365234375, 5.1998291015625, 5.38116455078125, 5.5625]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 3.0, 3.0, 6.0, 5.0, 7.0, 6.0, 8.0, 13.0, 13.0, 24.0, 18.0, 21.0, 19.0, 26.0, 31.0, 34.0, 54.0, 44.0, 43.0, 54.0, 43.0, 58.0, 57.0, 56.0, 42.0, 35.0, 39.0, 31.0, 32.0, 30.0, 17.0, 21.0, 18.0, 19.0, 21.0, 10.0, 7.0, 7.0, 7.0, 13.0, 4.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.708984375, -1.653228759765625, -1.59747314453125, -1.541717529296875, -1.4859619140625, -1.430206298828125, -1.37445068359375, -1.318695068359375, -1.262939453125, -1.207183837890625, -1.15142822265625, -1.095672607421875, -1.0399169921875, -0.984161376953125, -0.92840576171875, -0.872650146484375, -0.81689453125, -0.761138916015625, -0.70538330078125, -0.649627685546875, -0.5938720703125, -0.538116455078125, -0.48236083984375, -0.426605224609375, -0.370849609375, -0.315093994140625, -0.25933837890625, -0.203582763671875, -0.1478271484375, -0.092071533203125, -0.03631591796875, 0.019439697265625, 0.0751953125, 0.130950927734375, 0.18670654296875, 0.242462158203125, 0.2982177734375, 0.353973388671875, 0.40972900390625, 0.465484619140625, 0.521240234375, 0.576995849609375, 0.63275146484375, 0.688507080078125, 0.7442626953125, 0.800018310546875, 0.85577392578125, 0.911529541015625, 0.96728515625, 1.023040771484375, 1.07879638671875, 1.134552001953125, 1.1903076171875, 1.246063232421875, 1.30181884765625, 1.357574462890625, 1.413330078125, 1.469085693359375, 1.52484130859375, 1.580596923828125, 1.6363525390625, 1.692108154296875, 1.74786376953125, 1.803619384765625, 1.859375]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 5.0, 4.0, 5.0, 4.0, 3.0, 8.0, 3.0, 8.0, 11.0, 18.0, 26.0, 30.0, 47.0, 94.0, 156.0, 341.0, 899.0, 2617.0, 10008.0, 217973.0, 798886.0, 12419.0, 2960.0, 1029.0, 465.0, 225.0, 97.0, 68.0, 39.0, 28.0, 24.0, 15.0, 11.0, 4.0, 11.0, 4.0, 3.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.99853515625, -0.9715957641601562, -0.9446563720703125, -0.9177169799804688, -0.890777587890625, -0.8638381958007812, -0.8368988037109375, -0.8099594116210938, -0.78302001953125, -0.7560806274414062, -0.7291412353515625, -0.7022018432617188, -0.675262451171875, -0.6483230590820312, -0.6213836669921875, -0.5944442749023438, -0.5675048828125, -0.5405654907226562, -0.5136260986328125, -0.48668670654296875, -0.459747314453125, -0.43280792236328125, -0.4058685302734375, -0.37892913818359375, -0.35198974609375, -0.32505035400390625, -0.2981109619140625, -0.27117156982421875, -0.244232177734375, -0.21729278564453125, -0.1903533935546875, -0.16341400146484375, -0.136474609375, -0.10953521728515625, -0.0825958251953125, -0.05565643310546875, -0.028717041015625, -0.00177764892578125, 0.0251617431640625, 0.05210113525390625, 0.07904052734375, 0.10597991943359375, 0.1329193115234375, 0.15985870361328125, 0.186798095703125, 0.21373748779296875, 0.2406768798828125, 0.26761627197265625, 0.2945556640625, 0.32149505615234375, 0.3484344482421875, 0.37537384033203125, 0.402313232421875, 0.42925262451171875, 0.4561920166015625, 0.48313140869140625, 0.51007080078125, 0.5370101928710938, 0.5639495849609375, 0.5908889770507812, 0.617828369140625, 0.6447677612304688, 0.6717071533203125, 0.6986465454101562, 0.7255859375]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 4.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 8.0, 4.0, 3.0, 10.0, 9.0, 11.0, 35.0, 54.0, 138.0, 487.0, 109.0, 54.0, 19.0, 11.0, 6.0, 7.0, 5.0, 5.0, 1.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011342763900756836, -0.0001100366935133934, -0.00010664574801921844, -0.00010325480252504349, -9.986385703086853e-05, -9.647291153669357e-05, -9.308196604251862e-05, -8.969102054834366e-05, -8.63000750541687e-05, -8.290912955999374e-05, -7.951818406581879e-05, -7.612723857164383e-05, -7.273629307746887e-05, -6.934534758329391e-05, -6.595440208911896e-05, -6.2563456594944e-05, -5.917251110076904e-05, -5.5781565606594086e-05, -5.239062011241913e-05, -4.899967461824417e-05, -4.5608729124069214e-05, -4.2217783629894257e-05, -3.88268381357193e-05, -3.543589264154434e-05, -3.2044947147369385e-05, -2.8654001653194427e-05, -2.526305615901947e-05, -2.1872110664844513e-05, -1.8481165170669556e-05, -1.5090219676494598e-05, -1.1699274182319641e-05, -8.308328688144684e-06, -4.9173831939697266e-06, -1.5264376997947693e-06, 1.864507794380188e-06, 5.255453288555145e-06, 8.646398782730103e-06, 1.203734427690506e-05, 1.5428289771080017e-05, 1.8819235265254974e-05, 2.221018075942993e-05, 2.560112625360489e-05, 2.8992071747779846e-05, 3.2383017241954803e-05, 3.577396273612976e-05, 3.916490823030472e-05, 4.2555853724479675e-05, 4.594679921865463e-05, 4.933774471282959e-05, 5.272869020700455e-05, 5.6119635701179504e-05, 5.951058119535446e-05, 6.290152668952942e-05, 6.629247218370438e-05, 6.968341767787933e-05, 7.307436317205429e-05, 7.646530866622925e-05, 7.98562541604042e-05, 8.324719965457916e-05, 8.663814514875412e-05, 9.002909064292908e-05, 9.342003613710403e-05, 9.681098163127899e-05, 0.00010020192712545395, 0.0001035928726196289]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 11.0, 5.0, 9.0, 4.0, 17.0, 31.0, 53.0, 67.0, 143.0, 373.0, 974.0, 3387.0, 21421.0, 992084.0, 24486.0, 3724.0, 1029.0, 362.0, 165.0, 73.0, 47.0, 32.0, 19.0, 7.0, 6.0, 5.0, 6.0, 5.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.96435546875, -0.9280014038085938, -0.8916473388671875, -0.8552932739257812, -0.818939208984375, -0.7825851440429688, -0.7462310791015625, -0.7098770141601562, -0.67352294921875, -0.6371688842773438, -0.6008148193359375, -0.5644607543945312, -0.528106689453125, -0.49175262451171875, -0.4553985595703125, -0.41904449462890625, -0.3826904296875, -0.34633636474609375, -0.3099822998046875, -0.27362823486328125, -0.237274169921875, -0.20092010498046875, -0.1645660400390625, -0.12821197509765625, -0.09185791015625, -0.05550384521484375, -0.0191497802734375, 0.01720428466796875, 0.053558349609375, 0.08991241455078125, 0.1262664794921875, 0.16262054443359375, 0.198974609375, 0.23532867431640625, 0.2716827392578125, 0.30803680419921875, 0.344390869140625, 0.38074493408203125, 0.4170989990234375, 0.45345306396484375, 0.48980712890625, 0.5261611938476562, 0.5625152587890625, 0.5988693237304688, 0.635223388671875, 0.6715774536132812, 0.7079315185546875, 0.7442855834960938, 0.7806396484375, 0.8169937133789062, 0.8533477783203125, 0.8897018432617188, 0.926055908203125, 0.9624099731445312, 0.9987640380859375, 1.0351181030273438, 1.07147216796875, 1.1078262329101562, 1.1441802978515625, 1.1805343627929688, 1.216888427734375, 1.2532424926757812, 1.2895965576171875, 1.3259506225585938, 1.3623046875]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 1.0, 2.0, 4.0, 4.0, 6.0, 8.0, 10.0, 15.0, 20.0, 53.0, 103.0, 380.0, 219.0, 72.0, 40.0, 17.0, 6.0, 6.0, 5.0, 5.0, 5.0, 1.0, 1.0, 3.0, 3.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.339599609375, -0.3306083679199219, -0.32161712646484375, -0.3126258850097656, -0.3036346435546875, -0.2946434020996094, -0.28565216064453125, -0.2766609191894531, -0.267669677734375, -0.2586784362792969, -0.24968719482421875, -0.24069595336914062, -0.2317047119140625, -0.22271347045898438, -0.21372222900390625, -0.20473098754882812, -0.19573974609375, -0.18674850463867188, -0.17775726318359375, -0.16876602172851562, -0.1597747802734375, -0.15078353881835938, -0.14179229736328125, -0.13280105590820312, -0.123809814453125, -0.11481857299804688, -0.10582733154296875, -0.09683609008789062, -0.0878448486328125, -0.07885360717773438, -0.06986236572265625, -0.060871124267578125, -0.0518798828125, -0.042888641357421875, -0.03389739990234375, -0.024906158447265625, -0.0159149169921875, -0.006923675537109375, 0.00206756591796875, 0.011058807373046875, 0.020050048828125, 0.029041290283203125, 0.03803253173828125, 0.047023773193359375, 0.0560150146484375, 0.06500625610351562, 0.07399749755859375, 0.08298873901367188, 0.09197998046875, 0.10097122192382812, 0.10996246337890625, 0.11895370483398438, 0.1279449462890625, 0.13693618774414062, 0.14592742919921875, 0.15491867065429688, 0.163909912109375, 0.17290115356445312, 0.18189239501953125, 0.19088363647460938, 0.1998748779296875, 0.20886611938476562, 0.21785736083984375, 0.22684860229492188, 0.23583984375]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 5.0, 22.0, 131.0, 596.0, 201.0, 45.0, 6.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-22.348182678222656, -21.938617706298828, -21.529050827026367, -21.11948585510254, -20.709918975830078, -20.30035400390625, -19.89078712463379, -19.48122215270996, -19.0716552734375, -18.662090301513672, -18.25252342224121, -17.842958450317383, -17.433391571044922, -17.023826599121094, -16.614259719848633, -16.204694747924805, -15.795129776000977, -15.385563850402832, -14.975997924804688, -14.566431999206543, -14.156866073608398, -13.74730110168457, -13.33773422241211, -12.928169250488281, -12.51860237121582, -12.109036445617676, -11.699470520019531, -11.289904594421387, -10.880338668823242, -10.470773696899414, -10.061206817626953, -9.651641845703125, -9.242074966430664, -8.83250904083252, -8.422943115234375, -8.01337718963623, -7.603811740875244, -7.1942458152771, -6.784679889678955, -6.375114440917969, -5.965548515319824, -5.55598258972168, -5.146416664123535, -4.736850738525391, -4.327285289764404, -3.9177193641662598, -3.5081534385681152, -3.09858775138855, -2.6890218257904053, -2.2794559001922607, -1.8698902130126953, -1.4603242874145508, -1.0507584810256958, -0.6411926746368408, -0.2316267490386963, 0.17793893814086914, 0.5875048637390137, 0.9970706701278687, 1.4066364765167236, 1.8162024021148682, 2.2257680892944336, 2.635334014892578, 3.0448999404907227, 3.454465627670288, 3.8640315532684326]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 6.0, 2.0, 2.0, 0.0, 3.0, 2.0, 3.0, 7.0, 7.0, 5.0, 9.0, 12.0, 12.0, 12.0, 14.0, 13.0, 27.0, 38.0, 23.0, 20.0, 33.0, 30.0, 41.0, 35.0, 52.0, 39.0, 38.0, 54.0, 51.0, 42.0, 34.0, 38.0, 26.0, 32.0, 20.0, 27.0, 30.0, 19.0, 25.0, 24.0, 27.0, 14.0, 16.0, 7.0, 9.0, 5.0, 10.0, 5.0, 2.0, 2.0, 4.0, 3.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.0938031673431396, -3.0046226978302, -2.9154422283172607, -2.826261520385742, -2.7370810508728027, -2.6479005813598633, -2.558720111846924, -2.4695396423339844, -2.380359172821045, -2.2911787033081055, -2.201998233795166, -2.1128177642822266, -2.023637056350708, -1.9344565868377686, -1.845276117324829, -1.7560956478118896, -1.666914939880371, -1.5777344703674316, -1.4885538816452026, -1.3993734121322632, -1.3101928234100342, -1.2210123538970947, -1.1318318843841553, -1.0426514148712158, -0.9534708261489868, -0.8642902970314026, -0.7751097679138184, -0.6859292984008789, -0.5967487692832947, -0.5075682401657104, -0.418387770652771, -0.32920724153518677, -0.24002671241760254, -0.1508461982011795, -0.06166568398475647, 0.02751481533050537, 0.1166953444480896, 0.20587587356567383, 0.2950563430786133, 0.3842368721961975, 0.47341740131378174, 0.562597930431366, 0.6517784595489502, 0.7409589290618896, 0.8301394581794739, 0.9193199872970581, 1.0085004568099976, 1.0976810455322266, 1.186861515045166, 1.2760419845581055, 1.3652225732803345, 1.454403042793274, 1.543583631515503, 1.6327641010284424, 1.7219445705413818, 1.8111250400543213, 1.9003056287765503, 1.9894860982894897, 2.0786666870117188, 2.167847156524658, 2.2570276260375977, 2.346208095550537, 2.4353885650634766, 2.524569272994995, 2.6137497425079346]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 6.0, 6.0, 9.0, 15.0, 19.0, 34.0, 48.0, 69.0, 117.0, 178.0, 342.0, 609.0, 1176.0, 2565.0, 7696.0, 56772.0, 2193297.0, 1868468.0, 50135.0, 6914.0, 3087.0, 1183.0, 623.0, 354.0, 211.0, 124.0, 86.0, 41.0, 36.0, 20.0, 14.0, 10.0, 10.0, 3.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.60546875, -2.52880859375, -2.4521484375, -2.37548828125, -2.298828125, -2.22216796875, -2.1455078125, -2.06884765625, -1.9921875, -1.91552734375, -1.8388671875, -1.76220703125, -1.685546875, -1.60888671875, -1.5322265625, -1.45556640625, -1.37890625, -1.30224609375, -1.2255859375, -1.14892578125, -1.072265625, -0.99560546875, -0.9189453125, -0.84228515625, -0.765625, -0.68896484375, -0.6123046875, -0.53564453125, -0.458984375, -0.38232421875, -0.3056640625, -0.22900390625, -0.15234375, -0.07568359375, 0.0009765625, 0.07763671875, 0.154296875, 0.23095703125, 0.3076171875, 0.38427734375, 0.4609375, 0.53759765625, 0.6142578125, 0.69091796875, 0.767578125, 0.84423828125, 0.9208984375, 0.99755859375, 1.07421875, 1.15087890625, 1.2275390625, 1.30419921875, 1.380859375, 1.45751953125, 1.5341796875, 1.61083984375, 1.6875, 1.76416015625, 1.8408203125, 1.91748046875, 1.994140625, 2.07080078125, 2.1474609375, 2.22412109375, 2.30078125]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 3.0, 11.0, 9.0, 18.0, 22.0, 24.0, 48.0, 43.0, 45.0, 58.0, 74.0, 49.0, 76.0, 81.0, 63.0, 58.0, 67.0, 52.0, 52.0, 33.0, 28.0, 26.0, 20.0, 15.0, 6.0, 8.0, 3.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8623046875, -1.8133697509765625, -1.764434814453125, -1.7154998779296875, -1.66656494140625, -1.6176300048828125, -1.568695068359375, -1.5197601318359375, -1.4708251953125, -1.4218902587890625, -1.372955322265625, -1.3240203857421875, -1.27508544921875, -1.2261505126953125, -1.177215576171875, -1.1282806396484375, -1.079345703125, -1.0304107666015625, -0.981475830078125, -0.9325408935546875, -0.88360595703125, -0.8346710205078125, -0.785736083984375, -0.7368011474609375, -0.6878662109375, -0.6389312744140625, -0.589996337890625, -0.5410614013671875, -0.49212646484375, -0.4431915283203125, -0.394256591796875, -0.3453216552734375, -0.29638671875, -0.2474517822265625, -0.198516845703125, -0.1495819091796875, -0.10064697265625, -0.0517120361328125, -0.002777099609375, 0.0461578369140625, 0.0950927734375, 0.1440277099609375, 0.192962646484375, 0.2418975830078125, 0.29083251953125, 0.3397674560546875, 0.388702392578125, 0.4376373291015625, 0.486572265625, 0.5355072021484375, 0.584442138671875, 0.6333770751953125, 0.68231201171875, 0.7312469482421875, 0.780181884765625, 0.8291168212890625, 0.8780517578125, 0.9269866943359375, 0.975921630859375, 1.0248565673828125, 1.07379150390625, 1.1227264404296875, 1.171661376953125, 1.2205963134765625, 1.26953125]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 1.0, 7.0, 12.0, 20.0, 31.0, 104.0, 274.0, 1266.0, 25191.0, 4161344.0, 5151.0, 580.0, 154.0, 59.0, 32.0, 23.0, 7.0, 12.0, 5.0, 0.0, 4.0, 6.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.6640625, -10.34375, -10.0234375, -9.703125, -9.3828125, -9.0625, -8.7421875, -8.421875, -8.1015625, -7.78125, -7.4609375, -7.140625, -6.8203125, -6.5, -6.1796875, -5.859375, -5.5390625, -5.21875, -4.8984375, -4.578125, -4.2578125, -3.9375, -3.6171875, -3.296875, -2.9765625, -2.65625, -2.3359375, -2.015625, -1.6953125, -1.375, -1.0546875, -0.734375, -0.4140625, -0.09375, 0.2265625, 0.546875, 0.8671875, 1.1875, 1.5078125, 1.828125, 2.1484375, 2.46875, 2.7890625, 3.109375, 3.4296875, 3.75, 4.0703125, 4.390625, 4.7109375, 5.03125, 5.3515625, 5.671875, 5.9921875, 6.3125, 6.6328125, 6.953125, 7.2734375, 7.59375, 7.9140625, 8.234375, 8.5546875, 8.875, 9.1953125, 9.515625, 9.8359375]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 5.0, 3.0, 0.0, 7.0, 8.0, 6.0, 12.0, 28.0, 30.0, 64.0, 179.0, 906.0, 2105.0, 512.0, 122.0, 45.0, 18.0, 10.0, 7.0, 1.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9482421875, -0.91796875, -0.8876953125, -0.857421875, -0.8271484375, -0.796875, -0.7666015625, -0.736328125, -0.7060546875, -0.67578125, -0.6455078125, -0.615234375, -0.5849609375, -0.5546875, -0.5244140625, -0.494140625, -0.4638671875, -0.43359375, -0.4033203125, -0.373046875, -0.3427734375, -0.3125, -0.2822265625, -0.251953125, -0.2216796875, -0.19140625, -0.1611328125, -0.130859375, -0.1005859375, -0.0703125, -0.0400390625, -0.009765625, 0.0205078125, 0.05078125, 0.0810546875, 0.111328125, 0.1416015625, 0.171875, 0.2021484375, 0.232421875, 0.2626953125, 0.29296875, 0.3232421875, 0.353515625, 0.3837890625, 0.4140625, 0.4443359375, 0.474609375, 0.5048828125, 0.53515625, 0.5654296875, 0.595703125, 0.6259765625, 0.65625, 0.6865234375, 0.716796875, 0.7470703125, 0.77734375, 0.8076171875, 0.837890625, 0.8681640625, 0.8984375, 0.9287109375, 0.958984375, 0.9892578125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 8.0, 5.0, 23.0, 34.0, 66.0, 143.0, 232.0, 228.0, 111.0, 69.0, 40.0, 11.0, 17.0, 9.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.052628517150879, -3.945894718170166, -3.8391611576080322, -3.7324273586273193, -3.6256935596466064, -3.5189599990844727, -3.4122262001037598, -3.305492401123047, -3.198758602142334, -3.092024803161621, -2.9852912425994873, -2.8785574436187744, -2.7718236446380615, -2.6650900840759277, -2.558356285095215, -2.451622486114502, -2.344888925552368, -2.2381551265716553, -2.1314215660095215, -2.0246877670288086, -1.9179539680480957, -1.8112202882766724, -1.704486608505249, -1.5977528095245361, -1.4910191297531128, -1.3842854499816895, -1.2775516510009766, -1.1708179712295532, -1.0640842914581299, -0.957350492477417, -0.8506168127059937, -0.7438830733299255, -0.6371493339538574, -0.5304155945777893, -0.4236818850040436, -0.31694817543029785, -0.21021443605422974, -0.10348069667816162, 0.0032529830932617188, 0.10998672246932983, 0.21672046184539795, 0.32345420122146606, 0.4301879107952118, 0.5369216203689575, 0.6436553597450256, 0.7503890991210938, 0.8571227788925171, 0.9638565182685852, 1.0705902576446533, 1.1773239374160767, 1.2840577363967896, 1.390791416168213, 1.4975252151489258, 1.6042588949203491, 1.7109925746917725, 1.8177263736724854, 1.9244600534439087, 2.031193733215332, 2.137927532196045, 2.244661331176758, 2.3513948917388916, 2.4581286907196045, 2.5648622512817383, 2.671596050262451, 2.778329849243164]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 1.0, 3.0, 7.0, 8.0, 15.0, 22.0, 19.0, 30.0, 51.0, 39.0, 59.0, 65.0, 70.0, 64.0, 71.0, 88.0, 70.0, 66.0, 66.0, 48.0, 35.0, 34.0, 25.0, 15.0, 9.0, 10.0, 8.0, 4.0, 3.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.2870242595672607, -2.230461835861206, -2.1738996505737305, -2.117337226867676, -2.060774803161621, -2.0042126178741455, -1.9476501941680908, -1.8910878896713257, -1.8345255851745605, -1.7779632806777954, -1.7214008569717407, -1.6648385524749756, -1.6082762479782104, -1.5517139434814453, -1.4951515197753906, -1.4385892152786255, -1.3820269107818604, -1.3254646062850952, -1.2689021825790405, -1.2123398780822754, -1.1557775735855103, -1.0992152690887451, -1.0426528453826904, -0.9860905408859253, -0.9295281171798706, -0.8729657530784607, -0.8164034485816956, -0.7598410844802856, -0.7032787799835205, -0.6467164158821106, -0.5901540517807007, -0.5335917472839355, -0.4770294427871704, -0.4204671084880829, -0.36390477418899536, -0.30734241008758545, -0.2507801055908203, -0.1942177414894104, -0.13765540719032288, -0.08109307289123535, -0.024530738592147827, 0.032031599432229996, 0.08859393745660782, 0.14515627920627594, 0.20171861350536346, 0.2582809627056122, 0.3148432970046997, 0.37140563130378723, 0.42796796560287476, 0.4845302999019623, 0.5410926342010498, 0.5976549983024597, 0.6542173027992249, 0.7107796669006348, 0.7673419713973999, 0.8239043354988098, 0.8804666996002197, 0.9370290637016296, 0.9935913681983948, 1.0501537322998047, 1.1067160367965698, 1.163278341293335, 1.2198407649993896, 1.2764030694961548, 1.33296537399292]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 3.0, 2.0, 5.0, 4.0, 10.0, 10.0, 20.0, 31.0, 44.0, 57.0, 121.0, 219.0, 377.0, 759.0, 1781.0, 4496.0, 14461.0, 75425.0, 680279.0, 228599.0, 29365.0, 7514.0, 2662.0, 1157.0, 484.0, 295.0, 140.0, 73.0, 53.0, 38.0, 19.0, 10.0, 9.0, 7.0, 8.0, 4.0, 3.0, 7.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.336669921875, -0.3240776062011719, -0.31148529052734375, -0.2988929748535156, -0.2863006591796875, -0.2737083435058594, -0.26111602783203125, -0.24852371215820312, -0.235931396484375, -0.22333908081054688, -0.21074676513671875, -0.19815444946289062, -0.1855621337890625, -0.17296981811523438, -0.16037750244140625, -0.14778518676757812, -0.13519287109375, -0.12260055541992188, -0.11000823974609375, -0.09741592407226562, -0.0848236083984375, -0.07223129272460938, -0.05963897705078125, -0.047046661376953125, -0.034454345703125, -0.021862030029296875, -0.00926971435546875, 0.003322601318359375, 0.0159149169921875, 0.028507232666015625, 0.04109954833984375, 0.053691864013671875, 0.0662841796875, 0.07887649536132812, 0.09146881103515625, 0.10406112670898438, 0.1166534423828125, 0.12924575805664062, 0.14183807373046875, 0.15443038940429688, 0.167022705078125, 0.17961502075195312, 0.19220733642578125, 0.20479965209960938, 0.2173919677734375, 0.22998428344726562, 0.24257659912109375, 0.2551689147949219, 0.26776123046875, 0.2803535461425781, 0.29294586181640625, 0.3055381774902344, 0.3181304931640625, 0.3307228088378906, 0.34331512451171875, 0.3559074401855469, 0.368499755859375, 0.3810920715332031, 0.39368438720703125, 0.4062767028808594, 0.4188690185546875, 0.4314613342285156, 0.44405364990234375, 0.4566459655761719, 0.46923828125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 2.0, 9.0, 17.0, 22.0, 33.0, 55.0, 69.0, 82.0, 99.0, 103.0, 118.0, 106.0, 85.0, 57.0, 54.0, 38.0, 22.0, 10.0, 12.0, 5.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0, -1.947418212890625, -1.89483642578125, -1.842254638671875, -1.7896728515625, -1.737091064453125, -1.68450927734375, -1.631927490234375, -1.579345703125, -1.526763916015625, -1.47418212890625, -1.421600341796875, -1.3690185546875, -1.316436767578125, -1.26385498046875, -1.211273193359375, -1.15869140625, -1.106109619140625, -1.05352783203125, -1.000946044921875, -0.9483642578125, -0.895782470703125, -0.84320068359375, -0.790618896484375, -0.738037109375, -0.685455322265625, -0.63287353515625, -0.580291748046875, -0.5277099609375, -0.475128173828125, -0.42254638671875, -0.369964599609375, -0.3173828125, -0.264801025390625, -0.21221923828125, -0.159637451171875, -0.1070556640625, -0.054473876953125, -0.00189208984375, 0.050689697265625, 0.103271484375, 0.155853271484375, 0.20843505859375, 0.261016845703125, 0.3135986328125, 0.366180419921875, 0.41876220703125, 0.471343994140625, 0.52392578125, 0.576507568359375, 0.62908935546875, 0.681671142578125, 0.7342529296875, 0.786834716796875, 0.83941650390625, 0.891998291015625, 0.944580078125, 0.997161865234375, 1.04974365234375, 1.102325439453125, 1.1549072265625, 1.207489013671875, 1.26007080078125, 1.312652587890625, 1.365234375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 9.0, 6.0, 7.0, 11.0, 10.0, 17.0, 34.0, 41.0, 63.0, 87.0, 123.0, 203.0, 263.0, 423.0, 633.0, 968.0, 1684.0, 3043.0, 6238.0, 13890.0, 35238.0, 108347.0, 406200.0, 329752.0, 87505.0, 29454.0, 11821.0, 5435.0, 2831.0, 1522.0, 887.0, 549.0, 389.0, 274.0, 174.0, 128.0, 109.0, 54.0, 40.0, 34.0, 22.0, 15.0, 11.0, 6.0, 3.0, 1.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.180419921875, -0.17476463317871094, -0.16910934448242188, -0.1634540557861328, -0.15779876708984375, -0.1521434783935547, -0.14648818969726562, -0.14083290100097656, -0.1351776123046875, -0.12952232360839844, -0.12386703491210938, -0.11821174621582031, -0.11255645751953125, -0.10690116882324219, -0.10124588012695312, -0.09559059143066406, -0.089935302734375, -0.08428001403808594, -0.07862472534179688, -0.07296943664550781, -0.06731414794921875, -0.06165885925292969, -0.056003570556640625, -0.05034828186035156, -0.0446929931640625, -0.03903770446777344, -0.033382415771484375, -0.027727127075195312, -0.02207183837890625, -0.016416549682617188, -0.010761260986328125, -0.0051059722900390625, 0.00054931640625, 0.0062046051025390625, 0.011859893798828125, 0.017515182495117188, 0.02317047119140625, 0.028825759887695312, 0.034481048583984375, 0.04013633728027344, 0.0457916259765625, 0.05144691467285156, 0.057102203369140625, 0.06275749206542969, 0.06841278076171875, 0.07406806945800781, 0.07972335815429688, 0.08537864685058594, 0.091033935546875, 0.09668922424316406, 0.10234451293945312, 0.10799980163574219, 0.11365509033203125, 0.11931037902832031, 0.12496566772460938, 0.13062095642089844, 0.1362762451171875, 0.14193153381347656, 0.14758682250976562, 0.1532421112060547, 0.15889739990234375, 0.1645526885986328, 0.17020797729492188, 0.17586326599121094, 0.1815185546875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 3.0, 4.0, 6.0, 12.0, 9.0, 9.0, 17.0, 22.0, 20.0, 28.0, 40.0, 53.0, 52.0, 54.0, 42.0, 55.0, 71.0, 52.0, 65.0, 68.0, 52.0, 48.0, 42.0, 36.0, 24.0, 26.0, 20.0, 21.0, 20.0, 8.0, 12.0, 8.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.654296875, -1.5984344482421875, -1.542572021484375, -1.4867095947265625, -1.43084716796875, -1.3749847412109375, -1.319122314453125, -1.2632598876953125, -1.2073974609375, -1.1515350341796875, -1.095672607421875, -1.0398101806640625, -0.98394775390625, -0.9280853271484375, -0.872222900390625, -0.8163604736328125, -0.760498046875, -0.7046356201171875, -0.648773193359375, -0.5929107666015625, -0.53704833984375, -0.4811859130859375, -0.425323486328125, -0.3694610595703125, -0.3135986328125, -0.2577362060546875, -0.201873779296875, -0.1460113525390625, -0.09014892578125, -0.0342864990234375, 0.021575927734375, 0.0774383544921875, 0.13330078125, 0.1891632080078125, 0.245025634765625, 0.3008880615234375, 0.35675048828125, 0.4126129150390625, 0.468475341796875, 0.5243377685546875, 0.5802001953125, 0.6360626220703125, 0.691925048828125, 0.7477874755859375, 0.80364990234375, 0.8595123291015625, 0.915374755859375, 0.9712371826171875, 1.027099609375, 1.0829620361328125, 1.138824462890625, 1.1946868896484375, 1.25054931640625, 1.3064117431640625, 1.362274169921875, 1.4181365966796875, 1.4739990234375, 1.5298614501953125, 1.585723876953125, 1.6415863037109375, 1.69744873046875, 1.7533111572265625, 1.809173583984375, 1.8650360107421875, 1.9208984375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 6.0, 5.0, 13.0, 8.0, 21.0, 28.0, 29.0, 58.0, 78.0, 126.0, 193.0, 339.0, 772.0, 1447.0, 3128.0, 7886.0, 24737.0, 117379.0, 649130.0, 191485.0, 34275.0, 10130.0, 3816.0, 1645.0, 791.0, 419.0, 236.0, 122.0, 84.0, 51.0, 33.0, 24.0, 20.0, 9.0, 6.0, 7.0, 5.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.07354736328125, -0.07122135162353516, -0.06889533996582031, -0.06656932830810547, -0.06424331665039062, -0.06191730499267578, -0.05959129333496094, -0.057265281677246094, -0.05493927001953125, -0.052613258361816406, -0.05028724670410156, -0.04796123504638672, -0.045635223388671875, -0.04330921173095703, -0.04098320007324219, -0.038657188415527344, -0.0363311767578125, -0.034005165100097656, -0.03167915344238281, -0.02935314178466797, -0.027027130126953125, -0.02470111846923828, -0.022375106811523438, -0.020049095153808594, -0.01772308349609375, -0.015397071838378906, -0.013071060180664062, -0.010745048522949219, -0.008419036865234375, -0.006093025207519531, -0.0037670135498046875, -0.0014410018920898438, 0.000885009765625, 0.0032110214233398438, 0.0055370330810546875, 0.007863044738769531, 0.010189056396484375, 0.012515068054199219, 0.014841079711914062, 0.017167091369628906, 0.01949310302734375, 0.021819114685058594, 0.024145126342773438, 0.02647113800048828, 0.028797149658203125, 0.03112316131591797, 0.03344917297363281, 0.035775184631347656, 0.0381011962890625, 0.040427207946777344, 0.04275321960449219, 0.04507923126220703, 0.047405242919921875, 0.04973125457763672, 0.05205726623535156, 0.054383277893066406, 0.05670928955078125, 0.059035301208496094, 0.06136131286621094, 0.06368732452392578, 0.06601333618164062, 0.06833934783935547, 0.07066535949707031, 0.07299137115478516, 0.0753173828125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 3.0, 3.0, 14.0, 6.0, 14.0, 27.0, 21.0, 30.0, 45.0, 81.0, 84.0, 116.0, 147.0, 101.0, 82.0, 61.0, 38.0, 32.0, 20.0, 13.0, 13.0, 14.0, 11.0, 3.0, 6.0, 5.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.707408905029297e-05, -3.5713426768779755e-05, -3.435276448726654e-05, -3.2992102205753326e-05, -3.163143992424011e-05, -3.0270777642726898e-05, -2.8910115361213684e-05, -2.754945307970047e-05, -2.6188790798187256e-05, -2.4828128516674042e-05, -2.3467466235160828e-05, -2.2106803953647614e-05, -2.07461416721344e-05, -1.9385479390621185e-05, -1.802481710910797e-05, -1.6664154827594757e-05, -1.5303492546081543e-05, -1.3942830264568329e-05, -1.2582167983055115e-05, -1.12215057015419e-05, -9.860843420028687e-06, -8.500181138515472e-06, -7.139518857002258e-06, -5.778856575489044e-06, -4.41819429397583e-06, -3.057532012462616e-06, -1.6968697309494019e-06, -3.3620744943618774e-07, 1.0244548320770264e-06, 2.3851171135902405e-06, 3.7457793951034546e-06, 5.106441676616669e-06, 6.467103958129883e-06, 7.827766239643097e-06, 9.188428521156311e-06, 1.0549090802669525e-05, 1.190975308418274e-05, 1.3270415365695953e-05, 1.4631077647209167e-05, 1.599173992872238e-05, 1.7352402210235596e-05, 1.871306449174881e-05, 2.0073726773262024e-05, 2.1434389054775238e-05, 2.2795051336288452e-05, 2.4155713617801666e-05, 2.551637589931488e-05, 2.6877038180828094e-05, 2.823770046234131e-05, 2.9598362743854523e-05, 3.095902502536774e-05, 3.231968730688095e-05, 3.3680349588394165e-05, 3.504101186990738e-05, 3.640167415142059e-05, 3.776233643293381e-05, 3.912299871444702e-05, 4.0483660995960236e-05, 4.184432327747345e-05, 4.3204985558986664e-05, 4.456564784049988e-05, 4.592631012201309e-05, 4.7286972403526306e-05, 4.864763468503952e-05, 5.0008296966552734e-05]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 3.0, 10.0, 9.0, 13.0, 25.0, 36.0, 46.0, 82.0, 168.0, 410.0, 966.0, 2814.0, 10819.0, 61322.0, 626469.0, 303313.0, 32262.0, 6591.0, 1906.0, 654.0, 296.0, 133.0, 72.0, 44.0, 25.0, 22.0, 15.0, 7.0, 7.0, 5.0, 7.0, 3.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.10919189453125, -0.10605716705322266, -0.10292243957519531, -0.09978771209716797, -0.09665298461914062, -0.09351825714111328, -0.09038352966308594, -0.0872488021850586, -0.08411407470703125, -0.0809793472290039, -0.07784461975097656, -0.07470989227294922, -0.07157516479492188, -0.06844043731689453, -0.06530570983886719, -0.062170982360839844, -0.0590362548828125, -0.055901527404785156, -0.05276679992675781, -0.04963207244873047, -0.046497344970703125, -0.04336261749267578, -0.04022789001464844, -0.037093162536621094, -0.03395843505859375, -0.030823707580566406, -0.027688980102539062, -0.02455425262451172, -0.021419525146484375, -0.01828479766845703, -0.015150070190429688, -0.012015342712402344, -0.008880615234375, -0.005745887756347656, -0.0026111602783203125, 0.0005235671997070312, 0.003658294677734375, 0.006793022155761719, 0.009927749633789062, 0.013062477111816406, 0.01619720458984375, 0.019331932067871094, 0.022466659545898438, 0.02560138702392578, 0.028736114501953125, 0.03187084197998047, 0.03500556945800781, 0.038140296936035156, 0.0412750244140625, 0.044409751892089844, 0.04754447937011719, 0.05067920684814453, 0.053813934326171875, 0.05694866180419922, 0.06008338928222656, 0.0632181167602539, 0.06635284423828125, 0.0694875717163086, 0.07262229919433594, 0.07575702667236328, 0.07889175415039062, 0.08202648162841797, 0.08516120910644531, 0.08829593658447266, 0.0914306640625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 6.0, 6.0, 8.0, 9.0, 10.0, 7.0, 21.0, 22.0, 16.0, 33.0, 33.0, 60.0, 49.0, 59.0, 88.0, 66.0, 67.0, 76.0, 73.0, 64.0, 65.0, 38.0, 27.0, 26.0, 16.0, 13.0, 17.0, 10.0, 5.0, 7.0, 1.0, 1.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01541900634765625, -0.014920353889465332, -0.014421701431274414, -0.013923048973083496, -0.013424396514892578, -0.01292574405670166, -0.012427091598510742, -0.011928439140319824, -0.011429786682128906, -0.010931134223937988, -0.01043248176574707, -0.009933829307556152, -0.009435176849365234, -0.008936524391174316, -0.008437871932983398, -0.00793921947479248, -0.0074405670166015625, -0.0069419145584106445, -0.0064432621002197266, -0.005944609642028809, -0.005445957183837891, -0.004947304725646973, -0.004448652267456055, -0.003949999809265137, -0.0034513473510742188, -0.0029526948928833008, -0.002454042434692383, -0.001955389976501465, -0.0014567375183105469, -0.0009580850601196289, -0.00045943260192871094, 3.921985626220703e-05, 0.000537872314453125, 0.001036524772644043, 0.001535177230834961, 0.002033829689025879, 0.002532482147216797, 0.003031134605407715, 0.003529787063598633, 0.004028439521789551, 0.004527091979980469, 0.005025744438171387, 0.005524396896362305, 0.006023049354553223, 0.006521701812744141, 0.007020354270935059, 0.0075190067291259766, 0.008017659187316895, 0.008516311645507812, 0.00901496410369873, 0.009513616561889648, 0.010012269020080566, 0.010510921478271484, 0.011009573936462402, 0.01150822639465332, 0.012006878852844238, 0.012505531311035156, 0.013004183769226074, 0.013502836227416992, 0.01400148868560791, 0.014500141143798828, 0.014998793601989746, 0.015497446060180664, 0.015996098518371582, 0.0164947509765625]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 4.0, 3.0, 11.0, 17.0, 51.0, 143.0, 376.0, 252.0, 98.0, 23.0, 18.0, 7.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.140503406524658, -4.036479473114014, -3.932455062866211, -3.8284311294555664, -3.7244069576263428, -3.620382785797119, -3.5163586139678955, -3.412334442138672, -3.3083105087280273, -3.2042863368988037, -3.10026216506958, -2.9962382316589355, -2.892214059829712, -2.7881898880004883, -2.6841657161712646, -2.580141544342041, -2.4761176109313965, -2.372093439102173, -2.268069267272949, -2.1640453338623047, -2.060021162033081, -1.9559969902038574, -1.8519728183746338, -1.7479487657546997, -1.6439244747161865, -1.539900302886963, -1.4358762502670288, -1.3318520784378052, -1.227828025817871, -1.1238038539886475, -1.0197796821594238, -0.9157556295394897, -0.8117315769195557, -0.7077074646949768, -0.603683352470398, -0.4996592104434967, -0.39563509821891785, -0.2916109561920166, -0.18758684396743774, -0.08356273174285889, 0.02046138048171997, 0.12448550015687943, 0.22850961983203888, 0.33253374695777893, 0.4365578591823578, 0.540582001209259, 0.6446061134338379, 0.7486302256584167, 0.8526543378829956, 0.9566784501075745, 1.0607025623321533, 1.164726734161377, 1.268750786781311, 1.3727749586105347, 1.4767990112304688, 1.5808231830596924, 1.684847354888916, 1.7888715267181396, 1.8928955793380737, 1.9969197511672974, 2.1009438037872314, 2.204967975616455, 2.3089921474456787, 2.4130163192749023, 2.517040252685547]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 5.0, 2.0, 10.0, 9.0, 24.0, 32.0, 40.0, 54.0, 80.0, 87.0, 96.0, 97.0, 121.0, 82.0, 76.0, 64.0, 47.0, 32.0, 17.0, 12.0, 7.0, 7.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8105216026306152, -1.762357234954834, -1.7141928672790527, -1.6660284996032715, -1.6178641319274902, -1.569699764251709, -1.5215353965759277, -1.4733710289001465, -1.4252066612243652, -1.377042293548584, -1.3288779258728027, -1.2807135581970215, -1.2325491905212402, -1.184384822845459, -1.1362204551696777, -1.0880560874938965, -1.0398917198181152, -0.991727352142334, -0.9435629844665527, -0.8953986167907715, -0.8472342491149902, -0.799069881439209, -0.7509055137634277, -0.7027411460876465, -0.6545767784118652, -0.606412410736084, -0.5582480430603027, -0.5100836753845215, -0.46191930770874023, -0.413754940032959, -0.36559057235717773, -0.3174262046813965, -0.26926183700561523, -0.22109746932983398, -0.17293310165405273, -0.12476873397827148, -0.07660436630249023, -0.028439998626708984, 0.019724369049072266, 0.06788873672485352, 0.11605310440063477, 0.16421747207641602, 0.21238183975219727, 0.2605462074279785, 0.30871057510375977, 0.356874942779541, 0.40503931045532227, 0.4532036781311035, 0.5013680458068848, 0.549532413482666, 0.5976967811584473, 0.6458611488342285, 0.6940255165100098, 0.742189884185791, 0.7903542518615723, 0.8385186195373535, 0.8866829872131348, 0.934847354888916, 0.9830117225646973, 1.0311760902404785, 1.0793404579162598, 1.127504825592041, 1.1756691932678223, 1.2238335609436035, 1.2719979286193848]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 7.0, 8.0, 6.0, 19.0, 46.0, 182.0, 635.0, 3850.0, 153918.0, 883016.0, 5693.0, 869.0, 188.0, 54.0, 33.0, 9.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.55078125, -5.401123046875, -5.25146484375, -5.101806640625, -4.9521484375, -4.802490234375, -4.65283203125, -4.503173828125, -4.353515625, -4.203857421875, -4.05419921875, -3.904541015625, -3.7548828125, -3.605224609375, -3.45556640625, -3.305908203125, -3.15625, -3.006591796875, -2.85693359375, -2.707275390625, -2.5576171875, -2.407958984375, -2.25830078125, -2.108642578125, -1.958984375, -1.809326171875, -1.65966796875, -1.510009765625, -1.3603515625, -1.210693359375, -1.06103515625, -0.911376953125, -0.76171875, -0.612060546875, -0.46240234375, -0.312744140625, -0.1630859375, -0.013427734375, 0.13623046875, 0.285888671875, 0.435546875, 0.585205078125, 0.73486328125, 0.884521484375, 1.0341796875, 1.183837890625, 1.33349609375, 1.483154296875, 1.6328125, 1.782470703125, 1.93212890625, 2.081787109375, 2.2314453125, 2.381103515625, 2.53076171875, 2.680419921875, 2.830078125, 2.979736328125, 3.12939453125, 3.279052734375, 3.4287109375, 3.578369140625, 3.72802734375, 3.877685546875, 4.02734375]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 7.0, 18.0, 41.0, 52.0, 87.0, 148.0, 146.0, 184.0, 122.0, 85.0, 61.0, 23.0, 13.0, 10.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.560546875, -2.409027099609375, -2.25750732421875, -2.105987548828125, -1.9544677734375, -1.802947998046875, -1.65142822265625, -1.499908447265625, -1.348388671875, -1.196868896484375, -1.04534912109375, -0.893829345703125, -0.7423095703125, -0.590789794921875, -0.43927001953125, -0.287750244140625, -0.13623046875, 0.015289306640625, 0.16680908203125, 0.318328857421875, 0.4698486328125, 0.621368408203125, 0.77288818359375, 0.924407958984375, 1.075927734375, 1.227447509765625, 1.37896728515625, 1.530487060546875, 1.6820068359375, 1.833526611328125, 1.98504638671875, 2.136566162109375, 2.2880859375, 2.439605712890625, 2.59112548828125, 2.742645263671875, 2.8941650390625, 3.045684814453125, 3.19720458984375, 3.348724365234375, 3.500244140625, 3.651763916015625, 3.80328369140625, 3.954803466796875, 4.1063232421875, 4.257843017578125, 4.40936279296875, 4.560882568359375, 4.71240234375, 4.863922119140625, 5.01544189453125, 5.166961669921875, 5.3184814453125, 5.470001220703125, 5.62152099609375, 5.773040771484375, 5.924560546875, 6.076080322265625, 6.22760009765625, 6.379119873046875, 6.5306396484375, 6.682159423828125, 6.83367919921875, 6.985198974609375, 7.13671875]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 3.0, 2.0, 0.0, 6.0, 5.0, 6.0, 7.0, 8.0, 21.0, 7.0, 19.0, 24.0, 36.0, 48.0, 48.0, 62.0, 82.0, 120.0, 193.0, 285.0, 536.0, 1225.0, 3680.0, 18013.0, 880941.0, 129064.0, 9440.0, 2419.0, 902.0, 449.0, 265.0, 141.0, 115.0, 96.0, 56.0, 55.0, 41.0, 32.0, 20.0, 18.0, 18.0, 15.0, 8.0, 7.0, 8.0, 5.0, 7.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.60546875, -2.532745361328125, -2.46002197265625, -2.387298583984375, -2.3145751953125, -2.241851806640625, -2.16912841796875, -2.096405029296875, -2.023681640625, -1.950958251953125, -1.87823486328125, -1.805511474609375, -1.7327880859375, -1.660064697265625, -1.58734130859375, -1.514617919921875, -1.44189453125, -1.369171142578125, -1.29644775390625, -1.223724365234375, -1.1510009765625, -1.078277587890625, -1.00555419921875, -0.932830810546875, -0.860107421875, -0.787384033203125, -0.71466064453125, -0.641937255859375, -0.5692138671875, -0.496490478515625, -0.42376708984375, -0.351043701171875, -0.2783203125, -0.205596923828125, -0.13287353515625, -0.060150146484375, 0.0125732421875, 0.085296630859375, 0.15802001953125, 0.230743408203125, 0.303466796875, 0.376190185546875, 0.44891357421875, 0.521636962890625, 0.5943603515625, 0.667083740234375, 0.73980712890625, 0.812530517578125, 0.88525390625, 0.957977294921875, 1.03070068359375, 1.103424072265625, 1.1761474609375, 1.248870849609375, 1.32159423828125, 1.394317626953125, 1.467041015625, 1.539764404296875, 1.61248779296875, 1.685211181640625, 1.7579345703125, 1.830657958984375, 1.90338134765625, 1.976104736328125, 2.048828125]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 5.0, 2.0, 3.0, 9.0, 10.0, 13.0, 8.0, 10.0, 18.0, 21.0, 23.0, 21.0, 24.0, 21.0, 28.0, 36.0, 47.0, 40.0, 49.0, 35.0, 38.0, 60.0, 40.0, 53.0, 36.0, 40.0, 32.0, 24.0, 33.0, 28.0, 24.0, 31.0, 22.0, 17.0, 19.0, 21.0, 9.0, 18.0, 7.0, 7.0, 5.0, 3.0, 4.0, 5.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.4453125, -1.4024200439453125, -1.359527587890625, -1.3166351318359375, -1.27374267578125, -1.2308502197265625, -1.187957763671875, -1.1450653076171875, -1.1021728515625, -1.0592803955078125, -1.016387939453125, -0.9734954833984375, -0.93060302734375, -0.8877105712890625, -0.844818115234375, -0.8019256591796875, -0.759033203125, -0.7161407470703125, -0.673248291015625, -0.6303558349609375, -0.58746337890625, -0.5445709228515625, -0.501678466796875, -0.4587860107421875, -0.4158935546875, -0.3730010986328125, -0.330108642578125, -0.2872161865234375, -0.24432373046875, -0.2014312744140625, -0.158538818359375, -0.1156463623046875, -0.07275390625, -0.0298614501953125, 0.013031005859375, 0.0559234619140625, 0.09881591796875, 0.1417083740234375, 0.184600830078125, 0.2274932861328125, 0.2703857421875, 0.3132781982421875, 0.356170654296875, 0.3990631103515625, 0.44195556640625, 0.4848480224609375, 0.527740478515625, 0.5706329345703125, 0.613525390625, 0.6564178466796875, 0.699310302734375, 0.7422027587890625, 0.78509521484375, 0.8279876708984375, 0.870880126953125, 0.9137725830078125, 0.9566650390625, 0.9995574951171875, 1.042449951171875, 1.0853424072265625, 1.12823486328125, 1.1711273193359375, 1.214019775390625, 1.2569122314453125, 1.2998046875]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 4.0, 1.0, 7.0, 7.0, 9.0, 13.0, 24.0, 29.0, 44.0, 72.0, 146.0, 268.0, 602.0, 1745.0, 7381.0, 64764.0, 913148.0, 51111.0, 6590.0, 1501.0, 551.0, 245.0, 105.0, 74.0, 37.0, 21.0, 21.0, 13.0, 5.0, 7.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.29638671875, -0.2847442626953125, -0.273101806640625, -0.2614593505859375, -0.24981689453125, -0.2381744384765625, -0.226531982421875, -0.2148895263671875, -0.2032470703125, -0.1916046142578125, -0.179962158203125, -0.1683197021484375, -0.15667724609375, -0.1450347900390625, -0.133392333984375, -0.1217498779296875, -0.110107421875, -0.0984649658203125, -0.086822509765625, -0.0751800537109375, -0.06353759765625, -0.0518951416015625, -0.040252685546875, -0.0286102294921875, -0.0169677734375, -0.0053253173828125, 0.006317138671875, 0.0179595947265625, 0.02960205078125, 0.0412445068359375, 0.052886962890625, 0.0645294189453125, 0.076171875, 0.0878143310546875, 0.099456787109375, 0.1110992431640625, 0.12274169921875, 0.1343841552734375, 0.146026611328125, 0.1576690673828125, 0.1693115234375, 0.1809539794921875, 0.192596435546875, 0.2042388916015625, 0.21588134765625, 0.2275238037109375, 0.239166259765625, 0.2508087158203125, 0.262451171875, 0.2740936279296875, 0.285736083984375, 0.2973785400390625, 0.30902099609375, 0.3206634521484375, 0.332305908203125, 0.3439483642578125, 0.3555908203125, 0.3672332763671875, 0.378875732421875, 0.3905181884765625, 0.40216064453125, 0.4138031005859375, 0.425445556640625, 0.4370880126953125, 0.44873046875]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 3.0, 3.0, 2.0, 2.0, 2.0, 5.0, 11.0, 5.0, 12.0, 26.0, 25.0, 44.0, 93.0, 149.0, 207.0, 153.0, 100.0, 57.0, 28.0, 20.0, 11.0, 11.0, 10.0, 5.0, 8.0, 3.0, 3.0, 2.0, 0.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.082918167114258e-05, -3.9686448872089386e-05, -3.8543716073036194e-05, -3.7400983273983e-05, -3.625825047492981e-05, -3.511551767587662e-05, -3.3972784876823425e-05, -3.283005207777023e-05, -3.168731927871704e-05, -3.054458647966385e-05, -2.9401853680610657e-05, -2.8259120881557465e-05, -2.7116388082504272e-05, -2.597365528345108e-05, -2.4830922484397888e-05, -2.3688189685344696e-05, -2.2545456886291504e-05, -2.1402724087238312e-05, -2.025999128818512e-05, -1.9117258489131927e-05, -1.7974525690078735e-05, -1.6831792891025543e-05, -1.568906009197235e-05, -1.4546327292919159e-05, -1.3403594493865967e-05, -1.2260861694812775e-05, -1.1118128895759583e-05, -9.97539609670639e-06, -8.832663297653198e-06, -7.689930498600006e-06, -6.547197699546814e-06, -5.404464900493622e-06, -4.26173210144043e-06, -3.1189993023872375e-06, -1.9762665033340454e-06, -8.335337042808533e-07, 3.0919909477233887e-07, 1.451931893825531e-06, 2.594664692878723e-06, 3.7373974919319153e-06, 4.880130290985107e-06, 6.0228630900382996e-06, 7.165595889091492e-06, 8.308328688144684e-06, 9.451061487197876e-06, 1.0593794286251068e-05, 1.173652708530426e-05, 1.2879259884357452e-05, 1.4021992683410645e-05, 1.5164725482463837e-05, 1.630745828151703e-05, 1.745019108057022e-05, 1.8592923879623413e-05, 1.9735656678676605e-05, 2.0878389477729797e-05, 2.202112227678299e-05, 2.316385507583618e-05, 2.4306587874889374e-05, 2.5449320673942566e-05, 2.6592053472995758e-05, 2.773478627204895e-05, 2.8877519071102142e-05, 3.0020251870155334e-05, 3.1162984669208527e-05, 3.230571746826172e-05]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 12.0, 11.0, 15.0, 20.0, 35.0, 57.0, 77.0, 135.0, 204.0, 436.0, 952.0, 2307.0, 7574.0, 44677.0, 872694.0, 101725.0, 11885.0, 3242.0, 1199.0, 532.0, 290.0, 169.0, 95.0, 64.0, 41.0, 30.0, 18.0, 11.0, 10.0, 4.0, 8.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.343017578125, -0.3321800231933594, -0.32134246826171875, -0.3105049133300781, -0.2996673583984375, -0.2888298034667969, -0.27799224853515625, -0.2671546936035156, -0.256317138671875, -0.24547958374023438, -0.23464202880859375, -0.22380447387695312, -0.2129669189453125, -0.20212936401367188, -0.19129180908203125, -0.18045425415039062, -0.16961669921875, -0.15877914428710938, -0.14794158935546875, -0.13710403442382812, -0.1262664794921875, -0.11542892456054688, -0.10459136962890625, -0.09375381469726562, -0.082916259765625, -0.07207870483398438, -0.06124114990234375, -0.050403594970703125, -0.0395660400390625, -0.028728485107421875, -0.01789093017578125, -0.007053375244140625, 0.0037841796875, 0.014621734619140625, 0.02545928955078125, 0.036296844482421875, 0.0471343994140625, 0.057971954345703125, 0.06880950927734375, 0.07964706420898438, 0.090484619140625, 0.10132217407226562, 0.11215972900390625, 0.12299728393554688, 0.1338348388671875, 0.14467239379882812, 0.15550994873046875, 0.16634750366210938, 0.17718505859375, 0.18802261352539062, 0.19886016845703125, 0.20969772338867188, 0.2205352783203125, 0.23137283325195312, 0.24221038818359375, 0.2530479431152344, 0.263885498046875, 0.2747230529785156, 0.28556060791015625, 0.2963981628417969, 0.3072357177734375, 0.3180732727050781, 0.32891082763671875, 0.3397483825683594, 0.3505859375]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 8.0, 7.0, 6.0, 13.0, 14.0, 15.0, 29.0, 36.0, 57.0, 107.0, 169.0, 206.0, 144.0, 60.0, 34.0, 26.0, 20.0, 10.0, 12.0, 7.0, 7.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1260986328125, -0.12218761444091797, -0.11827659606933594, -0.1143655776977539, -0.11045455932617188, -0.10654354095458984, -0.10263252258300781, -0.09872150421142578, -0.09481048583984375, -0.09089946746826172, -0.08698844909667969, -0.08307743072509766, -0.07916641235351562, -0.0752553939819336, -0.07134437561035156, -0.06743335723876953, -0.0635223388671875, -0.05961132049560547, -0.05570030212402344, -0.051789283752441406, -0.047878265380859375, -0.043967247009277344, -0.04005622863769531, -0.03614521026611328, -0.03223419189453125, -0.02832317352294922, -0.024412155151367188, -0.020501136779785156, -0.016590118408203125, -0.012679100036621094, -0.008768081665039062, -0.004857063293457031, -0.000946044921875, 0.0029649734497070312, 0.0068759918212890625, 0.010787010192871094, 0.014698028564453125, 0.018609046936035156, 0.022520065307617188, 0.02643108367919922, 0.03034210205078125, 0.03425312042236328, 0.03816413879394531, 0.042075157165527344, 0.045986175537109375, 0.049897193908691406, 0.05380821228027344, 0.05771923065185547, 0.0616302490234375, 0.06554126739501953, 0.06945228576660156, 0.0733633041381836, 0.07727432250976562, 0.08118534088134766, 0.08509635925292969, 0.08900737762451172, 0.09291839599609375, 0.09682941436767578, 0.10074043273925781, 0.10465145111083984, 0.10856246948242188, 0.1124734878540039, 0.11638450622558594, 0.12029552459716797, 0.12420654296875]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 8.0, 10.0, 28.0, 79.0, 204.0, 351.0, 197.0, 66.0, 33.0, 12.0, 7.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.962121963500977, -7.778932094573975, -7.5957417488098145, -7.4125518798828125, -7.2293620109558105, -7.046172142028809, -6.862981796264648, -6.6797919273376465, -6.4966020584106445, -6.313412189483643, -6.130221843719482, -5.9470319747924805, -5.7638421058654785, -5.580652236938477, -5.397461891174316, -5.2142720222473145, -5.031081676483154, -4.847891807556152, -4.664701461791992, -4.48151159286499, -4.298321723937988, -4.115131378173828, -3.931941509246826, -3.748751640319824, -3.565561532974243, -3.382371425628662, -3.19918155670166, -3.015991449356079, -2.832801342010498, -2.649611473083496, -2.466421365737915, -2.283231258392334, -2.100041389465332, -1.9168514013290405, -1.733661413192749, -1.550471305847168, -1.3672813177108765, -1.184091329574585, -1.000901222229004, -0.8177112340927124, -0.6345212459564209, -0.451331228017807, -0.2681412100791931, -0.08495116233825684, 0.09823882579803467, 0.28142881393432617, 0.4646189212799072, 0.6478089094161987, 0.8309988975524902, 1.0141888856887817, 1.1973788738250732, 1.3805689811706543, 1.5637589693069458, 1.7469489574432373, 1.9301390647888184, 2.1133289337158203, 2.2965190410614014, 2.4797091484069824, 2.6628990173339844, 2.8460891246795654, 3.0292792320251465, 3.2124691009521484, 3.3956592082977295, 3.5788493156433105, 3.7620391845703125]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 2.0, 6.0, 5.0, 15.0, 23.0, 19.0, 32.0, 44.0, 52.0, 59.0, 59.0, 74.0, 82.0, 63.0, 73.0, 72.0, 68.0, 64.0, 44.0, 36.0, 41.0, 21.0, 21.0, 10.0, 8.0, 9.0, 3.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.457720994949341, -2.319880962371826, -2.1820411682128906, -2.044201374053955, -1.9063613414764404, -1.7685214281082153, -1.6306815147399902, -1.4928416013717651, -1.35500168800354, -1.217161774635315, -1.0793218612670898, -0.9414819478988647, -0.8036420345306396, -0.6658021211624146, -0.5279622077941895, -0.39012229442596436, -0.25228238105773926, -0.11444246768951416, 0.023397445678710938, 0.16123735904693604, 0.29907727241516113, 0.43691718578338623, 0.5747570991516113, 0.7125970125198364, 0.8504369258880615, 0.9882768392562866, 1.1261167526245117, 1.2639566659927368, 1.401796579360962, 1.539636492729187, 1.677476406097412, 1.8153163194656372, 1.9531564712524414, 2.090996265411377, 2.2288362979888916, 2.3666763305664062, 2.504516124725342, 2.6423559188842773, 2.780195951461792, 2.9180359840393066, 3.055875778198242, 3.1937155723571777, 3.3315556049346924, 3.469395637512207, 3.6072354316711426, 3.745075225830078, 3.8829152584075928, 4.020755290985107, 4.158595085144043, 4.2964348793029785, 4.434274673461914, 4.572114944458008, 4.709954738616943, 4.847794532775879, 4.985634803771973, 5.123474597930908, 5.261314392089844, 5.399154186248779, 5.536993980407715, 5.674834251403809, 5.812674045562744, 5.95051383972168, 6.088354110717773, 6.226193904876709, 6.3640336990356445]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 3.0, 4.0, 4.0, 2.0, 4.0, 3.0, 12.0, 16.0, 32.0, 32.0, 52.0, 112.0, 165.0, 290.0, 513.0, 1064.0, 2546.0, 7845.0, 82427.0, 3549404.0, 519146.0, 22727.0, 4165.0, 2004.0, 843.0, 373.0, 194.0, 102.0, 76.0, 47.0, 31.0, 21.0, 6.0, 7.0, 6.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.056640625, -2.975677490234375, -2.89471435546875, -2.813751220703125, -2.7327880859375, -2.651824951171875, -2.57086181640625, -2.489898681640625, -2.408935546875, -2.327972412109375, -2.24700927734375, -2.166046142578125, -2.0850830078125, -2.004119873046875, -1.92315673828125, -1.842193603515625, -1.76123046875, -1.680267333984375, -1.59930419921875, -1.518341064453125, -1.4373779296875, -1.356414794921875, -1.27545166015625, -1.194488525390625, -1.113525390625, -1.032562255859375, -0.95159912109375, -0.870635986328125, -0.7896728515625, -0.708709716796875, -0.62774658203125, -0.546783447265625, -0.4658203125, -0.384857177734375, -0.30389404296875, -0.222930908203125, -0.1419677734375, -0.061004638671875, 0.01995849609375, 0.100921630859375, 0.181884765625, 0.262847900390625, 0.34381103515625, 0.424774169921875, 0.5057373046875, 0.586700439453125, 0.66766357421875, 0.748626708984375, 0.82958984375, 0.910552978515625, 0.99151611328125, 1.072479248046875, 1.1534423828125, 1.234405517578125, 1.31536865234375, 1.396331787109375, 1.477294921875, 1.558258056640625, 1.63922119140625, 1.720184326171875, 1.8011474609375, 1.882110595703125, 1.96307373046875, 2.044036865234375, 2.125]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 7.0, 4.0, 6.0, 6.0, 10.0, 14.0, 18.0, 17.0, 34.0, 51.0, 59.0, 75.0, 78.0, 85.0, 106.0, 104.0, 81.0, 61.0, 64.0, 43.0, 29.0, 13.0, 14.0, 13.0, 4.0, 5.0, 6.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1796875, -2.12109375, -2.0625, -2.00390625, -1.9453125, -1.88671875, -1.828125, -1.76953125, -1.7109375, -1.65234375, -1.59375, -1.53515625, -1.4765625, -1.41796875, -1.359375, -1.30078125, -1.2421875, -1.18359375, -1.125, -1.06640625, -1.0078125, -0.94921875, -0.890625, -0.83203125, -0.7734375, -0.71484375, -0.65625, -0.59765625, -0.5390625, -0.48046875, -0.421875, -0.36328125, -0.3046875, -0.24609375, -0.1875, -0.12890625, -0.0703125, -0.01171875, 0.046875, 0.10546875, 0.1640625, 0.22265625, 0.28125, 0.33984375, 0.3984375, 0.45703125, 0.515625, 0.57421875, 0.6328125, 0.69140625, 0.75, 0.80859375, 0.8671875, 0.92578125, 0.984375, 1.04296875, 1.1015625, 1.16015625, 1.21875, 1.27734375, 1.3359375, 1.39453125, 1.453125, 1.51171875, 1.5703125]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 4.0, 13.0, 26.0, 55.0, 163.0, 632.0, 9759.0, 4178438.0, 4553.0, 441.0, 117.0, 32.0, 24.0, 12.0, 6.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.7734375, -15.4014892578125, -15.029541015625, -14.6575927734375, -14.28564453125, -13.9136962890625, -13.541748046875, -13.1697998046875, -12.7978515625, -12.4259033203125, -12.053955078125, -11.6820068359375, -11.31005859375, -10.9381103515625, -10.566162109375, -10.1942138671875, -9.822265625, -9.4503173828125, -9.078369140625, -8.7064208984375, -8.33447265625, -7.9625244140625, -7.590576171875, -7.2186279296875, -6.8466796875, -6.4747314453125, -6.102783203125, -5.7308349609375, -5.35888671875, -4.9869384765625, -4.614990234375, -4.2430419921875, -3.87109375, -3.4991455078125, -3.127197265625, -2.7552490234375, -2.38330078125, -2.0113525390625, -1.639404296875, -1.2674560546875, -0.8955078125, -0.5235595703125, -0.151611328125, 0.2203369140625, 0.59228515625, 0.9642333984375, 1.336181640625, 1.7081298828125, 2.080078125, 2.4520263671875, 2.823974609375, 3.1959228515625, 3.56787109375, 3.9398193359375, 4.311767578125, 4.6837158203125, 5.0556640625, 5.4276123046875, 5.799560546875, 6.1715087890625, 6.54345703125, 6.9154052734375, 7.287353515625, 7.6593017578125, 8.03125]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 13.0, 12.0, 31.0, 78.0, 422.0, 2589.0, 742.0, 99.0, 39.0, 21.0, 16.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8359375, -0.7972564697265625, -0.758575439453125, -0.7198944091796875, -0.68121337890625, -0.6425323486328125, -0.603851318359375, -0.5651702880859375, -0.5264892578125, -0.4878082275390625, -0.449127197265625, -0.4104461669921875, -0.37176513671875, -0.3330841064453125, -0.294403076171875, -0.2557220458984375, -0.217041015625, -0.1783599853515625, -0.139678955078125, -0.1009979248046875, -0.06231689453125, -0.0236358642578125, 0.015045166015625, 0.0537261962890625, 0.0924072265625, 0.1310882568359375, 0.169769287109375, 0.2084503173828125, 0.24713134765625, 0.2858123779296875, 0.324493408203125, 0.3631744384765625, 0.40185546875, 0.4405364990234375, 0.479217529296875, 0.5178985595703125, 0.55657958984375, 0.5952606201171875, 0.633941650390625, 0.6726226806640625, 0.7113037109375, 0.7499847412109375, 0.788665771484375, 0.8273468017578125, 0.86602783203125, 0.9047088623046875, 0.943389892578125, 0.9820709228515625, 1.020751953125, 1.0594329833984375, 1.098114013671875, 1.1367950439453125, 1.17547607421875, 1.2141571044921875, 1.252838134765625, 1.2915191650390625, 1.3302001953125, 1.3688812255859375, 1.407562255859375, 1.4462432861328125, 1.48492431640625, 1.5236053466796875, 1.562286376953125, 1.6009674072265625, 1.6396484375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 3.0, 7.0, 10.0, 19.0, 39.0, 74.0, 173.0, 277.0, 184.0, 105.0, 47.0, 34.0, 13.0, 7.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.185263633728027, -4.067671775817871, -3.9500796794891357, -3.8324875831604004, -3.714895486831665, -3.5973033905029297, -3.4797115325927734, -3.362119436264038, -3.2445273399353027, -3.1269352436065674, -3.009343385696411, -2.891751289367676, -2.7741591930389404, -2.656567096710205, -2.538975238800049, -2.4213831424713135, -2.3037912845611572, -2.186199188232422, -2.0686073303222656, -1.9510152339935303, -1.833423137664795, -1.7158311605453491, -1.5982391834259033, -1.480647087097168, -1.3630551099777222, -1.2454631328582764, -1.127871036529541, -1.0102790594100952, -0.8926870226860046, -0.7750949859619141, -0.6575030088424683, -0.5399109721183777, -0.4223191738128662, -0.30472713708877563, -0.18713513016700745, -0.06954312324523926, 0.04804891347885132, 0.1656409502029419, 0.2832329273223877, 0.40082496404647827, 0.5184170007705688, 0.6360090374946594, 0.75360107421875, 0.8711930513381958, 0.9887850880622864, 1.106377124786377, 1.2239691019058228, 1.3415610790252686, 1.459153175354004, 1.5767451524734497, 1.694337248802185, 1.8119292259216309, 1.9295213222503662, 2.0471134185791016, 2.164705276489258, 2.282297372817993, 2.3998894691467285, 2.517481565475464, 2.63507342338562, 2.7526655197143555, 2.870257616043091, 2.987849712371826, 3.1054415702819824, 3.2230336666107178, 3.340625524520874]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 8.0, 14.0, 8.0, 15.0, 18.0, 34.0, 38.0, 39.0, 51.0, 66.0, 67.0, 77.0, 76.0, 68.0, 75.0, 58.0, 65.0, 55.0, 49.0, 33.0, 24.0, 21.0, 11.0, 11.0, 6.0, 4.0, 7.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0943245887756348, -2.038926124572754, -1.9835278987884521, -1.9281295537948608, -1.8727312088012695, -1.8173328638076782, -1.761934518814087, -1.7065361738204956, -1.6511378288269043, -1.595739483833313, -1.5403411388397217, -1.4849427938461304, -1.429544448852539, -1.3741461038589478, -1.3187477588653564, -1.2633494138717651, -1.2079510688781738, -1.1525527238845825, -1.0971543788909912, -1.0417560338974, -0.9863576889038086, -0.9309593439102173, -0.875560998916626, -0.8201626539230347, -0.7647643089294434, -0.709365963935852, -0.6539676189422607, -0.5985692739486694, -0.5431709289550781, -0.4877725839614868, -0.4323742389678955, -0.3769758939743042, -0.32157766819000244, -0.26617932319641113, -0.21078097820281982, -0.15538263320922852, -0.09998428821563721, -0.0445859432220459, 0.01081240177154541, 0.06621074676513672, 0.12160909175872803, 0.17700743675231934, 0.23240578174591064, 0.28780412673950195, 0.34320247173309326, 0.39860081672668457, 0.4539991617202759, 0.5093975067138672, 0.5647958517074585, 0.6201941967010498, 0.6755925416946411, 0.7309908866882324, 0.7863892316818237, 0.841787576675415, 0.8971859216690063, 0.9525842666625977, 1.007982611656189, 1.0633809566497803, 1.1187793016433716, 1.174177646636963, 1.2295759916305542, 1.2849743366241455, 1.3403726816177368, 1.3957710266113281, 1.4511693716049194]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 5.0, 3.0, 1.0, 2.0, 7.0, 6.0, 6.0, 14.0, 19.0, 30.0, 54.0, 78.0, 164.0, 301.0, 589.0, 1272.0, 2850.0, 7962.0, 33878.0, 671775.0, 296371.0, 22463.0, 6190.0, 2353.0, 1077.0, 495.0, 254.0, 137.0, 77.0, 41.0, 30.0, 18.0, 12.0, 5.0, 13.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.69091796875, -0.671112060546875, -0.65130615234375, -0.631500244140625, -0.6116943359375, -0.591888427734375, -0.57208251953125, -0.552276611328125, -0.532470703125, -0.512664794921875, -0.49285888671875, -0.473052978515625, -0.4532470703125, -0.433441162109375, -0.41363525390625, -0.393829345703125, -0.3740234375, -0.354217529296875, -0.33441162109375, -0.314605712890625, -0.2947998046875, -0.274993896484375, -0.25518798828125, -0.235382080078125, -0.215576171875, -0.195770263671875, -0.17596435546875, -0.156158447265625, -0.1363525390625, -0.116546630859375, -0.09674072265625, -0.076934814453125, -0.05712890625, -0.037322998046875, -0.01751708984375, 0.002288818359375, 0.0220947265625, 0.041900634765625, 0.06170654296875, 0.081512451171875, 0.101318359375, 0.121124267578125, 0.14093017578125, 0.160736083984375, 0.1805419921875, 0.200347900390625, 0.22015380859375, 0.239959716796875, 0.259765625, 0.279571533203125, 0.29937744140625, 0.319183349609375, 0.3389892578125, 0.358795166015625, 0.37860107421875, 0.398406982421875, 0.418212890625, 0.438018798828125, 0.45782470703125, 0.477630615234375, 0.4974365234375, 0.517242431640625, 0.53704833984375, 0.556854248046875, 0.57666015625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 2.0, 6.0, 12.0, 11.0, 15.0, 23.0, 35.0, 38.0, 56.0, 86.0, 91.0, 108.0, 98.0, 86.0, 85.0, 66.0, 56.0, 46.0, 26.0, 19.0, 14.0, 11.0, 3.0, 6.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.07421875, -2.0261688232421875, -1.978118896484375, -1.9300689697265625, -1.88201904296875, -1.8339691162109375, -1.785919189453125, -1.7378692626953125, -1.6898193359375, -1.6417694091796875, -1.593719482421875, -1.5456695556640625, -1.49761962890625, -1.4495697021484375, -1.401519775390625, -1.3534698486328125, -1.305419921875, -1.2573699951171875, -1.209320068359375, -1.1612701416015625, -1.11322021484375, -1.0651702880859375, -1.017120361328125, -0.9690704345703125, -0.9210205078125, -0.8729705810546875, -0.824920654296875, -0.7768707275390625, -0.72882080078125, -0.6807708740234375, -0.632720947265625, -0.5846710205078125, -0.53662109375, -0.4885711669921875, -0.440521240234375, -0.3924713134765625, -0.34442138671875, -0.2963714599609375, -0.248321533203125, -0.2002716064453125, -0.1522216796875, -0.1041717529296875, -0.056121826171875, -0.0080718994140625, 0.03997802734375, 0.0880279541015625, 0.136077880859375, 0.1841278076171875, 0.232177734375, 0.2802276611328125, 0.328277587890625, 0.3763275146484375, 0.42437744140625, 0.4724273681640625, 0.520477294921875, 0.5685272216796875, 0.6165771484375, 0.6646270751953125, 0.712677001953125, 0.7607269287109375, 0.80877685546875, 0.8568267822265625, 0.904876708984375, 0.9529266357421875, 1.0009765625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 9.0, 8.0, 13.0, 12.0, 36.0, 40.0, 45.0, 57.0, 79.0, 124.0, 184.0, 283.0, 459.0, 649.0, 1008.0, 1651.0, 3000.0, 5629.0, 12389.0, 33426.0, 133220.0, 572796.0, 206510.0, 45924.0, 15471.0, 6828.0, 3461.0, 1925.0, 1170.0, 719.0, 486.0, 271.0, 198.0, 165.0, 79.0, 64.0, 42.0, 39.0, 21.0, 22.0, 17.0, 7.0, 10.0, 9.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.2578125, -0.2499103546142578, -0.24200820922851562, -0.23410606384277344, -0.22620391845703125, -0.21830177307128906, -0.21039962768554688, -0.2024974822998047, -0.1945953369140625, -0.1866931915283203, -0.17879104614257812, -0.17088890075683594, -0.16298675537109375, -0.15508460998535156, -0.14718246459960938, -0.1392803192138672, -0.131378173828125, -0.12347602844238281, -0.11557388305664062, -0.10767173767089844, -0.09976959228515625, -0.09186744689941406, -0.08396530151367188, -0.07606315612792969, -0.0681610107421875, -0.06025886535644531, -0.052356719970703125, -0.04445457458496094, -0.03655242919921875, -0.028650283813476562, -0.020748138427734375, -0.012845993041992188, -0.00494384765625, 0.0029582977294921875, 0.010860443115234375, 0.018762588500976562, 0.02666473388671875, 0.03456687927246094, 0.042469024658203125, 0.05037117004394531, 0.0582733154296875, 0.06617546081542969, 0.07407760620117188, 0.08197975158691406, 0.08988189697265625, 0.09778404235839844, 0.10568618774414062, 0.11358833312988281, 0.121490478515625, 0.1293926239013672, 0.13729476928710938, 0.14519691467285156, 0.15309906005859375, 0.16100120544433594, 0.16890335083007812, 0.1768054962158203, 0.1847076416015625, 0.1926097869873047, 0.20051193237304688, 0.20841407775878906, 0.21631622314453125, 0.22421836853027344, 0.23212051391601562, 0.2400226593017578, 0.2479248046875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 6.0, 4.0, 9.0, 7.0, 11.0, 10.0, 17.0, 17.0, 22.0, 28.0, 27.0, 36.0, 34.0, 38.0, 45.0, 34.0, 54.0, 46.0, 56.0, 58.0, 57.0, 40.0, 33.0, 38.0, 39.0, 38.0, 30.0, 35.0, 23.0, 18.0, 13.0, 18.0, 9.0, 12.0, 9.0, 7.0, 6.0, 7.0, 7.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.708984375, -1.6570587158203125, -1.605133056640625, -1.5532073974609375, -1.50128173828125, -1.4493560791015625, -1.397430419921875, -1.3455047607421875, -1.2935791015625, -1.2416534423828125, -1.189727783203125, -1.1378021240234375, -1.08587646484375, -1.0339508056640625, -0.982025146484375, -0.9300994873046875, -0.878173828125, -0.8262481689453125, -0.774322509765625, -0.7223968505859375, -0.67047119140625, -0.6185455322265625, -0.566619873046875, -0.5146942138671875, -0.4627685546875, -0.4108428955078125, -0.358917236328125, -0.3069915771484375, -0.25506591796875, -0.2031402587890625, -0.151214599609375, -0.0992889404296875, -0.04736328125, 0.0045623779296875, 0.056488037109375, 0.1084136962890625, 0.16033935546875, 0.2122650146484375, 0.264190673828125, 0.3161163330078125, 0.3680419921875, 0.4199676513671875, 0.471893310546875, 0.5238189697265625, 0.57574462890625, 0.6276702880859375, 0.679595947265625, 0.7315216064453125, 0.783447265625, 0.8353729248046875, 0.887298583984375, 0.9392242431640625, 0.99114990234375, 1.0430755615234375, 1.095001220703125, 1.1469268798828125, 1.1988525390625, 1.2507781982421875, 1.302703857421875, 1.3546295166015625, 1.40655517578125, 1.4584808349609375, 1.510406494140625, 1.5623321533203125, 1.6142578125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 3.0, 1.0, 2.0, 8.0, 12.0, 16.0, 14.0, 13.0, 29.0, 38.0, 65.0, 84.0, 113.0, 194.0, 318.0, 480.0, 866.0, 1527.0, 2990.0, 7101.0, 19018.0, 69654.0, 501464.0, 360428.0, 55683.0, 16161.0, 6054.0, 2779.0, 1413.0, 755.0, 426.0, 288.0, 172.0, 107.0, 81.0, 63.0, 46.0, 25.0, 16.0, 22.0, 8.0, 9.0, 3.0, 4.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 3.0, 1.0], "bins": [-0.09039306640625, -0.08780479431152344, -0.08521652221679688, -0.08262825012207031, -0.08003997802734375, -0.07745170593261719, -0.07486343383789062, -0.07227516174316406, -0.0696868896484375, -0.06709861755371094, -0.06451034545898438, -0.06192207336425781, -0.05933380126953125, -0.05674552917480469, -0.054157257080078125, -0.05156898498535156, -0.048980712890625, -0.04639244079589844, -0.043804168701171875, -0.04121589660644531, -0.03862762451171875, -0.03603935241699219, -0.033451080322265625, -0.030862808227539062, -0.0282745361328125, -0.025686264038085938, -0.023097991943359375, -0.020509719848632812, -0.01792144775390625, -0.015333175659179688, -0.012744903564453125, -0.010156631469726562, -0.007568359375, -0.0049800872802734375, -0.002391815185546875, 0.0001964569091796875, 0.00278472900390625, 0.0053730010986328125, 0.007961273193359375, 0.010549545288085938, 0.0131378173828125, 0.015726089477539062, 0.018314361572265625, 0.020902633666992188, 0.02349090576171875, 0.026079177856445312, 0.028667449951171875, 0.03125572204589844, 0.033843994140625, 0.03643226623535156, 0.039020538330078125, 0.04160881042480469, 0.04419708251953125, 0.04678535461425781, 0.049373626708984375, 0.05196189880371094, 0.0545501708984375, 0.05713844299316406, 0.059726715087890625, 0.06231498718261719, 0.06490325927734375, 0.06749153137207031, 0.07007980346679688, 0.07266807556152344, 0.07525634765625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 2.0, 6.0, 5.0, 12.0, 9.0, 8.0, 17.0, 26.0, 44.0, 56.0, 94.0, 136.0, 187.0, 133.0, 75.0, 36.0, 42.0, 23.0, 23.0, 7.0, 10.0, 10.0, 3.0, 7.0, 6.0, 5.0, 2.0, 3.0, 6.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.227327346801758e-05, -5.043204873800278e-05, -4.8590824007987976e-05, -4.6749599277973175e-05, -4.4908374547958374e-05, -4.306714981794357e-05, -4.122592508792877e-05, -3.938470035791397e-05, -3.754347562789917e-05, -3.570225089788437e-05, -3.386102616786957e-05, -3.201980143785477e-05, -3.0178576707839966e-05, -2.8337351977825165e-05, -2.6496127247810364e-05, -2.4654902517795563e-05, -2.2813677787780762e-05, -2.097245305776596e-05, -1.913122832775116e-05, -1.729000359773636e-05, -1.5448778867721558e-05, -1.3607554137706757e-05, -1.1766329407691956e-05, -9.925104677677155e-06, -8.083879947662354e-06, -6.2426552176475525e-06, -4.4014304876327515e-06, -2.5602057576179504e-06, -7.189810276031494e-07, 1.1222437024116516e-06, 2.9634684324264526e-06, 4.804693162441254e-06, 6.645917892456055e-06, 8.487142622470856e-06, 1.0328367352485657e-05, 1.2169592082500458e-05, 1.4010816812515259e-05, 1.585204154253006e-05, 1.769326627254486e-05, 1.9534491002559662e-05, 2.1375715732574463e-05, 2.3216940462589264e-05, 2.5058165192604065e-05, 2.6899389922618866e-05, 2.8740614652633667e-05, 3.058183938264847e-05, 3.242306411266327e-05, 3.426428884267807e-05, 3.610551357269287e-05, 3.794673830270767e-05, 3.978796303272247e-05, 4.1629187762737274e-05, 4.3470412492752075e-05, 4.5311637222766876e-05, 4.715286195278168e-05, 4.899408668279648e-05, 5.083531141281128e-05, 5.267653614282608e-05, 5.451776087284088e-05, 5.635898560285568e-05, 5.8200210332870483e-05, 6.0041435062885284e-05, 6.188265979290009e-05, 6.372388452291489e-05, 6.556510925292969e-05]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 6.0, 2.0, 4.0, 16.0, 14.0, 24.0, 32.0, 59.0, 97.0, 185.0, 349.0, 591.0, 1360.0, 3029.0, 8969.0, 41416.0, 623962.0, 328696.0, 28016.0, 6883.0, 2524.0, 1120.0, 544.0, 283.0, 145.0, 76.0, 56.0, 25.0, 25.0, 12.0, 13.0, 7.0, 2.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11419677734375, -0.11010265350341797, -0.10600852966308594, -0.1019144058227539, -0.09782028198242188, -0.09372615814208984, -0.08963203430175781, -0.08553791046142578, -0.08144378662109375, -0.07734966278076172, -0.07325553894042969, -0.06916141510009766, -0.06506729125976562, -0.060973167419433594, -0.05687904357910156, -0.05278491973876953, -0.0486907958984375, -0.04459667205810547, -0.04050254821777344, -0.036408424377441406, -0.032314300537109375, -0.028220176696777344, -0.024126052856445312, -0.02003192901611328, -0.01593780517578125, -0.011843681335449219, -0.0077495574951171875, -0.0036554336547851562, 0.000438690185546875, 0.004532814025878906, 0.008626937866210938, 0.012721061706542969, 0.016815185546875, 0.02090930938720703, 0.025003433227539062, 0.029097557067871094, 0.033191680908203125, 0.037285804748535156, 0.04137992858886719, 0.04547405242919922, 0.04956817626953125, 0.05366230010986328, 0.05775642395019531, 0.061850547790527344, 0.06594467163085938, 0.0700387954711914, 0.07413291931152344, 0.07822704315185547, 0.0823211669921875, 0.08641529083251953, 0.09050941467285156, 0.0946035385131836, 0.09869766235351562, 0.10279178619384766, 0.10688591003417969, 0.11098003387451172, 0.11507415771484375, 0.11916828155517578, 0.12326240539550781, 0.12735652923583984, 0.13145065307617188, 0.1355447769165039, 0.13963890075683594, 0.14373302459716797, 0.1478271484375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 6.0, 3.0, 5.0, 7.0, 4.0, 8.0, 12.0, 13.0, 18.0, 23.0, 35.0, 51.0, 65.0, 77.0, 100.0, 140.0, 98.0, 89.0, 64.0, 37.0, 31.0, 35.0, 17.0, 19.0, 9.0, 8.0, 9.0, 4.0, 7.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.024383544921875, -0.023694276809692383, -0.023005008697509766, -0.02231574058532715, -0.02162647247314453, -0.020937204360961914, -0.020247936248779297, -0.01955866813659668, -0.018869400024414062, -0.018180131912231445, -0.017490863800048828, -0.01680159568786621, -0.016112327575683594, -0.015423059463500977, -0.01473379135131836, -0.014044523239135742, -0.013355255126953125, -0.012665987014770508, -0.01197671890258789, -0.011287450790405273, -0.010598182678222656, -0.009908914566040039, -0.009219646453857422, -0.008530378341674805, -0.007841110229492188, -0.00715184211730957, -0.006462574005126953, -0.005773305892944336, -0.005084037780761719, -0.0043947696685791016, -0.0037055015563964844, -0.003016233444213867, -0.00232696533203125, -0.0016376972198486328, -0.0009484291076660156, -0.00025916099548339844, 0.00043010711669921875, 0.001119375228881836, 0.0018086433410644531, 0.0024979114532470703, 0.0031871795654296875, 0.0038764476776123047, 0.004565715789794922, 0.005254983901977539, 0.005944252014160156, 0.0066335201263427734, 0.007322788238525391, 0.008012056350708008, 0.008701324462890625, 0.009390592575073242, 0.01007986068725586, 0.010769128799438477, 0.011458396911621094, 0.012147665023803711, 0.012836933135986328, 0.013526201248168945, 0.014215469360351562, 0.01490473747253418, 0.015594005584716797, 0.016283273696899414, 0.01697254180908203, 0.01766180992126465, 0.018351078033447266, 0.019040346145629883, 0.0197296142578125]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 4.0, 5.0, 26.0, 48.0, 204.0, 433.0, 192.0, 55.0, 24.0, 4.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-5.729193687438965, -5.6084513664245605, -5.4877095222473145, -5.36696720123291, -5.246224880218506, -5.125482559204102, -5.0047407150268555, -4.883998394012451, -4.763256072998047, -4.642513751983643, -4.5217719078063965, -4.401029586791992, -4.280287265777588, -4.159544944763184, -4.0388031005859375, -3.918060779571533, -3.797318696975708, -3.676576614379883, -3.5558342933654785, -3.4350922107696533, -3.314349889755249, -3.193607807159424, -3.0728654861450195, -2.9521234035491943, -2.831381320953369, -2.710639238357544, -2.5898969173431396, -2.4691548347473145, -2.34841251373291, -2.227670431137085, -2.1069283485412598, -1.9861860275268555, -1.8654435873031616, -1.7447013854980469, -1.6239591836929321, -1.5032169818878174, -1.3824748992919922, -1.261732578277588, -1.1409904956817627, -1.020248293876648, -0.8995060920715332, -0.7787638902664185, -0.6580216884613037, -0.5372795462608337, -0.416537344455719, -0.29579514265060425, -0.17505300045013428, -0.05431079864501953, 0.06643140316009521, 0.18717359006404877, 0.3079157769680023, 0.4286579489707947, 0.5494001507759094, 0.6701423525810242, 0.7908844947814941, 0.9116266965866089, 1.0323688983917236, 1.1531111001968384, 1.2738533020019531, 1.3945953845977783, 1.5153377056121826, 1.6360797882080078, 1.7568219900131226, 1.8775641918182373, 1.998306393623352]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 4.0, 3.0, 2.0, 13.0, 11.0, 17.0, 21.0, 39.0, 49.0, 53.0, 83.0, 86.0, 102.0, 95.0, 82.0, 89.0, 56.0, 68.0, 47.0, 31.0, 19.0, 13.0, 9.0, 8.0, 3.0, 2.0, 4.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.9014041423797607, -1.8563053607940674, -1.811206579208374, -1.7661077976226807, -1.7210090160369873, -1.675910234451294, -1.6308114528656006, -1.5857127904891968, -1.5406140089035034, -1.49551522731781, -1.4504164457321167, -1.4053176641464233, -1.36021888256073, -1.3151202201843262, -1.2700214385986328, -1.2249226570129395, -1.179823875427246, -1.1347250938415527, -1.0896263122558594, -1.044527530670166, -0.9994288086891174, -0.9543300271034241, -0.9092312455177307, -0.8641325235366821, -0.8190336227416992, -0.7739348411560059, -0.7288360595703125, -0.6837372779846191, -0.6386385560035706, -0.5935397744178772, -0.5484409928321838, -0.5033422708511353, -0.4582434892654419, -0.41314470767974854, -0.36804595589637756, -0.3229471743106842, -0.27784842252731323, -0.23274964094161987, -0.1876508593559265, -0.14255210757255554, -0.09745332598686218, -0.05235455557703972, -0.007255785167217255, 0.03784298896789551, 0.08294175565242767, 0.12804052233695984, 0.1731393039226532, 0.21823805570602417, 0.26333683729171753, 0.3084356188774109, 0.35353437066078186, 0.3986331522464752, 0.4437319040298462, 0.48883068561553955, 0.5339294672012329, 0.5790282487869263, 0.6241270303726196, 0.669225811958313, 0.7143245935440063, 0.7594233751296997, 0.8045220971107483, 0.8496208786964417, 0.894719660282135, 0.9398183822631836, 0.984917163848877]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 7.0, 0.0, 4.0, 15.0, 15.0, 17.0, 37.0, 49.0, 107.0, 176.0, 421.0, 793.0, 1890.0, 5246.0, 23085.0, 703177.0, 290624.0, 15727.0, 4199.0, 1560.0, 678.0, 310.0, 182.0, 74.0, 56.0, 34.0, 21.0, 23.0, 12.0, 3.0, 2.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.892578125, -1.8426361083984375, -1.792694091796875, -1.7427520751953125, -1.69281005859375, -1.6428680419921875, -1.592926025390625, -1.5429840087890625, -1.4930419921875, -1.4430999755859375, -1.393157958984375, -1.3432159423828125, -1.29327392578125, -1.2433319091796875, -1.193389892578125, -1.1434478759765625, -1.093505859375, -1.0435638427734375, -0.993621826171875, -0.9436798095703125, -0.89373779296875, -0.8437957763671875, -0.793853759765625, -0.7439117431640625, -0.6939697265625, -0.6440277099609375, -0.594085693359375, -0.5441436767578125, -0.49420166015625, -0.4442596435546875, -0.394317626953125, -0.3443756103515625, -0.29443359375, -0.2444915771484375, -0.194549560546875, -0.1446075439453125, -0.09466552734375, -0.0447235107421875, 0.005218505859375, 0.0551605224609375, 0.1051025390625, 0.1550445556640625, 0.204986572265625, 0.2549285888671875, 0.30487060546875, 0.3548126220703125, 0.404754638671875, 0.4546966552734375, 0.504638671875, 0.5545806884765625, 0.604522705078125, 0.6544647216796875, 0.70440673828125, 0.7543487548828125, 0.804290771484375, 0.8542327880859375, 0.9041748046875, 0.9541168212890625, 1.004058837890625, 1.0540008544921875, 1.10394287109375, 1.1538848876953125, 1.203826904296875, 1.2537689208984375, 1.3037109375]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 6.0, 3.0, 11.0, 15.0, 21.0, 33.0, 55.0, 75.0, 118.0, 123.0, 139.0, 129.0, 93.0, 57.0, 56.0, 37.0, 11.0, 13.0, 7.0, 3.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.576171875, -2.449005126953125, -2.32183837890625, -2.194671630859375, -2.0675048828125, -1.940338134765625, -1.81317138671875, -1.686004638671875, -1.558837890625, -1.431671142578125, -1.30450439453125, -1.177337646484375, -1.0501708984375, -0.923004150390625, -0.79583740234375, -0.668670654296875, -0.54150390625, -0.414337158203125, -0.28717041015625, -0.160003662109375, -0.0328369140625, 0.094329833984375, 0.22149658203125, 0.348663330078125, 0.475830078125, 0.602996826171875, 0.73016357421875, 0.857330322265625, 0.9844970703125, 1.111663818359375, 1.23883056640625, 1.365997314453125, 1.4931640625, 1.620330810546875, 1.74749755859375, 1.874664306640625, 2.0018310546875, 2.128997802734375, 2.25616455078125, 2.383331298828125, 2.510498046875, 2.637664794921875, 2.76483154296875, 2.891998291015625, 3.0191650390625, 3.146331787109375, 3.27349853515625, 3.400665283203125, 3.52783203125, 3.654998779296875, 3.78216552734375, 3.909332275390625, 4.0364990234375, 4.163665771484375, 4.29083251953125, 4.417999267578125, 4.545166015625, 4.672332763671875, 4.79949951171875, 4.926666259765625, 5.0538330078125, 5.180999755859375, 5.30816650390625, 5.435333251953125, 5.5625]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 4.0, 1.0, 7.0, 4.0, 6.0, 10.0, 15.0, 13.0, 23.0, 44.0, 67.0, 69.0, 116.0, 202.0, 342.0, 598.0, 1440.0, 4065.0, 17497.0, 621294.0, 381574.0, 14793.0, 3621.0, 1311.0, 629.0, 322.0, 169.0, 116.0, 55.0, 38.0, 33.0, 25.0, 11.0, 13.0, 11.0, 6.0, 3.0, 5.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.5927734375, -1.54443359375, -1.49609375, -1.44775390625, -1.3994140625, -1.35107421875, -1.302734375, -1.25439453125, -1.2060546875, -1.15771484375, -1.109375, -1.06103515625, -1.0126953125, -0.96435546875, -0.916015625, -0.86767578125, -0.8193359375, -0.77099609375, -0.72265625, -0.67431640625, -0.6259765625, -0.57763671875, -0.529296875, -0.48095703125, -0.4326171875, -0.38427734375, -0.3359375, -0.28759765625, -0.2392578125, -0.19091796875, -0.142578125, -0.09423828125, -0.0458984375, 0.00244140625, 0.05078125, 0.09912109375, 0.1474609375, 0.19580078125, 0.244140625, 0.29248046875, 0.3408203125, 0.38916015625, 0.4375, 0.48583984375, 0.5341796875, 0.58251953125, 0.630859375, 0.67919921875, 0.7275390625, 0.77587890625, 0.82421875, 0.87255859375, 0.9208984375, 0.96923828125, 1.017578125, 1.06591796875, 1.1142578125, 1.16259765625, 1.2109375, 1.25927734375, 1.3076171875, 1.35595703125, 1.404296875, 1.45263671875, 1.5009765625]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 2.0, 5.0, 4.0, 5.0, 6.0, 4.0, 14.0, 11.0, 15.0, 15.0, 10.0, 21.0, 18.0, 17.0, 23.0, 31.0, 27.0, 28.0, 15.0, 34.0, 40.0, 53.0, 41.0, 36.0, 43.0, 34.0, 41.0, 39.0, 33.0, 41.0, 27.0, 29.0, 30.0, 19.0, 38.0, 22.0, 20.0, 19.0, 18.0, 13.0, 7.0, 10.0, 9.0, 9.0, 3.0, 4.0, 5.0, 4.0, 4.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0], "bins": [-1.505859375, -1.4591217041015625, -1.412384033203125, -1.3656463623046875, -1.31890869140625, -1.2721710205078125, -1.225433349609375, -1.1786956787109375, -1.1319580078125, -1.0852203369140625, -1.038482666015625, -0.9917449951171875, -0.94500732421875, -0.8982696533203125, -0.851531982421875, -0.8047943115234375, -0.758056640625, -0.7113189697265625, -0.664581298828125, -0.6178436279296875, -0.57110595703125, -0.5243682861328125, -0.477630615234375, -0.4308929443359375, -0.3841552734375, -0.3374176025390625, -0.290679931640625, -0.2439422607421875, -0.19720458984375, -0.1504669189453125, -0.103729248046875, -0.0569915771484375, -0.01025390625, 0.0364837646484375, 0.083221435546875, 0.1299591064453125, 0.17669677734375, 0.2234344482421875, 0.270172119140625, 0.3169097900390625, 0.3636474609375, 0.4103851318359375, 0.457122802734375, 0.5038604736328125, 0.55059814453125, 0.5973358154296875, 0.644073486328125, 0.6908111572265625, 0.737548828125, 0.7842864990234375, 0.831024169921875, 0.8777618408203125, 0.92449951171875, 0.9712371826171875, 1.017974853515625, 1.0647125244140625, 1.1114501953125, 1.1581878662109375, 1.204925537109375, 1.2516632080078125, 1.29840087890625, 1.3451385498046875, 1.391876220703125, 1.4386138916015625, 1.4853515625]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 5.0, 7.0, 5.0, 6.0, 11.0, 11.0, 19.0, 32.0, 49.0, 61.0, 68.0, 125.0, 209.0, 328.0, 520.0, 1078.0, 2222.0, 5485.0, 19302.0, 253061.0, 724926.0, 28389.0, 7054.0, 2698.0, 1233.0, 630.0, 367.0, 208.0, 129.0, 108.0, 60.0, 39.0, 26.0, 28.0, 11.0, 6.0, 8.0, 8.0, 7.0, 4.0, 3.0, 4.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.4541015625, -0.4403877258300781, -0.42667388916015625, -0.4129600524902344, -0.3992462158203125, -0.3855323791503906, -0.37181854248046875, -0.3581047058105469, -0.344390869140625, -0.3306770324707031, -0.31696319580078125, -0.3032493591308594, -0.2895355224609375, -0.2758216857910156, -0.26210784912109375, -0.24839401245117188, -0.23468017578125, -0.22096633911132812, -0.20725250244140625, -0.19353866577148438, -0.1798248291015625, -0.16611099243164062, -0.15239715576171875, -0.13868331909179688, -0.124969482421875, -0.11125564575195312, -0.09754180908203125, -0.08382797241210938, -0.0701141357421875, -0.056400299072265625, -0.04268646240234375, -0.028972625732421875, -0.0152587890625, -0.001544952392578125, 0.01216888427734375, 0.025882720947265625, 0.0395965576171875, 0.053310394287109375, 0.06702423095703125, 0.08073806762695312, 0.094451904296875, 0.10816574096679688, 0.12187957763671875, 0.13559341430664062, 0.1493072509765625, 0.16302108764648438, 0.17673492431640625, 0.19044876098632812, 0.20416259765625, 0.21787643432617188, 0.23159027099609375, 0.24530410766601562, 0.2590179443359375, 0.2727317810058594, 0.28644561767578125, 0.3001594543457031, 0.313873291015625, 0.3275871276855469, 0.34130096435546875, 0.3550148010253906, 0.3687286376953125, 0.3824424743652344, 0.39615631103515625, 0.4098701477050781, 0.423583984375]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 6.0, 10.0, 15.0, 22.0, 38.0, 76.0, 153.0, 283.0, 174.0, 86.0, 49.0, 36.0, 14.0, 6.0, 6.0, 8.0, 4.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.4849853515625e-05, -6.266124546527863e-05, -6.047263741493225e-05, -5.8284029364585876e-05, -5.60954213142395e-05, -5.390681326389313e-05, -5.171820521354675e-05, -4.952959716320038e-05, -4.7340989112854004e-05, -4.515238106250763e-05, -4.2963773012161255e-05, -4.077516496181488e-05, -3.8586556911468506e-05, -3.639794886112213e-05, -3.420934081077576e-05, -3.202073276042938e-05, -2.9832124710083008e-05, -2.7643516659736633e-05, -2.545490860939026e-05, -2.3266300559043884e-05, -2.107769250869751e-05, -1.8889084458351135e-05, -1.670047640800476e-05, -1.4511868357658386e-05, -1.2323260307312012e-05, -1.0134652256965637e-05, -7.946044206619263e-06, -5.757436156272888e-06, -3.5688281059265137e-06, -1.3802200555801392e-06, 8.083879947662354e-07, 2.99699604511261e-06, 5.185604095458984e-06, 7.374212145805359e-06, 9.562820196151733e-06, 1.1751428246498108e-05, 1.3940036296844482e-05, 1.6128644347190857e-05, 1.831725239753723e-05, 2.0505860447883606e-05, 2.269446849822998e-05, 2.4883076548576355e-05, 2.707168459892273e-05, 2.9260292649269104e-05, 3.144890069961548e-05, 3.363750874996185e-05, 3.582611680030823e-05, 3.80147248506546e-05, 4.0203332901000977e-05, 4.239194095134735e-05, 4.4580549001693726e-05, 4.67691570520401e-05, 4.8957765102386475e-05, 5.114637315273285e-05, 5.3334981203079224e-05, 5.55235892534256e-05, 5.771219730377197e-05, 5.990080535411835e-05, 6.208941340446472e-05, 6.42780214548111e-05, 6.646662950515747e-05, 6.865523755550385e-05, 7.084384560585022e-05, 7.30324536561966e-05, 7.522106170654297e-05]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 8.0, 5.0, 8.0, 13.0, 6.0, 16.0, 22.0, 22.0, 62.0, 81.0, 147.0, 314.0, 679.0, 1864.0, 5856.0, 31259.0, 913260.0, 80837.0, 9608.0, 2692.0, 909.0, 411.0, 197.0, 100.0, 56.0, 27.0, 29.0, 16.0, 12.0, 7.0, 8.0, 4.0, 2.0, 5.0, 2.0, 5.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.6728515625, -0.6545028686523438, -0.6361541748046875, -0.6178054809570312, -0.599456787109375, -0.5811080932617188, -0.5627593994140625, -0.5444107055664062, -0.52606201171875, -0.5077133178710938, -0.4893646240234375, -0.47101593017578125, -0.452667236328125, -0.43431854248046875, -0.4159698486328125, -0.39762115478515625, -0.3792724609375, -0.36092376708984375, -0.3425750732421875, -0.32422637939453125, -0.305877685546875, -0.28752899169921875, -0.2691802978515625, -0.25083160400390625, -0.23248291015625, -0.21413421630859375, -0.1957855224609375, -0.17743682861328125, -0.159088134765625, -0.14073944091796875, -0.1223907470703125, -0.10404205322265625, -0.085693359375, -0.06734466552734375, -0.0489959716796875, -0.03064727783203125, -0.012298583984375, 0.00605010986328125, 0.0243988037109375, 0.04274749755859375, 0.06109619140625, 0.07944488525390625, 0.0977935791015625, 0.11614227294921875, 0.134490966796875, 0.15283966064453125, 0.1711883544921875, 0.18953704833984375, 0.2078857421875, 0.22623443603515625, 0.2445831298828125, 0.26293182373046875, 0.281280517578125, 0.29962921142578125, 0.3179779052734375, 0.33632659912109375, 0.35467529296875, 0.37302398681640625, 0.3913726806640625, 0.40972137451171875, 0.428070068359375, 0.44641876220703125, 0.4647674560546875, 0.48311614990234375, 0.50146484375]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 3.0, 4.0, 0.0, 2.0, 9.0, 12.0, 17.0, 24.0, 13.0, 32.0, 75.0, 137.0, 245.0, 188.0, 86.0, 42.0, 27.0, 18.0, 14.0, 15.0, 6.0, 8.0, 4.0, 6.0, 1.0, 4.0, 4.0, 1.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.174072265625, -0.16821861267089844, -0.16236495971679688, -0.1565113067626953, -0.15065765380859375, -0.1448040008544922, -0.13895034790039062, -0.13309669494628906, -0.1272430419921875, -0.12138938903808594, -0.11553573608398438, -0.10968208312988281, -0.10382843017578125, -0.09797477722167969, -0.09212112426757812, -0.08626747131347656, -0.080413818359375, -0.07456016540527344, -0.06870651245117188, -0.06285285949707031, -0.05699920654296875, -0.05114555358886719, -0.045291900634765625, -0.03943824768066406, -0.0335845947265625, -0.027730941772460938, -0.021877288818359375, -0.016023635864257812, -0.01016998291015625, -0.0043163299560546875, 0.001537322998046875, 0.0073909759521484375, 0.01324462890625, 0.019098281860351562, 0.024951934814453125, 0.030805587768554688, 0.03665924072265625, 0.04251289367675781, 0.048366546630859375, 0.05422019958496094, 0.0600738525390625, 0.06592750549316406, 0.07178115844726562, 0.07763481140136719, 0.08348846435546875, 0.08934211730957031, 0.09519577026367188, 0.10104942321777344, 0.106903076171875, 0.11275672912597656, 0.11861038208007812, 0.12446403503417969, 0.13031768798828125, 0.1361713409423828, 0.14202499389648438, 0.14787864685058594, 0.1537322998046875, 0.15958595275878906, 0.16543960571289062, 0.1712932586669922, 0.17714691162109375, 0.1830005645751953, 0.18885421752929688, 0.19470787048339844, 0.2005615234375]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 6.0, 3.0, 8.0, 17.0, 29.0, 47.0, 96.0, 216.0, 258.0, 149.0, 87.0, 42.0, 19.0, 12.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.628633975982666, -4.489284515380859, -4.349935054779053, -4.210585594177246, -4.0712361335754395, -3.931886672973633, -3.792536973953247, -3.6531875133514404, -3.513838052749634, -3.374488592147827, -3.2351391315460205, -3.095789670944214, -2.956439971923828, -2.8170905113220215, -2.677741050720215, -2.538391590118408, -2.3990421295166016, -2.259692668914795, -2.1203432083129883, -1.980993628501892, -1.8416441679000854, -1.7022947072982788, -1.5629451274871826, -1.423595666885376, -1.2842462062835693, -1.1448967456817627, -1.005547285079956, -0.8661977052688599, -0.7268482446670532, -0.5874987840652466, -0.44814926385879517, -0.30879974365234375, -0.1694507598876953, -0.030101269483566284, 0.10924822092056274, 0.24859771132469177, 0.3879472017288208, 0.5272966623306274, 0.6666461825370789, 0.8059957027435303, 0.9453451633453369, 1.0846946239471436, 1.2240440845489502, 1.3633936643600464, 1.502743124961853, 1.6420925855636597, 1.7814421653747559, 1.9207916259765625, 2.060141086578369, 2.199490547180176, 2.3388400077819824, 2.478189468383789, 2.6175389289855957, 2.7568883895874023, 2.896238088607788, 3.0355875492095947, 3.1749370098114014, 3.314286470413208, 3.4536359310150146, 3.5929853916168213, 3.732335090637207, 3.8716845512390137, 4.01103401184082, 4.150383472442627, 4.289732933044434]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 3.0, 4.0, 10.0, 11.0, 15.0, 20.0, 18.0, 24.0, 32.0, 22.0, 37.0, 41.0, 49.0, 62.0, 52.0, 50.0, 64.0, 78.0, 53.0, 68.0, 31.0, 50.0, 36.0, 32.0, 35.0, 33.0, 23.0, 21.0, 9.0, 5.0, 5.0, 3.0, 7.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9645183086395264, -2.838589668273926, -2.7126612663269043, -2.5867326259613037, -2.4608042240142822, -2.3348755836486816, -2.20894718170166, -2.0830185413360596, -1.9570900201797485, -1.8311614990234375, -1.7052329778671265, -1.5793044567108154, -1.4533758163452148, -1.3274474143981934, -1.2015187740325928, -1.0755902528762817, -0.9496617317199707, -0.8237332105636597, -0.6978046894073486, -0.5718761086463928, -0.4459475874900818, -0.32001906633377075, -0.19409048557281494, -0.0681619644165039, 0.05776655673980713, 0.18369509279727936, 0.3096236288547516, 0.435552179813385, 0.561480700969696, 0.6874092221260071, 0.8133378028869629, 0.9392663240432739, 1.065195083618164, 1.191123604774475, 1.3170521259307861, 1.4429807662963867, 1.5689091682434082, 1.6948378086090088, 1.8207663297653198, 1.9466948509216309, 2.0726232528686523, 2.198551893234253, 2.3244802951812744, 2.450408935546875, 2.5763373374938965, 2.702265977859497, 2.8281946182250977, 2.954123020172119, 3.0800516605377197, 3.2059803009033203, 3.331908702850342, 3.4578373432159424, 3.583765745162964, 3.7096943855285645, 3.835622787475586, 3.9615514278411865, 4.087480068206787, 4.213408470153809, 4.339337348937988, 4.46526575088501, 4.591194152832031, 4.717122554779053, 4.843051433563232, 4.968979835510254, 5.094908237457275]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 5.0, 5.0, 9.0, 8.0, 11.0, 28.0, 29.0, 47.0, 79.0, 174.0, 269.0, 567.0, 1381.0, 5354.0, 120878.0, 3994405.0, 63151.0, 4865.0, 1897.0, 537.0, 245.0, 136.0, 80.0, 46.0, 30.0, 21.0, 12.0, 8.0, 2.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-5.203125, -5.08331298828125, -4.9635009765625, -4.84368896484375, -4.723876953125, -4.60406494140625, -4.4842529296875, -4.36444091796875, -4.24462890625, -4.12481689453125, -4.0050048828125, -3.88519287109375, -3.765380859375, -3.64556884765625, -3.5257568359375, -3.40594482421875, -3.2861328125, -3.16632080078125, -3.0465087890625, -2.92669677734375, -2.806884765625, -2.68707275390625, -2.5672607421875, -2.44744873046875, -2.32763671875, -2.20782470703125, -2.0880126953125, -1.96820068359375, -1.848388671875, -1.72857666015625, -1.6087646484375, -1.48895263671875, -1.369140625, -1.24932861328125, -1.1295166015625, -1.00970458984375, -0.889892578125, -0.77008056640625, -0.6502685546875, -0.53045654296875, -0.41064453125, -0.29083251953125, -0.1710205078125, -0.05120849609375, 0.068603515625, 0.18841552734375, 0.3082275390625, 0.42803955078125, 0.5478515625, 0.66766357421875, 0.7874755859375, 0.90728759765625, 1.027099609375, 1.14691162109375, 1.2667236328125, 1.38653564453125, 1.50634765625, 1.62615966796875, 1.7459716796875, 1.86578369140625, 1.985595703125, 2.10540771484375, 2.2252197265625, 2.34503173828125, 2.46484375]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 3.0, 8.0, 8.0, 7.0, 15.0, 24.0, 46.0, 50.0, 56.0, 84.0, 90.0, 109.0, 100.0, 87.0, 87.0, 62.0, 56.0, 35.0, 23.0, 12.0, 17.0, 7.0, 6.0, 4.0, 0.0, 3.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.322265625, -2.2640838623046875, -2.205902099609375, -2.1477203369140625, -2.08953857421875, -2.0313568115234375, -1.973175048828125, -1.9149932861328125, -1.8568115234375, -1.7986297607421875, -1.740447998046875, -1.6822662353515625, -1.62408447265625, -1.5659027099609375, -1.507720947265625, -1.4495391845703125, -1.391357421875, -1.3331756591796875, -1.274993896484375, -1.2168121337890625, -1.15863037109375, -1.1004486083984375, -1.042266845703125, -0.9840850830078125, -0.9259033203125, -0.8677215576171875, -0.809539794921875, -0.7513580322265625, -0.69317626953125, -0.6349945068359375, -0.576812744140625, -0.5186309814453125, -0.46044921875, -0.4022674560546875, -0.344085693359375, -0.2859039306640625, -0.22772216796875, -0.1695404052734375, -0.111358642578125, -0.0531768798828125, 0.0050048828125, 0.0631866455078125, 0.121368408203125, 0.1795501708984375, 0.23773193359375, 0.2959136962890625, 0.354095458984375, 0.4122772216796875, 0.470458984375, 0.5286407470703125, 0.586822509765625, 0.6450042724609375, 0.70318603515625, 0.7613677978515625, 0.819549560546875, 0.8777313232421875, 0.9359130859375, 0.9940948486328125, 1.052276611328125, 1.1104583740234375, 1.16864013671875, 1.2268218994140625, 1.285003662109375, 1.3431854248046875, 1.4013671875]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 3.0, 4.0, 7.0, 15.0, 9.0, 18.0, 35.0, 75.0, 116.0, 259.0, 594.0, 1912.0, 8790.0, 271441.0, 3890439.0, 16413.0, 2678.0, 808.0, 311.0, 143.0, 85.0, 48.0, 23.0, 19.0, 11.0, 12.0, 2.0, 5.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.06640625, -4.936981201171875, -4.80755615234375, -4.678131103515625, -4.5487060546875, -4.419281005859375, -4.28985595703125, -4.160430908203125, -4.031005859375, -3.901580810546875, -3.77215576171875, -3.642730712890625, -3.5133056640625, -3.383880615234375, -3.25445556640625, -3.125030517578125, -2.99560546875, -2.866180419921875, -2.73675537109375, -2.607330322265625, -2.4779052734375, -2.348480224609375, -2.21905517578125, -2.089630126953125, -1.960205078125, -1.830780029296875, -1.70135498046875, -1.571929931640625, -1.4425048828125, -1.313079833984375, -1.18365478515625, -1.054229736328125, -0.9248046875, -0.795379638671875, -0.66595458984375, -0.536529541015625, -0.4071044921875, -0.277679443359375, -0.14825439453125, -0.018829345703125, 0.110595703125, 0.240020751953125, 0.36944580078125, 0.498870849609375, 0.6282958984375, 0.757720947265625, 0.88714599609375, 1.016571044921875, 1.14599609375, 1.275421142578125, 1.40484619140625, 1.534271240234375, 1.6636962890625, 1.793121337890625, 1.92254638671875, 2.051971435546875, 2.181396484375, 2.310821533203125, 2.44024658203125, 2.569671630859375, 2.6990966796875, 2.828521728515625, 2.95794677734375, 3.087371826171875, 3.216796875]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 4.0, 10.0, 3.0, 16.0, 19.0, 14.0, 34.0, 73.0, 307.0, 1480.0, 1544.0, 376.0, 97.0, 44.0, 14.0, 13.0, 8.0, 5.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.69873046875, -0.6707687377929688, -0.6428070068359375, -0.6148452758789062, -0.586883544921875, -0.5589218139648438, -0.5309600830078125, -0.5029983520507812, -0.47503662109375, -0.44707489013671875, -0.4191131591796875, -0.39115142822265625, -0.363189697265625, -0.33522796630859375, -0.3072662353515625, -0.27930450439453125, -0.2513427734375, -0.22338104248046875, -0.1954193115234375, -0.16745758056640625, -0.139495849609375, -0.11153411865234375, -0.0835723876953125, -0.05561065673828125, -0.02764892578125, 0.00031280517578125, 0.0282745361328125, 0.05623626708984375, 0.084197998046875, 0.11215972900390625, 0.1401214599609375, 0.16808319091796875, 0.196044921875, 0.22400665283203125, 0.2519683837890625, 0.27993011474609375, 0.307891845703125, 0.33585357666015625, 0.3638153076171875, 0.39177703857421875, 0.41973876953125, 0.44770050048828125, 0.4756622314453125, 0.5036239624023438, 0.531585693359375, 0.5595474243164062, 0.5875091552734375, 0.6154708862304688, 0.6434326171875, 0.6713943481445312, 0.6993560791015625, 0.7273178100585938, 0.755279541015625, 0.7832412719726562, 0.8112030029296875, 0.8391647338867188, 0.86712646484375, 0.8950881958007812, 0.9230499267578125, 0.9510116577148438, 0.978973388671875, 1.0069351196289062, 1.0348968505859375, 1.0628585815429688, 1.0908203125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 6.0, 3.0, 4.0, 12.0, 16.0, 39.0, 62.0, 142.0, 231.0, 237.0, 126.0, 50.0, 28.0, 21.0, 10.0, 11.0, 1.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.6737101078033447, -3.565480947494507, -3.457251787185669, -3.349022626876831, -3.2407937049865723, -3.1325645446777344, -3.0243353843688965, -2.9161062240600586, -2.8078770637512207, -2.699647903442383, -2.591418743133545, -2.483189582824707, -2.374960422515869, -2.2667312622070312, -2.1585023403167725, -2.0502731800079346, -1.9420440196990967, -1.8338148593902588, -1.725585699081421, -1.6173566579818726, -1.5091274976730347, -1.4008983373641968, -1.2926692962646484, -1.1844401359558105, -1.0762109756469727, -0.9679818153381348, -0.8597527146339417, -0.7515236139297485, -0.6432944536209106, -0.5350652933120728, -0.42683619260787964, -0.3186070919036865, -0.21037769317626953, -0.10214856266975403, 0.006080567836761475, 0.11430969834327698, 0.22253882884979248, 0.33076798915863037, 0.4389970898628235, 0.5472261905670166, 0.6554553508758545, 0.7636845111846924, 0.8719136118888855, 0.9801427125930786, 1.0883718729019165, 1.1966010332107544, 1.3048300743103027, 1.4130592346191406, 1.5212883949279785, 1.6295175552368164, 1.7377467155456543, 1.8459757566452026, 1.9542049169540405, 2.062434196472168, 2.1706631183624268, 2.2788922786712646, 2.3871214389801025, 2.4953505992889404, 2.6035797595977783, 2.711808919906616, 2.820037841796875, 2.928267002105713, 3.036496162414551, 3.1447253227233887, 3.2529544830322266]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 7.0, 4.0, 6.0, 17.0, 12.0, 21.0, 29.0, 32.0, 41.0, 70.0, 62.0, 66.0, 82.0, 80.0, 88.0, 66.0, 73.0, 63.0, 56.0, 37.0, 37.0, 16.0, 14.0, 9.0, 5.0, 6.0, 4.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9855552911758423, -1.9296249151229858, -1.8736945390701294, -1.817764163017273, -1.7618337869644165, -1.70590341091156, -1.6499730348587036, -1.5940426588058472, -1.5381122827529907, -1.4821819067001343, -1.4262515306472778, -1.3703211545944214, -1.314390778541565, -1.2584604024887085, -1.202530026435852, -1.1465996503829956, -1.0906693935394287, -1.0347390174865723, -0.9788086414337158, -0.9228782653808594, -0.8669478893280029, -0.8110175132751465, -0.75508713722229, -0.6991567611694336, -0.6432263851165771, -0.5872960090637207, -0.5313656330108643, -0.4754352569580078, -0.41950488090515137, -0.3635745346546173, -0.30764415860176086, -0.2517137825489044, -0.19578337669372559, -0.13985300064086914, -0.08392263203859329, -0.027992263436317444, 0.027938112616539, 0.08386847376823425, 0.1397988498210907, 0.19572922587394714, 0.2516596019268036, 0.30758997797966003, 0.3635203540325165, 0.41945070028305054, 0.475381076335907, 0.5313114523887634, 0.5872418284416199, 0.6431722044944763, 0.6991025805473328, 0.7550329566001892, 0.8109633326530457, 0.8668937087059021, 0.9228240847587585, 0.9787544012069702, 1.0346847772598267, 1.090615153312683, 1.1465455293655396, 1.202475905418396, 1.2584062814712524, 1.3143366575241089, 1.3702670335769653, 1.4261974096298218, 1.4821277856826782, 1.5380581617355347, 1.5939885377883911]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 11.0, 5.0, 9.0, 12.0, 10.0, 17.0, 27.0, 41.0, 55.0, 66.0, 128.0, 223.0, 491.0, 1025.0, 2941.0, 8834.0, 33302.0, 193004.0, 658880.0, 116154.0, 22947.0, 6427.0, 2202.0, 843.0, 400.0, 183.0, 119.0, 61.0, 47.0, 28.0, 15.0, 11.0, 12.0, 8.0, 9.0, 6.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.240478515625, -0.23200225830078125, -0.2235260009765625, -0.21504974365234375, -0.206573486328125, -0.19809722900390625, -0.1896209716796875, -0.18114471435546875, -0.17266845703125, -0.16419219970703125, -0.1557159423828125, -0.14723968505859375, -0.138763427734375, -0.13028717041015625, -0.1218109130859375, -0.11333465576171875, -0.1048583984375, -0.09638214111328125, -0.0879058837890625, -0.07942962646484375, -0.070953369140625, -0.06247711181640625, -0.0540008544921875, -0.04552459716796875, -0.03704833984375, -0.02857208251953125, -0.0200958251953125, -0.01161956787109375, -0.003143310546875, 0.00533294677734375, 0.0138092041015625, 0.02228546142578125, 0.03076171875, 0.03923797607421875, 0.0477142333984375, 0.05619049072265625, 0.064666748046875, 0.07314300537109375, 0.0816192626953125, 0.09009552001953125, 0.09857177734375, 0.10704803466796875, 0.1155242919921875, 0.12400054931640625, 0.132476806640625, 0.14095306396484375, 0.1494293212890625, 0.15790557861328125, 0.1663818359375, 0.17485809326171875, 0.1833343505859375, 0.19181060791015625, 0.200286865234375, 0.20876312255859375, 0.2172393798828125, 0.22571563720703125, 0.23419189453125, 0.24266815185546875, 0.2511444091796875, 0.25962066650390625, 0.268096923828125, 0.27657318115234375, 0.2850494384765625, 0.29352569580078125, 0.302001953125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 11.0, 7.0, 8.0, 20.0, 23.0, 36.0, 49.0, 70.0, 79.0, 97.0, 120.0, 98.0, 113.0, 84.0, 69.0, 42.0, 33.0, 17.0, 10.0, 10.0, 6.0, 3.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.060546875, -2.0111541748046875, -1.961761474609375, -1.9123687744140625, -1.86297607421875, -1.8135833740234375, -1.764190673828125, -1.7147979736328125, -1.6654052734375, -1.6160125732421875, -1.566619873046875, -1.5172271728515625, -1.46783447265625, -1.4184417724609375, -1.369049072265625, -1.3196563720703125, -1.270263671875, -1.2208709716796875, -1.171478271484375, -1.1220855712890625, -1.07269287109375, -1.0233001708984375, -0.973907470703125, -0.9245147705078125, -0.8751220703125, -0.8257293701171875, -0.776336669921875, -0.7269439697265625, -0.67755126953125, -0.6281585693359375, -0.578765869140625, -0.5293731689453125, -0.47998046875, -0.4305877685546875, -0.381195068359375, -0.3318023681640625, -0.28240966796875, -0.2330169677734375, -0.183624267578125, -0.1342315673828125, -0.0848388671875, -0.0354461669921875, 0.013946533203125, 0.0633392333984375, 0.11273193359375, 0.1621246337890625, 0.211517333984375, 0.2609100341796875, 0.310302734375, 0.3596954345703125, 0.409088134765625, 0.4584808349609375, 0.50787353515625, 0.5572662353515625, 0.606658935546875, 0.6560516357421875, 0.7054443359375, 0.7548370361328125, 0.804229736328125, 0.8536224365234375, 0.90301513671875, 0.9524078369140625, 1.001800537109375, 1.0511932373046875, 1.1005859375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 5.0, 4.0, 5.0, 11.0, 11.0, 17.0, 17.0, 34.0, 36.0, 49.0, 78.0, 114.0, 184.0, 265.0, 418.0, 681.0, 1276.0, 2469.0, 5341.0, 12929.0, 36642.0, 124762.0, 505197.0, 257423.0, 64055.0, 20859.0, 7931.0, 3522.0, 1780.0, 876.0, 546.0, 326.0, 224.0, 142.0, 96.0, 61.0, 47.0, 37.0, 25.0, 16.0, 17.0, 8.0, 8.0, 2.0, 7.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1485595703125, -0.1433887481689453, -0.13821792602539062, -0.13304710388183594, -0.12787628173828125, -0.12270545959472656, -0.11753463745117188, -0.11236381530761719, -0.1071929931640625, -0.10202217102050781, -0.09685134887695312, -0.09168052673339844, -0.08650970458984375, -0.08133888244628906, -0.07616806030273438, -0.07099723815917969, -0.065826416015625, -0.06065559387207031, -0.055484771728515625, -0.05031394958496094, -0.04514312744140625, -0.03997230529785156, -0.034801483154296875, -0.029630661010742188, -0.0244598388671875, -0.019289016723632812, -0.014118194580078125, -0.008947372436523438, -0.00377655029296875, 0.0013942718505859375, 0.006565093994140625, 0.011735916137695312, 0.01690673828125, 0.022077560424804688, 0.027248382568359375, 0.03241920471191406, 0.03759002685546875, 0.04276084899902344, 0.047931671142578125, 0.05310249328613281, 0.0582733154296875, 0.06344413757324219, 0.06861495971679688, 0.07378578186035156, 0.07895660400390625, 0.08412742614746094, 0.08929824829101562, 0.09446907043457031, 0.099639892578125, 0.10481071472167969, 0.10998153686523438, 0.11515235900878906, 0.12032318115234375, 0.12549400329589844, 0.13066482543945312, 0.1358356475830078, 0.1410064697265625, 0.1461772918701172, 0.15134811401367188, 0.15651893615722656, 0.16168975830078125, 0.16686058044433594, 0.17203140258789062, 0.1772022247314453, 0.182373046875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 2.0, 4.0, 7.0, 11.0, 11.0, 14.0, 14.0, 10.0, 21.0, 12.0, 26.0, 25.0, 24.0, 31.0, 29.0, 27.0, 33.0, 44.0, 50.0, 63.0, 59.0, 50.0, 56.0, 55.0, 41.0, 30.0, 40.0, 43.0, 28.0, 29.0, 22.0, 15.0, 17.0, 13.0, 14.0, 6.0, 4.0, 9.0, 3.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2197265625, -1.1776580810546875, -1.135589599609375, -1.0935211181640625, -1.05145263671875, -1.0093841552734375, -0.967315673828125, -0.9252471923828125, -0.8831787109375, -0.8411102294921875, -0.799041748046875, -0.7569732666015625, -0.71490478515625, -0.6728363037109375, -0.630767822265625, -0.5886993408203125, -0.546630859375, -0.5045623779296875, -0.462493896484375, -0.4204254150390625, -0.37835693359375, -0.3362884521484375, -0.294219970703125, -0.2521514892578125, -0.2100830078125, -0.1680145263671875, -0.125946044921875, -0.0838775634765625, -0.04180908203125, 0.0002593994140625, 0.042327880859375, 0.0843963623046875, 0.12646484375, 0.1685333251953125, 0.210601806640625, 0.2526702880859375, 0.29473876953125, 0.3368072509765625, 0.378875732421875, 0.4209442138671875, 0.4630126953125, 0.5050811767578125, 0.547149658203125, 0.5892181396484375, 0.63128662109375, 0.6733551025390625, 0.715423583984375, 0.7574920654296875, 0.799560546875, 0.8416290283203125, 0.883697509765625, 0.9257659912109375, 0.96783447265625, 1.0099029541015625, 1.051971435546875, 1.0940399169921875, 1.1361083984375, 1.1781768798828125, 1.220245361328125, 1.2623138427734375, 1.30438232421875, 1.3464508056640625, 1.388519287109375, 1.4305877685546875, 1.47265625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 9.0, 6.0, 14.0, 13.0, 16.0, 29.0, 51.0, 53.0, 89.0, 191.0, 265.0, 478.0, 985.0, 2166.0, 5905.0, 20534.0, 123271.0, 733148.0, 129521.0, 21549.0, 5891.0, 2161.0, 1016.0, 460.0, 301.0, 143.0, 92.0, 66.0, 39.0, 27.0, 15.0, 19.0, 15.0, 5.0, 7.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0618896484375, -0.059861183166503906, -0.05783271789550781, -0.05580425262451172, -0.053775787353515625, -0.05174732208251953, -0.04971885681152344, -0.047690391540527344, -0.04566192626953125, -0.043633460998535156, -0.04160499572753906, -0.03957653045654297, -0.037548065185546875, -0.03551959991455078, -0.03349113464355469, -0.031462669372558594, -0.0294342041015625, -0.027405738830566406, -0.025377273559570312, -0.02334880828857422, -0.021320343017578125, -0.01929187774658203, -0.017263412475585938, -0.015234947204589844, -0.01320648193359375, -0.011178016662597656, -0.009149551391601562, -0.007121086120605469, -0.005092620849609375, -0.0030641555786132812, -0.0010356903076171875, 0.0009927749633789062, 0.003021240234375, 0.005049705505371094, 0.0070781707763671875, 0.009106636047363281, 0.011135101318359375, 0.013163566589355469, 0.015192031860351562, 0.017220497131347656, 0.01924896240234375, 0.021277427673339844, 0.023305892944335938, 0.02533435821533203, 0.027362823486328125, 0.02939128875732422, 0.03141975402832031, 0.033448219299316406, 0.0354766845703125, 0.037505149841308594, 0.03953361511230469, 0.04156208038330078, 0.043590545654296875, 0.04561901092529297, 0.04764747619628906, 0.049675941467285156, 0.05170440673828125, 0.053732872009277344, 0.05576133728027344, 0.05778980255126953, 0.059818267822265625, 0.06184673309326172, 0.06387519836425781, 0.0659036636352539, 0.06793212890625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 2.0, 9.0, 11.0, 16.0, 22.0, 37.0, 62.0, 122.0, 170.0, 214.0, 147.0, 88.0, 44.0, 27.0, 11.0, 9.0, 5.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.574392318725586e-05, -6.418582051992416e-05, -6.262771785259247e-05, -6.106961518526077e-05, -5.951151251792908e-05, -5.795340985059738e-05, -5.6395307183265686e-05, -5.483720451593399e-05, -5.3279101848602295e-05, -5.17209991812706e-05, -5.0162896513938904e-05, -4.860479384660721e-05, -4.704669117927551e-05, -4.548858851194382e-05, -4.393048584461212e-05, -4.2372383177280426e-05, -4.081428050994873e-05, -3.9256177842617035e-05, -3.769807517528534e-05, -3.6139972507953644e-05, -3.458186984062195e-05, -3.302376717329025e-05, -3.146566450595856e-05, -2.990756183862686e-05, -2.8349459171295166e-05, -2.679135650396347e-05, -2.5233253836631775e-05, -2.367515116930008e-05, -2.2117048501968384e-05, -2.0558945834636688e-05, -1.9000843167304993e-05, -1.7442740499973297e-05, -1.58846378326416e-05, -1.4326535165309906e-05, -1.276843249797821e-05, -1.1210329830646515e-05, -9.65222716331482e-06, -8.094124495983124e-06, -6.536021828651428e-06, -4.977919161319733e-06, -3.419816493988037e-06, -1.8617138266563416e-06, -3.03611159324646e-07, 1.2544915080070496e-06, 2.812594175338745e-06, 4.370696842670441e-06, 5.928799510002136e-06, 7.486902177333832e-06, 9.045004844665527e-06, 1.0603107511997223e-05, 1.2161210179328918e-05, 1.3719312846660614e-05, 1.527741551399231e-05, 1.6835518181324005e-05, 1.83936208486557e-05, 1.9951723515987396e-05, 2.1509826183319092e-05, 2.3067928850650787e-05, 2.4626031517982483e-05, 2.618413418531418e-05, 2.7742236852645874e-05, 2.930033951997757e-05, 3.0858442187309265e-05, 3.241654485464096e-05, 3.3974647521972656e-05]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 6.0, 3.0, 10.0, 12.0, 21.0, 21.0, 32.0, 37.0, 62.0, 105.0, 165.0, 249.0, 422.0, 701.0, 1285.0, 2485.0, 5369.0, 13566.0, 40479.0, 169521.0, 561103.0, 184145.0, 43317.0, 14034.0, 5588.0, 2537.0, 1419.0, 727.0, 413.0, 262.0, 164.0, 91.0, 66.0, 38.0, 21.0, 23.0, 22.0, 5.0, 4.0, 6.0, 5.0, 6.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.046112060546875, -0.0446014404296875, -0.0430908203125, -0.0415802001953125, -0.040069580078125, -0.0385589599609375, -0.03704833984375, -0.0355377197265625, -0.034027099609375, -0.0325164794921875, -0.031005859375, -0.0294952392578125, -0.027984619140625, -0.0264739990234375, -0.02496337890625, -0.0234527587890625, -0.021942138671875, -0.0204315185546875, -0.0189208984375, -0.0174102783203125, -0.015899658203125, -0.0143890380859375, -0.01287841796875, -0.0113677978515625, -0.009857177734375, -0.0083465576171875, -0.0068359375, -0.0053253173828125, -0.003814697265625, -0.0023040771484375, -0.00079345703125, 0.0007171630859375, 0.002227783203125, 0.0037384033203125, 0.0052490234375, 0.0067596435546875, 0.008270263671875, 0.0097808837890625, 0.01129150390625, 0.0128021240234375, 0.014312744140625, 0.0158233642578125, 0.017333984375, 0.0188446044921875, 0.020355224609375, 0.0218658447265625, 0.02337646484375, 0.0248870849609375, 0.026397705078125, 0.0279083251953125, 0.0294189453125, 0.0309295654296875, 0.032440185546875, 0.0339508056640625, 0.03546142578125, 0.0369720458984375, 0.038482666015625, 0.0399932861328125, 0.04150390625, 0.0430145263671875, 0.044525146484375, 0.0460357666015625, 0.04754638671875, 0.0490570068359375, 0.050567626953125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 3.0, 3.0, 4.0, 5.0, 6.0, 4.0, 8.0, 15.0, 12.0, 25.0, 29.0, 41.0, 46.0, 56.0, 58.0, 81.0, 84.0, 87.0, 73.0, 66.0, 56.0, 58.0, 27.0, 32.0, 24.0, 30.0, 16.0, 9.0, 7.0, 10.0, 7.0, 3.0, 4.0, 3.0, 5.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.013031005859375, -0.012640237808227539, -0.012249469757080078, -0.011858701705932617, -0.011467933654785156, -0.011077165603637695, -0.010686397552490234, -0.010295629501342773, -0.009904861450195312, -0.009514093399047852, -0.00912332534790039, -0.00873255729675293, -0.008341789245605469, -0.007951021194458008, -0.007560253143310547, -0.007169485092163086, -0.006778717041015625, -0.006387948989868164, -0.005997180938720703, -0.005606412887573242, -0.005215644836425781, -0.00482487678527832, -0.004434108734130859, -0.0040433406829833984, -0.0036525726318359375, -0.0032618045806884766, -0.0028710365295410156, -0.0024802684783935547, -0.0020895004272460938, -0.0016987323760986328, -0.0013079643249511719, -0.0009171962738037109, -0.00052642822265625, -0.00013566017150878906, 0.0002551078796386719, 0.0006458759307861328, 0.0010366439819335938, 0.0014274120330810547, 0.0018181800842285156, 0.0022089481353759766, 0.0025997161865234375, 0.0029904842376708984, 0.0033812522888183594, 0.0037720203399658203, 0.004162788391113281, 0.004553556442260742, 0.004944324493408203, 0.005335092544555664, 0.005725860595703125, 0.006116628646850586, 0.006507396697998047, 0.006898164749145508, 0.007288932800292969, 0.00767970085144043, 0.00807046890258789, 0.008461236953735352, 0.008852005004882812, 0.009242773056030273, 0.009633541107177734, 0.010024309158325195, 0.010415077209472656, 0.010805845260620117, 0.011196613311767578, 0.011587381362915039, 0.0119781494140625]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 8.0, 11.0, 20.0, 76.0, 219.0, 443.0, 151.0, 42.0, 17.0, 11.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-5.538624286651611, -5.421570777893066, -5.3045172691345215, -5.187463760375977, -5.070409774780273, -4.9533562660217285, -4.836302757263184, -4.719249248504639, -4.602195739746094, -4.485142230987549, -4.368088722229004, -4.251034736633301, -4.133981227874756, -4.016927719116211, -3.899874210357666, -3.782820701599121, -3.665766716003418, -3.548713207244873, -3.431659460067749, -3.314605951309204, -3.197552442550659, -3.080498695373535, -2.9634451866149902, -2.8463916778564453, -2.7293381690979004, -2.6122846603393555, -2.4952309131622314, -2.3781774044036865, -2.2611238956451416, -2.1440701484680176, -2.0270166397094727, -1.9099630117416382, -1.7929093837738037, -1.6758557558059692, -1.5588022470474243, -1.4417486190795898, -1.3246949911117554, -1.207641363143921, -1.090587854385376, -0.9735342264175415, -0.8564806580543518, -0.7394270896911621, -0.6223734617233276, -0.5053198933601379, -0.38826629519462585, -0.27121269702911377, -0.15415912866592407, -0.0371055006980896, 0.0799480676651001, 0.19700166583061218, 0.31405526399612427, 0.43110883235931396, 0.5481624603271484, 0.6652160286903381, 0.7822695970535278, 0.8993232250213623, 1.0163767337799072, 1.1334303617477417, 1.2504838705062866, 1.367537498474121, 1.4845911264419556, 1.60164475440979, 1.718698263168335, 1.8357518911361694, 1.952805519104004]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 12.0, 10.0, 11.0, 26.0, 33.0, 39.0, 61.0, 84.0, 87.0, 101.0, 103.0, 105.0, 81.0, 74.0, 63.0, 37.0, 25.0, 16.0, 11.0, 8.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.8379266262054443, -1.7933305501937866, -1.7487343549728394, -1.7041382789611816, -1.6595420837402344, -1.6149460077285767, -1.570349931716919, -1.5257537364959717, -1.4811575412750244, -1.4365614652633667, -1.3919652700424194, -1.3473691940307617, -1.3027729988098145, -1.2581769227981567, -1.213580846786499, -1.1689846515655518, -1.124388575553894, -1.0797924995422363, -1.035196304321289, -0.9906002283096313, -0.9460040330886841, -0.9014079570770264, -0.8568118214607239, -0.8122156858444214, -0.7676195502281189, -0.7230234146118164, -0.6784272789955139, -0.6338311433792114, -0.5892350673675537, -0.5446388721466064, -0.5000427961349487, -0.45544666051864624, -0.41085052490234375, -0.36625438928604126, -0.32165825366973877, -0.27706214785575867, -0.23246601223945618, -0.1878698766231537, -0.14327377080917358, -0.0986776351928711, -0.054081499576568604, -0.00948537141084671, 0.03511075675487518, 0.07970687747001648, 0.12430301308631897, 0.16889914870262146, 0.21349525451660156, 0.25809139013290405, 0.30268752574920654, 0.34728366136550903, 0.3918797969818115, 0.4364759027957916, 0.4810720384120941, 0.5256681442260742, 0.5702642798423767, 0.6148604154586792, 0.6594565510749817, 0.7040526866912842, 0.7486488223075867, 0.7932449579238892, 0.8378410339355469, 0.8824372291564941, 0.9270333051681519, 0.9716294407844543, 1.0162255764007568]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 4.0, 4.0, 5.0, 7.0, 14.0, 16.0, 23.0, 35.0, 35.0, 57.0, 76.0, 106.0, 171.0, 255.0, 391.0, 586.0, 967.0, 1604.0, 2866.0, 5421.0, 11688.0, 31004.0, 206334.0, 692358.0, 60578.0, 17201.0, 7445.0, 3817.0, 2066.0, 1245.0, 767.0, 448.0, 285.0, 211.0, 135.0, 100.0, 57.0, 53.0, 33.0, 28.0, 18.0, 10.0, 8.0, 8.0, 9.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.17578125, -1.1403961181640625, -1.105010986328125, -1.0696258544921875, -1.03424072265625, -0.9988555908203125, -0.963470458984375, -0.9280853271484375, -0.8927001953125, -0.8573150634765625, -0.821929931640625, -0.7865447998046875, -0.75115966796875, -0.7157745361328125, -0.680389404296875, -0.6450042724609375, -0.609619140625, -0.5742340087890625, -0.538848876953125, -0.5034637451171875, -0.46807861328125, -0.4326934814453125, -0.397308349609375, -0.3619232177734375, -0.3265380859375, -0.2911529541015625, -0.255767822265625, -0.2203826904296875, -0.18499755859375, -0.1496124267578125, -0.114227294921875, -0.0788421630859375, -0.04345703125, -0.0080718994140625, 0.027313232421875, 0.0626983642578125, 0.09808349609375, 0.1334686279296875, 0.168853759765625, 0.2042388916015625, 0.2396240234375, 0.2750091552734375, 0.310394287109375, 0.3457794189453125, 0.38116455078125, 0.4165496826171875, 0.451934814453125, 0.4873199462890625, 0.522705078125, 0.5580902099609375, 0.593475341796875, 0.6288604736328125, 0.66424560546875, 0.6996307373046875, 0.735015869140625, 0.7704010009765625, 0.8057861328125, 0.8411712646484375, 0.876556396484375, 0.9119415283203125, 0.94732666015625, 0.9827117919921875, 1.018096923828125, 1.0534820556640625, 1.0888671875]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 6.0, 7.0, 6.0, 8.0, 12.0, 19.0, 17.0, 34.0, 28.0, 50.0, 57.0, 51.0, 70.0, 77.0, 89.0, 83.0, 80.0, 64.0, 46.0, 43.0, 50.0, 27.0, 21.0, 14.0, 14.0, 5.0, 7.0, 9.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.19140625, -2.117218017578125, -2.04302978515625, -1.968841552734375, -1.8946533203125, -1.820465087890625, -1.74627685546875, -1.672088623046875, -1.597900390625, -1.523712158203125, -1.44952392578125, -1.375335693359375, -1.3011474609375, -1.226959228515625, -1.15277099609375, -1.078582763671875, -1.00439453125, -0.930206298828125, -0.85601806640625, -0.781829833984375, -0.7076416015625, -0.633453369140625, -0.55926513671875, -0.485076904296875, -0.410888671875, -0.336700439453125, -0.26251220703125, -0.188323974609375, -0.1141357421875, -0.039947509765625, 0.03424072265625, 0.108428955078125, 0.1826171875, 0.256805419921875, 0.33099365234375, 0.405181884765625, 0.4793701171875, 0.553558349609375, 0.62774658203125, 0.701934814453125, 0.776123046875, 0.850311279296875, 0.92449951171875, 0.998687744140625, 1.0728759765625, 1.147064208984375, 1.22125244140625, 1.295440673828125, 1.36962890625, 1.443817138671875, 1.51800537109375, 1.592193603515625, 1.6663818359375, 1.740570068359375, 1.81475830078125, 1.888946533203125, 1.963134765625, 2.037322998046875, 2.11151123046875, 2.185699462890625, 2.2598876953125, 2.334075927734375, 2.40826416015625, 2.482452392578125, 2.556640625]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 8.0, 8.0, 10.0, 11.0, 12.0, 16.0, 29.0, 38.0, 43.0, 59.0, 98.0, 141.0, 241.0, 427.0, 845.0, 1945.0, 5255.0, 18788.0, 142750.0, 808032.0, 52579.0, 10753.0, 3432.0, 1420.0, 646.0, 342.0, 196.0, 117.0, 100.0, 57.0, 42.0, 31.0, 16.0, 16.0, 19.0, 10.0, 7.0, 5.0, 6.0, 4.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.396484375, -1.35577392578125, -1.3150634765625, -1.27435302734375, -1.233642578125, -1.19293212890625, -1.1522216796875, -1.11151123046875, -1.07080078125, -1.03009033203125, -0.9893798828125, -0.94866943359375, -0.907958984375, -0.86724853515625, -0.8265380859375, -0.78582763671875, -0.7451171875, -0.70440673828125, -0.6636962890625, -0.62298583984375, -0.582275390625, -0.54156494140625, -0.5008544921875, -0.46014404296875, -0.41943359375, -0.37872314453125, -0.3380126953125, -0.29730224609375, -0.256591796875, -0.21588134765625, -0.1751708984375, -0.13446044921875, -0.09375, -0.05303955078125, -0.0123291015625, 0.02838134765625, 0.069091796875, 0.10980224609375, 0.1505126953125, 0.19122314453125, 0.23193359375, 0.27264404296875, 0.3133544921875, 0.35406494140625, 0.394775390625, 0.43548583984375, 0.4761962890625, 0.51690673828125, 0.5576171875, 0.59832763671875, 0.6390380859375, 0.67974853515625, 0.720458984375, 0.76116943359375, 0.8018798828125, 0.84259033203125, 0.88330078125, 0.92401123046875, 0.9647216796875, 1.00543212890625, 1.046142578125, 1.08685302734375, 1.1275634765625, 1.16827392578125, 1.208984375]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 3.0, 2.0, 9.0, 4.0, 9.0, 10.0, 16.0, 11.0, 13.0, 16.0, 16.0, 19.0, 21.0, 24.0, 29.0, 19.0, 27.0, 35.0, 33.0, 40.0, 34.0, 39.0, 57.0, 45.0, 47.0, 48.0, 32.0, 29.0, 30.0, 27.0, 27.0, 24.0, 28.0, 18.0, 23.0, 27.0, 28.0, 13.0, 10.0, 12.0, 9.0, 8.0, 7.0, 8.0, 4.0, 9.0, 4.0, 1.0, 3.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.4931640625, -1.447998046875, -1.40283203125, -1.357666015625, -1.3125, -1.267333984375, -1.22216796875, -1.177001953125, -1.1318359375, -1.086669921875, -1.04150390625, -0.996337890625, -0.951171875, -0.906005859375, -0.86083984375, -0.815673828125, -0.7705078125, -0.725341796875, -0.68017578125, -0.635009765625, -0.58984375, -0.544677734375, -0.49951171875, -0.454345703125, -0.4091796875, -0.364013671875, -0.31884765625, -0.273681640625, -0.228515625, -0.183349609375, -0.13818359375, -0.093017578125, -0.0478515625, -0.002685546875, 0.04248046875, 0.087646484375, 0.1328125, 0.177978515625, 0.22314453125, 0.268310546875, 0.3134765625, 0.358642578125, 0.40380859375, 0.448974609375, 0.494140625, 0.539306640625, 0.58447265625, 0.629638671875, 0.6748046875, 0.719970703125, 0.76513671875, 0.810302734375, 0.85546875, 0.900634765625, 0.94580078125, 0.990966796875, 1.0361328125, 1.081298828125, 1.12646484375, 1.171630859375, 1.216796875, 1.261962890625, 1.30712890625, 1.352294921875, 1.3974609375]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 5.0, 4.0, 9.0, 13.0, 17.0, 15.0, 27.0, 33.0, 47.0, 104.0, 183.0, 345.0, 679.0, 1735.0, 5620.0, 28669.0, 892448.0, 102019.0, 11429.0, 3060.0, 1013.0, 465.0, 237.0, 128.0, 83.0, 65.0, 34.0, 18.0, 11.0, 14.0, 7.0, 2.0, 2.0, 6.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.765625, -0.7358856201171875, -0.706146240234375, -0.6764068603515625, -0.64666748046875, -0.6169281005859375, -0.587188720703125, -0.5574493408203125, -0.5277099609375, -0.4979705810546875, -0.468231201171875, -0.4384918212890625, -0.40875244140625, -0.3790130615234375, -0.349273681640625, -0.3195343017578125, -0.289794921875, -0.2600555419921875, -0.230316162109375, -0.2005767822265625, -0.17083740234375, -0.1410980224609375, -0.111358642578125, -0.0816192626953125, -0.0518798828125, -0.0221405029296875, 0.007598876953125, 0.0373382568359375, 0.06707763671875, 0.0968170166015625, 0.126556396484375, 0.1562957763671875, 0.18603515625, 0.2157745361328125, 0.245513916015625, 0.2752532958984375, 0.30499267578125, 0.3347320556640625, 0.364471435546875, 0.3942108154296875, 0.4239501953125, 0.4536895751953125, 0.483428955078125, 0.5131683349609375, 0.54290771484375, 0.5726470947265625, 0.602386474609375, 0.6321258544921875, 0.661865234375, 0.6916046142578125, 0.721343994140625, 0.7510833740234375, 0.78082275390625, 0.8105621337890625, 0.840301513671875, 0.8700408935546875, 0.8997802734375, 0.9295196533203125, 0.959259033203125, 0.9889984130859375, 1.01873779296875, 1.0484771728515625, 1.078216552734375, 1.1079559326171875, 1.1376953125]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 8.0, 15.0, 27.0, 29.0, 66.0, 241.0, 414.0, 85.0, 42.0, 27.0, 16.0, 12.0, 5.0, 5.0, 6.0, 0.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0002275705337524414, -0.00022274907678365707, -0.00021792761981487274, -0.0002131061628460884, -0.00020828470587730408, -0.00020346324890851974, -0.0001986417919397354, -0.00019382033497095108, -0.00018899887800216675, -0.00018417742103338242, -0.00017935596406459808, -0.00017453450709581375, -0.00016971305012702942, -0.0001648915931582451, -0.00016007013618946075, -0.00015524867922067642, -0.0001504272222518921, -0.00014560576528310776, -0.00014078430831432343, -0.0001359628513455391, -0.00013114139437675476, -0.00012631993740797043, -0.0001214984804391861, -0.00011667702347040176, -0.00011185556650161743, -0.0001070341095328331, -0.00010221265256404877, -9.739119559526443e-05, -9.25697386264801e-05, -8.774828165769577e-05, -8.292682468891144e-05, -7.81053677201271e-05, -7.328391075134277e-05, -6.846245378255844e-05, -6.364099681377411e-05, -5.8819539844989777e-05, -5.3998082876205444e-05, -4.917662590742111e-05, -4.435516893863678e-05, -3.953371196985245e-05, -3.4712255001068115e-05, -2.9890798032283783e-05, -2.506934106349945e-05, -2.024788409471512e-05, -1.5426427125930786e-05, -1.0604970157146454e-05, -5.783513188362122e-06, -9.620562195777893e-07, 3.859400749206543e-06, 8.680857717990875e-06, 1.3502314686775208e-05, 1.832377165555954e-05, 2.3145228624343872e-05, 2.7966685593128204e-05, 3.278814256191254e-05, 3.760959953069687e-05, 4.24310564994812e-05, 4.7252513468265533e-05, 5.2073970437049866e-05, 5.68954274058342e-05, 6.171688437461853e-05, 6.653834134340286e-05, 7.13597983121872e-05, 7.618125528097153e-05, 8.100271224975586e-05]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 0.0, 4.0, 4.0, 5.0, 6.0, 3.0, 5.0, 5.0, 7.0, 11.0, 20.0, 31.0, 48.0, 92.0, 156.0, 260.0, 512.0, 1051.0, 2506.0, 6495.0, 24248.0, 479521.0, 497582.0, 24652.0, 6736.0, 2417.0, 1052.0, 473.0, 232.0, 130.0, 75.0, 65.0, 40.0, 20.0, 21.0, 18.0, 8.0, 10.0, 8.0, 8.0, 6.0, 3.0, 5.0, 0.0, 3.0, 3.0, 4.0, 0.0, 1.0], "bins": [-0.83251953125, -0.8100204467773438, -0.7875213623046875, -0.7650222778320312, -0.742523193359375, -0.7200241088867188, -0.6975250244140625, -0.6750259399414062, -0.65252685546875, -0.6300277709960938, -0.6075286865234375, -0.5850296020507812, -0.562530517578125, -0.5400314331054688, -0.5175323486328125, -0.49503326416015625, -0.4725341796875, -0.45003509521484375, -0.4275360107421875, -0.40503692626953125, -0.382537841796875, -0.36003875732421875, -0.3375396728515625, -0.31504058837890625, -0.29254150390625, -0.27004241943359375, -0.2475433349609375, -0.22504425048828125, -0.202545166015625, -0.18004608154296875, -0.1575469970703125, -0.13504791259765625, -0.112548828125, -0.09004974365234375, -0.0675506591796875, -0.04505157470703125, -0.022552490234375, -5.340576171875e-05, 0.0224456787109375, 0.04494476318359375, 0.06744384765625, 0.08994293212890625, 0.1124420166015625, 0.13494110107421875, 0.157440185546875, 0.17993927001953125, 0.2024383544921875, 0.22493743896484375, 0.2474365234375, 0.26993560791015625, 0.2924346923828125, 0.31493377685546875, 0.337432861328125, 0.35993194580078125, 0.3824310302734375, 0.40493011474609375, 0.42742919921875, 0.44992828369140625, 0.4724273681640625, 0.49492645263671875, 0.517425537109375, 0.5399246215820312, 0.5624237060546875, 0.5849227905273438, 0.607421875]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 6.0, 0.0, 9.0, 7.0, 8.0, 6.0, 7.0, 23.0, 15.0, 19.0, 30.0, 57.0, 95.0, 278.0, 185.0, 78.0, 33.0, 38.0, 19.0, 20.0, 8.0, 10.0, 12.0, 12.0, 5.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.23193359375, -0.22328567504882812, -0.21463775634765625, -0.20598983764648438, -0.1973419189453125, -0.18869400024414062, -0.18004608154296875, -0.17139816284179688, -0.162750244140625, -0.15410232543945312, -0.14545440673828125, -0.13680648803710938, -0.1281585693359375, -0.11951065063476562, -0.11086273193359375, -0.10221481323242188, -0.09356689453125, -0.08491897583007812, -0.07627105712890625, -0.06762313842773438, -0.0589752197265625, -0.050327301025390625, -0.04167938232421875, -0.033031463623046875, -0.024383544921875, -0.015735626220703125, -0.00708770751953125, 0.001560211181640625, 0.0102081298828125, 0.018856048583984375, 0.02750396728515625, 0.036151885986328125, 0.0447998046875, 0.053447723388671875, 0.06209564208984375, 0.07074356079101562, 0.0793914794921875, 0.08803939819335938, 0.09668731689453125, 0.10533523559570312, 0.113983154296875, 0.12263107299804688, 0.13127899169921875, 0.13992691040039062, 0.1485748291015625, 0.15722274780273438, 0.16587066650390625, 0.17451858520507812, 0.18316650390625, 0.19181442260742188, 0.20046234130859375, 0.20911026000976562, 0.2177581787109375, 0.22640609741210938, 0.23505401611328125, 0.24370193481445312, 0.252349853515625, 0.2609977722167969, 0.26964569091796875, 0.2782936096191406, 0.2869415283203125, 0.2955894470214844, 0.30423736572265625, 0.3128852844238281, 0.321533203125]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 5.0, 8.0, 37.0, 166.0, 544.0, 175.0, 46.0, 18.0, 5.0, 1.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.5871992111206055, -5.2689971923828125, -4.9507951736450195, -4.632593631744385, -4.314391613006592, -3.996189594268799, -3.677987813949585, -3.359786033630371, -3.041584014892578, -2.723381996154785, -2.4051802158355713, -2.0869784355163574, -1.7687764167785645, -1.450574517250061, -1.1323726177215576, -0.8141708374023438, -0.4959688186645508, -0.17776691913604736, 0.14043498039245605, 0.4586368799209595, 0.7768387794494629, 1.0950406789779663, 1.4132425785064697, 1.7314443588256836, 2.0496463775634766, 2.3678483963012695, 2.6860501766204834, 3.0042519569396973, 3.3224539756774902, 3.640655994415283, 3.958857774734497, 4.277059555053711, 4.5952606201171875, 4.9134626388549805, 5.231664657592773, 5.549866199493408, 5.868068218231201, 6.186270236968994, 6.504471778869629, 6.822673797607422, 7.140875816345215, 7.459077835083008, 7.777279853820801, 8.095481872558594, 8.41368293762207, 8.731884956359863, 9.050086975097656, 9.36828899383545, 9.686491012573242, 10.004693031311035, 10.322895050048828, 10.641097068786621, 10.959299087524414, 11.27750015258789, 11.595702171325684, 11.913904190063477, 12.23210620880127, 12.550308227539062, 12.868510246276855, 13.186712265014648, 13.504913330078125, 13.823115348815918, 14.141317367553711, 14.459519386291504, 14.777721405029297]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 4.0, 4.0, 5.0, 8.0, 8.0, 9.0, 22.0, 20.0, 15.0, 21.0, 25.0, 34.0, 31.0, 22.0, 37.0, 32.0, 42.0, 45.0, 40.0, 45.0, 50.0, 48.0, 55.0, 51.0, 48.0, 31.0, 29.0, 39.0, 21.0, 23.0, 28.0, 27.0, 18.0, 15.0, 17.0, 9.0, 6.0, 4.0, 6.0, 4.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.7176430225372314, -2.6250250339508057, -2.53240704536438, -2.439789295196533, -2.3471713066101074, -2.2545533180236816, -2.161935329437256, -2.06931734085083, -1.9766995906829834, -1.8840816020965576, -1.7914637327194214, -1.6988457441329956, -1.6062278747558594, -1.5136098861694336, -1.4209918975830078, -1.3283740282058716, -1.2357560396194458, -1.14313805103302, -1.0505201816558838, -0.957902193069458, -0.8652843236923218, -0.772666335105896, -0.680048406124115, -0.587430477142334, -0.494812548160553, -0.402194619178772, -0.30957669019699097, -0.21695873141288757, -0.12434080243110657, -0.03172287344932556, 0.06089508533477783, 0.15351301431655884, 0.24613094329833984, 0.33874887228012085, 0.43136680126190186, 0.5239847898483276, 0.6166026592254639, 0.7092206478118896, 0.8018385767936707, 0.8944565057754517, 0.9870744347572327, 1.0796923637390137, 1.1723103523254395, 1.2649282217025757, 1.3575462102890015, 1.4501640796661377, 1.5427820682525635, 1.6354000568389893, 1.7280179262161255, 1.8206359148025513, 1.9132537841796875, 2.0058717727661133, 2.098489761352539, 2.1911075115203857, 2.2837255001068115, 2.3763434886932373, 2.468961477279663, 2.561579465866089, 2.6541974544525146, 2.7468152046203613, 2.839433193206787, 2.932051181793213, 3.0246691703796387, 3.1172871589660645, 3.209904909133911]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 6.0, 8.0, 15.0, 21.0, 35.0, 53.0, 78.0, 146.0, 248.0, 621.0, 2846.0, 79248.0, 4097327.0, 11391.0, 1447.0, 404.0, 141.0, 97.0, 43.0, 43.0, 16.0, 13.0, 14.0, 8.0, 4.0, 5.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.6953125, -8.4847412109375, -8.274169921875, -8.0635986328125, -7.85302734375, -7.6424560546875, -7.431884765625, -7.2213134765625, -7.0107421875, -6.8001708984375, -6.589599609375, -6.3790283203125, -6.16845703125, -5.9578857421875, -5.747314453125, -5.5367431640625, -5.326171875, -5.1156005859375, -4.905029296875, -4.6944580078125, -4.48388671875, -4.2733154296875, -4.062744140625, -3.8521728515625, -3.6416015625, -3.4310302734375, -3.220458984375, -3.0098876953125, -2.79931640625, -2.5887451171875, -2.378173828125, -2.1676025390625, -1.95703125, -1.7464599609375, -1.535888671875, -1.3253173828125, -1.11474609375, -0.9041748046875, -0.693603515625, -0.4830322265625, -0.2724609375, -0.0618896484375, 0.148681640625, 0.3592529296875, 0.56982421875, 0.7803955078125, 0.990966796875, 1.2015380859375, 1.412109375, 1.6226806640625, 1.833251953125, 2.0438232421875, 2.25439453125, 2.4649658203125, 2.675537109375, 2.8861083984375, 3.0966796875, 3.3072509765625, 3.517822265625, 3.7283935546875, 3.93896484375, 4.1495361328125, 4.360107421875, 4.5706787109375, 4.78125]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 6.0, 9.0, 15.0, 20.0, 26.0, 36.0, 49.0, 57.0, 79.0, 89.0, 113.0, 126.0, 86.0, 80.0, 64.0, 46.0, 34.0, 23.0, 18.0, 11.0, 5.0, 5.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.294921875, -2.2374420166015625, -2.179962158203125, -2.1224822998046875, -2.06500244140625, -2.0075225830078125, -1.950042724609375, -1.8925628662109375, -1.8350830078125, -1.7776031494140625, -1.720123291015625, -1.6626434326171875, -1.60516357421875, -1.5476837158203125, -1.490203857421875, -1.4327239990234375, -1.375244140625, -1.3177642822265625, -1.260284423828125, -1.2028045654296875, -1.14532470703125, -1.0878448486328125, -1.030364990234375, -0.9728851318359375, -0.9154052734375, -0.8579254150390625, -0.800445556640625, -0.7429656982421875, -0.68548583984375, -0.6280059814453125, -0.570526123046875, -0.5130462646484375, -0.45556640625, -0.3980865478515625, -0.340606689453125, -0.2831268310546875, -0.22564697265625, -0.1681671142578125, -0.110687255859375, -0.0532073974609375, 0.0042724609375, 0.0617523193359375, 0.119232177734375, 0.1767120361328125, 0.23419189453125, 0.2916717529296875, 0.349151611328125, 0.4066314697265625, 0.464111328125, 0.5215911865234375, 0.579071044921875, 0.6365509033203125, 0.69403076171875, 0.7515106201171875, 0.808990478515625, 0.8664703369140625, 0.9239501953125, 0.9814300537109375, 1.038909912109375, 1.0963897705078125, 1.15386962890625, 1.2113494873046875, 1.268829345703125, 1.3263092041015625, 1.3837890625]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 1.0, 4.0, 6.0, 3.0, 5.0, 8.0, 10.0, 10.0, 21.0, 30.0, 35.0, 73.0, 101.0, 158.0, 314.0, 554.0, 1172.0, 2778.0, 7993.0, 35155.0, 2764463.0, 1340196.0, 29375.0, 7044.0, 2490.0, 1096.0, 515.0, 255.0, 150.0, 84.0, 62.0, 41.0, 24.0, 16.0, 14.0, 9.0, 4.0, 10.0, 0.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0], "bins": [-2.84375, -2.7725830078125, -2.701416015625, -2.6302490234375, -2.55908203125, -2.4879150390625, -2.416748046875, -2.3455810546875, -2.2744140625, -2.2032470703125, -2.132080078125, -2.0609130859375, -1.98974609375, -1.9185791015625, -1.847412109375, -1.7762451171875, -1.705078125, -1.6339111328125, -1.562744140625, -1.4915771484375, -1.42041015625, -1.3492431640625, -1.278076171875, -1.2069091796875, -1.1357421875, -1.0645751953125, -0.993408203125, -0.9222412109375, -0.85107421875, -0.7799072265625, -0.708740234375, -0.6375732421875, -0.56640625, -0.4952392578125, -0.424072265625, -0.3529052734375, -0.28173828125, -0.2105712890625, -0.139404296875, -0.0682373046875, 0.0029296875, 0.0740966796875, 0.145263671875, 0.2164306640625, 0.28759765625, 0.3587646484375, 0.429931640625, 0.5010986328125, 0.572265625, 0.6434326171875, 0.714599609375, 0.7857666015625, 0.85693359375, 0.9281005859375, 0.999267578125, 1.0704345703125, 1.1416015625, 1.2127685546875, 1.283935546875, 1.3551025390625, 1.42626953125, 1.4974365234375, 1.568603515625, 1.6397705078125, 1.7109375]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 2.0, 6.0, 7.0, 9.0, 11.0, 11.0, 18.0, 19.0, 54.0, 111.0, 310.0, 900.0, 1506.0, 613.0, 236.0, 91.0, 46.0, 26.0, 23.0, 19.0, 13.0, 13.0, 4.0, 4.0, 7.0, 2.0, 6.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.45556640625, -0.4361114501953125, -0.416656494140625, -0.3972015380859375, -0.37774658203125, -0.3582916259765625, -0.338836669921875, -0.3193817138671875, -0.2999267578125, -0.2804718017578125, -0.261016845703125, -0.2415618896484375, -0.22210693359375, -0.2026519775390625, -0.183197021484375, -0.1637420654296875, -0.144287109375, -0.1248321533203125, -0.105377197265625, -0.0859222412109375, -0.06646728515625, -0.0470123291015625, -0.027557373046875, -0.0081024169921875, 0.0113525390625, 0.0308074951171875, 0.050262451171875, 0.0697174072265625, 0.08917236328125, 0.1086273193359375, 0.128082275390625, 0.1475372314453125, 0.1669921875, 0.1864471435546875, 0.205902099609375, 0.2253570556640625, 0.24481201171875, 0.2642669677734375, 0.283721923828125, 0.3031768798828125, 0.3226318359375, 0.3420867919921875, 0.361541748046875, 0.3809967041015625, 0.40045166015625, 0.4199066162109375, 0.439361572265625, 0.4588165283203125, 0.478271484375, 0.4977264404296875, 0.517181396484375, 0.5366363525390625, 0.55609130859375, 0.5755462646484375, 0.595001220703125, 0.6144561767578125, 0.6339111328125, 0.6533660888671875, 0.672821044921875, 0.6922760009765625, 0.71173095703125, 0.7311859130859375, 0.750640869140625, 0.7700958251953125, 0.78955078125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 16.0, 6.0, 13.0, 16.0, 30.0, 68.0, 112.0, 182.0, 240.0, 133.0, 74.0, 36.0, 24.0, 20.0, 12.0, 3.0, 5.0, 7.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-2.897313117980957, -2.8127846717834473, -2.7282562255859375, -2.6437277793884277, -2.559199571609497, -2.4746711254119873, -2.3901426792144775, -2.3056142330169678, -2.221086025238037, -2.1365575790405273, -2.0520291328430176, -1.9675008058547974, -1.8829724788665771, -1.7984440326690674, -1.7139155864715576, -1.6293871402740479, -1.544858694076538, -1.4603302478790283, -1.375801920890808, -1.2912734746932983, -1.2067451477050781, -1.1222167015075684, -1.0376882553100586, -0.9531598687171936, -0.8686314821243286, -0.7841030955314636, -0.6995747089385986, -0.6150462627410889, -0.5305178761482239, -0.4459894895553589, -0.3614610433578491, -0.27693265676498413, -0.19240450859069824, -0.10787610709667206, -0.023347705602645874, 0.061180710792541504, 0.1457090973854065, 0.23023748397827148, 0.31476593017578125, 0.39929431676864624, 0.48382270336151123, 0.5683510899543762, 0.6528794765472412, 0.737407922744751, 0.821936309337616, 0.906464695930481, 0.9909931421279907, 1.075521469116211, 1.1600499153137207, 1.2445783615112305, 1.3291066884994507, 1.4136351346969604, 1.4981634616851807, 1.5826919078826904, 1.6672203540802002, 1.75174880027771, 1.8362771272659302, 1.92080557346344, 2.00533390045166, 2.08986234664917, 2.1743907928466797, 2.2589192390441895, 2.343447685241699, 2.42797589302063, 2.5125043392181396]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 5.0, 4.0, 13.0, 18.0, 27.0, 34.0, 35.0, 57.0, 51.0, 66.0, 78.0, 85.0, 74.0, 69.0, 76.0, 71.0, 48.0, 42.0, 36.0, 35.0, 31.0, 20.0, 7.0, 7.0, 7.0, 4.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.907869815826416, -1.8558416366577148, -1.8038134574890137, -1.7517852783203125, -1.6997569799423218, -1.6477288007736206, -1.5957006216049194, -1.5436724424362183, -1.491644263267517, -1.439616084098816, -1.3875879049301147, -1.335559606552124, -1.2835314273834229, -1.2315032482147217, -1.1794750690460205, -1.1274468898773193, -1.0754187107086182, -1.023390531539917, -0.971362292766571, -0.9193341135978699, -0.8673059344291687, -0.8152776956558228, -0.7632495164871216, -0.7112213373184204, -0.6591930389404297, -0.6071648597717285, -0.5551366209983826, -0.5031084418296814, -0.4510802626609802, -0.39905205368995667, -0.3470238447189331, -0.29499566555023193, -0.24296748638153076, -0.1909392923116684, -0.13891109824180603, -0.08688288927078247, -0.034854695200920105, 0.01717349886894226, 0.06920170783996582, 0.12122988700866699, 0.17325809597969055, 0.22528629004955292, 0.2773144841194153, 0.32934269309043884, 0.3813709020614624, 0.4333990812301636, 0.48542729020118713, 0.5374554395675659, 0.5894836783409119, 0.641511857509613, 0.693540096282959, 0.7455682754516602, 0.7975964546203613, 0.8496246337890625, 0.9016528725624084, 0.9536810517311096, 1.0057092905044556, 1.0577374696731567, 1.109765648841858, 1.1617939472198486, 1.2138221263885498, 1.265850305557251, 1.3178784847259521, 1.3699066638946533, 1.4219348430633545]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 9.0, 13.0, 11.0, 29.0, 44.0, 73.0, 90.0, 170.0, 293.0, 606.0, 1302.0, 3725.0, 15752.0, 146734.0, 784529.0, 79224.0, 10818.0, 2946.0, 1075.0, 502.0, 263.0, 141.0, 79.0, 46.0, 21.0, 19.0, 9.0, 5.0, 7.0, 7.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.31005859375, -0.2967987060546875, -0.283538818359375, -0.2702789306640625, -0.25701904296875, -0.2437591552734375, -0.230499267578125, -0.2172393798828125, -0.2039794921875, -0.1907196044921875, -0.177459716796875, -0.1641998291015625, -0.15093994140625, -0.1376800537109375, -0.124420166015625, -0.1111602783203125, -0.097900390625, -0.0846405029296875, -0.071380615234375, -0.0581207275390625, -0.04486083984375, -0.0316009521484375, -0.018341064453125, -0.0050811767578125, 0.0081787109375, 0.0214385986328125, 0.034698486328125, 0.0479583740234375, 0.06121826171875, 0.0744781494140625, 0.087738037109375, 0.1009979248046875, 0.1142578125, 0.1275177001953125, 0.140777587890625, 0.1540374755859375, 0.16729736328125, 0.1805572509765625, 0.193817138671875, 0.2070770263671875, 0.2203369140625, 0.2335968017578125, 0.246856689453125, 0.2601165771484375, 0.27337646484375, 0.2866363525390625, 0.299896240234375, 0.3131561279296875, 0.326416015625, 0.3396759033203125, 0.352935791015625, 0.3661956787109375, 0.37945556640625, 0.3927154541015625, 0.405975341796875, 0.4192352294921875, 0.4324951171875, 0.4457550048828125, 0.459014892578125, 0.4722747802734375, 0.48553466796875, 0.4987945556640625, 0.512054443359375, 0.5253143310546875, 0.53857421875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 6.0, 11.0, 13.0, 15.0, 39.0, 28.0, 56.0, 59.0, 75.0, 106.0, 103.0, 100.0, 83.0, 85.0, 56.0, 49.0, 39.0, 29.0, 25.0, 4.0, 4.0, 10.0, 7.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.763671875, -1.7196197509765625, -1.675567626953125, -1.6315155029296875, -1.58746337890625, -1.5434112548828125, -1.499359130859375, -1.4553070068359375, -1.4112548828125, -1.3672027587890625, -1.323150634765625, -1.2790985107421875, -1.23504638671875, -1.1909942626953125, -1.146942138671875, -1.1028900146484375, -1.058837890625, -1.0147857666015625, -0.970733642578125, -0.9266815185546875, -0.88262939453125, -0.8385772705078125, -0.794525146484375, -0.7504730224609375, -0.7064208984375, -0.6623687744140625, -0.618316650390625, -0.5742645263671875, -0.53021240234375, -0.4861602783203125, -0.442108154296875, -0.3980560302734375, -0.35400390625, -0.3099517822265625, -0.265899658203125, -0.2218475341796875, -0.17779541015625, -0.1337432861328125, -0.089691162109375, -0.0456390380859375, -0.0015869140625, 0.0424652099609375, 0.086517333984375, 0.1305694580078125, 0.17462158203125, 0.2186737060546875, 0.262725830078125, 0.3067779541015625, 0.350830078125, 0.3948822021484375, 0.438934326171875, 0.4829864501953125, 0.52703857421875, 0.5710906982421875, 0.615142822265625, 0.6591949462890625, 0.7032470703125, 0.7472991943359375, 0.791351318359375, 0.8354034423828125, 0.87945556640625, 0.9235076904296875, 0.967559814453125, 1.0116119384765625, 1.0556640625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 4.0, 7.0, 2.0, 16.0, 15.0, 11.0, 18.0, 30.0, 56.0, 63.0, 102.0, 161.0, 192.0, 328.0, 447.0, 740.0, 1143.0, 1885.0, 3493.0, 7001.0, 16099.0, 42615.0, 144353.0, 472674.0, 247016.0, 66114.0, 23128.0, 9718.0, 4658.0, 2493.0, 1371.0, 893.0, 523.0, 382.0, 223.0, 152.0, 126.0, 83.0, 68.0, 49.0, 20.0, 19.0, 20.0, 18.0, 11.0, 6.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.16162109375, -0.15652084350585938, -0.15142059326171875, -0.14632034301757812, -0.1412200927734375, -0.13611984252929688, -0.13101959228515625, -0.12591934204101562, -0.120819091796875, -0.11571884155273438, -0.11061859130859375, -0.10551834106445312, -0.1004180908203125, -0.09531784057617188, -0.09021759033203125, -0.08511734008789062, -0.08001708984375, -0.07491683959960938, -0.06981658935546875, -0.06471633911132812, -0.0596160888671875, -0.054515838623046875, -0.04941558837890625, -0.044315338134765625, -0.039215087890625, -0.034114837646484375, -0.02901458740234375, -0.023914337158203125, -0.0188140869140625, -0.013713836669921875, -0.00861358642578125, -0.003513336181640625, 0.0015869140625, 0.006687164306640625, 0.01178741455078125, 0.016887664794921875, 0.0219879150390625, 0.027088165283203125, 0.03218841552734375, 0.037288665771484375, 0.042388916015625, 0.047489166259765625, 0.05258941650390625, 0.057689666748046875, 0.0627899169921875, 0.06789016723632812, 0.07299041748046875, 0.07809066772460938, 0.08319091796875, 0.08829116821289062, 0.09339141845703125, 0.09849166870117188, 0.1035919189453125, 0.10869216918945312, 0.11379241943359375, 0.11889266967773438, 0.123992919921875, 0.12909317016601562, 0.13419342041015625, 0.13929367065429688, 0.1443939208984375, 0.14949417114257812, 0.15459442138671875, 0.15969467163085938, 0.164794921875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 4.0, 5.0, 8.0, 5.0, 7.0, 9.0, 13.0, 8.0, 12.0, 13.0, 23.0, 28.0, 25.0, 32.0, 35.0, 33.0, 31.0, 43.0, 52.0, 38.0, 53.0, 38.0, 42.0, 52.0, 51.0, 34.0, 39.0, 33.0, 33.0, 24.0, 29.0, 22.0, 17.0, 17.0, 18.0, 17.0, 11.0, 12.0, 9.0, 9.0, 8.0, 3.0, 5.0, 2.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1953125, -1.15576171875, -1.1162109375, -1.07666015625, -1.037109375, -0.99755859375, -0.9580078125, -0.91845703125, -0.87890625, -0.83935546875, -0.7998046875, -0.76025390625, -0.720703125, -0.68115234375, -0.6416015625, -0.60205078125, -0.5625, -0.52294921875, -0.4833984375, -0.44384765625, -0.404296875, -0.36474609375, -0.3251953125, -0.28564453125, -0.24609375, -0.20654296875, -0.1669921875, -0.12744140625, -0.087890625, -0.04833984375, -0.0087890625, 0.03076171875, 0.0703125, 0.10986328125, 0.1494140625, 0.18896484375, 0.228515625, 0.26806640625, 0.3076171875, 0.34716796875, 0.38671875, 0.42626953125, 0.4658203125, 0.50537109375, 0.544921875, 0.58447265625, 0.6240234375, 0.66357421875, 0.703125, 0.74267578125, 0.7822265625, 0.82177734375, 0.861328125, 0.90087890625, 0.9404296875, 0.97998046875, 1.01953125, 1.05908203125, 1.0986328125, 1.13818359375, 1.177734375, 1.21728515625, 1.2568359375, 1.29638671875, 1.3359375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 8.0, 5.0, 3.0, 7.0, 12.0, 16.0, 18.0, 16.0, 20.0, 39.0, 50.0, 84.0, 109.0, 167.0, 244.0, 440.0, 701.0, 1223.0, 2083.0, 4150.0, 9221.0, 25285.0, 101484.0, 531550.0, 289017.0, 52666.0, 16187.0, 6436.0, 3086.0, 1655.0, 958.0, 542.0, 349.0, 220.0, 159.0, 101.0, 56.0, 49.0, 36.0, 27.0, 30.0, 17.0, 8.0, 6.0, 8.0, 6.0, 8.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.051971435546875, -0.05038642883300781, -0.048801422119140625, -0.04721641540527344, -0.04563140869140625, -0.04404640197753906, -0.042461395263671875, -0.04087638854980469, -0.0392913818359375, -0.03770637512207031, -0.036121368408203125, -0.03453636169433594, -0.03295135498046875, -0.03136634826660156, -0.029781341552734375, -0.028196334838867188, -0.026611328125, -0.025026321411132812, -0.023441314697265625, -0.021856307983398438, -0.02027130126953125, -0.018686294555664062, -0.017101287841796875, -0.015516281127929688, -0.0139312744140625, -0.012346267700195312, -0.010761260986328125, -0.009176254272460938, -0.00759124755859375, -0.0060062408447265625, -0.004421234130859375, -0.0028362274169921875, -0.001251220703125, 0.0003337860107421875, 0.001918792724609375, 0.0035037994384765625, 0.00508880615234375, 0.0066738128662109375, 0.008258819580078125, 0.009843826293945312, 0.0114288330078125, 0.013013839721679688, 0.014598846435546875, 0.016183853149414062, 0.01776885986328125, 0.019353866577148438, 0.020938873291015625, 0.022523880004882812, 0.02410888671875, 0.025693893432617188, 0.027278900146484375, 0.028863906860351562, 0.03044891357421875, 0.03203392028808594, 0.033618927001953125, 0.03520393371582031, 0.0367889404296875, 0.03837394714355469, 0.039958953857421875, 0.04154396057128906, 0.04312896728515625, 0.04471397399902344, 0.046298980712890625, 0.04788398742675781, 0.049468994140625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 5.0, 8.0, 11.0, 11.0, 18.0, 26.0, 49.0, 94.0, 118.0, 154.0, 163.0, 113.0, 80.0, 46.0, 32.0, 30.0, 13.0, 7.0, 3.0, 4.0, 4.0, 5.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.2988529205322266e-05, -5.137734115123749e-05, -4.976615309715271e-05, -4.815496504306793e-05, -4.6543776988983154e-05, -4.4932588934898376e-05, -4.33214008808136e-05, -4.171021282672882e-05, -4.009902477264404e-05, -3.8487836718559265e-05, -3.687664866447449e-05, -3.526546061038971e-05, -3.365427255630493e-05, -3.2043084502220154e-05, -3.0431896448135376e-05, -2.8820708394050598e-05, -2.720952033996582e-05, -2.5598332285881042e-05, -2.3987144231796265e-05, -2.2375956177711487e-05, -2.076476812362671e-05, -1.915358006954193e-05, -1.7542392015457153e-05, -1.5931203961372375e-05, -1.4320015907287598e-05, -1.270882785320282e-05, -1.1097639799118042e-05, -9.486451745033264e-06, -7.875263690948486e-06, -6.2640756368637085e-06, -4.652887582778931e-06, -3.041699528694153e-06, -1.430511474609375e-06, 1.8067657947540283e-07, 1.7918646335601807e-06, 3.4030526876449585e-06, 5.014240741729736e-06, 6.625428795814514e-06, 8.236616849899292e-06, 9.84780490398407e-06, 1.1458992958068848e-05, 1.3070181012153625e-05, 1.4681369066238403e-05, 1.629255712032318e-05, 1.790374517440796e-05, 1.9514933228492737e-05, 2.1126121282577515e-05, 2.2737309336662292e-05, 2.434849739074707e-05, 2.5959685444831848e-05, 2.7570873498916626e-05, 2.9182061553001404e-05, 3.079324960708618e-05, 3.240443766117096e-05, 3.401562571525574e-05, 3.5626813769340515e-05, 3.723800182342529e-05, 3.884918987751007e-05, 4.046037793159485e-05, 4.2071565985679626e-05, 4.3682754039764404e-05, 4.529394209384918e-05, 4.690513014793396e-05, 4.851631820201874e-05, 5.0127506256103516e-05]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 6.0, 13.0, 13.0, 20.0, 20.0, 40.0, 57.0, 68.0, 114.0, 129.0, 227.0, 351.0, 586.0, 925.0, 1762.0, 3307.0, 6981.0, 16810.0, 49474.0, 189472.0, 495007.0, 198672.0, 51857.0, 17590.0, 7307.0, 3398.0, 1762.0, 961.0, 569.0, 374.0, 210.0, 144.0, 94.0, 76.0, 42.0, 35.0, 20.0, 17.0, 11.0, 11.0, 4.0, 7.0, 5.0, 2.0, 3.0, 3.0, 1.0, 0.0, 3.0, 2.0], "bins": [-0.04522705078125, -0.04391670227050781, -0.042606353759765625, -0.04129600524902344, -0.03998565673828125, -0.03867530822753906, -0.037364959716796875, -0.03605461120605469, -0.0347442626953125, -0.03343391418457031, -0.032123565673828125, -0.030813217163085938, -0.02950286865234375, -0.028192520141601562, -0.026882171630859375, -0.025571823120117188, -0.024261474609375, -0.022951126098632812, -0.021640777587890625, -0.020330429077148438, -0.01902008056640625, -0.017709732055664062, -0.016399383544921875, -0.015089035034179688, -0.0137786865234375, -0.012468338012695312, -0.011157989501953125, -0.009847640991210938, -0.00853729248046875, -0.0072269439697265625, -0.005916595458984375, -0.0046062469482421875, -0.0032958984375, -0.0019855499267578125, -0.000675201416015625, 0.0006351470947265625, 0.00194549560546875, 0.0032558441162109375, 0.004566192626953125, 0.0058765411376953125, 0.0071868896484375, 0.008497238159179688, 0.009807586669921875, 0.011117935180664062, 0.01242828369140625, 0.013738632202148438, 0.015048980712890625, 0.016359329223632812, 0.017669677734375, 0.018980026245117188, 0.020290374755859375, 0.021600723266601562, 0.02291107177734375, 0.024221420288085938, 0.025531768798828125, 0.026842117309570312, 0.0281524658203125, 0.029462814331054688, 0.030773162841796875, 0.03208351135253906, 0.03339385986328125, 0.03470420837402344, 0.036014556884765625, 0.03732490539550781, 0.03863525390625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 5.0, 3.0, 7.0, 8.0, 12.0, 2.0, 13.0, 17.0, 28.0, 27.0, 46.0, 37.0, 52.0, 64.0, 70.0, 69.0, 78.0, 90.0, 62.0, 74.0, 38.0, 42.0, 29.0, 24.0, 25.0, 22.0, 10.0, 17.0, 10.0, 6.0, 6.0, 2.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.010894775390625, -0.010493159294128418, -0.010091543197631836, -0.009689927101135254, -0.009288311004638672, -0.00888669490814209, -0.008485078811645508, -0.008083462715148926, -0.007681846618652344, -0.007280230522155762, -0.00687861442565918, -0.006476998329162598, -0.006075382232666016, -0.005673766136169434, -0.0052721500396728516, -0.0048705339431762695, -0.0044689178466796875, -0.0040673017501831055, -0.0036656856536865234, -0.0032640695571899414, -0.0028624534606933594, -0.0024608373641967773, -0.0020592212677001953, -0.0016576051712036133, -0.0012559890747070312, -0.0008543729782104492, -0.0004527568817138672, -5.1140785217285156e-05, 0.0003504753112792969, 0.0007520914077758789, 0.001153707504272461, 0.001555323600769043, 0.001956939697265625, 0.002358555793762207, 0.002760171890258789, 0.003161787986755371, 0.003563404083251953, 0.003965020179748535, 0.004366636276245117, 0.004768252372741699, 0.005169868469238281, 0.005571484565734863, 0.005973100662231445, 0.006374716758728027, 0.006776332855224609, 0.007177948951721191, 0.0075795650482177734, 0.007981181144714355, 0.008382797241210938, 0.00878441333770752, 0.009186029434204102, 0.009587645530700684, 0.009989261627197266, 0.010390877723693848, 0.01079249382019043, 0.011194109916687012, 0.011595726013183594, 0.011997342109680176, 0.012398958206176758, 0.01280057430267334, 0.013202190399169922, 0.013603806495666504, 0.014005422592163086, 0.014407038688659668, 0.01480865478515625]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 6.0, 31.0, 54.0, 267.0, 478.0, 112.0, 37.0, 9.0, 4.0, 5.0, 2.0, 0.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.457675933837891, -4.319665431976318, -4.181655406951904, -4.043644905090332, -3.905634641647339, -3.7676243782043457, -3.6296138763427734, -3.4916036128997803, -3.353593349456787, -3.215583086013794, -3.077572822570801, -2.9395623207092285, -2.8015520572662354, -2.663541793823242, -2.52553129196167, -2.3875210285186768, -2.2495107650756836, -2.1115005016326904, -1.9734901189804077, -1.835479736328125, -1.6974694728851318, -1.5594592094421387, -1.421448826789856, -1.2834384441375732, -1.14542818069458, -1.007417917251587, -0.8694075345993042, -0.7313972115516663, -0.5933868885040283, -0.4553765654563904, -0.31736624240875244, -0.1793559193611145, -0.04134511947631836, 0.09666520357131958, 0.23467552661895752, 0.37268584966659546, 0.5106961727142334, 0.6487064957618713, 0.7867168188095093, 0.9247271418571472, 1.0627374649047852, 1.2007477283477783, 1.338758111000061, 1.4767684936523438, 1.614778757095337, 1.75278902053833, 1.8907994031906128, 2.0288097858428955, 2.1668200492858887, 2.304830312728882, 2.442840576171875, 2.5808510780334473, 2.7188613414764404, 2.8568716049194336, 2.994882106781006, 3.132892370223999, 3.270902633666992, 3.4089128971099854, 3.5469231605529785, 3.684933662414551, 3.822943925857544, 3.960954189300537, 4.098964691162109, 4.236974716186523, 4.374985218048096]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 8.0, 13.0, 19.0, 24.0, 51.0, 44.0, 75.0, 80.0, 102.0, 99.0, 104.0, 95.0, 78.0, 65.0, 43.0, 34.0, 35.0, 10.0, 6.0, 10.0, 5.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.8624941110610962, -1.8180227279663086, -1.7735512256622314, -1.7290798425674438, -1.6846084594726562, -1.640136957168579, -1.5956655740737915, -1.551194190979004, -1.5067226886749268, -1.4622513055801392, -1.417779803276062, -1.3733084201812744, -1.3288370370864868, -1.2843656539916992, -1.239894151687622, -1.1954227685928345, -1.1509513854980469, -1.1064800024032593, -1.0620085000991821, -1.0175371170043945, -0.9730657339096069, -0.9285942912101746, -0.8841228485107422, -0.8396514654159546, -0.7951800227165222, -0.7507085800170898, -0.7062371969223022, -0.6617657542228699, -0.6172943115234375, -0.5728229284286499, -0.5283514857292175, -0.48388007283210754, -0.4394086003303528, -0.3949371874332428, -0.3504657745361328, -0.30599433183670044, -0.26152291893959045, -0.21705150604248047, -0.1725800633430481, -0.1281086504459381, -0.08363723754882812, -0.03916581720113754, 0.0053056031465530396, 0.04977703094482422, 0.0942484438419342, 0.1387198567390442, 0.18319129943847656, 0.22766271233558655, 0.27213412523269653, 0.3166055381298065, 0.3610769510269165, 0.4055483937263489, 0.45001980662345886, 0.49449121952056885, 0.5389626622200012, 0.5834341049194336, 0.6279054880142212, 0.6723769307136536, 0.7168483138084412, 0.7613197565078735, 0.8057911396026611, 0.8502625823020935, 0.8947340250015259, 0.9392054080963135, 0.9836768507957458]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 7.0, 4.0, 4.0, 12.0, 9.0, 17.0, 28.0, 39.0, 71.0, 125.0, 198.0, 386.0, 860.0, 2464.0, 11431.0, 390462.0, 624198.0, 13527.0, 2881.0, 949.0, 369.0, 200.0, 115.0, 76.0, 47.0, 31.0, 18.0, 14.0, 3.0, 4.0, 2.0, 2.0, 0.0, 3.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7783203125, -1.727569580078125, -1.67681884765625, -1.626068115234375, -1.5753173828125, -1.524566650390625, -1.47381591796875, -1.423065185546875, -1.372314453125, -1.321563720703125, -1.27081298828125, -1.220062255859375, -1.1693115234375, -1.118560791015625, -1.06781005859375, -1.017059326171875, -0.96630859375, -0.915557861328125, -0.86480712890625, -0.814056396484375, -0.7633056640625, -0.712554931640625, -0.66180419921875, -0.611053466796875, -0.560302734375, -0.509552001953125, -0.45880126953125, -0.408050537109375, -0.3572998046875, -0.306549072265625, -0.25579833984375, -0.205047607421875, -0.154296875, -0.103546142578125, -0.05279541015625, -0.002044677734375, 0.0487060546875, 0.099456787109375, 0.15020751953125, 0.200958251953125, 0.251708984375, 0.302459716796875, 0.35321044921875, 0.403961181640625, 0.4547119140625, 0.505462646484375, 0.55621337890625, 0.606964111328125, 0.65771484375, 0.708465576171875, 0.75921630859375, 0.809967041015625, 0.8607177734375, 0.911468505859375, 0.96221923828125, 1.012969970703125, 1.063720703125, 1.114471435546875, 1.16522216796875, 1.215972900390625, 1.2667236328125, 1.317474365234375, 1.36822509765625, 1.418975830078125, 1.4697265625]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 7.0, 6.0, 15.0, 18.0, 28.0, 39.0, 38.0, 56.0, 69.0, 89.0, 83.0, 95.0, 91.0, 75.0, 67.0, 60.0, 47.0, 31.0, 25.0, 25.0, 15.0, 3.0, 5.0, 6.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.640625, -2.56219482421875, -2.4837646484375, -2.40533447265625, -2.326904296875, -2.24847412109375, -2.1700439453125, -2.09161376953125, -2.01318359375, -1.93475341796875, -1.8563232421875, -1.77789306640625, -1.699462890625, -1.62103271484375, -1.5426025390625, -1.46417236328125, -1.3857421875, -1.30731201171875, -1.2288818359375, -1.15045166015625, -1.072021484375, -0.99359130859375, -0.9151611328125, -0.83673095703125, -0.75830078125, -0.67987060546875, -0.6014404296875, -0.52301025390625, -0.444580078125, -0.36614990234375, -0.2877197265625, -0.20928955078125, -0.130859375, -0.05242919921875, 0.0260009765625, 0.10443115234375, 0.182861328125, 0.26129150390625, 0.3397216796875, 0.41815185546875, 0.49658203125, 0.57501220703125, 0.6534423828125, 0.73187255859375, 0.810302734375, 0.88873291015625, 0.9671630859375, 1.04559326171875, 1.1240234375, 1.20245361328125, 1.2808837890625, 1.35931396484375, 1.437744140625, 1.51617431640625, 1.5946044921875, 1.67303466796875, 1.75146484375, 1.82989501953125, 1.9083251953125, 1.98675537109375, 2.065185546875, 2.14361572265625, 2.2220458984375, 2.30047607421875, 2.37890625]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 10.0, 3.0, 10.0, 4.0, 16.0, 13.0, 21.0, 25.0, 31.0, 66.0, 92.0, 125.0, 220.0, 314.0, 591.0, 975.0, 1654.0, 3594.0, 10190.0, 99596.0, 873907.0, 43284.0, 7294.0, 2893.0, 1432.0, 794.0, 486.0, 283.0, 189.0, 133.0, 77.0, 62.0, 44.0, 34.0, 20.0, 13.0, 10.0, 16.0, 9.0, 5.0, 4.0, 1.0, 4.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0], "bins": [-1.0166015625, -0.9870223999023438, -0.9574432373046875, -0.9278640747070312, -0.898284912109375, -0.8687057495117188, -0.8391265869140625, -0.8095474243164062, -0.77996826171875, -0.7503890991210938, -0.7208099365234375, -0.6912307739257812, -0.661651611328125, -0.6320724487304688, -0.6024932861328125, -0.5729141235351562, -0.5433349609375, -0.5137557983398438, -0.4841766357421875, -0.45459747314453125, -0.425018310546875, -0.39543914794921875, -0.3658599853515625, -0.33628082275390625, -0.30670166015625, -0.27712249755859375, -0.2475433349609375, -0.21796417236328125, -0.188385009765625, -0.15880584716796875, -0.1292266845703125, -0.09964752197265625, -0.070068359375, -0.04048919677734375, -0.0109100341796875, 0.01866912841796875, 0.048248291015625, 0.07782745361328125, 0.1074066162109375, 0.13698577880859375, 0.16656494140625, 0.19614410400390625, 0.2257232666015625, 0.25530242919921875, 0.284881591796875, 0.31446075439453125, 0.3440399169921875, 0.37361907958984375, 0.4031982421875, 0.43277740478515625, 0.4623565673828125, 0.49193572998046875, 0.521514892578125, 0.5510940551757812, 0.5806732177734375, 0.6102523803710938, 0.63983154296875, 0.6694107055664062, 0.6989898681640625, 0.7285690307617188, 0.758148193359375, 0.7877273559570312, 0.8173065185546875, 0.8468856811523438, 0.87646484375]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 1.0, 4.0, 5.0, 5.0, 7.0, 10.0, 12.0, 23.0, 10.0, 14.0, 15.0, 25.0, 26.0, 28.0, 41.0, 37.0, 44.0, 42.0, 43.0, 47.0, 38.0, 36.0, 38.0, 35.0, 41.0, 46.0, 34.0, 52.0, 34.0, 16.0, 25.0, 30.0, 25.0, 16.0, 17.0, 13.0, 14.0, 17.0, 7.0, 9.0, 7.0, 4.0, 5.0, 1.0, 1.0, 3.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.47265625, -1.4248809814453125, -1.377105712890625, -1.3293304443359375, -1.28155517578125, -1.2337799072265625, -1.186004638671875, -1.1382293701171875, -1.0904541015625, -1.0426788330078125, -0.994903564453125, -0.9471282958984375, -0.89935302734375, -0.8515777587890625, -0.803802490234375, -0.7560272216796875, -0.708251953125, -0.6604766845703125, -0.612701416015625, -0.5649261474609375, -0.51715087890625, -0.4693756103515625, -0.421600341796875, -0.3738250732421875, -0.3260498046875, -0.2782745361328125, -0.230499267578125, -0.1827239990234375, -0.13494873046875, -0.0871734619140625, -0.039398193359375, 0.0083770751953125, 0.05615234375, 0.1039276123046875, 0.151702880859375, 0.1994781494140625, 0.24725341796875, 0.2950286865234375, 0.342803955078125, 0.3905792236328125, 0.4383544921875, 0.4861297607421875, 0.533905029296875, 0.5816802978515625, 0.62945556640625, 0.6772308349609375, 0.725006103515625, 0.7727813720703125, 0.820556640625, 0.8683319091796875, 0.916107177734375, 0.9638824462890625, 1.01165771484375, 1.0594329833984375, 1.107208251953125, 1.1549835205078125, 1.2027587890625, 1.2505340576171875, 1.298309326171875, 1.3460845947265625, 1.39385986328125, 1.4416351318359375, 1.489410400390625, 1.5371856689453125, 1.5849609375]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 7.0, 5.0, 12.0, 16.0, 14.0, 25.0, 51.0, 58.0, 96.0, 222.0, 423.0, 1072.0, 3416.0, 21238.0, 895455.0, 115656.0, 7585.0, 1873.0, 647.0, 307.0, 139.0, 108.0, 43.0, 27.0, 19.0, 12.0, 12.0, 4.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.67431640625, -0.6549148559570312, -0.6355133056640625, -0.6161117553710938, -0.596710205078125, -0.5773086547851562, -0.5579071044921875, -0.5385055541992188, -0.51910400390625, -0.49970245361328125, -0.4803009033203125, -0.46089935302734375, -0.441497802734375, -0.42209625244140625, -0.4026947021484375, -0.38329315185546875, -0.3638916015625, -0.34449005126953125, -0.3250885009765625, -0.30568695068359375, -0.286285400390625, -0.26688385009765625, -0.2474822998046875, -0.22808074951171875, -0.20867919921875, -0.18927764892578125, -0.1698760986328125, -0.15047454833984375, -0.131072998046875, -0.11167144775390625, -0.0922698974609375, -0.07286834716796875, -0.053466796875, -0.03406524658203125, -0.0146636962890625, 0.00473785400390625, 0.024139404296875, 0.04354095458984375, 0.0629425048828125, 0.08234405517578125, 0.10174560546875, 0.12114715576171875, 0.1405487060546875, 0.15995025634765625, 0.179351806640625, 0.19875335693359375, 0.2181549072265625, 0.23755645751953125, 0.2569580078125, 0.27635955810546875, 0.2957611083984375, 0.31516265869140625, 0.334564208984375, 0.35396575927734375, 0.3733673095703125, 0.39276885986328125, 0.41217041015625, 0.43157196044921875, 0.4509735107421875, 0.47037506103515625, 0.489776611328125, 0.5091781616210938, 0.5285797119140625, 0.5479812622070312, 0.5673828125]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 4.0, 5.0, 12.0, 20.0, 28.0, 46.0, 130.0, 386.0, 215.0, 72.0, 45.0, 15.0, 16.0, 8.0, 6.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00018095970153808594, -0.00017732474952936172, -0.0001736897975206375, -0.0001700548455119133, -0.0001664198935031891, -0.00016278494149446487, -0.00015914998948574066, -0.00015551503747701645, -0.00015188008546829224, -0.00014824513345956802, -0.0001446101814508438, -0.0001409752294421196, -0.00013734027743339539, -0.00013370532542467117, -0.00013007037341594696, -0.00012643542140722275, -0.00012280046939849854, -0.00011916551738977432, -0.00011553056538105011, -0.0001118956133723259, -0.00010826066136360168, -0.00010462570935487747, -0.00010099075734615326, -9.735580533742905e-05, -9.372085332870483e-05, -9.008590131998062e-05, -8.645094931125641e-05, -8.28159973025322e-05, -7.918104529380798e-05, -7.554609328508377e-05, -7.191114127635956e-05, -6.827618926763535e-05, -6.464123725891113e-05, -6.100628525018692e-05, -5.737133324146271e-05, -5.3736381232738495e-05, -5.010142922401428e-05, -4.646647721529007e-05, -4.283152520656586e-05, -3.9196573197841644e-05, -3.556162118911743e-05, -3.192666918039322e-05, -2.8291717171669006e-05, -2.4656765162944794e-05, -2.102181315422058e-05, -1.738686114549637e-05, -1.3751909136772156e-05, -1.0116957128047943e-05, -6.4820051193237305e-06, -2.847053110599518e-06, 7.878988981246948e-07, 4.4228509068489075e-06, 8.05780291557312e-06, 1.1692754924297333e-05, 1.5327706933021545e-05, 1.8962658941745758e-05, 2.259761095046997e-05, 2.6232562959194183e-05, 2.9867514967918396e-05, 3.350246697664261e-05, 3.713741898536682e-05, 4.0772370994091034e-05, 4.4407323002815247e-05, 4.804227501153946e-05, 5.167722702026367e-05]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 6.0, 3.0, 5.0, 12.0, 23.0, 26.0, 37.0, 80.0, 142.0, 299.0, 616.0, 1531.0, 4692.0, 23567.0, 858957.0, 142973.0, 10695.0, 3024.0, 944.0, 447.0, 216.0, 92.0, 54.0, 34.0, 24.0, 13.0, 9.0, 6.0, 9.0, 6.0, 4.0, 2.0, 6.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.483154296875, -0.4651222229003906, -0.44709014892578125, -0.4290580749511719, -0.4110260009765625, -0.3929939270019531, -0.37496185302734375, -0.3569297790527344, -0.338897705078125, -0.3208656311035156, -0.30283355712890625, -0.2848014831542969, -0.2667694091796875, -0.24873733520507812, -0.23070526123046875, -0.21267318725585938, -0.19464111328125, -0.17660903930664062, -0.15857696533203125, -0.14054489135742188, -0.1225128173828125, -0.10448074340820312, -0.08644866943359375, -0.06841659545898438, -0.050384521484375, -0.032352447509765625, -0.01432037353515625, 0.003711700439453125, 0.0217437744140625, 0.039775848388671875, 0.05780792236328125, 0.07583999633789062, 0.0938720703125, 0.11190414428710938, 0.12993621826171875, 0.14796829223632812, 0.1660003662109375, 0.18403244018554688, 0.20206451416015625, 0.22009658813476562, 0.238128662109375, 0.2561607360839844, 0.27419281005859375, 0.2922248840332031, 0.3102569580078125, 0.3282890319824219, 0.34632110595703125, 0.3643531799316406, 0.38238525390625, 0.4004173278808594, 0.41844940185546875, 0.4364814758300781, 0.4545135498046875, 0.4725456237792969, 0.49057769775390625, 0.5086097717285156, 0.526641845703125, 0.5446739196777344, 0.5627059936523438, 0.5807380676269531, 0.5987701416015625, 0.6168022155761719, 0.6348342895507812, 0.6528663635253906, 0.6708984375]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 5.0, 3.0, 1.0, 1.0, 7.0, 5.0, 5.0, 20.0, 13.0, 29.0, 38.0, 57.0, 112.0, 171.0, 228.0, 97.0, 67.0, 51.0, 22.0, 14.0, 15.0, 9.0, 6.0, 4.0, 3.0, 2.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.2041015625, -0.19887542724609375, -0.1936492919921875, -0.18842315673828125, -0.183197021484375, -0.17797088623046875, -0.1727447509765625, -0.16751861572265625, -0.16229248046875, -0.15706634521484375, -0.1518402099609375, -0.14661407470703125, -0.141387939453125, -0.13616180419921875, -0.1309356689453125, -0.12570953369140625, -0.1204833984375, -0.11525726318359375, -0.1100311279296875, -0.10480499267578125, -0.099578857421875, -0.09435272216796875, -0.0891265869140625, -0.08390045166015625, -0.07867431640625, -0.07344818115234375, -0.0682220458984375, -0.06299591064453125, -0.057769775390625, -0.05254364013671875, -0.0473175048828125, -0.04209136962890625, -0.036865234375, -0.03163909912109375, -0.0264129638671875, -0.02118682861328125, -0.015960693359375, -0.01073455810546875, -0.0055084228515625, -0.00028228759765625, 0.00494384765625, 0.01016998291015625, 0.0153961181640625, 0.02062225341796875, 0.025848388671875, 0.03107452392578125, 0.0363006591796875, 0.04152679443359375, 0.0467529296875, 0.05197906494140625, 0.0572052001953125, 0.06243133544921875, 0.067657470703125, 0.07288360595703125, 0.0781097412109375, 0.08333587646484375, 0.08856201171875, 0.09378814697265625, 0.0990142822265625, 0.10424041748046875, 0.109466552734375, 0.11469268798828125, 0.1199188232421875, 0.12514495849609375, 0.13037109375]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 9.0, 16.0, 25.0, 46.0, 101.0, 196.0, 310.0, 149.0, 66.0, 34.0, 24.0, 6.0, 5.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.903681993484497, -2.7609798908233643, -2.6182777881622314, -2.4755756855010986, -2.3328733444213867, -2.190171241760254, -2.047469139099121, -1.9047670364379883, -1.7620649337768555, -1.6193628311157227, -1.4766607284545898, -1.3339585065841675, -1.1912564039230347, -1.0485543012619019, -0.9058521389961243, -0.7631499767303467, -0.6204478740692139, -0.47774574160575867, -0.33504360914230347, -0.19234147667884827, -0.049639344215393066, 0.09306275844573975, 0.23576492071151733, 0.3784670829772949, 0.5211691856384277, 0.6638712882995605, 0.8065734505653381, 0.9492756128311157, 1.0919777154922485, 1.2346798181533813, 1.3773820400238037, 1.5200841426849365, 1.6627860069274902, 1.805488109588623, 1.9481902122497559, 2.0908923149108887, 2.2335944175720215, 2.3762965202331543, 2.518998861312866, 2.661700963973999, 2.804403066635132, 2.9471051692962646, 3.0898072719573975, 3.2325093746185303, 3.375211715698242, 3.517913818359375, 3.660615921020508, 3.8033180236816406, 3.9460201263427734, 4.088722229003906, 4.231424331665039, 4.374126434326172, 4.516828536987305, 4.6595306396484375, 4.80223274230957, 4.944934844970703, 5.087636947631836, 5.230339050292969, 5.373041152954102, 5.515743255615234, 5.658445358276367, 5.8011474609375, 5.943849563598633, 6.086551666259766, 6.229254245758057]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 6.0, 10.0, 6.0, 5.0, 19.0, 17.0, 17.0, 24.0, 33.0, 29.0, 34.0, 51.0, 49.0, 44.0, 60.0, 47.0, 62.0, 52.0, 45.0, 58.0, 40.0, 51.0, 36.0, 42.0, 36.0, 27.0, 26.0, 23.0, 15.0, 15.0, 8.0, 5.0, 4.0, 5.0, 3.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0103719234466553, -2.907381772994995, -2.804391384124756, -2.7014012336730957, -2.5984108448028564, -2.4954206943511963, -2.392430305480957, -2.289440155029297, -2.1864500045776367, -2.0834598541259766, -1.9804694652557373, -1.8774793148040771, -1.7744890451431274, -1.6714987754821777, -1.568508505821228, -1.4655182361602783, -1.3625279664993286, -1.259537696838379, -1.1565474271774292, -1.0535571575164795, -0.9505670070648193, -0.8475767374038696, -0.7445864677429199, -0.641596257686615, -0.5386059880256653, -0.43561574816703796, -0.33262550830841064, -0.22963523864746094, -0.12664499878883362, -0.0236547589302063, 0.07933551073074341, 0.18232572078704834, 0.28531599044799805, 0.38830623030662537, 0.4912964701652527, 0.5942867398262024, 0.6972769498825073, 0.800267219543457, 0.9032574892044067, 1.0062477588653564, 1.1092379093170166, 1.2122281789779663, 1.315218448638916, 1.4182085990905762, 1.5211988687515259, 1.6241891384124756, 1.7271794080734253, 1.830169677734375, 1.9331599473953247, 2.0361502170562744, 2.1391403675079346, 2.242130756378174, 2.345120906829834, 2.448111057281494, 2.5511014461517334, 2.6540915966033936, 2.757081985473633, 2.860072135925293, 2.9630625247955322, 3.0660526752471924, 3.1690430641174316, 3.272033214569092, 3.375023365020752, 3.478013753890991, 3.5810039043426514]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 8.0, 5.0, 3.0, 2.0, 5.0, 9.0, 11.0, 11.0, 9.0, 12.0, 23.0, 34.0, 45.0, 68.0, 98.0, 160.0, 296.0, 461.0, 778.0, 1639.0, 3986.0, 15256.0, 213345.0, 3794245.0, 140270.0, 14421.0, 4736.0, 2041.0, 918.0, 490.0, 292.0, 203.0, 111.0, 88.0, 62.0, 39.0, 40.0, 25.0, 11.0, 8.0, 9.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-3.111328125, -3.0324859619140625, -2.953643798828125, -2.8748016357421875, -2.79595947265625, -2.7171173095703125, -2.638275146484375, -2.5594329833984375, -2.4805908203125, -2.4017486572265625, -2.322906494140625, -2.2440643310546875, -2.16522216796875, -2.0863800048828125, -2.007537841796875, -1.9286956787109375, -1.849853515625, -1.7710113525390625, -1.692169189453125, -1.6133270263671875, -1.53448486328125, -1.4556427001953125, -1.376800537109375, -1.2979583740234375, -1.2191162109375, -1.1402740478515625, -1.061431884765625, -0.9825897216796875, -0.90374755859375, -0.8249053955078125, -0.746063232421875, -0.6672210693359375, -0.58837890625, -0.5095367431640625, -0.430694580078125, -0.3518524169921875, -0.27301025390625, -0.1941680908203125, -0.115325927734375, -0.0364837646484375, 0.0423583984375, 0.1212005615234375, 0.200042724609375, 0.2788848876953125, 0.35772705078125, 0.4365692138671875, 0.515411376953125, 0.5942535400390625, 0.673095703125, 0.7519378662109375, 0.830780029296875, 0.9096221923828125, 0.98846435546875, 1.0673065185546875, 1.146148681640625, 1.2249908447265625, 1.3038330078125, 1.3826751708984375, 1.461517333984375, 1.5403594970703125, 1.61920166015625, 1.6980438232421875, 1.776885986328125, 1.8557281494140625, 1.9345703125]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 2.0, 10.0, 6.0, 14.0, 22.0, 30.0, 42.0, 54.0, 65.0, 95.0, 110.0, 94.0, 93.0, 85.0, 71.0, 61.0, 38.0, 26.0, 26.0, 24.0, 13.0, 5.0, 9.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.8837890625, -1.833709716796875, -1.78363037109375, -1.733551025390625, -1.6834716796875, -1.633392333984375, -1.58331298828125, -1.533233642578125, -1.483154296875, -1.433074951171875, -1.38299560546875, -1.332916259765625, -1.2828369140625, -1.232757568359375, -1.18267822265625, -1.132598876953125, -1.08251953125, -1.032440185546875, -0.98236083984375, -0.932281494140625, -0.8822021484375, -0.832122802734375, -0.78204345703125, -0.731964111328125, -0.681884765625, -0.631805419921875, -0.58172607421875, -0.531646728515625, -0.4815673828125, -0.431488037109375, -0.38140869140625, -0.331329345703125, -0.28125, -0.231170654296875, -0.18109130859375, -0.131011962890625, -0.0809326171875, -0.030853271484375, 0.01922607421875, 0.069305419921875, 0.119384765625, 0.169464111328125, 0.21954345703125, 0.269622802734375, 0.3197021484375, 0.369781494140625, 0.41986083984375, 0.469940185546875, 0.52001953125, 0.570098876953125, 0.62017822265625, 0.670257568359375, 0.7203369140625, 0.770416259765625, 0.82049560546875, 0.870574951171875, 0.920654296875, 0.970733642578125, 1.02081298828125, 1.070892333984375, 1.1209716796875, 1.171051025390625, 1.22113037109375, 1.271209716796875, 1.3212890625]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 9.0, 7.0, 5.0, 13.0, 16.0, 18.0, 31.0, 43.0, 55.0, 70.0, 112.0, 193.0, 336.0, 555.0, 1086.0, 2335.0, 5272.0, 15379.0, 82500.0, 3821435.0, 227651.0, 23966.0, 7162.0, 2847.0, 1383.0, 765.0, 379.0, 231.0, 149.0, 88.0, 56.0, 43.0, 22.0, 17.0, 12.0, 15.0, 7.0, 7.0, 5.0, 4.0, 2.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.923828125, -1.861083984375, -1.79833984375, -1.735595703125, -1.6728515625, -1.610107421875, -1.54736328125, -1.484619140625, -1.421875, -1.359130859375, -1.29638671875, -1.233642578125, -1.1708984375, -1.108154296875, -1.04541015625, -0.982666015625, -0.919921875, -0.857177734375, -0.79443359375, -0.731689453125, -0.6689453125, -0.606201171875, -0.54345703125, -0.480712890625, -0.41796875, -0.355224609375, -0.29248046875, -0.229736328125, -0.1669921875, -0.104248046875, -0.04150390625, 0.021240234375, 0.083984375, 0.146728515625, 0.20947265625, 0.272216796875, 0.3349609375, 0.397705078125, 0.46044921875, 0.523193359375, 0.5859375, 0.648681640625, 0.71142578125, 0.774169921875, 0.8369140625, 0.899658203125, 0.96240234375, 1.025146484375, 1.087890625, 1.150634765625, 1.21337890625, 1.276123046875, 1.3388671875, 1.401611328125, 1.46435546875, 1.527099609375, 1.58984375, 1.652587890625, 1.71533203125, 1.778076171875, 1.8408203125, 1.903564453125, 1.96630859375, 2.029052734375, 2.091796875]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 4.0, 7.0, 3.0, 3.0, 10.0, 5.0, 8.0, 17.0, 12.0, 18.0, 29.0, 36.0, 83.0, 191.0, 476.0, 1287.0, 1072.0, 434.0, 161.0, 70.0, 43.0, 24.0, 17.0, 16.0, 10.0, 7.0, 4.0, 6.0, 4.0, 2.0, 2.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.61767578125, -0.5994491577148438, -0.5812225341796875, -0.5629959106445312, -0.544769287109375, -0.5265426635742188, -0.5083160400390625, -0.49008941650390625, -0.47186279296875, -0.45363616943359375, -0.4354095458984375, -0.41718292236328125, -0.398956298828125, -0.38072967529296875, -0.3625030517578125, -0.34427642822265625, -0.3260498046875, -0.30782318115234375, -0.2895965576171875, -0.27136993408203125, -0.253143310546875, -0.23491668701171875, -0.2166900634765625, -0.19846343994140625, -0.18023681640625, -0.16201019287109375, -0.1437835693359375, -0.12555694580078125, -0.107330322265625, -0.08910369873046875, -0.0708770751953125, -0.05265045166015625, -0.034423828125, -0.01619720458984375, 0.0020294189453125, 0.02025604248046875, 0.038482666015625, 0.05670928955078125, 0.0749359130859375, 0.09316253662109375, 0.11138916015625, 0.12961578369140625, 0.1478424072265625, 0.16606903076171875, 0.184295654296875, 0.20252227783203125, 0.2207489013671875, 0.23897552490234375, 0.2572021484375, 0.27542877197265625, 0.2936553955078125, 0.31188201904296875, 0.330108642578125, 0.34833526611328125, 0.3665618896484375, 0.38478851318359375, 0.40301513671875, 0.42124176025390625, 0.4394683837890625, 0.45769500732421875, 0.475921630859375, 0.49414825439453125, 0.5123748779296875, 0.5306015014648438, 0.548828125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 7.0, 4.0, 2.0, 1.0, 4.0, 5.0, 8.0, 19.0, 17.0, 52.0, 51.0, 103.0, 130.0, 176.0, 158.0, 100.0, 59.0, 34.0, 29.0, 16.0, 8.0, 7.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7705849409103394, -1.701843023300171, -1.6331011056900024, -1.564359188079834, -1.495617151260376, -1.4268752336502075, -1.358133316040039, -1.2893913984298706, -1.2206494808197021, -1.1519075632095337, -1.0831656455993652, -1.0144236087799072, -0.9456816911697388, -0.8769397735595703, -0.8081978559494019, -0.7394559383392334, -0.6707139015197754, -0.6019719839096069, -0.5332300066947937, -0.46448808908462524, -0.3957461416721344, -0.32700419425964355, -0.2582622766494751, -0.18952032923698425, -0.12077838182449341, -0.05203644186258316, 0.016705498099327087, 0.08544743061065674, 0.15418937802314758, 0.22293132543563843, 0.2916732430458069, 0.36041519045829773, 0.4291572570800781, 0.49789920449256897, 0.5666411519050598, 0.6353830695152283, 0.7041250467300415, 0.77286696434021, 0.8416088819503784, 0.9103507995605469, 0.9790927767753601, 1.0478347539901733, 1.1165766716003418, 1.1853185892105103, 1.2540605068206787, 1.3228025436401367, 1.3915443420410156, 1.4602863788604736, 1.529028296470642, 1.5977702140808105, 1.666512131690979, 1.7352540493011475, 1.8039960861206055, 1.872738003730774, 1.9414799213409424, 2.0102219581604004, 2.0789637565612793, 2.1477057933807373, 2.216447591781616, 2.285189628601074, 2.353931427001953, 2.422673463821411, 2.491415500640869, 2.560157299041748, 2.628899335861206]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 4.0, 3.0, 9.0, 1.0, 12.0, 13.0, 20.0, 22.0, 30.0, 42.0, 36.0, 41.0, 52.0, 69.0, 67.0, 65.0, 61.0, 55.0, 57.0, 61.0, 41.0, 53.0, 32.0, 43.0, 24.0, 27.0, 23.0, 9.0, 16.0, 12.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4072253704071045, -1.364511489868164, -1.3217976093292236, -1.2790837287902832, -1.2363698482513428, -1.1936559677124023, -1.150942087173462, -1.1082282066345215, -1.065514326095581, -1.0228004455566406, -0.9800865650177002, -0.9373726844787598, -0.8946588039398193, -0.8519449234008789, -0.8092310428619385, -0.766517162322998, -0.7238032817840576, -0.6810894012451172, -0.6383755207061768, -0.5956616401672363, -0.5529477596282959, -0.5102338790893555, -0.46751999855041504, -0.4248061180114746, -0.3820922374725342, -0.33937835693359375, -0.2966644763946533, -0.2539505958557129, -0.21123671531677246, -0.16852283477783203, -0.1258089542388916, -0.08309507369995117, -0.04038119316101074, 0.0023326873779296875, 0.04504656791687012, 0.08776044845581055, 0.13047432899475098, 0.1731882095336914, 0.21590209007263184, 0.25861597061157227, 0.3013298511505127, 0.3440437316894531, 0.38675761222839355, 0.429471492767334, 0.4721853733062744, 0.5148992538452148, 0.5576131343841553, 0.6003270149230957, 0.6430408954620361, 0.6857547760009766, 0.728468656539917, 0.7711825370788574, 0.8138964176177979, 0.8566102981567383, 0.8993241786956787, 0.9420380592346191, 0.9847519397735596, 1.0274658203125, 1.0701797008514404, 1.1128935813903809, 1.1556074619293213, 1.1983213424682617, 1.2410352230072021, 1.2837491035461426, 1.326462984085083]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [4.0, 3.0, 0.0, 3.0, 1.0, 1.0, 5.0, 3.0, 3.0, 5.0, 2.0, 4.0, 13.0, 17.0, 23.0, 56.0, 82.0, 151.0, 290.0, 519.0, 1208.0, 3037.0, 9980.0, 69193.0, 847330.0, 98462.0, 12087.0, 3389.0, 1388.0, 643.0, 299.0, 150.0, 65.0, 40.0, 36.0, 33.0, 11.0, 13.0, 6.0, 5.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.45068359375, -0.43233489990234375, -0.4139862060546875, -0.39563751220703125, -0.377288818359375, -0.35894012451171875, -0.3405914306640625, -0.32224273681640625, -0.30389404296875, -0.28554534912109375, -0.2671966552734375, -0.24884796142578125, -0.230499267578125, -0.21215057373046875, -0.1938018798828125, -0.17545318603515625, -0.1571044921875, -0.13875579833984375, -0.1204071044921875, -0.10205841064453125, -0.083709716796875, -0.06536102294921875, -0.0470123291015625, -0.02866363525390625, -0.01031494140625, 0.00803375244140625, 0.0263824462890625, 0.04473114013671875, 0.063079833984375, 0.08142852783203125, 0.0997772216796875, 0.11812591552734375, 0.136474609375, 0.15482330322265625, 0.1731719970703125, 0.19152069091796875, 0.209869384765625, 0.22821807861328125, 0.2465667724609375, 0.26491546630859375, 0.28326416015625, 0.30161285400390625, 0.3199615478515625, 0.33831024169921875, 0.356658935546875, 0.37500762939453125, 0.3933563232421875, 0.41170501708984375, 0.4300537109375, 0.44840240478515625, 0.4667510986328125, 0.48509979248046875, 0.503448486328125, 0.5217971801757812, 0.5401458740234375, 0.5584945678710938, 0.57684326171875, 0.5951919555664062, 0.6135406494140625, 0.6318893432617188, 0.650238037109375, 0.6685867309570312, 0.6869354248046875, 0.7052841186523438, 0.7236328125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 6.0, 4.0, 2.0, 4.0, 8.0, 11.0, 16.0, 23.0, 43.0, 51.0, 48.0, 73.0, 87.0, 105.0, 103.0, 87.0, 80.0, 73.0, 50.0, 42.0, 28.0, 24.0, 23.0, 14.0, 8.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.6376953125, -1.5970611572265625, -1.556427001953125, -1.5157928466796875, -1.47515869140625, -1.4345245361328125, -1.393890380859375, -1.3532562255859375, -1.3126220703125, -1.2719879150390625, -1.231353759765625, -1.1907196044921875, -1.15008544921875, -1.1094512939453125, -1.068817138671875, -1.0281829833984375, -0.987548828125, -0.9469146728515625, -0.906280517578125, -0.8656463623046875, -0.82501220703125, -0.7843780517578125, -0.743743896484375, -0.7031097412109375, -0.6624755859375, -0.6218414306640625, -0.581207275390625, -0.5405731201171875, -0.49993896484375, -0.4593048095703125, -0.418670654296875, -0.3780364990234375, -0.33740234375, -0.2967681884765625, -0.256134033203125, -0.2154998779296875, -0.17486572265625, -0.1342315673828125, -0.093597412109375, -0.0529632568359375, -0.0123291015625, 0.0283050537109375, 0.068939208984375, 0.1095733642578125, 0.15020751953125, 0.1908416748046875, 0.231475830078125, 0.2721099853515625, 0.312744140625, 0.3533782958984375, 0.394012451171875, 0.4346466064453125, 0.47528076171875, 0.5159149169921875, 0.556549072265625, 0.5971832275390625, 0.6378173828125, 0.6784515380859375, 0.719085693359375, 0.7597198486328125, 0.80035400390625, 0.8409881591796875, 0.881622314453125, 0.9222564697265625, 0.962890625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 3.0, 5.0, 7.0, 5.0, 5.0, 8.0, 20.0, 22.0, 27.0, 56.0, 73.0, 144.0, 220.0, 299.0, 552.0, 942.0, 1705.0, 3222.0, 7259.0, 21659.0, 112437.0, 694756.0, 161212.0, 27231.0, 8364.0, 3823.0, 1815.0, 1053.0, 620.0, 343.0, 217.0, 149.0, 98.0, 64.0, 42.0, 23.0, 24.0, 14.0, 13.0, 6.0, 3.0, 2.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.281982421875, -0.2727622985839844, -0.26354217529296875, -0.2543220520019531, -0.2451019287109375, -0.23588180541992188, -0.22666168212890625, -0.21744155883789062, -0.208221435546875, -0.19900131225585938, -0.18978118896484375, -0.18056106567382812, -0.1713409423828125, -0.16212081909179688, -0.15290069580078125, -0.14368057250976562, -0.13446044921875, -0.12524032592773438, -0.11602020263671875, -0.10680007934570312, -0.0975799560546875, -0.08835983276367188, -0.07913970947265625, -0.06991958618164062, -0.060699462890625, -0.051479339599609375, -0.04225921630859375, -0.033039093017578125, -0.0238189697265625, -0.014598846435546875, -0.00537872314453125, 0.003841400146484375, 0.0130615234375, 0.022281646728515625, 0.03150177001953125, 0.040721893310546875, 0.0499420166015625, 0.059162139892578125, 0.06838226318359375, 0.07760238647460938, 0.086822509765625, 0.09604263305664062, 0.10526275634765625, 0.11448287963867188, 0.1237030029296875, 0.13292312622070312, 0.14214324951171875, 0.15136337280273438, 0.16058349609375, 0.16980361938476562, 0.17902374267578125, 0.18824386596679688, 0.1974639892578125, 0.20668411254882812, 0.21590423583984375, 0.22512435913085938, 0.234344482421875, 0.24356460571289062, 0.25278472900390625, 0.2620048522949219, 0.2712249755859375, 0.2804450988769531, 0.28966522216796875, 0.2988853454589844, 0.30810546875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 1.0, 6.0, 3.0, 10.0, 4.0, 11.0, 7.0, 10.0, 14.0, 15.0, 29.0, 18.0, 25.0, 31.0, 38.0, 34.0, 35.0, 52.0, 40.0, 46.0, 56.0, 38.0, 49.0, 35.0, 47.0, 40.0, 38.0, 48.0, 30.0, 29.0, 30.0, 19.0, 23.0, 20.0, 9.0, 8.0, 7.0, 10.0, 12.0, 3.0, 9.0, 6.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0634765625, -1.0264739990234375, -0.989471435546875, -0.9524688720703125, -0.91546630859375, -0.8784637451171875, -0.841461181640625, -0.8044586181640625, -0.7674560546875, -0.7304534912109375, -0.693450927734375, -0.6564483642578125, -0.61944580078125, -0.5824432373046875, -0.545440673828125, -0.5084381103515625, -0.471435546875, -0.4344329833984375, -0.397430419921875, -0.3604278564453125, -0.32342529296875, -0.2864227294921875, -0.249420166015625, -0.2124176025390625, -0.1754150390625, -0.1384124755859375, -0.101409912109375, -0.0644073486328125, -0.02740478515625, 0.0095977783203125, 0.046600341796875, 0.0836029052734375, 0.12060546875, 0.1576080322265625, 0.194610595703125, 0.2316131591796875, 0.26861572265625, 0.3056182861328125, 0.342620849609375, 0.3796234130859375, 0.4166259765625, 0.4536285400390625, 0.490631103515625, 0.5276336669921875, 0.56463623046875, 0.6016387939453125, 0.638641357421875, 0.6756439208984375, 0.712646484375, 0.7496490478515625, 0.786651611328125, 0.8236541748046875, 0.86065673828125, 0.8976593017578125, 0.934661865234375, 0.9716644287109375, 1.0086669921875, 1.0456695556640625, 1.082672119140625, 1.1196746826171875, 1.15667724609375, 1.1936798095703125, 1.230682373046875, 1.2676849365234375, 1.3046875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 5.0, 10.0, 13.0, 15.0, 23.0, 31.0, 71.0, 130.0, 241.0, 640.0, 1949.0, 8591.0, 86737.0, 883729.0, 56718.0, 6816.0, 1680.0, 605.0, 234.0, 116.0, 77.0, 38.0, 39.0, 16.0, 12.0, 7.0, 2.0, 3.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13232421875, -0.1275005340576172, -0.12267684936523438, -0.11785316467285156, -0.11302947998046875, -0.10820579528808594, -0.10338211059570312, -0.09855842590332031, -0.0937347412109375, -0.08891105651855469, -0.08408737182617188, -0.07926368713378906, -0.07444000244140625, -0.06961631774902344, -0.06479263305664062, -0.05996894836425781, -0.055145263671875, -0.05032157897949219, -0.045497894287109375, -0.04067420959472656, -0.03585052490234375, -0.031026840209960938, -0.026203155517578125, -0.021379470825195312, -0.0165557861328125, -0.011732101440429688, -0.006908416748046875, -0.0020847320556640625, 0.00273895263671875, 0.0075626373291015625, 0.012386322021484375, 0.017210006713867188, 0.02203369140625, 0.026857376098632812, 0.031681060791015625, 0.03650474548339844, 0.04132843017578125, 0.04615211486816406, 0.050975799560546875, 0.05579948425292969, 0.0606231689453125, 0.06544685363769531, 0.07027053833007812, 0.07509422302246094, 0.07991790771484375, 0.08474159240722656, 0.08956527709960938, 0.09438896179199219, 0.099212646484375, 0.10403633117675781, 0.10886001586914062, 0.11368370056152344, 0.11850738525390625, 0.12333106994628906, 0.12815475463867188, 0.1329784393310547, 0.1378021240234375, 0.1426258087158203, 0.14744949340820312, 0.15227317810058594, 0.15709686279296875, 0.16192054748535156, 0.16674423217773438, 0.1715679168701172, 0.1763916015625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 5.0, 5.0, 5.0, 9.0, 9.0, 32.0, 57.0, 148.0, 276.0, 254.0, 115.0, 41.0, 12.0, 13.0, 10.0, 6.0, 1.0, 2.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011628866195678711, -0.00011304859071969986, -0.00010980851948261261, -0.00010656844824552536, -0.00010332837700843811, -0.00010008830577135086, -9.684823453426361e-05, -9.360816329717636e-05, -9.036809206008911e-05, -8.712802082300186e-05, -8.388794958591461e-05, -8.064787834882736e-05, -7.740780711174011e-05, -7.416773587465286e-05, -7.092766463756561e-05, -6.768759340047836e-05, -6.444752216339111e-05, -6.120745092630386e-05, -5.7967379689216614e-05, -5.4727308452129364e-05, -5.1487237215042114e-05, -4.8247165977954865e-05, -4.5007094740867615e-05, -4.1767023503780365e-05, -3.8526952266693115e-05, -3.5286881029605865e-05, -3.2046809792518616e-05, -2.8806738555431366e-05, -2.5566667318344116e-05, -2.2326596081256866e-05, -1.9086524844169617e-05, -1.5846453607082367e-05, -1.2606382369995117e-05, -9.366311132907867e-06, -6.126239895820618e-06, -2.886168658733368e-06, 3.5390257835388184e-07, 3.5939738154411316e-06, 6.834045052528381e-06, 1.0074116289615631e-05, 1.3314187526702881e-05, 1.655425876379013e-05, 1.979433000087738e-05, 2.303440123796463e-05, 2.627447247505188e-05, 2.951454371213913e-05, 3.275461494922638e-05, 3.599468618631363e-05, 3.923475742340088e-05, 4.247482866048813e-05, 4.571489989757538e-05, 4.895497113466263e-05, 5.219504237174988e-05, 5.543511360883713e-05, 5.867518484592438e-05, 6.191525608301163e-05, 6.515532732009888e-05, 6.839539855718613e-05, 7.163546979427338e-05, 7.487554103136063e-05, 7.811561226844788e-05, 8.135568350553513e-05, 8.459575474262238e-05, 8.783582597970963e-05, 9.107589721679688e-05]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 0.0, 3.0, 7.0, 4.0, 8.0, 8.0, 8.0, 13.0, 18.0, 35.0, 40.0, 52.0, 74.0, 107.0, 169.0, 240.0, 379.0, 580.0, 980.0, 1519.0, 2935.0, 5630.0, 13212.0, 41811.0, 213342.0, 585486.0, 130760.0, 29874.0, 10464.0, 4631.0, 2353.0, 1390.0, 813.0, 537.0, 345.0, 209.0, 138.0, 112.0, 78.0, 44.0, 44.0, 28.0, 19.0, 10.0, 23.0, 6.0, 5.0, 3.0, 5.0, 5.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.07244873046875, -0.07021045684814453, -0.06797218322753906, -0.0657339096069336, -0.06349563598632812, -0.061257362365722656, -0.05901908874511719, -0.05678081512451172, -0.05454254150390625, -0.05230426788330078, -0.05006599426269531, -0.047827720642089844, -0.045589447021484375, -0.043351173400878906, -0.04111289978027344, -0.03887462615966797, -0.0366363525390625, -0.03439807891845703, -0.03215980529785156, -0.029921531677246094, -0.027683258056640625, -0.025444984436035156, -0.023206710815429688, -0.02096843719482422, -0.01873016357421875, -0.01649188995361328, -0.014253616333007812, -0.012015342712402344, -0.009777069091796875, -0.007538795471191406, -0.0053005218505859375, -0.0030622482299804688, -0.000823974609375, 0.0014142990112304688, 0.0036525726318359375, 0.005890846252441406, 0.008129119873046875, 0.010367393493652344, 0.012605667114257812, 0.014843940734863281, 0.01708221435546875, 0.01932048797607422, 0.021558761596679688, 0.023797035217285156, 0.026035308837890625, 0.028273582458496094, 0.030511856079101562, 0.03275012969970703, 0.0349884033203125, 0.03722667694091797, 0.03946495056152344, 0.041703224182128906, 0.043941497802734375, 0.046179771423339844, 0.04841804504394531, 0.05065631866455078, 0.05289459228515625, 0.05513286590576172, 0.05737113952636719, 0.059609413146972656, 0.061847686767578125, 0.0640859603881836, 0.06632423400878906, 0.06856250762939453, 0.07080078125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 6.0, 9.0, 9.0, 18.0, 14.0, 26.0, 41.0, 51.0, 94.0, 117.0, 140.0, 123.0, 89.0, 77.0, 56.0, 43.0, 25.0, 17.0, 10.0, 8.0, 5.0, 4.0, 2.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.024139404296875, -0.02335071563720703, -0.022562026977539062, -0.021773338317871094, -0.020984649658203125, -0.020195960998535156, -0.019407272338867188, -0.01861858367919922, -0.01782989501953125, -0.01704120635986328, -0.016252517700195312, -0.015463829040527344, -0.014675140380859375, -0.013886451721191406, -0.013097763061523438, -0.012309074401855469, -0.0115203857421875, -0.010731697082519531, -0.009943008422851562, -0.009154319763183594, -0.008365631103515625, -0.007576942443847656, -0.0067882537841796875, -0.005999565124511719, -0.00521087646484375, -0.004422187805175781, -0.0036334991455078125, -0.0028448104858398438, -0.002056121826171875, -0.0012674331665039062, -0.0004787445068359375, 0.00030994415283203125, 0.0010986328125, 0.0018873214721679688, 0.0026760101318359375, 0.0034646987915039062, 0.004253387451171875, 0.005042076110839844, 0.0058307647705078125, 0.006619453430175781, 0.00740814208984375, 0.008196830749511719, 0.008985519409179688, 0.009774208068847656, 0.010562896728515625, 0.011351585388183594, 0.012140274047851562, 0.012928962707519531, 0.0137176513671875, 0.014506340026855469, 0.015295028686523438, 0.016083717346191406, 0.016872406005859375, 0.017661094665527344, 0.018449783325195312, 0.01923847198486328, 0.02002716064453125, 0.02081584930419922, 0.021604537963867188, 0.022393226623535156, 0.023181915283203125, 0.023970603942871094, 0.024759292602539062, 0.02554798126220703, 0.026336669921875]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 6.0, 6.0, 4.0, 16.0, 50.0, 109.0, 299.0, 309.0, 125.0, 47.0, 13.0, 13.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.703280448913574, -3.613175392150879, -3.5230703353881836, -3.4329652786254883, -3.342860221862793, -3.2527554035186768, -3.1626503467559814, -3.072545289993286, -2.982440233230591, -2.8923351764678955, -2.8022301197052, -2.712125062942505, -2.6220202445983887, -2.5319151878356934, -2.441810131072998, -2.3517050743103027, -2.2616000175476074, -2.171494960784912, -2.081389904022217, -1.991284966468811, -1.9011799097061157, -1.8110748529434204, -1.7209699153900146, -1.6308648586273193, -1.540759801864624, -1.4506547451019287, -1.3605496883392334, -1.2704447507858276, -1.1803396940231323, -1.090234637260437, -1.0001296997070312, -0.9100246429443359, -0.8199193477630615, -0.7298142910003662, -0.6397092938423157, -0.5496042966842651, -0.4594992399215698, -0.3693942129611969, -0.279289186000824, -0.18918418884277344, -0.09907913208007812, -0.0089741051197052, 0.08113092184066772, 0.17123594880104065, 0.2613409757614136, 0.3514460027217865, 0.4415510296821594, 0.53165602684021, 0.6217610836029053, 0.7118661403656006, 0.8019711375236511, 0.8920761346817017, 0.982181191444397, 1.0722862482070923, 1.162391185760498, 1.2524962425231934, 1.3426012992858887, 1.432706356048584, 1.5228114128112793, 1.612916350364685, 1.7030214071273804, 1.7931264638900757, 1.8832314014434814, 1.9733364582061768, 2.063441514968872]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 5.0, 7.0, 6.0, 17.0, 19.0, 26.0, 41.0, 52.0, 55.0, 64.0, 102.0, 96.0, 78.0, 81.0, 78.0, 66.0, 55.0, 41.0, 36.0, 29.0, 23.0, 16.0, 9.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.436684250831604, -1.4001200199127197, -1.3635557889938354, -1.3269915580749512, -1.2904272079467773, -1.253862977027893, -1.2172987461090088, -1.1807345151901245, -1.1441702842712402, -1.107606053352356, -1.0710418224334717, -1.0344775915145874, -0.9979133009910583, -0.9613490700721741, -0.924784779548645, -0.8882205486297607, -0.8516563177108765, -0.8150920867919922, -0.7785278558731079, -0.7419635653495789, -0.7053993344306946, -0.6688351035118103, -0.6322708129882812, -0.595706582069397, -0.5591423511505127, -0.5225781202316284, -0.48601385951042175, -0.4494495987892151, -0.4128853678703308, -0.37632113695144653, -0.33975687623023987, -0.3031926155090332, -0.2666285037994385, -0.230064257979393, -0.19350001215934753, -0.15693576633930206, -0.12037152051925659, -0.08380727469921112, -0.04724302887916565, -0.010678768157958984, 0.025885462760925293, 0.062449708580970764, 0.09901395440101624, 0.1355782002210617, 0.17214244604110718, 0.20870669186115265, 0.24527093768119812, 0.2818351984024048, 0.31839942932128906, 0.35496366024017334, 0.39152792096138, 0.42809218168258667, 0.46465641260147095, 0.5012206435203552, 0.5377849340438843, 0.5743491649627686, 0.6109133958816528, 0.6474776268005371, 0.6840418577194214, 0.7206061482429504, 0.7571703791618347, 0.793734610080719, 0.830298900604248, 0.8668631315231323, 0.9034273624420166]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 3.0, 2.0, 3.0, 3.0, 5.0, 17.0, 21.0, 32.0, 36.0, 54.0, 101.0, 137.0, 227.0, 414.0, 719.0, 1419.0, 3575.0, 9913.0, 41643.0, 758965.0, 196415.0, 23149.0, 6718.0, 2482.0, 1082.0, 561.0, 301.0, 207.0, 113.0, 83.0, 50.0, 34.0, 22.0, 11.0, 13.0, 5.0, 8.0, 3.0, 5.0, 2.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.802734375, -0.7775039672851562, -0.7522735595703125, -0.7270431518554688, -0.701812744140625, -0.6765823364257812, -0.6513519287109375, -0.6261215209960938, -0.60089111328125, -0.5756607055664062, -0.5504302978515625, -0.5251998901367188, -0.499969482421875, -0.47473907470703125, -0.4495086669921875, -0.42427825927734375, -0.3990478515625, -0.37381744384765625, -0.3485870361328125, -0.32335662841796875, -0.298126220703125, -0.27289581298828125, -0.2476654052734375, -0.22243499755859375, -0.19720458984375, -0.17197418212890625, -0.1467437744140625, -0.12151336669921875, -0.096282958984375, -0.07105255126953125, -0.0458221435546875, -0.02059173583984375, 0.004638671875, 0.02986907958984375, 0.0550994873046875, 0.08032989501953125, 0.105560302734375, 0.13079071044921875, 0.1560211181640625, 0.18125152587890625, 0.20648193359375, 0.23171234130859375, 0.2569427490234375, 0.28217315673828125, 0.307403564453125, 0.33263397216796875, 0.3578643798828125, 0.38309478759765625, 0.4083251953125, 0.43355560302734375, 0.4587860107421875, 0.48401641845703125, 0.509246826171875, 0.5344772338867188, 0.5597076416015625, 0.5849380493164062, 0.61016845703125, 0.6353988647460938, 0.6606292724609375, 0.6858596801757812, 0.711090087890625, 0.7363204956054688, 0.7615509033203125, 0.7867813110351562, 0.81201171875]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 6.0, 5.0, 6.0, 5.0, 8.0, 24.0, 19.0, 29.0, 31.0, 44.0, 46.0, 61.0, 80.0, 81.0, 87.0, 72.0, 76.0, 68.0, 52.0, 48.0, 32.0, 24.0, 26.0, 25.0, 14.0, 16.0, 10.0, 6.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.048828125, -1.984466552734375, -1.92010498046875, -1.855743408203125, -1.7913818359375, -1.727020263671875, -1.66265869140625, -1.598297119140625, -1.533935546875, -1.469573974609375, -1.40521240234375, -1.340850830078125, -1.2764892578125, -1.212127685546875, -1.14776611328125, -1.083404541015625, -1.01904296875, -0.954681396484375, -0.89031982421875, -0.825958251953125, -0.7615966796875, -0.697235107421875, -0.63287353515625, -0.568511962890625, -0.504150390625, -0.439788818359375, -0.37542724609375, -0.311065673828125, -0.2467041015625, -0.182342529296875, -0.11798095703125, -0.053619384765625, 0.0107421875, 0.075103759765625, 0.13946533203125, 0.203826904296875, 0.2681884765625, 0.332550048828125, 0.39691162109375, 0.461273193359375, 0.525634765625, 0.589996337890625, 0.65435791015625, 0.718719482421875, 0.7830810546875, 0.847442626953125, 0.91180419921875, 0.976165771484375, 1.04052734375, 1.104888916015625, 1.16925048828125, 1.233612060546875, 1.2979736328125, 1.362335205078125, 1.42669677734375, 1.491058349609375, 1.555419921875, 1.619781494140625, 1.68414306640625, 1.748504638671875, 1.8128662109375, 1.877227783203125, 1.94158935546875, 2.005950927734375, 2.0703125]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 4.0, 4.0, 8.0, 7.0, 10.0, 16.0, 24.0, 30.0, 31.0, 46.0, 54.0, 77.0, 237.0, 1648.0, 75516.0, 966168.0, 3843.0, 398.0, 126.0, 81.0, 49.0, 37.0, 35.0, 26.0, 19.0, 14.0, 22.0, 10.0, 3.0, 5.0, 7.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.87890625, -1.8011474609375, -1.723388671875, -1.6456298828125, -1.56787109375, -1.4901123046875, -1.412353515625, -1.3345947265625, -1.2568359375, -1.1790771484375, -1.101318359375, -1.0235595703125, -0.94580078125, -0.8680419921875, -0.790283203125, -0.7125244140625, -0.634765625, -0.5570068359375, -0.479248046875, -0.4014892578125, -0.32373046875, -0.2459716796875, -0.168212890625, -0.0904541015625, -0.0126953125, 0.0650634765625, 0.142822265625, 0.2205810546875, 0.29833984375, 0.3760986328125, 0.453857421875, 0.5316162109375, 0.609375, 0.6871337890625, 0.764892578125, 0.8426513671875, 0.92041015625, 0.9981689453125, 1.075927734375, 1.1536865234375, 1.2314453125, 1.3092041015625, 1.386962890625, 1.4647216796875, 1.54248046875, 1.6202392578125, 1.697998046875, 1.7757568359375, 1.853515625, 1.9312744140625, 2.009033203125, 2.0867919921875, 2.16455078125, 2.2423095703125, 2.320068359375, 2.3978271484375, 2.4755859375, 2.5533447265625, 2.631103515625, 2.7088623046875, 2.78662109375, 2.8643798828125, 2.942138671875, 3.0198974609375, 3.09765625]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 5.0, 2.0, 6.0, 8.0, 7.0, 14.0, 16.0, 27.0, 29.0, 32.0, 53.0, 41.0, 58.0, 49.0, 50.0, 57.0, 72.0, 65.0, 48.0, 78.0, 52.0, 42.0, 36.0, 32.0, 24.0, 25.0, 21.0, 17.0, 9.0, 11.0, 7.0, 5.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.404296875, -1.34649658203125, -1.2886962890625, -1.23089599609375, -1.173095703125, -1.11529541015625, -1.0574951171875, -0.99969482421875, -0.94189453125, -0.88409423828125, -0.8262939453125, -0.76849365234375, -0.710693359375, -0.65289306640625, -0.5950927734375, -0.53729248046875, -0.4794921875, -0.42169189453125, -0.3638916015625, -0.30609130859375, -0.248291015625, -0.19049072265625, -0.1326904296875, -0.07489013671875, -0.01708984375, 0.04071044921875, 0.0985107421875, 0.15631103515625, 0.214111328125, 0.27191162109375, 0.3297119140625, 0.38751220703125, 0.4453125, 0.50311279296875, 0.5609130859375, 0.61871337890625, 0.676513671875, 0.73431396484375, 0.7921142578125, 0.84991455078125, 0.90771484375, 0.96551513671875, 1.0233154296875, 1.08111572265625, 1.138916015625, 1.19671630859375, 1.2545166015625, 1.31231689453125, 1.3701171875, 1.42791748046875, 1.4857177734375, 1.54351806640625, 1.601318359375, 1.65911865234375, 1.7169189453125, 1.77471923828125, 1.83251953125, 1.89031982421875, 1.9481201171875, 2.00592041015625, 2.063720703125, 2.12152099609375, 2.1793212890625, 2.23712158203125, 2.294921875]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 7.0, 2.0, 5.0, 4.0, 6.0, 14.0, 11.0, 17.0, 25.0, 41.0, 65.0, 108.0, 184.0, 371.0, 775.0, 1686.0, 4969.0, 26331.0, 921795.0, 79576.0, 7987.0, 2447.0, 1020.0, 491.0, 241.0, 141.0, 79.0, 43.0, 32.0, 21.0, 24.0, 7.0, 10.0, 4.0, 11.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 1.0], "bins": [-0.55810546875, -0.5432968139648438, -0.5284881591796875, -0.5136795043945312, -0.498870849609375, -0.48406219482421875, -0.4692535400390625, -0.45444488525390625, -0.43963623046875, -0.42482757568359375, -0.4100189208984375, -0.39521026611328125, -0.380401611328125, -0.36559295654296875, -0.3507843017578125, -0.33597564697265625, -0.3211669921875, -0.30635833740234375, -0.2915496826171875, -0.27674102783203125, -0.261932373046875, -0.24712371826171875, -0.2323150634765625, -0.21750640869140625, -0.20269775390625, -0.18788909912109375, -0.1730804443359375, -0.15827178955078125, -0.143463134765625, -0.12865447998046875, -0.1138458251953125, -0.09903717041015625, -0.084228515625, -0.06941986083984375, -0.0546112060546875, -0.03980255126953125, -0.024993896484375, -0.01018524169921875, 0.0046234130859375, 0.01943206787109375, 0.03424072265625, 0.04904937744140625, 0.0638580322265625, 0.07866668701171875, 0.093475341796875, 0.10828399658203125, 0.1230926513671875, 0.13790130615234375, 0.1527099609375, 0.16751861572265625, 0.1823272705078125, 0.19713592529296875, 0.211944580078125, 0.22675323486328125, 0.2415618896484375, 0.25637054443359375, 0.27117919921875, 0.28598785400390625, 0.3007965087890625, 0.31560516357421875, 0.330413818359375, 0.34522247314453125, 0.3600311279296875, 0.37483978271484375, 0.3896484375]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 7.0, 6.0, 5.0, 11.0, 21.0, 24.0, 45.0, 96.0, 381.0, 216.0, 83.0, 38.0, 24.0, 17.0, 15.0, 3.0, 1.0, 3.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.599592208862305e-05, -7.368717342615128e-05, -7.13784247636795e-05, -6.906967610120773e-05, -6.676092743873596e-05, -6.445217877626419e-05, -6.214343011379242e-05, -5.983468145132065e-05, -5.752593278884888e-05, -5.5217184126377106e-05, -5.2908435463905334e-05, -5.059968680143356e-05, -4.829093813896179e-05, -4.598218947649002e-05, -4.367344081401825e-05, -4.136469215154648e-05, -3.905594348907471e-05, -3.6747194826602936e-05, -3.4438446164131165e-05, -3.212969750165939e-05, -2.9820948839187622e-05, -2.751220017671585e-05, -2.520345151424408e-05, -2.289470285177231e-05, -2.0585954189300537e-05, -1.8277205526828766e-05, -1.5968456864356995e-05, -1.3659708201885223e-05, -1.1350959539413452e-05, -9.042210876941681e-06, -6.73346221446991e-06, -4.4247135519981384e-06, -2.115964889526367e-06, 1.9278377294540405e-07, 2.5015324354171753e-06, 4.8102810978889465e-06, 7.119029760360718e-06, 9.427778422832489e-06, 1.173652708530426e-05, 1.4045275747776031e-05, 1.6354024410247803e-05, 1.8662773072719574e-05, 2.0971521735191345e-05, 2.3280270397663116e-05, 2.5589019060134888e-05, 2.789776772260666e-05, 3.020651638507843e-05, 3.25152650475502e-05, 3.482401371002197e-05, 3.7132762372493744e-05, 3.9441511034965515e-05, 4.1750259697437286e-05, 4.405900835990906e-05, 4.636775702238083e-05, 4.86765056848526e-05, 5.098525434732437e-05, 5.329400300979614e-05, 5.5602751672267914e-05, 5.7911500334739685e-05, 6.0220248997211456e-05, 6.252899765968323e-05, 6.4837746322155e-05, 6.714649498462677e-05, 6.945524364709854e-05, 7.176399230957031e-05]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 4.0, 7.0, 10.0, 11.0, 19.0, 21.0, 35.0, 42.0, 78.0, 98.0, 145.0, 222.0, 385.0, 721.0, 1488.0, 4754.0, 26597.0, 925338.0, 76092.0, 8075.0, 2232.0, 906.0, 491.0, 249.0, 180.0, 110.0, 80.0, 49.0, 35.0, 29.0, 18.0, 8.0, 7.0, 7.0, 3.0, 1.0, 4.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.438232421875, -0.4211692810058594, -0.40410614013671875, -0.3870429992675781, -0.3699798583984375, -0.3529167175292969, -0.33585357666015625, -0.3187904357910156, -0.301727294921875, -0.2846641540527344, -0.26760101318359375, -0.2505378723144531, -0.2334747314453125, -0.21641159057617188, -0.19934844970703125, -0.18228530883789062, -0.16522216796875, -0.14815902709960938, -0.13109588623046875, -0.11403274536132812, -0.0969696044921875, -0.07990646362304688, -0.06284332275390625, -0.045780181884765625, -0.028717041015625, -0.011653900146484375, 0.00540924072265625, 0.022472381591796875, 0.0395355224609375, 0.056598663330078125, 0.07366180419921875, 0.09072494506835938, 0.1077880859375, 0.12485122680664062, 0.14191436767578125, 0.15897750854492188, 0.1760406494140625, 0.19310379028320312, 0.21016693115234375, 0.22723007202148438, 0.244293212890625, 0.2613563537597656, 0.27841949462890625, 0.2954826354980469, 0.3125457763671875, 0.3296089172363281, 0.34667205810546875, 0.3637351989746094, 0.38079833984375, 0.3978614807128906, 0.41492462158203125, 0.4319877624511719, 0.4490509033203125, 0.4661140441894531, 0.48317718505859375, 0.5002403259277344, 0.517303466796875, 0.5343666076660156, 0.5514297485351562, 0.5684928894042969, 0.5855560302734375, 0.6026191711425781, 0.6196823120117188, 0.6367454528808594, 0.65380859375]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 3.0, 6.0, 5.0, 18.0, 31.0, 50.0, 137.0, 531.0, 109.0, 40.0, 32.0, 11.0, 7.0, 12.0, 6.0, 4.0, 4.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.333251953125, -0.3245868682861328, -0.3159217834472656, -0.30725669860839844, -0.29859161376953125, -0.28992652893066406, -0.2812614440917969, -0.2725963592529297, -0.2639312744140625, -0.2552661895751953, -0.24660110473632812, -0.23793601989746094, -0.22927093505859375, -0.22060585021972656, -0.21194076538085938, -0.2032756805419922, -0.194610595703125, -0.1859455108642578, -0.17728042602539062, -0.16861534118652344, -0.15995025634765625, -0.15128517150878906, -0.14262008666992188, -0.1339550018310547, -0.1252899169921875, -0.11662483215332031, -0.10795974731445312, -0.09929466247558594, -0.09062957763671875, -0.08196449279785156, -0.07329940795898438, -0.06463432312011719, -0.05596923828125, -0.04730415344238281, -0.038639068603515625, -0.029973983764648438, -0.02130889892578125, -0.012643814086914062, -0.003978729248046875, 0.0046863555908203125, 0.0133514404296875, 0.022016525268554688, 0.030681610107421875, 0.03934669494628906, 0.04801177978515625, 0.05667686462402344, 0.06534194946289062, 0.07400703430175781, 0.082672119140625, 0.09133720397949219, 0.10000228881835938, 0.10866737365722656, 0.11733245849609375, 0.12599754333496094, 0.13466262817382812, 0.1433277130126953, 0.1519927978515625, 0.1606578826904297, 0.16932296752929688, 0.17798805236816406, 0.18665313720703125, 0.19531822204589844, 0.20398330688476562, 0.2126483917236328, 0.2213134765625]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 7.0, 10.0, 16.0, 42.0, 108.0, 314.0, 312.0, 121.0, 42.0, 18.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-9.555488586425781, -9.352388381958008, -9.149288177490234, -8.946187019348145, -8.743086814880371, -8.539986610412598, -8.336885452270508, -8.133785247802734, -7.930685043334961, -7.7275848388671875, -7.524484157562256, -7.321383476257324, -7.118283271789551, -6.915183067321777, -6.712082386016846, -6.508981704711914, -6.305881500244141, -6.102781295776367, -5.8996806144714355, -5.696579933166504, -5.4934797286987305, -5.290379524230957, -5.087278842926025, -4.884178161621094, -4.68107795715332, -4.477977752685547, -4.274877071380615, -4.071776390075684, -3.86867618560791, -3.6655757427215576, -3.462475299835205, -3.2593748569488525, -3.056274890899658, -2.8531744480133057, -2.650074005126953, -2.4469735622406006, -2.243873119354248, -2.0407726764678955, -1.837672233581543, -1.6345717906951904, -1.431471347808838, -1.2283709049224854, -1.0252704620361328, -0.8221700191497803, -0.6190695762634277, -0.4159691333770752, -0.21286869049072266, -0.009768247604370117, 0.19333219528198242, 0.39643263816833496, 0.5995330810546875, 0.80263352394104, 1.0057339668273926, 1.2088344097137451, 1.4119348526000977, 1.6150352954864502, 1.8181357383728027, 2.0212361812591553, 2.224336624145508, 2.4274370670318604, 2.630537509918213, 2.8336379528045654, 3.036738395690918, 3.2398388385772705, 3.442939281463623]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 4.0, 4.0, 12.0, 3.0, 7.0, 7.0, 19.0, 9.0, 16.0, 18.0, 24.0, 27.0, 26.0, 31.0, 32.0, 21.0, 41.0, 36.0, 47.0, 41.0, 54.0, 34.0, 40.0, 47.0, 43.0, 40.0, 32.0, 39.0, 37.0, 27.0, 27.0, 19.0, 19.0, 22.0, 12.0, 20.0, 13.0, 7.0, 8.0, 9.0, 8.0, 6.0, 3.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-2.3098936080932617, -2.2411890029907227, -2.1724843978881836, -2.1037797927856445, -2.0350751876831055, -1.9663704633712769, -1.8976657390594482, -1.8289611339569092, -1.7602565288543701, -1.691551923751831, -1.622847318649292, -1.5541425943374634, -1.4854379892349243, -1.4167333841323853, -1.3480286598205566, -1.2793240547180176, -1.2106194496154785, -1.1419148445129395, -1.0732102394104004, -1.0045055150985718, -0.9358009099960327, -0.8670963048934937, -0.7983916401863098, -0.729686975479126, -0.6609823703765869, -0.5922777652740479, -0.523573100566864, -0.45486846566200256, -0.3861638307571411, -0.31745919585227966, -0.2487545609474182, -0.18004992604255676, -0.11134552955627441, -0.042640894651412964, 0.026063740253448486, 0.09476837515830994, 0.1634730100631714, 0.23217764496803284, 0.3008822798728943, 0.36958691477775574, 0.4382915496826172, 0.5069961547851562, 0.5757008194923401, 0.6444054841995239, 0.713110089302063, 0.781814694404602, 0.8505193591117859, 0.9192240238189697, 0.9879286289215088, 1.0566332340240479, 1.125337839126587, 1.1940425634384155, 1.2627471685409546, 1.3314517736434937, 1.4001564979553223, 1.4688611030578613, 1.5375657081604004, 1.6062703132629395, 1.6749749183654785, 1.7436796426773071, 1.8123842477798462, 1.8810888528823853, 1.9497935771942139, 2.018498182296753, 2.087202787399292]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 6.0, 2.0, 0.0, 9.0, 7.0, 8.0, 10.0, 17.0, 38.0, 48.0, 69.0, 119.0, 167.0, 263.0, 523.0, 918.0, 2076.0, 6992.0, 67754.0, 3995969.0, 105785.0, 8640.0, 2476.0, 1033.0, 532.0, 309.0, 178.0, 103.0, 76.0, 52.0, 29.0, 23.0, 21.0, 10.0, 2.0, 7.0, 4.0, 4.0, 7.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.35546875, -3.255462646484375, -3.15545654296875, -3.055450439453125, -2.9554443359375, -2.855438232421875, -2.75543212890625, -2.655426025390625, -2.555419921875, -2.455413818359375, -2.35540771484375, -2.255401611328125, -2.1553955078125, -2.055389404296875, -1.95538330078125, -1.855377197265625, -1.75537109375, -1.655364990234375, -1.55535888671875, -1.455352783203125, -1.3553466796875, -1.255340576171875, -1.15533447265625, -1.055328369140625, -0.955322265625, -0.855316162109375, -0.75531005859375, -0.655303955078125, -0.5552978515625, -0.455291748046875, -0.35528564453125, -0.255279541015625, -0.1552734375, -0.055267333984375, 0.04473876953125, 0.144744873046875, 0.2447509765625, 0.344757080078125, 0.44476318359375, 0.544769287109375, 0.644775390625, 0.744781494140625, 0.84478759765625, 0.944793701171875, 1.0447998046875, 1.144805908203125, 1.24481201171875, 1.344818115234375, 1.44482421875, 1.544830322265625, 1.64483642578125, 1.744842529296875, 1.8448486328125, 1.944854736328125, 2.04486083984375, 2.144866943359375, 2.244873046875, 2.344879150390625, 2.44488525390625, 2.544891357421875, 2.6448974609375, 2.744903564453125, 2.84490966796875, 2.944915771484375, 3.044921875]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 4.0, 11.0, 3.0, 6.0, 12.0, 17.0, 29.0, 30.0, 48.0, 47.0, 57.0, 77.0, 92.0, 98.0, 76.0, 95.0, 66.0, 50.0, 39.0, 38.0, 38.0, 22.0, 24.0, 9.0, 8.0, 5.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2275390625, -1.1889190673828125, -1.150299072265625, -1.1116790771484375, -1.07305908203125, -1.0344390869140625, -0.995819091796875, -0.9571990966796875, -0.9185791015625, -0.8799591064453125, -0.841339111328125, -0.8027191162109375, -0.76409912109375, -0.7254791259765625, -0.686859130859375, -0.6482391357421875, -0.609619140625, -0.5709991455078125, -0.532379150390625, -0.4937591552734375, -0.45513916015625, -0.4165191650390625, -0.377899169921875, -0.3392791748046875, -0.3006591796875, -0.2620391845703125, -0.223419189453125, -0.1847991943359375, -0.14617919921875, -0.1075592041015625, -0.068939208984375, -0.0303192138671875, 0.00830078125, 0.0469207763671875, 0.085540771484375, 0.1241607666015625, 0.16278076171875, 0.2014007568359375, 0.240020751953125, 0.2786407470703125, 0.3172607421875, 0.3558807373046875, 0.394500732421875, 0.4331207275390625, 0.47174072265625, 0.5103607177734375, 0.548980712890625, 0.5876007080078125, 0.626220703125, 0.6648406982421875, 0.703460693359375, 0.7420806884765625, 0.78070068359375, 0.8193206787109375, 0.857940673828125, 0.8965606689453125, 0.9351806640625, 0.9738006591796875, 1.012420654296875, 1.0510406494140625, 1.08966064453125, 1.1282806396484375, 1.166900634765625, 1.2055206298828125, 1.244140625]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 9.0, 7.0, 6.0, 12.0, 9.0, 24.0, 41.0, 66.0, 145.0, 261.0, 585.0, 1511.0, 4606.0, 22111.0, 741533.0, 3382705.0, 31462.0, 6049.0, 1757.0, 732.0, 311.0, 151.0, 70.0, 49.0, 23.0, 21.0, 8.0, 5.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.16015625, -3.074951171875, -2.98974609375, -2.904541015625, -2.8193359375, -2.734130859375, -2.64892578125, -2.563720703125, -2.478515625, -2.393310546875, -2.30810546875, -2.222900390625, -2.1376953125, -2.052490234375, -1.96728515625, -1.882080078125, -1.796875, -1.711669921875, -1.62646484375, -1.541259765625, -1.4560546875, -1.370849609375, -1.28564453125, -1.200439453125, -1.115234375, -1.030029296875, -0.94482421875, -0.859619140625, -0.7744140625, -0.689208984375, -0.60400390625, -0.518798828125, -0.43359375, -0.348388671875, -0.26318359375, -0.177978515625, -0.0927734375, -0.007568359375, 0.07763671875, 0.162841796875, 0.248046875, 0.333251953125, 0.41845703125, 0.503662109375, 0.5888671875, 0.674072265625, 0.75927734375, 0.844482421875, 0.9296875, 1.014892578125, 1.10009765625, 1.185302734375, 1.2705078125, 1.355712890625, 1.44091796875, 1.526123046875, 1.611328125, 1.696533203125, 1.78173828125, 1.866943359375, 1.9521484375, 2.037353515625, 2.12255859375, 2.207763671875, 2.29296875]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 5.0, 2.0, 2.0, 2.0, 8.0, 8.0, 12.0, 9.0, 19.0, 24.0, 25.0, 60.0, 122.0, 305.0, 953.0, 1550.0, 536.0, 207.0, 86.0, 43.0, 31.0, 19.0, 17.0, 7.0, 9.0, 5.0, 4.0, 4.0, 2.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5546875, -0.5350570678710938, -0.5154266357421875, -0.49579620361328125, -0.476165771484375, -0.45653533935546875, -0.4369049072265625, -0.41727447509765625, -0.39764404296875, -0.37801361083984375, -0.3583831787109375, -0.33875274658203125, -0.319122314453125, -0.29949188232421875, -0.2798614501953125, -0.26023101806640625, -0.2406005859375, -0.22097015380859375, -0.2013397216796875, -0.18170928955078125, -0.162078857421875, -0.14244842529296875, -0.1228179931640625, -0.10318756103515625, -0.08355712890625, -0.06392669677734375, -0.0442962646484375, -0.02466583251953125, -0.005035400390625, 0.01459503173828125, 0.0342254638671875, 0.05385589599609375, 0.073486328125, 0.09311676025390625, 0.1127471923828125, 0.13237762451171875, 0.152008056640625, 0.17163848876953125, 0.1912689208984375, 0.21089935302734375, 0.23052978515625, 0.25016021728515625, 0.2697906494140625, 0.28942108154296875, 0.309051513671875, 0.32868194580078125, 0.3483123779296875, 0.36794281005859375, 0.3875732421875, 0.40720367431640625, 0.4268341064453125, 0.44646453857421875, 0.466094970703125, 0.48572540283203125, 0.5053558349609375, 0.5249862670898438, 0.54461669921875, 0.5642471313476562, 0.5838775634765625, 0.6035079956054688, 0.623138427734375, 0.6427688598632812, 0.6623992919921875, 0.6820297241210938, 0.70166015625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 8.0, 4.0, 10.0, 19.0, 32.0, 47.0, 89.0, 143.0, 198.0, 194.0, 97.0, 59.0, 38.0, 23.0, 15.0, 15.0, 3.0, 7.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3228342533111572, -3.2410762310028076, -3.159317970275879, -3.0775599479675293, -2.9958016872406006, -2.914043664932251, -2.8322854042053223, -2.7505273818969727, -2.668769359588623, -2.5870113372802734, -2.5052530765533447, -2.423495054244995, -2.3417367935180664, -2.259978771209717, -2.178220748901367, -2.0964624881744385, -2.0147042274475098, -1.9329460859298706, -1.8511879444122314, -1.7694299221038818, -1.6876717805862427, -1.6059136390686035, -1.5241554975509644, -1.4423973560333252, -1.3606393337249756, -1.2788811922073364, -1.1971230506896973, -1.1153650283813477, -1.0336068868637085, -0.9518487453460693, -0.8700906038284302, -0.7883325219154358, -0.7065744400024414, -0.6248162984848022, -0.5430582165718079, -0.4613000750541687, -0.37954196333885193, -0.29778385162353516, -0.216025710105896, -0.1342676281929016, -0.05250948667526245, 0.029248632490634918, 0.11100675165653229, 0.19276487827301025, 0.274522989988327, 0.3562811017036438, 0.43803924322128296, 0.5197973251342773, 0.6015554666519165, 0.6833136081695557, 0.76507169008255, 0.8468298316001892, 0.9285879135131836, 1.0103460550308228, 1.092104196548462, 1.1738622188568115, 1.2556204795837402, 1.3373786211013794, 1.4191367626190186, 1.5008947849273682, 1.5826529264450073, 1.6644110679626465, 1.7461692094802856, 1.8279273509979248, 1.9096853733062744]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 6.0, 3.0, 7.0, 3.0, 11.0, 15.0, 15.0, 15.0, 28.0, 29.0, 27.0, 41.0, 29.0, 49.0, 56.0, 60.0, 44.0, 53.0, 50.0, 53.0, 61.0, 48.0, 46.0, 45.0, 38.0, 34.0, 32.0, 22.0, 15.0, 14.0, 13.0, 8.0, 12.0, 11.0, 4.0, 3.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0057085752487183, -0.9715639352798462, -0.9374192357063293, -0.9032745957374573, -0.8691298961639404, -0.8349852561950684, -0.8008406162261963, -0.7666959762573242, -0.7325512766838074, -0.6984066367149353, -0.6642619371414185, -0.6301172971725464, -0.5959726572036743, -0.5618279576301575, -0.5276833176612854, -0.49353864789009094, -0.4593939781188965, -0.425249308347702, -0.39110463857650757, -0.3569599986076355, -0.32281532883644104, -0.2886706590652466, -0.2545260190963745, -0.22038134932518005, -0.1862366795539856, -0.15209200978279114, -0.11794735491275787, -0.08380269259214401, -0.04965803027153015, -0.015513360500335693, 0.01863129436969757, 0.052775949239730835, 0.08692061901092529, 0.12106528133153915, 0.15520994365215302, 0.18935459852218628, 0.22349926829338074, 0.2576439380645752, 0.29178857803344727, 0.3259332478046417, 0.3600779175758362, 0.39422258734703064, 0.4283672571182251, 0.46251189708709717, 0.4966565668582916, 0.5308012366294861, 0.5649458765983582, 0.599090576171875, 0.6332352161407471, 0.6673798561096191, 0.701524555683136, 0.7356691956520081, 0.7698138952255249, 0.803958535194397, 0.838103175163269, 0.8722478151321411, 0.906392514705658, 0.94053715467453, 0.9746818542480469, 1.008826494216919, 1.042971134185791, 1.077115774154663, 1.1112605333328247, 1.1454051733016968, 1.1795498132705688]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 2.0, 6.0, 1.0, 8.0, 8.0, 18.0, 27.0, 38.0, 51.0, 125.0, 188.0, 320.0, 610.0, 1244.0, 2685.0, 7043.0, 25783.0, 331371.0, 629034.0, 35328.0, 8512.0, 3169.0, 1397.0, 681.0, 358.0, 229.0, 115.0, 68.0, 50.0, 24.0, 23.0, 16.0, 7.0, 6.0, 7.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.7705078125, -0.747222900390625, -0.72393798828125, -0.700653076171875, -0.6773681640625, -0.654083251953125, -0.63079833984375, -0.607513427734375, -0.584228515625, -0.560943603515625, -0.53765869140625, -0.514373779296875, -0.4910888671875, -0.467803955078125, -0.44451904296875, -0.421234130859375, -0.39794921875, -0.374664306640625, -0.35137939453125, -0.328094482421875, -0.3048095703125, -0.281524658203125, -0.25823974609375, -0.234954833984375, -0.211669921875, -0.188385009765625, -0.16510009765625, -0.141815185546875, -0.1185302734375, -0.095245361328125, -0.07196044921875, -0.048675537109375, -0.025390625, -0.002105712890625, 0.02117919921875, 0.044464111328125, 0.0677490234375, 0.091033935546875, 0.11431884765625, 0.137603759765625, 0.160888671875, 0.184173583984375, 0.20745849609375, 0.230743408203125, 0.2540283203125, 0.277313232421875, 0.30059814453125, 0.323883056640625, 0.34716796875, 0.370452880859375, 0.39373779296875, 0.417022705078125, 0.4403076171875, 0.463592529296875, 0.48687744140625, 0.510162353515625, 0.533447265625, 0.556732177734375, 0.58001708984375, 0.603302001953125, 0.6265869140625, 0.649871826171875, 0.67315673828125, 0.696441650390625, 0.7197265625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 6.0, 6.0, 7.0, 11.0, 13.0, 11.0, 27.0, 27.0, 45.0, 40.0, 36.0, 69.0, 75.0, 69.0, 69.0, 65.0, 72.0, 61.0, 62.0, 56.0, 47.0, 32.0, 25.0, 15.0, 10.0, 17.0, 14.0, 9.0, 5.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0458984375, -1.0159378051757812, -0.9859771728515625, -0.9560165405273438, -0.926055908203125, -0.8960952758789062, -0.8661346435546875, -0.8361740112304688, -0.80621337890625, -0.7762527465820312, -0.7462921142578125, -0.7163314819335938, -0.686370849609375, -0.6564102172851562, -0.6264495849609375, -0.5964889526367188, -0.5665283203125, -0.5365676879882812, -0.5066070556640625, -0.47664642333984375, -0.446685791015625, -0.41672515869140625, -0.3867645263671875, -0.35680389404296875, -0.32684326171875, -0.29688262939453125, -0.2669219970703125, -0.23696136474609375, -0.207000732421875, -0.17704010009765625, -0.1470794677734375, -0.11711883544921875, -0.087158203125, -0.05719757080078125, -0.0272369384765625, 0.00272369384765625, 0.032684326171875, 0.06264495849609375, 0.0926055908203125, 0.12256622314453125, 0.15252685546875, 0.18248748779296875, 0.2124481201171875, 0.24240875244140625, 0.272369384765625, 0.30233001708984375, 0.3322906494140625, 0.36225128173828125, 0.3922119140625, 0.42217254638671875, 0.4521331787109375, 0.48209381103515625, 0.512054443359375, 0.5420150756835938, 0.5719757080078125, 0.6019363403320312, 0.63189697265625, 0.6618576049804688, 0.6918182373046875, 0.7217788696289062, 0.751739501953125, 0.7817001342773438, 0.8116607666015625, 0.8416213989257812, 0.87158203125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 1.0, 6.0, 4.0, 7.0, 6.0, 4.0, 10.0, 13.0, 26.0, 29.0, 46.0, 78.0, 130.0, 210.0, 355.0, 686.0, 1357.0, 3040.0, 7381.0, 23880.0, 174959.0, 726814.0, 83043.0, 16053.0, 5517.0, 2391.0, 1089.0, 612.0, 326.0, 157.0, 97.0, 66.0, 42.0, 23.0, 29.0, 9.0, 17.0, 8.0, 5.0, 5.0, 3.0, 4.0, 3.0, 4.0, 3.0, 1.0, 1.0, 4.0, 3.0, 0.0, 1.0], "bins": [-0.46728515625, -0.45368194580078125, -0.4400787353515625, -0.42647552490234375, -0.412872314453125, -0.39926910400390625, -0.3856658935546875, -0.37206268310546875, -0.35845947265625, -0.34485626220703125, -0.3312530517578125, -0.31764984130859375, -0.304046630859375, -0.29044342041015625, -0.2768402099609375, -0.26323699951171875, -0.2496337890625, -0.23603057861328125, -0.2224273681640625, -0.20882415771484375, -0.195220947265625, -0.18161773681640625, -0.1680145263671875, -0.15441131591796875, -0.14080810546875, -0.12720489501953125, -0.1136016845703125, -0.09999847412109375, -0.086395263671875, -0.07279205322265625, -0.0591888427734375, -0.04558563232421875, -0.031982421875, -0.01837921142578125, -0.0047760009765625, 0.00882720947265625, 0.022430419921875, 0.03603363037109375, 0.0496368408203125, 0.06324005126953125, 0.07684326171875, 0.09044647216796875, 0.1040496826171875, 0.11765289306640625, 0.131256103515625, 0.14485931396484375, 0.1584625244140625, 0.17206573486328125, 0.1856689453125, 0.19927215576171875, 0.2128753662109375, 0.22647857666015625, 0.240081787109375, 0.25368499755859375, 0.2672882080078125, 0.28089141845703125, 0.29449462890625, 0.30809783935546875, 0.3217010498046875, 0.33530426025390625, 0.348907470703125, 0.36251068115234375, 0.3761138916015625, 0.38971710205078125, 0.4033203125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 3.0, 10.0, 6.0, 7.0, 7.0, 10.0, 8.0, 19.0, 24.0, 20.0, 18.0, 32.0, 29.0, 29.0, 37.0, 44.0, 47.0, 44.0, 39.0, 46.0, 46.0, 58.0, 34.0, 42.0, 45.0, 27.0, 49.0, 46.0, 27.0, 30.0, 26.0, 24.0, 13.0, 13.0, 8.0, 12.0, 9.0, 8.0, 7.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.212890625, -1.1720123291015625, -1.131134033203125, -1.0902557373046875, -1.04937744140625, -1.0084991455078125, -0.967620849609375, -0.9267425537109375, -0.8858642578125, -0.8449859619140625, -0.804107666015625, -0.7632293701171875, -0.72235107421875, -0.6814727783203125, -0.640594482421875, -0.5997161865234375, -0.558837890625, -0.5179595947265625, -0.477081298828125, -0.4362030029296875, -0.39532470703125, -0.3544464111328125, -0.313568115234375, -0.2726898193359375, -0.2318115234375, -0.1909332275390625, -0.150054931640625, -0.1091766357421875, -0.06829833984375, -0.0274200439453125, 0.013458251953125, 0.0543365478515625, 0.09521484375, 0.1360931396484375, 0.176971435546875, 0.2178497314453125, 0.25872802734375, 0.2996063232421875, 0.340484619140625, 0.3813629150390625, 0.4222412109375, 0.4631195068359375, 0.503997802734375, 0.5448760986328125, 0.58575439453125, 0.6266326904296875, 0.667510986328125, 0.7083892822265625, 0.749267578125, 0.7901458740234375, 0.831024169921875, 0.8719024658203125, 0.91278076171875, 0.9536590576171875, 0.994537353515625, 1.0354156494140625, 1.0762939453125, 1.1171722412109375, 1.158050537109375, 1.1989288330078125, 1.23980712890625, 1.2806854248046875, 1.321563720703125, 1.3624420166015625, 1.4033203125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 5.0, 3.0, 7.0, 10.0, 8.0, 14.0, 18.0, 41.0, 43.0, 78.0, 94.0, 165.0, 232.0, 332.0, 567.0, 945.0, 1649.0, 3130.0, 6716.0, 19275.0, 84589.0, 621443.0, 248304.0, 39653.0, 11095.0, 4596.0, 2179.0, 1256.0, 768.0, 430.0, 314.0, 197.0, 106.0, 88.0, 61.0, 47.0, 30.0, 22.0, 12.0, 12.0, 10.0, 5.0, 4.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07757568359375, -0.07505416870117188, -0.07253265380859375, -0.07001113891601562, -0.0674896240234375, -0.06496810913085938, -0.06244659423828125, -0.059925079345703125, -0.057403564453125, -0.054882049560546875, -0.05236053466796875, -0.049839019775390625, -0.0473175048828125, -0.044795989990234375, -0.04227447509765625, -0.039752960205078125, -0.0372314453125, -0.034709930419921875, -0.03218841552734375, -0.029666900634765625, -0.0271453857421875, -0.024623870849609375, -0.02210235595703125, -0.019580841064453125, -0.017059326171875, -0.014537811279296875, -0.01201629638671875, -0.009494781494140625, -0.0069732666015625, -0.004451751708984375, -0.00193023681640625, 0.000591278076171875, 0.00311279296875, 0.005634307861328125, 0.00815582275390625, 0.010677337646484375, 0.0131988525390625, 0.015720367431640625, 0.01824188232421875, 0.020763397216796875, 0.023284912109375, 0.025806427001953125, 0.02832794189453125, 0.030849456787109375, 0.0333709716796875, 0.035892486572265625, 0.03841400146484375, 0.040935516357421875, 0.04345703125, 0.045978546142578125, 0.04850006103515625, 0.051021575927734375, 0.0535430908203125, 0.056064605712890625, 0.05858612060546875, 0.061107635498046875, 0.063629150390625, 0.06615066528320312, 0.06867218017578125, 0.07119369506835938, 0.0737152099609375, 0.07623672485351562, 0.07875823974609375, 0.08127975463867188, 0.08380126953125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 2.0, 3.0, 2.0, 3.0, 8.0, 5.0, 7.0, 20.0, 33.0, 54.0, 79.0, 107.0, 198.0, 174.0, 126.0, 62.0, 35.0, 30.0, 13.0, 11.0, 13.0, 4.0, 7.0, 1.0, 4.0, 0.0, 4.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.97834587097168e-05, -5.797017365694046e-05, -5.6156888604164124e-05, -5.434360355138779e-05, -5.253031849861145e-05, -5.0717033445835114e-05, -4.890374839305878e-05, -4.709046334028244e-05, -4.5277178287506104e-05, -4.346389323472977e-05, -4.165060818195343e-05, -3.9837323129177094e-05, -3.802403807640076e-05, -3.621075302362442e-05, -3.4397467970848083e-05, -3.258418291807175e-05, -3.077089786529541e-05, -2.8957612812519073e-05, -2.7144327759742737e-05, -2.53310427069664e-05, -2.3517757654190063e-05, -2.1704472601413727e-05, -1.989118754863739e-05, -1.8077902495861053e-05, -1.6264617443084717e-05, -1.445133239030838e-05, -1.2638047337532043e-05, -1.0824762284755707e-05, -9.01147723197937e-06, -7.1981921792030334e-06, -5.384907126426697e-06, -3.57162207365036e-06, -1.7583370208740234e-06, 5.494803190231323e-08, 1.86823308467865e-06, 3.6815181374549866e-06, 5.494803190231323e-06, 7.30808824300766e-06, 9.121373295783997e-06, 1.0934658348560333e-05, 1.274794340133667e-05, 1.4561228454113007e-05, 1.6374513506889343e-05, 1.818779855966568e-05, 2.0001083612442017e-05, 2.1814368665218353e-05, 2.362765371799469e-05, 2.5440938770771027e-05, 2.7254223823547363e-05, 2.90675088763237e-05, 3.088079392910004e-05, 3.269407898187637e-05, 3.450736403465271e-05, 3.632064908742905e-05, 3.813393414020538e-05, 3.994721919298172e-05, 4.176050424575806e-05, 4.357378929853439e-05, 4.538707435131073e-05, 4.720035940408707e-05, 4.90136444568634e-05, 5.082692950963974e-05, 5.264021456241608e-05, 5.445349961519241e-05, 5.626678466796875e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 4.0, 8.0, 10.0, 13.0, 15.0, 29.0, 25.0, 33.0, 55.0, 92.0, 151.0, 218.0, 341.0, 528.0, 986.0, 1756.0, 3372.0, 6967.0, 16221.0, 44395.0, 156668.0, 530194.0, 198350.0, 53153.0, 18460.0, 7972.0, 3808.0, 1944.0, 1099.0, 610.0, 373.0, 232.0, 152.0, 98.0, 70.0, 53.0, 28.0, 23.0, 16.0, 4.0, 7.0, 6.0, 5.0, 4.0, 4.0, 3.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.07537841796875, -0.07325983047485352, -0.07114124298095703, -0.06902265548706055, -0.06690406799316406, -0.06478548049926758, -0.0626668930053711, -0.06054830551147461, -0.058429718017578125, -0.05631113052368164, -0.054192543029785156, -0.05207395553588867, -0.04995536804199219, -0.0478367805480957, -0.04571819305419922, -0.043599605560302734, -0.04148101806640625, -0.039362430572509766, -0.03724384307861328, -0.0351252555847168, -0.03300666809082031, -0.030888080596923828, -0.028769493103027344, -0.02665090560913086, -0.024532318115234375, -0.02241373062133789, -0.020295143127441406, -0.018176555633544922, -0.016057968139648438, -0.013939380645751953, -0.011820793151855469, -0.009702205657958984, -0.0075836181640625, -0.005465030670166016, -0.0033464431762695312, -0.0012278556823730469, 0.0008907318115234375, 0.003009319305419922, 0.005127906799316406, 0.007246494293212891, 0.009365081787109375, 0.01148366928100586, 0.013602256774902344, 0.015720844268798828, 0.017839431762695312, 0.019958019256591797, 0.02207660675048828, 0.024195194244384766, 0.02631378173828125, 0.028432369232177734, 0.03055095672607422, 0.0326695442199707, 0.03478813171386719, 0.03690671920776367, 0.039025306701660156, 0.04114389419555664, 0.043262481689453125, 0.04538106918334961, 0.047499656677246094, 0.04961824417114258, 0.05173683166503906, 0.05385541915893555, 0.05597400665283203, 0.058092594146728516, 0.060211181640625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 5.0, 6.0, 6.0, 3.0, 6.0, 16.0, 19.0, 11.0, 18.0, 37.0, 39.0, 44.0, 54.0, 57.0, 88.0, 104.0, 120.0, 75.0, 60.0, 49.0, 30.0, 31.0, 20.0, 21.0, 20.0, 11.0, 7.0, 10.0, 10.0, 8.0, 2.0, 2.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0186614990234375, -0.018013715744018555, -0.01736593246459961, -0.016718149185180664, -0.01607036590576172, -0.015422582626342773, -0.014774799346923828, -0.014127016067504883, -0.013479232788085938, -0.012831449508666992, -0.012183666229248047, -0.011535882949829102, -0.010888099670410156, -0.010240316390991211, -0.009592533111572266, -0.00894474983215332, -0.008296966552734375, -0.00764918327331543, -0.007001399993896484, -0.006353616714477539, -0.005705833435058594, -0.0050580501556396484, -0.004410266876220703, -0.003762483596801758, -0.0031147003173828125, -0.002466917037963867, -0.0018191337585449219, -0.0011713504791259766, -0.0005235671997070312, 0.00012421607971191406, 0.0007719993591308594, 0.0014197826385498047, 0.00206756591796875, 0.0027153491973876953, 0.0033631324768066406, 0.004010915756225586, 0.004658699035644531, 0.0053064823150634766, 0.005954265594482422, 0.006602048873901367, 0.0072498321533203125, 0.007897615432739258, 0.008545398712158203, 0.009193181991577148, 0.009840965270996094, 0.010488748550415039, 0.011136531829833984, 0.01178431510925293, 0.012432098388671875, 0.01307988166809082, 0.013727664947509766, 0.014375448226928711, 0.015023231506347656, 0.0156710147857666, 0.016318798065185547, 0.016966581344604492, 0.017614364624023438, 0.018262147903442383, 0.018909931182861328, 0.019557714462280273, 0.02020549774169922, 0.020853281021118164, 0.02150106430053711, 0.022148847579956055, 0.022796630859375]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 6.0, 8.0, 13.0, 10.0, 27.0, 41.0, 52.0, 81.0, 124.0, 143.0, 146.0, 111.0, 73.0, 49.0, 30.0, 17.0, 19.0, 10.0, 12.0, 5.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.304758071899414, -1.2662726640701294, -1.2277873754501343, -1.1893019676208496, -1.150816559791565, -1.1123311519622803, -1.0738458633422852, -1.0353604555130005, -0.9968751072883606, -0.9583897590637207, -0.919904351234436, -0.8814190030097961, -0.8429336547851562, -0.8044482469558716, -0.7659628987312317, -0.7274775505065918, -0.6889921426773071, -0.6505067944526672, -0.6120213866233826, -0.5735360383987427, -0.535050630569458, -0.4965652823448181, -0.4580799341201782, -0.41959455609321594, -0.38110917806625366, -0.3426238000392914, -0.3041384220123291, -0.2656530737876892, -0.22716769576072693, -0.18868231773376465, -0.15019695460796356, -0.11171159148216248, -0.07322633266448975, -0.03474096208810806, 0.0037444084882736206, 0.042229779064655304, 0.08071514964103699, 0.11920052766799927, 0.15768589079380035, 0.19617125391960144, 0.23465663194656372, 0.273142009973526, 0.3116273880004883, 0.3501127362251282, 0.38859811425209045, 0.42708349227905273, 0.4655688405036926, 0.5040541887283325, 0.5425395965576172, 0.5810249447822571, 0.6195103526115417, 0.6579957008361816, 0.6964811086654663, 0.7349664568901062, 0.7734518051147461, 0.8119372129440308, 0.8504225611686707, 0.8889079093933105, 0.9273933172225952, 0.9658786654472351, 1.004364013671875, 1.0428494215011597, 1.0813348293304443, 1.1198201179504395, 1.1583055257797241]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 6.0, 10.0, 5.0, 8.0, 19.0, 9.0, 17.0, 28.0, 32.0, 37.0, 44.0, 43.0, 67.0, 67.0, 56.0, 56.0, 63.0, 69.0, 62.0, 45.0, 58.0, 39.0, 39.0, 31.0, 20.0, 9.0, 19.0, 19.0, 8.0, 9.0, 9.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.9158645868301392, -0.8896703720092773, -0.8634761571884155, -0.8372819423675537, -0.8110877275466919, -0.7848935127258301, -0.7586992383003235, -0.7325050234794617, -0.7063108086585999, -0.680116593837738, -0.6539223790168762, -0.6277281641960144, -0.6015338897705078, -0.575339674949646, -0.5491454601287842, -0.5229512453079224, -0.49675703048706055, -0.47056281566619873, -0.4443686008453369, -0.4181743562221527, -0.3919801414012909, -0.3657859265804291, -0.3395916819572449, -0.31339746713638306, -0.28720325231552124, -0.2610090374946594, -0.2348148077726364, -0.2086205780506134, -0.1824263632297516, -0.15623214840888977, -0.13003791868686676, -0.10384368896484375, -0.07764947414398193, -0.05145525187253952, -0.025261029601097107, 0.0009331926703453064, 0.02712741494178772, 0.053321629762649536, 0.07951585948467255, 0.10571008920669556, 0.13190430402755737, 0.1580985188484192, 0.1842927485704422, 0.2104869782924652, 0.23668119311332703, 0.26287540793418884, 0.28906965255737305, 0.31526386737823486, 0.3414580821990967, 0.3676522970199585, 0.3938465118408203, 0.4200407564640045, 0.44623497128486633, 0.47242918610572815, 0.49862343072891235, 0.5248176455497742, 0.551011860370636, 0.5772060751914978, 0.6034002900123596, 0.6295945048332214, 0.655788779258728, 0.6819829940795898, 0.7081772089004517, 0.7343714237213135, 0.7605656385421753]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 5.0, 11.0, 9.0, 14.0, 17.0, 25.0, 25.0, 48.0, 71.0, 105.0, 158.0, 245.0, 367.0, 578.0, 1086.0, 2016.0, 4324.0, 10959.0, 40761.0, 422892.0, 500046.0, 43922.0, 11549.0, 4357.0, 2091.0, 1102.0, 659.0, 378.0, 236.0, 164.0, 90.0, 71.0, 50.0, 27.0, 30.0, 17.0, 17.0, 12.0, 10.0, 3.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.75732421875, -0.7343902587890625, -0.711456298828125, -0.6885223388671875, -0.66558837890625, -0.6426544189453125, -0.619720458984375, -0.5967864990234375, -0.5738525390625, -0.5509185791015625, -0.527984619140625, -0.5050506591796875, -0.48211669921875, -0.4591827392578125, -0.436248779296875, -0.4133148193359375, -0.390380859375, -0.3674468994140625, -0.344512939453125, -0.3215789794921875, -0.29864501953125, -0.2757110595703125, -0.252777099609375, -0.2298431396484375, -0.2069091796875, -0.1839752197265625, -0.161041259765625, -0.1381072998046875, -0.11517333984375, -0.0922393798828125, -0.069305419921875, -0.0463714599609375, -0.0234375, -0.0005035400390625, 0.022430419921875, 0.0453643798828125, 0.06829833984375, 0.0912322998046875, 0.114166259765625, 0.1371002197265625, 0.1600341796875, 0.1829681396484375, 0.205902099609375, 0.2288360595703125, 0.25177001953125, 0.2747039794921875, 0.297637939453125, 0.3205718994140625, 0.343505859375, 0.3664398193359375, 0.389373779296875, 0.4123077392578125, 0.43524169921875, 0.4581756591796875, 0.481109619140625, 0.5040435791015625, 0.5269775390625, 0.5499114990234375, 0.572845458984375, 0.5957794189453125, 0.61871337890625, 0.6416473388671875, 0.664581298828125, 0.6875152587890625, 0.71044921875]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 7.0, 3.0, 3.0, 10.0, 8.0, 13.0, 12.0, 19.0, 23.0, 26.0, 38.0, 44.0, 38.0, 55.0, 55.0, 56.0, 45.0, 73.0, 81.0, 60.0, 55.0, 49.0, 48.0, 34.0, 31.0, 26.0, 17.0, 20.0, 8.0, 9.0, 12.0, 9.0, 5.0, 6.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-1.6640625, -1.61419677734375, -1.5643310546875, -1.51446533203125, -1.464599609375, -1.41473388671875, -1.3648681640625, -1.31500244140625, -1.26513671875, -1.21527099609375, -1.1654052734375, -1.11553955078125, -1.065673828125, -1.01580810546875, -0.9659423828125, -0.91607666015625, -0.8662109375, -0.81634521484375, -0.7664794921875, -0.71661376953125, -0.666748046875, -0.61688232421875, -0.5670166015625, -0.51715087890625, -0.46728515625, -0.41741943359375, -0.3675537109375, -0.31768798828125, -0.267822265625, -0.21795654296875, -0.1680908203125, -0.11822509765625, -0.068359375, -0.01849365234375, 0.0313720703125, 0.08123779296875, 0.131103515625, 0.18096923828125, 0.2308349609375, 0.28070068359375, 0.33056640625, 0.38043212890625, 0.4302978515625, 0.48016357421875, 0.530029296875, 0.57989501953125, 0.6297607421875, 0.67962646484375, 0.7294921875, 0.77935791015625, 0.8292236328125, 0.87908935546875, 0.928955078125, 0.97882080078125, 1.0286865234375, 1.07855224609375, 1.12841796875, 1.17828369140625, 1.2281494140625, 1.27801513671875, 1.327880859375, 1.37774658203125, 1.4276123046875, 1.47747802734375, 1.52734375]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 6.0, 4.0, 10.0, 11.0, 13.0, 11.0, 16.0, 19.0, 14.0, 21.0, 16.0, 29.0, 45.0, 54.0, 73.0, 175.0, 335.0, 1132.0, 8879.0, 956885.0, 76253.0, 3299.0, 582.0, 237.0, 111.0, 74.0, 34.0, 38.0, 34.0, 25.0, 22.0, 19.0, 10.0, 20.0, 10.0, 7.0, 11.0, 5.0, 5.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.275390625, -2.20147705078125, -2.1275634765625, -2.05364990234375, -1.979736328125, -1.90582275390625, -1.8319091796875, -1.75799560546875, -1.68408203125, -1.61016845703125, -1.5362548828125, -1.46234130859375, -1.388427734375, -1.31451416015625, -1.2406005859375, -1.16668701171875, -1.0927734375, -1.01885986328125, -0.9449462890625, -0.87103271484375, -0.797119140625, -0.72320556640625, -0.6492919921875, -0.57537841796875, -0.50146484375, -0.42755126953125, -0.3536376953125, -0.27972412109375, -0.205810546875, -0.13189697265625, -0.0579833984375, 0.01593017578125, 0.08984375, 0.16375732421875, 0.2376708984375, 0.31158447265625, 0.385498046875, 0.45941162109375, 0.5333251953125, 0.60723876953125, 0.68115234375, 0.75506591796875, 0.8289794921875, 0.90289306640625, 0.976806640625, 1.05072021484375, 1.1246337890625, 1.19854736328125, 1.2724609375, 1.34637451171875, 1.4202880859375, 1.49420166015625, 1.568115234375, 1.64202880859375, 1.7159423828125, 1.78985595703125, 1.86376953125, 1.93768310546875, 2.0115966796875, 2.08551025390625, 2.159423828125, 2.23333740234375, 2.3072509765625, 2.38116455078125, 2.455078125]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 2.0, 10.0, 11.0, 8.0, 16.0, 10.0, 9.0, 20.0, 24.0, 24.0, 28.0, 28.0, 31.0, 38.0, 31.0, 36.0, 42.0, 39.0, 35.0, 54.0, 56.0, 45.0, 45.0, 41.0, 38.0, 27.0, 42.0, 29.0, 30.0, 26.0, 23.0, 11.0, 17.0, 15.0, 13.0, 13.0, 9.0, 6.0, 4.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.4541015625, -1.4105987548828125, -1.367095947265625, -1.3235931396484375, -1.28009033203125, -1.2365875244140625, -1.193084716796875, -1.1495819091796875, -1.1060791015625, -1.0625762939453125, -1.019073486328125, -0.9755706787109375, -0.93206787109375, -0.8885650634765625, -0.845062255859375, -0.8015594482421875, -0.758056640625, -0.7145538330078125, -0.671051025390625, -0.6275482177734375, -0.58404541015625, -0.5405426025390625, -0.497039794921875, -0.4535369873046875, -0.4100341796875, -0.3665313720703125, -0.323028564453125, -0.2795257568359375, -0.23602294921875, -0.1925201416015625, -0.149017333984375, -0.1055145263671875, -0.06201171875, -0.0185089111328125, 0.024993896484375, 0.0684967041015625, 0.11199951171875, 0.1555023193359375, 0.199005126953125, 0.2425079345703125, 0.2860107421875, 0.3295135498046875, 0.373016357421875, 0.4165191650390625, 0.46002197265625, 0.5035247802734375, 0.547027587890625, 0.5905303955078125, 0.634033203125, 0.6775360107421875, 0.721038818359375, 0.7645416259765625, 0.80804443359375, 0.8515472412109375, 0.895050048828125, 0.9385528564453125, 0.9820556640625, 1.0255584716796875, 1.069061279296875, 1.1125640869140625, 1.15606689453125, 1.1995697021484375, 1.243072509765625, 1.2865753173828125, 1.330078125]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 2.0, 4.0, 5.0, 5.0, 11.0, 10.0, 20.0, 24.0, 46.0, 76.0, 172.0, 364.0, 948.0, 2925.0, 12579.0, 139968.0, 849730.0, 33564.0, 5507.0, 1490.0, 537.0, 253.0, 111.0, 61.0, 39.0, 25.0, 20.0, 16.0, 9.0, 10.0, 4.0, 9.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3818359375, -0.3703498840332031, -0.35886383056640625, -0.3473777770996094, -0.3358917236328125, -0.3244056701660156, -0.31291961669921875, -0.3014335632324219, -0.289947509765625, -0.2784614562988281, -0.26697540283203125, -0.2554893493652344, -0.2440032958984375, -0.23251724243164062, -0.22103118896484375, -0.20954513549804688, -0.19805908203125, -0.18657302856445312, -0.17508697509765625, -0.16360092163085938, -0.1521148681640625, -0.14062881469726562, -0.12914276123046875, -0.11765670776367188, -0.106170654296875, -0.09468460083007812, -0.08319854736328125, -0.07171249389648438, -0.0602264404296875, -0.048740386962890625, -0.03725433349609375, -0.025768280029296875, -0.0142822265625, -0.002796173095703125, 0.00868988037109375, 0.020175933837890625, 0.0316619873046875, 0.043148040771484375, 0.05463409423828125, 0.06612014770507812, 0.077606201171875, 0.08909225463867188, 0.10057830810546875, 0.11206436157226562, 0.1235504150390625, 0.13503646850585938, 0.14652252197265625, 0.15800857543945312, 0.16949462890625, 0.18098068237304688, 0.19246673583984375, 0.20395278930664062, 0.2154388427734375, 0.22692489624023438, 0.23841094970703125, 0.24989700317382812, 0.261383056640625, 0.2728691101074219, 0.28435516357421875, 0.2958412170410156, 0.3073272705078125, 0.3188133239746094, 0.33029937744140625, 0.3417854309082031, 0.353271484375]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 1.0, 6.0, 8.0, 11.0, 18.0, 34.0, 43.0, 91.0, 256.0, 301.0, 91.0, 54.0, 28.0, 13.0, 12.0, 12.0, 8.0, 3.0, 2.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.240606307983398e-05, -6.0395337641239166e-05, -5.838461220264435e-05, -5.637388676404953e-05, -5.436316132545471e-05, -5.2352435886859894e-05, -5.0341710448265076e-05, -4.833098500967026e-05, -4.632025957107544e-05, -4.430953413248062e-05, -4.22988086938858e-05, -4.0288083255290985e-05, -3.827735781669617e-05, -3.626663237810135e-05, -3.425590693950653e-05, -3.224518150091171e-05, -3.0234456062316895e-05, -2.8223730623722076e-05, -2.6213005185127258e-05, -2.420227974653244e-05, -2.2191554307937622e-05, -2.0180828869342804e-05, -1.8170103430747986e-05, -1.6159377992153168e-05, -1.414865255355835e-05, -1.2137927114963531e-05, -1.0127201676368713e-05, -8.116476237773895e-06, -6.105750799179077e-06, -4.095025360584259e-06, -2.084299921989441e-06, -7.35744833946228e-08, 1.9371509552001953e-06, 3.9478763937950134e-06, 5.9586018323898315e-06, 7.96932727098465e-06, 9.980052709579468e-06, 1.1990778148174286e-05, 1.4001503586769104e-05, 1.6012229025363922e-05, 1.802295446395874e-05, 2.003367990255356e-05, 2.2044405341148376e-05, 2.4055130779743195e-05, 2.6065856218338013e-05, 2.807658165693283e-05, 3.008730709552765e-05, 3.209803253412247e-05, 3.4108757972717285e-05, 3.61194834113121e-05, 3.813020884990692e-05, 4.014093428850174e-05, 4.215165972709656e-05, 4.4162385165691376e-05, 4.6173110604286194e-05, 4.818383604288101e-05, 5.019456148147583e-05, 5.220528692007065e-05, 5.4216012358665466e-05, 5.6226737797260284e-05, 5.82374632358551e-05, 6.024818867444992e-05, 6.225891411304474e-05, 6.426963955163956e-05, 6.628036499023438e-05]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 3.0, 5.0, 10.0, 7.0, 9.0, 20.0, 22.0, 36.0, 53.0, 60.0, 148.0, 271.0, 562.0, 1355.0, 5568.0, 44041.0, 915266.0, 71124.0, 6955.0, 1655.0, 626.0, 314.0, 177.0, 104.0, 59.0, 37.0, 19.0, 16.0, 11.0, 2.0, 9.0, 7.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.36767578125, -0.35384368896484375, -0.3400115966796875, -0.32617950439453125, -0.312347412109375, -0.29851531982421875, -0.2846832275390625, -0.27085113525390625, -0.25701904296875, -0.24318695068359375, -0.2293548583984375, -0.21552276611328125, -0.201690673828125, -0.18785858154296875, -0.1740264892578125, -0.16019439697265625, -0.1463623046875, -0.13253021240234375, -0.1186981201171875, -0.10486602783203125, -0.091033935546875, -0.07720184326171875, -0.0633697509765625, -0.04953765869140625, -0.03570556640625, -0.02187347412109375, -0.0080413818359375, 0.00579071044921875, 0.019622802734375, 0.03345489501953125, 0.0472869873046875, 0.06111907958984375, 0.074951171875, 0.08878326416015625, 0.1026153564453125, 0.11644744873046875, 0.130279541015625, 0.14411163330078125, 0.1579437255859375, 0.17177581787109375, 0.18560791015625, 0.19944000244140625, 0.2132720947265625, 0.22710418701171875, 0.240936279296875, 0.25476837158203125, 0.2686004638671875, 0.28243255615234375, 0.2962646484375, 0.31009674072265625, 0.3239288330078125, 0.33776092529296875, 0.351593017578125, 0.36542510986328125, 0.3792572021484375, 0.39308929443359375, 0.40692138671875, 0.42075347900390625, 0.4345855712890625, 0.44841766357421875, 0.462249755859375, 0.47608184814453125, 0.4899139404296875, 0.5037460327148438, 0.517578125]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 2.0, 1.0, 6.0, 12.0, 13.0, 20.0, 48.0, 77.0, 178.0, 373.0, 141.0, 59.0, 35.0, 22.0, 12.0, 7.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2626953125, -0.2556629180908203, -0.24863052368164062, -0.24159812927246094, -0.23456573486328125, -0.22753334045410156, -0.22050094604492188, -0.2134685516357422, -0.2064361572265625, -0.1994037628173828, -0.19237136840820312, -0.18533897399902344, -0.17830657958984375, -0.17127418518066406, -0.16424179077148438, -0.1572093963623047, -0.150177001953125, -0.1431446075439453, -0.13611221313476562, -0.12907981872558594, -0.12204742431640625, -0.11501502990722656, -0.10798263549804688, -0.10095024108886719, -0.0939178466796875, -0.08688545227050781, -0.07985305786132812, -0.07282066345214844, -0.06578826904296875, -0.05875587463378906, -0.051723480224609375, -0.04469108581542969, -0.03765869140625, -0.030626296997070312, -0.023593902587890625, -0.016561508178710938, -0.00952911376953125, -0.0024967193603515625, 0.004535675048828125, 0.011568069458007812, 0.0186004638671875, 0.025632858276367188, 0.032665252685546875, 0.03969764709472656, 0.04673004150390625, 0.05376243591308594, 0.060794830322265625, 0.06782722473144531, 0.074859619140625, 0.08189201354980469, 0.08892440795898438, 0.09595680236816406, 0.10298919677734375, 0.11002159118652344, 0.11705398559570312, 0.12408638000488281, 0.1311187744140625, 0.1381511688232422, 0.14518356323242188, 0.15221595764160156, 0.15924835205078125, 0.16628074645996094, 0.17331314086914062, 0.1803455352783203, 0.1873779296875]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 6.0, 12.0, 18.0, 39.0, 100.0, 234.0, 312.0, 151.0, 64.0, 35.0, 17.0, 16.0, 5.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0284457206726074, -2.8633882999420166, -2.698330879211426, -2.533273696899414, -2.3682162761688232, -2.2031588554382324, -2.0381014347076416, -1.8730441331863403, -1.7079867124557495, -1.5429292917251587, -1.3778719902038574, -1.2128145694732666, -1.0477571487426758, -0.8826998472213745, -0.7176424264907837, -0.5525851249694824, -0.3875277042388916, -0.22247032821178436, -0.057412952184677124, 0.10764443874359131, 0.27270179986953735, 0.4377591609954834, 0.6028165817260742, 0.7678738832473755, 0.9329313039779663, 1.0979887247085571, 1.2630460262298584, 1.4281034469604492, 1.59316086769104, 1.7582181692123413, 1.9232755899429321, 2.0883328914642334, 2.253390312194824, 2.418447732925415, 2.583505153656006, 2.7485623359680176, 2.9136197566986084, 3.078677177429199, 3.24373459815979, 3.408792018890381, 3.5738492012023926, 3.7389066219329834, 3.903964042663574, 4.069021224975586, 4.234078884124756, 4.399136066436768, 4.5641937255859375, 4.729250907897949, 4.894308090209961, 5.059365272521973, 5.224422931671143, 5.389480113983154, 5.554537773132324, 5.719594955444336, 5.884652137756348, 6.049709796905518, 6.2147674560546875, 6.379824638366699, 6.544882297515869, 6.709939479827881, 6.874997138977051, 7.0400543212890625, 7.205111503601074, 7.370169162750244, 7.535226345062256]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 6.0, 5.0, 8.0, 11.0, 8.0, 14.0, 12.0, 13.0, 22.0, 20.0, 17.0, 26.0, 26.0, 28.0, 26.0, 32.0, 28.0, 29.0, 28.0, 51.0, 34.0, 33.0, 33.0, 45.0, 38.0, 40.0, 31.0, 26.0, 43.0, 31.0, 32.0, 29.0, 27.0, 14.0, 23.0, 12.0, 10.0, 14.0, 15.0, 11.0, 12.0, 10.0, 6.0, 10.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0], "bins": [-1.9444060325622559, -1.8847922086715698, -1.8251783847808838, -1.7655645608901978, -1.7059507369995117, -1.6463369131088257, -1.5867230892181396, -1.5271092653274536, -1.4674954414367676, -1.4078816175460815, -1.3482677936553955, -1.2886539697647095, -1.2290401458740234, -1.1694263219833374, -1.1098124980926514, -1.0501986742019653, -0.9905848503112793, -0.9309710264205933, -0.8713572025299072, -0.8117433786392212, -0.7521295547485352, -0.6925157308578491, -0.6329019069671631, -0.573288083076477, -0.513674259185791, -0.454060435295105, -0.39444661140441895, -0.3348327875137329, -0.2752189636230469, -0.21560513973236084, -0.1559913158416748, -0.09637749195098877, -0.036763668060302734, 0.0228501558303833, 0.08246397972106934, 0.14207780361175537, 0.2016916275024414, 0.26130545139312744, 0.3209192752838135, 0.3805330991744995, 0.44014692306518555, 0.4997607469558716, 0.5593745708465576, 0.6189883947372437, 0.6786022186279297, 0.7382160425186157, 0.7978298664093018, 0.8574436902999878, 0.9170575141906738, 0.9766713380813599, 1.036285161972046, 1.095898985862732, 1.155512809753418, 1.215126633644104, 1.27474045753479, 1.334354281425476, 1.393968105316162, 1.4535819292068481, 1.5131957530975342, 1.5728095769882202, 1.6324234008789062, 1.6920372247695923, 1.7516510486602783, 1.8112648725509644, 1.8708786964416504]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 3.0, 4.0, 6.0, 2.0, 9.0, 7.0, 16.0, 18.0, 38.0, 35.0, 62.0, 96.0, 151.0, 259.0, 437.0, 757.0, 1415.0, 2520.0, 5225.0, 17767.0, 150203.0, 3615512.0, 364729.0, 21289.0, 7154.0, 2983.0, 1485.0, 818.0, 485.0, 290.0, 170.0, 108.0, 77.0, 47.0, 42.0, 21.0, 17.0, 7.0, 6.0, 6.0, 5.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9072265625, -1.846893310546875, -1.78656005859375, -1.726226806640625, -1.6658935546875, -1.605560302734375, -1.54522705078125, -1.484893798828125, -1.424560546875, -1.364227294921875, -1.30389404296875, -1.243560791015625, -1.1832275390625, -1.122894287109375, -1.06256103515625, -1.002227783203125, -0.94189453125, -0.881561279296875, -0.82122802734375, -0.760894775390625, -0.7005615234375, -0.640228271484375, -0.57989501953125, -0.519561767578125, -0.459228515625, -0.398895263671875, -0.33856201171875, -0.278228759765625, -0.2178955078125, -0.157562255859375, -0.09722900390625, -0.036895751953125, 0.0234375, 0.083770751953125, 0.14410400390625, 0.204437255859375, 0.2647705078125, 0.325103759765625, 0.38543701171875, 0.445770263671875, 0.506103515625, 0.566436767578125, 0.62677001953125, 0.687103271484375, 0.7474365234375, 0.807769775390625, 0.86810302734375, 0.928436279296875, 0.98876953125, 1.049102783203125, 1.10943603515625, 1.169769287109375, 1.2301025390625, 1.290435791015625, 1.35076904296875, 1.411102294921875, 1.471435546875, 1.531768798828125, 1.59210205078125, 1.652435302734375, 1.7127685546875, 1.773101806640625, 1.83343505859375, 1.893768310546875, 1.9541015625]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 7.0, 2.0, 6.0, 8.0, 10.0, 20.0, 19.0, 21.0, 34.0, 47.0, 47.0, 66.0, 60.0, 76.0, 76.0, 77.0, 69.0, 68.0, 65.0, 55.0, 47.0, 29.0, 22.0, 28.0, 17.0, 9.0, 6.0, 8.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.208984375, -1.1755828857421875, -1.142181396484375, -1.1087799072265625, -1.07537841796875, -1.0419769287109375, -1.008575439453125, -0.9751739501953125, -0.9417724609375, -0.9083709716796875, -0.874969482421875, -0.8415679931640625, -0.80816650390625, -0.7747650146484375, -0.741363525390625, -0.7079620361328125, -0.674560546875, -0.6411590576171875, -0.607757568359375, -0.5743560791015625, -0.54095458984375, -0.5075531005859375, -0.474151611328125, -0.4407501220703125, -0.4073486328125, -0.3739471435546875, -0.340545654296875, -0.3071441650390625, -0.27374267578125, -0.2403411865234375, -0.206939697265625, -0.1735382080078125, -0.14013671875, -0.1067352294921875, -0.073333740234375, -0.0399322509765625, -0.00653076171875, 0.0268707275390625, 0.060272216796875, 0.0936737060546875, 0.1270751953125, 0.1604766845703125, 0.193878173828125, 0.2272796630859375, 0.26068115234375, 0.2940826416015625, 0.327484130859375, 0.3608856201171875, 0.394287109375, 0.4276885986328125, 0.461090087890625, 0.4944915771484375, 0.52789306640625, 0.5612945556640625, 0.594696044921875, 0.6280975341796875, 0.6614990234375, 0.6949005126953125, 0.728302001953125, 0.7617034912109375, 0.79510498046875, 0.8285064697265625, 0.861907958984375, 0.8953094482421875, 0.9287109375]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 3.0, 6.0, 4.0, 4.0, 23.0, 18.0, 23.0, 33.0, 39.0, 69.0, 105.0, 195.0, 360.0, 838.0, 2448.0, 8412.0, 45247.0, 3793443.0, 314737.0, 20619.0, 4856.0, 1591.0, 549.0, 247.0, 133.0, 79.0, 61.0, 43.0, 28.0, 20.0, 14.0, 5.0, 7.0, 5.0, 6.0, 3.0, 2.0, 4.0, 3.0, 3.0, 1.0, 0.0, 3.0], "bins": [-3.47265625, -3.38311767578125, -3.2935791015625, -3.20404052734375, -3.114501953125, -3.02496337890625, -2.9354248046875, -2.84588623046875, -2.75634765625, -2.66680908203125, -2.5772705078125, -2.48773193359375, -2.398193359375, -2.30865478515625, -2.2191162109375, -2.12957763671875, -2.0400390625, -1.95050048828125, -1.8609619140625, -1.77142333984375, -1.681884765625, -1.59234619140625, -1.5028076171875, -1.41326904296875, -1.32373046875, -1.23419189453125, -1.1446533203125, -1.05511474609375, -0.965576171875, -0.87603759765625, -0.7864990234375, -0.69696044921875, -0.607421875, -0.51788330078125, -0.4283447265625, -0.33880615234375, -0.249267578125, -0.15972900390625, -0.0701904296875, 0.01934814453125, 0.10888671875, 0.19842529296875, 0.2879638671875, 0.37750244140625, 0.467041015625, 0.55657958984375, 0.6461181640625, 0.73565673828125, 0.8251953125, 0.91473388671875, 1.0042724609375, 1.09381103515625, 1.183349609375, 1.27288818359375, 1.3624267578125, 1.45196533203125, 1.54150390625, 1.63104248046875, 1.7205810546875, 1.81011962890625, 1.899658203125, 1.98919677734375, 2.0787353515625, 2.16827392578125, 2.2578125]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 3.0, 2.0, 6.0, 7.0, 3.0, 6.0, 15.0, 27.0, 16.0, 29.0, 52.0, 81.0, 245.0, 743.0, 1649.0, 747.0, 249.0, 74.0, 32.0, 31.0, 13.0, 10.0, 10.0, 7.0, 6.0, 3.0, 3.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.486572265625, -0.4628105163574219, -0.43904876708984375, -0.4152870178222656, -0.3915252685546875, -0.3677635192871094, -0.34400177001953125, -0.3202400207519531, -0.296478271484375, -0.2727165222167969, -0.24895477294921875, -0.22519302368164062, -0.2014312744140625, -0.17766952514648438, -0.15390777587890625, -0.13014602661132812, -0.10638427734375, -0.08262252807617188, -0.05886077880859375, -0.035099029541015625, -0.0113372802734375, 0.012424468994140625, 0.03618621826171875, 0.059947967529296875, 0.083709716796875, 0.10747146606445312, 0.13123321533203125, 0.15499496459960938, 0.1787567138671875, 0.20251846313476562, 0.22628021240234375, 0.2500419616699219, 0.2738037109375, 0.2975654602050781, 0.32132720947265625, 0.3450889587402344, 0.3688507080078125, 0.3926124572753906, 0.41637420654296875, 0.4401359558105469, 0.463897705078125, 0.4876594543457031, 0.5114212036132812, 0.5351829528808594, 0.5589447021484375, 0.5827064514160156, 0.6064682006835938, 0.6302299499511719, 0.65399169921875, 0.6777534484863281, 0.7015151977539062, 0.7252769470214844, 0.7490386962890625, 0.7728004455566406, 0.7965621948242188, 0.8203239440917969, 0.844085693359375, 0.8678474426269531, 0.8916091918945312, 0.9153709411621094, 0.9391326904296875, 0.9628944396972656, 0.9866561889648438, 1.0104179382324219, 1.0341796875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 1.0, 7.0, 6.0, 12.0, 15.0, 27.0, 33.0, 53.0, 78.0, 115.0, 139.0, 139.0, 124.0, 81.0, 59.0, 41.0, 22.0, 18.0, 12.0, 8.0, 2.0, 1.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.62961483001709, -2.5625107288360596, -2.4954066276550293, -2.428302526473999, -2.3611984252929688, -2.2940940856933594, -2.226990222930908, -2.159885883331299, -2.0927817821502686, -2.0256776809692383, -1.958573579788208, -1.8914694786071777, -1.824365258216858, -1.7572611570358276, -1.6901570558547974, -1.623052954673767, -1.5559488534927368, -1.4888447523117065, -1.4217406511306763, -1.3546364307403564, -1.2875323295593262, -1.220428228378296, -1.1533241271972656, -1.0862200260162354, -1.019115924835205, -0.9520118236541748, -0.8849076628684998, -0.8178035616874695, -0.7506994009017944, -0.6835952997207642, -0.6164911985397339, -0.5493870973587036, -0.48228275775909424, -0.4151786267757416, -0.3480744957923889, -0.28097039461135864, -0.21386626362800598, -0.14676213264465332, -0.07965803146362305, -0.012553900480270386, 0.054550230503082275, 0.12165435403585434, 0.1887584775686264, 0.25586259365081787, 0.32296672463417053, 0.3900708556175232, 0.45717495679855347, 0.5242791175842285, 0.5913832187652588, 0.6584873199462891, 0.7255914807319641, 0.7926955819129944, 0.8597997426986694, 0.9269038438796997, 0.99400794506073, 1.0611120462417603, 1.12821626663208, 1.1953203678131104, 1.2624244689941406, 1.329528570175171, 1.3966327905654907, 1.463736891746521, 1.5308409929275513, 1.5979450941085815, 1.6650491952896118]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 6.0, 4.0, 3.0, 5.0, 5.0, 6.0, 7.0, 8.0, 11.0, 10.0, 24.0, 25.0, 27.0, 40.0, 31.0, 39.0, 53.0, 40.0, 43.0, 43.0, 45.0, 57.0, 49.0, 41.0, 46.0, 60.0, 36.0, 31.0, 34.0, 21.0, 28.0, 29.0, 26.0, 8.0, 12.0, 11.0, 10.0, 12.0, 7.0, 5.0, 7.0, 0.0, 7.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9882547855377197, -0.9553248286247253, -0.922394871711731, -0.8894649147987366, -0.8565349578857422, -0.823604941368103, -0.7906749844551086, -0.7577450275421143, -0.7248150706291199, -0.6918851137161255, -0.6589551568031311, -0.6260251998901367, -0.5930951833724976, -0.560165286064148, -0.5272352695465088, -0.4943053126335144, -0.46137535572052, -0.42844539880752563, -0.39551544189453125, -0.3625854551792145, -0.3296554982662201, -0.2967255413532257, -0.26379555463790894, -0.23086559772491455, -0.19793564081192017, -0.16500568389892578, -0.1320757120847702, -0.09914574772119522, -0.06621578335762024, -0.033285826444625854, -0.0003558546304702759, 0.0325741171836853, 0.06550419330596924, 0.09843415766954422, 0.1313641220331192, 0.16429409384727478, 0.19722405076026917, 0.23015400767326355, 0.2630839943885803, 0.2960139513015747, 0.3289439082145691, 0.3618738651275635, 0.39480382204055786, 0.42773380875587463, 0.460663765668869, 0.4935937225818634, 0.5265237092971802, 0.5594536662101746, 0.592383623123169, 0.6253135800361633, 0.6582435369491577, 0.6911734938621521, 0.7241034507751465, 0.7570334672927856, 0.78996342420578, 0.8228933811187744, 0.8558233380317688, 0.8887532949447632, 0.9216832518577576, 0.954613208770752, 0.9875432252883911, 1.0204731225967407, 1.0534031391143799, 1.0863330364227295, 1.1192630529403687]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 5.0, 12.0, 8.0, 12.0, 21.0, 35.0, 45.0, 53.0, 102.0, 161.0, 223.0, 372.0, 706.0, 1299.0, 2778.0, 6736.0, 23649.0, 217912.0, 719673.0, 55169.0, 11492.0, 4061.0, 1772.0, 922.0, 491.0, 298.0, 182.0, 103.0, 92.0, 61.0, 38.0, 26.0, 15.0, 9.0, 9.0, 6.0, 5.0, 2.0, 3.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.626953125, -0.6062164306640625, -0.585479736328125, -0.5647430419921875, -0.54400634765625, -0.5232696533203125, -0.502532958984375, -0.4817962646484375, -0.4610595703125, -0.4403228759765625, -0.419586181640625, -0.3988494873046875, -0.37811279296875, -0.3573760986328125, -0.336639404296875, -0.3159027099609375, -0.295166015625, -0.2744293212890625, -0.253692626953125, -0.2329559326171875, -0.21221923828125, -0.1914825439453125, -0.170745849609375, -0.1500091552734375, -0.1292724609375, -0.1085357666015625, -0.087799072265625, -0.0670623779296875, -0.04632568359375, -0.0255889892578125, -0.004852294921875, 0.0158843994140625, 0.03662109375, 0.0573577880859375, 0.078094482421875, 0.0988311767578125, 0.11956787109375, 0.1403045654296875, 0.161041259765625, 0.1817779541015625, 0.2025146484375, 0.2232513427734375, 0.243988037109375, 0.2647247314453125, 0.28546142578125, 0.3061981201171875, 0.326934814453125, 0.3476715087890625, 0.368408203125, 0.3891448974609375, 0.409881591796875, 0.4306182861328125, 0.45135498046875, 0.4720916748046875, 0.492828369140625, 0.5135650634765625, 0.5343017578125, 0.5550384521484375, 0.575775146484375, 0.5965118408203125, 0.61724853515625, 0.6379852294921875, 0.658721923828125, 0.6794586181640625, 0.7001953125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 4.0, 5.0, 1.0, 5.0, 11.0, 16.0, 14.0, 24.0, 16.0, 28.0, 39.0, 39.0, 60.0, 57.0, 62.0, 56.0, 68.0, 68.0, 64.0, 63.0, 52.0, 47.0, 39.0, 32.0, 30.0, 29.0, 17.0, 11.0, 11.0, 14.0, 8.0, 7.0, 4.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7861328125, -0.7613601684570312, -0.7365875244140625, -0.7118148803710938, -0.687042236328125, -0.6622695922851562, -0.6374969482421875, -0.6127243041992188, -0.58795166015625, -0.5631790161132812, -0.5384063720703125, -0.5136337280273438, -0.488861083984375, -0.46408843994140625, -0.4393157958984375, -0.41454315185546875, -0.3897705078125, -0.36499786376953125, -0.3402252197265625, -0.31545257568359375, -0.290679931640625, -0.26590728759765625, -0.2411346435546875, -0.21636199951171875, -0.19158935546875, -0.16681671142578125, -0.1420440673828125, -0.11727142333984375, -0.092498779296875, -0.06772613525390625, -0.0429534912109375, -0.01818084716796875, 0.006591796875, 0.03136444091796875, 0.0561370849609375, 0.08090972900390625, 0.105682373046875, 0.13045501708984375, 0.1552276611328125, 0.18000030517578125, 0.20477294921875, 0.22954559326171875, 0.2543182373046875, 0.27909088134765625, 0.303863525390625, 0.32863616943359375, 0.3534088134765625, 0.37818145751953125, 0.4029541015625, 0.42772674560546875, 0.4524993896484375, 0.47727203369140625, 0.502044677734375, 0.5268173217773438, 0.5515899658203125, 0.5763626098632812, 0.60113525390625, 0.6259078979492188, 0.6506805419921875, 0.6754531860351562, 0.700225830078125, 0.7249984741210938, 0.7497711181640625, 0.7745437622070312, 0.79931640625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 5.0, 6.0, 5.0, 10.0, 20.0, 34.0, 58.0, 116.0, 201.0, 431.0, 926.0, 2478.0, 8355.0, 43527.0, 558814.0, 389976.0, 32953.0, 6829.0, 2185.0, 887.0, 347.0, 173.0, 85.0, 44.0, 30.0, 17.0, 11.0, 12.0, 7.0, 5.0, 2.0, 2.0, 0.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.461181640625, -0.4471778869628906, -0.43317413330078125, -0.4191703796386719, -0.4051666259765625, -0.3911628723144531, -0.37715911865234375, -0.3631553649902344, -0.349151611328125, -0.3351478576660156, -0.32114410400390625, -0.3071403503417969, -0.2931365966796875, -0.2791328430175781, -0.26512908935546875, -0.2511253356933594, -0.23712158203125, -0.22311782836914062, -0.20911407470703125, -0.19511032104492188, -0.1811065673828125, -0.16710281372070312, -0.15309906005859375, -0.13909530639648438, -0.125091552734375, -0.11108779907226562, -0.09708404541015625, -0.08308029174804688, -0.0690765380859375, -0.055072784423828125, -0.04106903076171875, -0.027065277099609375, -0.0130615234375, 0.000942230224609375, 0.01494598388671875, 0.028949737548828125, 0.0429534912109375, 0.056957244873046875, 0.07096099853515625, 0.08496475219726562, 0.098968505859375, 0.11297225952148438, 0.12697601318359375, 0.14097976684570312, 0.1549835205078125, 0.16898727416992188, 0.18299102783203125, 0.19699478149414062, 0.21099853515625, 0.22500228881835938, 0.23900604248046875, 0.2530097961425781, 0.2670135498046875, 0.2810173034667969, 0.29502105712890625, 0.3090248107910156, 0.323028564453125, 0.3370323181152344, 0.35103607177734375, 0.3650398254394531, 0.3790435791015625, 0.3930473327636719, 0.40705108642578125, 0.4210548400878906, 0.43505859375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 7.0, 1.0, 3.0, 8.0, 5.0, 7.0, 9.0, 15.0, 13.0, 16.0, 15.0, 25.0, 20.0, 31.0, 32.0, 26.0, 42.0, 45.0, 36.0, 51.0, 48.0, 53.0, 52.0, 75.0, 41.0, 39.0, 37.0, 35.0, 30.0, 31.0, 25.0, 18.0, 21.0, 20.0, 11.0, 13.0, 7.0, 7.0, 11.0, 8.0, 10.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.3486328125, -1.3122634887695312, -1.2758941650390625, -1.2395248413085938, -1.203155517578125, -1.1667861938476562, -1.1304168701171875, -1.0940475463867188, -1.05767822265625, -1.0213088989257812, -0.9849395751953125, -0.9485702514648438, -0.912200927734375, -0.8758316040039062, -0.8394622802734375, -0.8030929565429688, -0.7667236328125, -0.7303543090820312, -0.6939849853515625, -0.6576156616210938, -0.621246337890625, -0.5848770141601562, -0.5485076904296875, -0.5121383666992188, -0.47576904296875, -0.43939971923828125, -0.4030303955078125, -0.36666107177734375, -0.330291748046875, -0.29392242431640625, -0.2575531005859375, -0.22118377685546875, -0.184814453125, -0.14844512939453125, -0.1120758056640625, -0.07570648193359375, -0.039337158203125, -0.00296783447265625, 0.0334014892578125, 0.06977081298828125, 0.10614013671875, 0.14250946044921875, 0.1788787841796875, 0.21524810791015625, 0.251617431640625, 0.28798675537109375, 0.3243560791015625, 0.36072540283203125, 0.3970947265625, 0.43346405029296875, 0.4698333740234375, 0.5062026977539062, 0.542572021484375, 0.5789413452148438, 0.6153106689453125, 0.6516799926757812, 0.68804931640625, 0.7244186401367188, 0.7607879638671875, 0.7971572875976562, 0.833526611328125, 0.8698959350585938, 0.9062652587890625, 0.9426345825195312, 0.97900390625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 7.0, 5.0, 9.0, 7.0, 15.0, 14.0, 29.0, 42.0, 74.0, 83.0, 140.0, 226.0, 352.0, 640.0, 1293.0, 2747.0, 6982.0, 21630.0, 99719.0, 662744.0, 199559.0, 34613.0, 10045.0, 3909.0, 1664.0, 831.0, 480.0, 235.0, 168.0, 96.0, 62.0, 40.0, 29.0, 21.0, 11.0, 14.0, 8.0, 4.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.10595703125, -0.10261154174804688, -0.09926605224609375, -0.09592056274414062, -0.0925750732421875, -0.08922958374023438, -0.08588409423828125, -0.08253860473632812, -0.079193115234375, -0.07584762573242188, -0.07250213623046875, -0.06915664672851562, -0.0658111572265625, -0.062465667724609375, -0.05912017822265625, -0.055774688720703125, -0.05242919921875, -0.049083709716796875, -0.04573822021484375, -0.042392730712890625, -0.0390472412109375, -0.035701751708984375, -0.03235626220703125, -0.029010772705078125, -0.025665283203125, -0.022319793701171875, -0.01897430419921875, -0.015628814697265625, -0.0122833251953125, -0.008937835693359375, -0.00559234619140625, -0.002246856689453125, 0.0010986328125, 0.004444122314453125, 0.00778961181640625, 0.011135101318359375, 0.0144805908203125, 0.017826080322265625, 0.02117156982421875, 0.024517059326171875, 0.027862548828125, 0.031208038330078125, 0.03455352783203125, 0.037899017333984375, 0.0412445068359375, 0.044589996337890625, 0.04793548583984375, 0.051280975341796875, 0.05462646484375, 0.057971954345703125, 0.06131744384765625, 0.06466293334960938, 0.0680084228515625, 0.07135391235351562, 0.07469940185546875, 0.07804489135742188, 0.081390380859375, 0.08473587036132812, 0.08808135986328125, 0.09142684936523438, 0.0947723388671875, 0.09811782836914062, 0.10146331787109375, 0.10480880737304688, 0.108154296875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 4.0, 4.0, 9.0, 10.0, 11.0, 17.0, 25.0, 40.0, 54.0, 85.0, 113.0, 192.0, 154.0, 81.0, 49.0, 39.0, 27.0, 32.0, 9.0, 11.0, 9.0, 13.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.539987564086914e-05, -7.350090891122818e-05, -7.160194218158722e-05, -6.970297545194626e-05, -6.78040087223053e-05, -6.590504199266434e-05, -6.400607526302338e-05, -6.210710853338242e-05, -6.0208141803741455e-05, -5.8309175074100494e-05, -5.6410208344459534e-05, -5.451124161481857e-05, -5.261227488517761e-05, -5.071330815553665e-05, -4.881434142589569e-05, -4.691537469625473e-05, -4.501640796661377e-05, -4.311744123697281e-05, -4.121847450733185e-05, -3.931950777769089e-05, -3.742054104804993e-05, -3.5521574318408966e-05, -3.3622607588768005e-05, -3.1723640859127045e-05, -2.9824674129486084e-05, -2.7925707399845123e-05, -2.6026740670204163e-05, -2.4127773940563202e-05, -2.222880721092224e-05, -2.032984048128128e-05, -1.843087375164032e-05, -1.653190702199936e-05, -1.4632940292358398e-05, -1.2733973562717438e-05, -1.0835006833076477e-05, -8.936040103435516e-06, -7.037073373794556e-06, -5.138106644153595e-06, -3.2391399145126343e-06, -1.3401731848716736e-06, 5.587935447692871e-07, 2.457760274410248e-06, 4.3567270040512085e-06, 6.255693733692169e-06, 8.15466046333313e-06, 1.005362719297409e-05, 1.1952593922615051e-05, 1.3851560652256012e-05, 1.5750527381896973e-05, 1.7649494111537933e-05, 1.9548460841178894e-05, 2.1447427570819855e-05, 2.3346394300460815e-05, 2.5245361030101776e-05, 2.7144327759742737e-05, 2.9043294489383698e-05, 3.094226121902466e-05, 3.284122794866562e-05, 3.474019467830658e-05, 3.663916140794754e-05, 3.85381281375885e-05, 4.043709486722946e-05, 4.233606159687042e-05, 4.423502832651138e-05, 4.6133995056152344e-05]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 5.0, 2.0, 11.0, 11.0, 14.0, 14.0, 28.0, 36.0, 59.0, 96.0, 171.0, 209.0, 344.0, 593.0, 978.0, 1552.0, 2726.0, 5051.0, 9586.0, 19531.0, 43465.0, 113458.0, 389513.0, 298276.0, 90794.0, 36319.0, 16905.0, 8282.0, 4415.0, 2454.0, 1446.0, 805.0, 533.0, 272.0, 204.0, 144.0, 80.0, 45.0, 47.0, 28.0, 17.0, 14.0, 8.0, 5.0, 4.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.06494140625, -0.06276893615722656, -0.060596466064453125, -0.05842399597167969, -0.05625152587890625, -0.05407905578613281, -0.051906585693359375, -0.04973411560058594, -0.0475616455078125, -0.04538917541503906, -0.043216705322265625, -0.04104423522949219, -0.03887176513671875, -0.03669929504394531, -0.034526824951171875, -0.03235435485839844, -0.030181884765625, -0.028009414672851562, -0.025836944580078125, -0.023664474487304688, -0.02149200439453125, -0.019319534301757812, -0.017147064208984375, -0.014974594116210938, -0.0128021240234375, -0.010629653930664062, -0.008457183837890625, -0.0062847137451171875, -0.00411224365234375, -0.0019397735595703125, 0.000232696533203125, 0.0024051666259765625, 0.00457763671875, 0.0067501068115234375, 0.008922576904296875, 0.011095046997070312, 0.01326751708984375, 0.015439987182617188, 0.017612457275390625, 0.019784927368164062, 0.0219573974609375, 0.024129867553710938, 0.026302337646484375, 0.028474807739257812, 0.03064727783203125, 0.03281974792480469, 0.034992218017578125, 0.03716468811035156, 0.039337158203125, 0.04150962829589844, 0.043682098388671875, 0.04585456848144531, 0.04802703857421875, 0.05019950866699219, 0.052371978759765625, 0.05454444885253906, 0.0567169189453125, 0.05888938903808594, 0.061061859130859375, 0.06323432922363281, 0.06540679931640625, 0.06757926940917969, 0.06975173950195312, 0.07192420959472656, 0.0740966796875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 7.0, 2.0, 10.0, 6.0, 8.0, 10.0, 15.0, 18.0, 23.0, 24.0, 23.0, 29.0, 39.0, 59.0, 64.0, 62.0, 89.0, 83.0, 83.0, 59.0, 51.0, 41.0, 38.0, 37.0, 19.0, 17.0, 16.0, 16.0, 13.0, 7.0, 7.0, 10.0, 4.0, 3.0, 5.0, 1.0, 2.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0210113525390625, -0.02039480209350586, -0.01977825164794922, -0.019161701202392578, -0.018545150756835938, -0.017928600311279297, -0.017312049865722656, -0.016695499420166016, -0.016078948974609375, -0.015462398529052734, -0.014845848083496094, -0.014229297637939453, -0.013612747192382812, -0.012996196746826172, -0.012379646301269531, -0.01176309585571289, -0.01114654541015625, -0.01052999496459961, -0.009913444519042969, -0.009296894073486328, -0.008680343627929688, -0.008063793182373047, -0.007447242736816406, -0.006830692291259766, -0.006214141845703125, -0.005597591400146484, -0.004981040954589844, -0.004364490509033203, -0.0037479400634765625, -0.003131389617919922, -0.0025148391723632812, -0.0018982887268066406, -0.00128173828125, -0.0006651878356933594, -4.863739013671875e-05, 0.0005679130554199219, 0.0011844635009765625, 0.0018010139465332031, 0.0024175643920898438, 0.0030341148376464844, 0.003650665283203125, 0.004267215728759766, 0.004883766174316406, 0.005500316619873047, 0.0061168670654296875, 0.006733417510986328, 0.007349967956542969, 0.00796651840209961, 0.00858306884765625, 0.00919961929321289, 0.009816169738769531, 0.010432720184326172, 0.011049270629882812, 0.011665821075439453, 0.012282371520996094, 0.012898921966552734, 0.013515472412109375, 0.014132022857666016, 0.014748573303222656, 0.015365123748779297, 0.015981674194335938, 0.016598224639892578, 0.01721477508544922, 0.01783132553100586, 0.0184478759765625]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 9.0, 7.0, 8.0, 6.0, 16.0, 34.0, 35.0, 58.0, 68.0, 110.0, 137.0, 140.0, 116.0, 69.0, 60.0, 46.0, 27.0, 18.0, 10.0, 7.0, 7.0, 2.0, 3.0, 5.0, 7.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.1575431823730469, -1.1226516962051392, -1.087760090827942, -1.0528686046600342, -1.0179771184921265, -0.9830855131149292, -0.9481940269470215, -0.913302481174469, -0.8784109354019165, -0.843519389629364, -0.8086279034614563, -0.7737363576889038, -0.7388448119163513, -0.7039532661437988, -0.6690617799758911, -0.6341702342033386, -0.5992787480354309, -0.5643872022628784, -0.5294957160949707, -0.4946041703224182, -0.4597126245498657, -0.4248211085796356, -0.3899295926094055, -0.355038046836853, -0.3201465308666229, -0.2852550148963928, -0.25036346912384033, -0.21547195315361023, -0.18058042228221893, -0.14568889141082764, -0.11079737544059753, -0.07590584456920624, -0.04101431369781494, -0.0061227865517139435, 0.028768740594387054, 0.06366026401519775, 0.09855179488658905, 0.13344332575798035, 0.16833484172821045, 0.20322637259960175, 0.23811790347099304, 0.27300941944122314, 0.30790096521377563, 0.34279248118400574, 0.37768399715423584, 0.41257554292678833, 0.44746705889701843, 0.48235857486724854, 0.517250120639801, 0.5521416664123535, 0.5870331525802612, 0.6219246983528137, 0.6568162441253662, 0.6917077302932739, 0.7265992760658264, 0.7614908218383789, 0.7963823080062866, 0.8312738537788391, 0.8661653399467468, 0.9010568857192993, 0.9359484314918518, 0.9708399772644043, 1.005731463432312, 1.0406229496002197, 1.075514554977417]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 6.0, 7.0, 6.0, 7.0, 12.0, 15.0, 13.0, 35.0, 38.0, 45.0, 46.0, 63.0, 68.0, 56.0, 71.0, 74.0, 61.0, 77.0, 56.0, 50.0, 37.0, 36.0, 36.0, 22.0, 13.0, 18.0, 12.0, 8.0, 9.0, 5.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9620012044906616, -0.9360266327857971, -0.9100520610809326, -0.8840775489807129, -0.8581029772758484, -0.8321284055709839, -0.8061538934707642, -0.7801793217658997, -0.7542047500610352, -0.7282301783561707, -0.7022556066513062, -0.6762810945510864, -0.6503065228462219, -0.6243319511413574, -0.5983574390411377, -0.5723828673362732, -0.5464082956314087, -0.5204337239265442, -0.4944591820240021, -0.46848464012145996, -0.44251006841659546, -0.41653549671173096, -0.39056095480918884, -0.36458641290664673, -0.3386118412017822, -0.3126372694969177, -0.2866627275943756, -0.2606881856918335, -0.234713613986969, -0.20873905718326569, -0.18276450037956238, -0.15678994357585907, -0.13081538677215576, -0.10484082996845245, -0.07886627316474915, -0.05289171636104584, -0.02691715955734253, -0.0009426027536392212, 0.025031954050064087, 0.051006510853767395, 0.0769810676574707, 0.10295562446117401, 0.12893018126487732, 0.15490473806858063, 0.18087929487228394, 0.20685385167598724, 0.23282840847969055, 0.25880295038223267, 0.28477752208709717, 0.31075209379196167, 0.3367266356945038, 0.3627011775970459, 0.3886757493019104, 0.4146503210067749, 0.440624862909317, 0.46659940481185913, 0.49257397651672363, 0.5185485482215881, 0.5445231199264526, 0.5704976320266724, 0.5964722037315369, 0.6224467754364014, 0.6484212875366211, 0.6743958592414856, 0.7003704309463501]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 6.0, 8.0, 4.0, 16.0, 27.0, 22.0, 43.0, 73.0, 118.0, 198.0, 325.0, 635.0, 1197.0, 2264.0, 5187.0, 14524.0, 94261.0, 842424.0, 65874.0, 12410.0, 4610.0, 2062.0, 989.0, 517.0, 292.0, 191.0, 99.0, 64.0, 34.0, 23.0, 19.0, 20.0, 4.0, 8.0, 4.0, 0.0, 0.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2939453125, -1.2387237548828125, -1.183502197265625, -1.1282806396484375, -1.07305908203125, -1.0178375244140625, -0.962615966796875, -0.9073944091796875, -0.8521728515625, -0.7969512939453125, -0.741729736328125, -0.6865081787109375, -0.63128662109375, -0.5760650634765625, -0.520843505859375, -0.4656219482421875, -0.410400390625, -0.3551788330078125, -0.299957275390625, -0.2447357177734375, -0.18951416015625, -0.1342926025390625, -0.079071044921875, -0.0238494873046875, 0.0313720703125, 0.0865936279296875, 0.141815185546875, 0.1970367431640625, 0.25225830078125, 0.3074798583984375, 0.362701416015625, 0.4179229736328125, 0.47314453125, 0.5283660888671875, 0.583587646484375, 0.6388092041015625, 0.69403076171875, 0.7492523193359375, 0.804473876953125, 0.8596954345703125, 0.9149169921875, 0.9701385498046875, 1.025360107421875, 1.0805816650390625, 1.13580322265625, 1.1910247802734375, 1.246246337890625, 1.3014678955078125, 1.356689453125, 1.4119110107421875, 1.467132568359375, 1.5223541259765625, 1.57757568359375, 1.6327972412109375, 1.688018798828125, 1.7432403564453125, 1.7984619140625, 1.8536834716796875, 1.908905029296875, 1.9641265869140625, 2.01934814453125, 2.0745697021484375, 2.129791259765625, 2.1850128173828125, 2.240234375]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 7.0, 3.0, 6.0, 4.0, 6.0, 10.0, 15.0, 18.0, 16.0, 32.0, 55.0, 51.0, 67.0, 60.0, 87.0, 69.0, 74.0, 66.0, 75.0, 54.0, 52.0, 41.0, 36.0, 25.0, 22.0, 13.0, 13.0, 11.0, 5.0, 9.0, 7.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.095703125, -2.0403900146484375, -1.985076904296875, -1.9297637939453125, -1.87445068359375, -1.8191375732421875, -1.763824462890625, -1.7085113525390625, -1.6531982421875, -1.5978851318359375, -1.542572021484375, -1.4872589111328125, -1.43194580078125, -1.3766326904296875, -1.321319580078125, -1.2660064697265625, -1.210693359375, -1.1553802490234375, -1.100067138671875, -1.0447540283203125, -0.98944091796875, -0.9341278076171875, -0.878814697265625, -0.8235015869140625, -0.7681884765625, -0.7128753662109375, -0.657562255859375, -0.6022491455078125, -0.54693603515625, -0.4916229248046875, -0.436309814453125, -0.3809967041015625, -0.32568359375, -0.2703704833984375, -0.215057373046875, -0.1597442626953125, -0.10443115234375, -0.0491180419921875, 0.006195068359375, 0.0615081787109375, 0.1168212890625, 0.1721343994140625, 0.227447509765625, 0.2827606201171875, 0.33807373046875, 0.3933868408203125, 0.448699951171875, 0.5040130615234375, 0.559326171875, 0.6146392822265625, 0.669952392578125, 0.7252655029296875, 0.78057861328125, 0.8358917236328125, 0.891204833984375, 0.9465179443359375, 1.0018310546875, 1.0571441650390625, 1.112457275390625, 1.1677703857421875, 1.22308349609375, 1.2783966064453125, 1.333709716796875, 1.3890228271484375, 1.4443359375]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 2.0, 2.0, 1.0, 4.0, 3.0, 3.0, 16.0, 2.0, 13.0, 22.0, 13.0, 28.0, 35.0, 46.0, 94.0, 134.0, 176.0, 377.0, 642.0, 1132.0, 2330.0, 4767.0, 12747.0, 53016.0, 710364.0, 221088.0, 25985.0, 8110.0, 3493.0, 1759.0, 899.0, 505.0, 279.0, 159.0, 83.0, 79.0, 49.0, 40.0, 21.0, 13.0, 6.0, 7.0, 5.0, 4.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1240234375, -1.0835723876953125, -1.043121337890625, -1.0026702880859375, -0.96221923828125, -0.9217681884765625, -0.881317138671875, -0.8408660888671875, -0.8004150390625, -0.7599639892578125, -0.719512939453125, -0.6790618896484375, -0.63861083984375, -0.5981597900390625, -0.557708740234375, -0.5172576904296875, -0.476806640625, -0.4363555908203125, -0.395904541015625, -0.3554534912109375, -0.31500244140625, -0.2745513916015625, -0.234100341796875, -0.1936492919921875, -0.1531982421875, -0.1127471923828125, -0.072296142578125, -0.0318450927734375, 0.00860595703125, 0.0490570068359375, 0.089508056640625, 0.1299591064453125, 0.17041015625, 0.2108612060546875, 0.251312255859375, 0.2917633056640625, 0.33221435546875, 0.3726654052734375, 0.413116455078125, 0.4535675048828125, 0.4940185546875, 0.5344696044921875, 0.574920654296875, 0.6153717041015625, 0.65582275390625, 0.6962738037109375, 0.736724853515625, 0.7771759033203125, 0.817626953125, 0.8580780029296875, 0.898529052734375, 0.9389801025390625, 0.97943115234375, 1.0198822021484375, 1.060333251953125, 1.1007843017578125, 1.1412353515625, 1.1816864013671875, 1.222137451171875, 1.2625885009765625, 1.30303955078125, 1.3434906005859375, 1.383941650390625, 1.4243927001953125, 1.46484375]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 5.0, 9.0, 10.0, 12.0, 9.0, 15.0, 18.0, 24.0, 32.0, 37.0, 37.0, 46.0, 49.0, 40.0, 48.0, 48.0, 53.0, 41.0, 54.0, 56.0, 52.0, 37.0, 39.0, 36.0, 24.0, 24.0, 23.0, 21.0, 18.0, 15.0, 14.0, 7.0, 15.0, 11.0, 2.0, 5.0, 3.0, 2.0, 4.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.4306640625, -1.3872222900390625, -1.343780517578125, -1.3003387451171875, -1.25689697265625, -1.2134552001953125, -1.170013427734375, -1.1265716552734375, -1.0831298828125, -1.0396881103515625, -0.996246337890625, -0.9528045654296875, -0.90936279296875, -0.8659210205078125, -0.822479248046875, -0.7790374755859375, -0.735595703125, -0.6921539306640625, -0.648712158203125, -0.6052703857421875, -0.56182861328125, -0.5183868408203125, -0.474945068359375, -0.4315032958984375, -0.3880615234375, -0.3446197509765625, -0.301177978515625, -0.2577362060546875, -0.21429443359375, -0.1708526611328125, -0.127410888671875, -0.0839691162109375, -0.04052734375, 0.0029144287109375, 0.046356201171875, 0.0897979736328125, 0.13323974609375, 0.1766815185546875, 0.220123291015625, 0.2635650634765625, 0.3070068359375, 0.3504486083984375, 0.393890380859375, 0.4373321533203125, 0.48077392578125, 0.5242156982421875, 0.567657470703125, 0.6110992431640625, 0.654541015625, 0.6979827880859375, 0.741424560546875, 0.7848663330078125, 0.82830810546875, 0.8717498779296875, 0.915191650390625, 0.9586334228515625, 1.0020751953125, 1.0455169677734375, 1.088958740234375, 1.1324005126953125, 1.17584228515625, 1.2192840576171875, 1.262725830078125, 1.3061676025390625, 1.349609375]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 4.0, 5.0, 9.0, 9.0, 19.0, 23.0, 32.0, 55.0, 76.0, 124.0, 200.0, 254.0, 452.0, 817.0, 1416.0, 2925.0, 7840.0, 33002.0, 701655.0, 264636.0, 23239.0, 6206.0, 2541.0, 1105.0, 679.0, 444.0, 286.0, 186.0, 123.0, 57.0, 44.0, 22.0, 16.0, 15.0, 14.0, 8.0, 8.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.448486328125, -0.4356346130371094, -0.42278289794921875, -0.4099311828613281, -0.3970794677734375, -0.3842277526855469, -0.37137603759765625, -0.3585243225097656, -0.345672607421875, -0.3328208923339844, -0.31996917724609375, -0.3071174621582031, -0.2942657470703125, -0.2814140319824219, -0.26856231689453125, -0.2557106018066406, -0.24285888671875, -0.23000717163085938, -0.21715545654296875, -0.20430374145507812, -0.1914520263671875, -0.17860031127929688, -0.16574859619140625, -0.15289688110351562, -0.140045166015625, -0.12719345092773438, -0.11434173583984375, -0.10149002075195312, -0.0886383056640625, -0.07578659057617188, -0.06293487548828125, -0.050083160400390625, -0.0372314453125, -0.024379730224609375, -0.01152801513671875, 0.001323699951171875, 0.0141754150390625, 0.027027130126953125, 0.03987884521484375, 0.052730560302734375, 0.065582275390625, 0.07843399047851562, 0.09128570556640625, 0.10413742065429688, 0.1169891357421875, 0.12984085083007812, 0.14269256591796875, 0.15554428100585938, 0.16839599609375, 0.18124771118164062, 0.19409942626953125, 0.20695114135742188, 0.2198028564453125, 0.23265457153320312, 0.24550628662109375, 0.2583580017089844, 0.271209716796875, 0.2840614318847656, 0.29691314697265625, 0.3097648620605469, 0.3226165771484375, 0.3354682922363281, 0.34832000732421875, 0.3611717224121094, 0.3740234375]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 5.0, 8.0, 11.0, 18.0, 24.0, 82.0, 198.0, 423.0, 127.0, 55.0, 25.0, 11.0, 6.0, 5.0, 2.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.896257400512695e-05, -6.571691483259201e-05, -6.247125566005707e-05, -5.9225596487522125e-05, -5.597993731498718e-05, -5.273427814245224e-05, -4.94886189699173e-05, -4.6242959797382355e-05, -4.299730062484741e-05, -3.975164145231247e-05, -3.650598227977753e-05, -3.3260323107242584e-05, -3.001466393470764e-05, -2.67690047621727e-05, -2.3523345589637756e-05, -2.0277686417102814e-05, -1.703202724456787e-05, -1.3786368072032928e-05, -1.0540708899497986e-05, -7.295049726963043e-06, -4.049390554428101e-06, -8.03731381893158e-07, 2.4419277906417847e-06, 5.687586963176727e-06, 8.93324613571167e-06, 1.2178905308246613e-05, 1.5424564480781555e-05, 1.8670223653316498e-05, 2.191588282585144e-05, 2.5161541998386383e-05, 2.8407201170921326e-05, 3.165286034345627e-05, 3.489851951599121e-05, 3.8144178688526154e-05, 4.1389837861061096e-05, 4.463549703359604e-05, 4.788115620613098e-05, 5.1126815378665924e-05, 5.437247455120087e-05, 5.761813372373581e-05, 6.086379289627075e-05, 6.41094520688057e-05, 6.735511124134064e-05, 7.060077041387558e-05, 7.384642958641052e-05, 7.709208875894547e-05, 8.033774793148041e-05, 8.358340710401535e-05, 8.682906627655029e-05, 9.007472544908524e-05, 9.332038462162018e-05, 9.656604379415512e-05, 9.981170296669006e-05, 0.000103057362139225, 0.00010630302131175995, 0.00010954868048429489, 0.00011279433965682983, 0.00011603999882936478, 0.00011928565800189972, 0.00012253131717443466, 0.0001257769763469696, 0.00012902263551950455, 0.0001322682946920395, 0.00013551395386457443, 0.00013875961303710938]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 5.0, 6.0, 12.0, 6.0, 5.0, 34.0, 27.0, 37.0, 73.0, 93.0, 134.0, 193.0, 263.0, 402.0, 621.0, 1145.0, 2020.0, 3806.0, 8860.0, 30562.0, 311077.0, 627417.0, 41242.0, 10510.0, 4344.0, 2306.0, 1257.0, 701.0, 428.0, 298.0, 217.0, 148.0, 100.0, 68.0, 50.0, 30.0, 16.0, 14.0, 13.0, 6.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.385498046875, -0.37384796142578125, -0.3621978759765625, -0.35054779052734375, -0.338897705078125, -0.32724761962890625, -0.3155975341796875, -0.30394744873046875, -0.29229736328125, -0.28064727783203125, -0.2689971923828125, -0.25734710693359375, -0.245697021484375, -0.23404693603515625, -0.2223968505859375, -0.21074676513671875, -0.1990966796875, -0.18744659423828125, -0.1757965087890625, -0.16414642333984375, -0.152496337890625, -0.14084625244140625, -0.1291961669921875, -0.11754608154296875, -0.10589599609375, -0.09424591064453125, -0.0825958251953125, -0.07094573974609375, -0.059295654296875, -0.04764556884765625, -0.0359954833984375, -0.02434539794921875, -0.0126953125, -0.00104522705078125, 0.0106048583984375, 0.02225494384765625, 0.033905029296875, 0.04555511474609375, 0.0572052001953125, 0.06885528564453125, 0.08050537109375, 0.09215545654296875, 0.1038055419921875, 0.11545562744140625, 0.127105712890625, 0.13875579833984375, 0.1504058837890625, 0.16205596923828125, 0.1737060546875, 0.18535614013671875, 0.1970062255859375, 0.20865631103515625, 0.220306396484375, 0.23195648193359375, 0.2436065673828125, 0.25525665283203125, 0.26690673828125, 0.27855682373046875, 0.2902069091796875, 0.30185699462890625, 0.313507080078125, 0.32515716552734375, 0.3368072509765625, 0.34845733642578125, 0.360107421875]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 2.0, 7.0, 10.0, 5.0, 20.0, 12.0, 12.0, 20.0, 22.0, 28.0, 47.0, 77.0, 79.0, 108.0, 158.0, 91.0, 65.0, 55.0, 40.0, 35.0, 22.0, 8.0, 15.0, 14.0, 10.0, 9.0, 10.0, 5.0, 1.0, 2.0, 1.0, 5.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.06842041015625, -0.06546783447265625, -0.0625152587890625, -0.05956268310546875, -0.056610107421875, -0.05365753173828125, -0.0507049560546875, -0.04775238037109375, -0.0447998046875, -0.04184722900390625, -0.0388946533203125, -0.03594207763671875, -0.032989501953125, -0.03003692626953125, -0.0270843505859375, -0.02413177490234375, -0.02117919921875, -0.01822662353515625, -0.0152740478515625, -0.01232147216796875, -0.009368896484375, -0.00641632080078125, -0.0034637451171875, -0.00051116943359375, 0.00244140625, 0.00539398193359375, 0.0083465576171875, 0.01129913330078125, 0.014251708984375, 0.01720428466796875, 0.0201568603515625, 0.02310943603515625, 0.02606201171875, 0.02901458740234375, 0.0319671630859375, 0.03491973876953125, 0.037872314453125, 0.04082489013671875, 0.0437774658203125, 0.04673004150390625, 0.0496826171875, 0.05263519287109375, 0.0555877685546875, 0.05854034423828125, 0.061492919921875, 0.06444549560546875, 0.0673980712890625, 0.07035064697265625, 0.07330322265625, 0.07625579833984375, 0.0792083740234375, 0.08216094970703125, 0.085113525390625, 0.08806610107421875, 0.0910186767578125, 0.09397125244140625, 0.096923828125, 0.09987640380859375, 0.1028289794921875, 0.10578155517578125, 0.108734130859375, 0.11168670654296875, 0.1146392822265625, 0.11759185791015625, 0.12054443359375]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 6.0, 8.0, 17.0, 34.0, 20.0, 45.0, 50.0, 79.0, 104.0, 100.0, 137.0, 103.0, 97.0, 53.0, 41.0, 31.0, 16.0, 16.0, 12.0, 7.0, 5.0, 9.0, 7.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-2.9285340309143066, -2.860914945602417, -2.7932960987091064, -2.725677013397217, -2.658057928085327, -2.5904388427734375, -2.522819995880127, -2.4552009105682373, -2.3875818252563477, -2.319962739944458, -2.2523438930511475, -2.184724807739258, -2.117105722427368, -2.0494866371154785, -1.981867790222168, -1.9142487049102783, -1.8466298580169678, -1.7790108919143677, -1.711391806602478, -1.643772840499878, -1.5761537551879883, -1.5085347890853882, -1.440915822982788, -1.3732967376708984, -1.3056777715682983, -1.2380588054656982, -1.1704397201538086, -1.1028207540512085, -1.0352017879486084, -0.9675827026367188, -0.8999637365341187, -0.8323447108268738, -0.7647258043289185, -0.6971067786216736, -0.6294877529144287, -0.5618687868118286, -0.49424976110458374, -0.42663073539733887, -0.3590117394924164, -0.2913927435874939, -0.22377371788024902, -0.15615470707416534, -0.08853569626808167, -0.020916685461997986, 0.04670232534408569, 0.11432135105133057, 0.18194034695625305, 0.24955934286117554, 0.3171783685684204, 0.3847973942756653, 0.45241639018058777, 0.5200353860855103, 0.5876544117927551, 0.6552734375, 0.7228924036026001, 0.790511429309845, 0.8581304550170898, 0.9257494807243347, 0.9933685064315796, 1.0609874725341797, 1.1286065578460693, 1.1962255239486694, 1.2638444900512695, 1.3314635753631592, 1.3990825414657593]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 5.0, 4.0, 2.0, 5.0, 6.0, 9.0, 11.0, 16.0, 16.0, 11.0, 28.0, 22.0, 30.0, 19.0, 29.0, 25.0, 31.0, 26.0, 42.0, 38.0, 34.0, 38.0, 48.0, 38.0, 27.0, 38.0, 38.0, 40.0, 40.0, 36.0, 33.0, 31.0, 28.0, 20.0, 20.0, 20.0, 10.0, 16.0, 17.0, 17.0, 12.0, 8.0, 6.0, 8.0, 1.0, 4.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.734708309173584, -1.677946925163269, -1.621185541152954, -1.5644241571426392, -1.5076627731323242, -1.4509012699127197, -1.3941398859024048, -1.3373785018920898, -1.280617117881775, -1.22385573387146, -1.167094349861145, -1.11033296585083, -1.0535714626312256, -0.9968101382255554, -0.9400486946105957, -0.8832873106002808, -0.8265259265899658, -0.7697645425796509, -0.7130031585693359, -0.6562417149543762, -0.5994803309440613, -0.5427189469337463, -0.485957533121109, -0.4291961193084717, -0.37243473529815674, -0.3156733512878418, -0.25891193747520447, -0.20215053856372833, -0.1453891396522522, -0.08862775564193726, -0.03186634182929993, 0.024895071983337402, 0.0816565752029419, 0.13841797411441803, 0.19517937302589417, 0.2519407868385315, 0.30870217084884644, 0.3654635548591614, 0.4222249686717987, 0.47898638248443604, 0.535747766494751, 0.5925091505050659, 0.6492705345153809, 0.7060319781303406, 0.7627933621406555, 0.8195547461509705, 0.8763161897659302, 0.9330775737762451, 0.9898389577865601, 1.046600341796875, 1.10336172580719, 1.1601231098175049, 1.2168846130371094, 1.2736458778381348, 1.3304073810577393, 1.3871687650680542, 1.4439301490783691, 1.500691533088684, 1.557452917098999, 1.614214301109314, 1.670975685119629, 1.7277371883392334, 1.7844985723495483, 1.8412599563598633, 1.8980213403701782]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 3.0, 3.0, 6.0, 6.0, 12.0, 9.0, 20.0, 25.0, 28.0, 40.0, 50.0, 70.0, 98.0, 146.0, 225.0, 361.0, 536.0, 870.0, 1553.0, 3030.0, 6471.0, 18384.0, 84824.0, 2029415.0, 1929681.0, 86393.0, 18296.0, 6571.0, 3007.0, 1627.0, 911.0, 541.0, 354.0, 232.0, 148.0, 79.0, 65.0, 66.0, 25.0, 28.0, 23.0, 15.0, 7.0, 11.0, 6.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 3.0], "bins": [-1.7275390625, -1.6781768798828125, -1.628814697265625, -1.5794525146484375, -1.53009033203125, -1.4807281494140625, -1.431365966796875, -1.3820037841796875, -1.3326416015625, -1.2832794189453125, -1.233917236328125, -1.1845550537109375, -1.13519287109375, -1.0858306884765625, -1.036468505859375, -0.9871063232421875, -0.937744140625, -0.8883819580078125, -0.839019775390625, -0.7896575927734375, -0.74029541015625, -0.6909332275390625, -0.641571044921875, -0.5922088623046875, -0.5428466796875, -0.4934844970703125, -0.444122314453125, -0.3947601318359375, -0.34539794921875, -0.2960357666015625, -0.246673583984375, -0.1973114013671875, -0.14794921875, -0.0985870361328125, -0.049224853515625, 0.0001373291015625, 0.04949951171875, 0.0988616943359375, 0.148223876953125, 0.1975860595703125, 0.2469482421875, 0.2963104248046875, 0.345672607421875, 0.3950347900390625, 0.44439697265625, 0.4937591552734375, 0.543121337890625, 0.5924835205078125, 0.641845703125, 0.6912078857421875, 0.740570068359375, 0.7899322509765625, 0.83929443359375, 0.8886566162109375, 0.938018798828125, 0.9873809814453125, 1.0367431640625, 1.0861053466796875, 1.135467529296875, 1.1848297119140625, 1.23419189453125, 1.2835540771484375, 1.332916259765625, 1.3822784423828125, 1.431640625]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 4.0, 9.0, 8.0, 10.0, 13.0, 20.0, 18.0, 23.0, 44.0, 42.0, 48.0, 53.0, 55.0, 84.0, 66.0, 70.0, 60.0, 75.0, 75.0, 40.0, 42.0, 29.0, 28.0, 28.0, 17.0, 7.0, 13.0, 7.0, 6.0, 9.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.80517578125, -0.778228759765625, -0.75128173828125, -0.724334716796875, -0.6973876953125, -0.670440673828125, -0.64349365234375, -0.616546630859375, -0.589599609375, -0.562652587890625, -0.53570556640625, -0.508758544921875, -0.4818115234375, -0.454864501953125, -0.42791748046875, -0.400970458984375, -0.3740234375, -0.347076416015625, -0.32012939453125, -0.293182373046875, -0.2662353515625, -0.239288330078125, -0.21234130859375, -0.185394287109375, -0.158447265625, -0.131500244140625, -0.10455322265625, -0.077606201171875, -0.0506591796875, -0.023712158203125, 0.00323486328125, 0.030181884765625, 0.05712890625, 0.084075927734375, 0.11102294921875, 0.137969970703125, 0.1649169921875, 0.191864013671875, 0.21881103515625, 0.245758056640625, 0.272705078125, 0.299652099609375, 0.32659912109375, 0.353546142578125, 0.3804931640625, 0.407440185546875, 0.43438720703125, 0.461334228515625, 0.48828125, 0.515228271484375, 0.54217529296875, 0.569122314453125, 0.5960693359375, 0.623016357421875, 0.64996337890625, 0.676910400390625, 0.703857421875, 0.730804443359375, 0.75775146484375, 0.784698486328125, 0.8116455078125, 0.838592529296875, 0.86553955078125, 0.892486572265625, 0.91943359375]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 2.0, 7.0, 4.0, 7.0, 7.0, 15.0, 18.0, 27.0, 46.0, 64.0, 168.0, 381.0, 1023.0, 3139.0, 11415.0, 60130.0, 3343917.0, 725429.0, 36759.0, 7995.0, 2309.0, 770.0, 308.0, 135.0, 70.0, 45.0, 25.0, 20.0, 10.0, 6.0, 9.0, 12.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.642578125, -2.556976318359375, -2.47137451171875, -2.385772705078125, -2.3001708984375, -2.214569091796875, -2.12896728515625, -2.043365478515625, -1.957763671875, -1.872161865234375, -1.78656005859375, -1.700958251953125, -1.6153564453125, -1.529754638671875, -1.44415283203125, -1.358551025390625, -1.27294921875, -1.187347412109375, -1.10174560546875, -1.016143798828125, -0.9305419921875, -0.844940185546875, -0.75933837890625, -0.673736572265625, -0.588134765625, -0.502532958984375, -0.41693115234375, -0.331329345703125, -0.2457275390625, -0.160125732421875, -0.07452392578125, 0.011077880859375, 0.0966796875, 0.182281494140625, 0.26788330078125, 0.353485107421875, 0.4390869140625, 0.524688720703125, 0.61029052734375, 0.695892333984375, 0.781494140625, 0.867095947265625, 0.95269775390625, 1.038299560546875, 1.1239013671875, 1.209503173828125, 1.29510498046875, 1.380706787109375, 1.46630859375, 1.551910400390625, 1.63751220703125, 1.723114013671875, 1.8087158203125, 1.894317626953125, 1.97991943359375, 2.065521240234375, 2.151123046875, 2.236724853515625, 2.32232666015625, 2.407928466796875, 2.4935302734375, 2.579132080078125, 2.66473388671875, 2.750335693359375, 2.8359375]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 9.0, 8.0, 8.0, 13.0, 18.0, 16.0, 14.0, 23.0, 41.0, 68.0, 65.0, 126.0, 241.0, 559.0, 1055.0, 848.0, 408.0, 203.0, 100.0, 51.0, 51.0, 40.0, 22.0, 17.0, 15.0, 12.0, 12.0, 5.0, 4.0, 6.0, 5.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.61669921875, -0.5979537963867188, -0.5792083740234375, -0.5604629516601562, -0.541717529296875, -0.5229721069335938, -0.5042266845703125, -0.48548126220703125, -0.46673583984375, -0.44799041748046875, -0.4292449951171875, -0.41049957275390625, -0.391754150390625, -0.37300872802734375, -0.3542633056640625, -0.33551788330078125, -0.3167724609375, -0.29802703857421875, -0.2792816162109375, -0.26053619384765625, -0.241790771484375, -0.22304534912109375, -0.2042999267578125, -0.18555450439453125, -0.16680908203125, -0.14806365966796875, -0.1293182373046875, -0.11057281494140625, -0.091827392578125, -0.07308197021484375, -0.0543365478515625, -0.03559112548828125, -0.016845703125, 0.00189971923828125, 0.0206451416015625, 0.03939056396484375, 0.058135986328125, 0.07688140869140625, 0.0956268310546875, 0.11437225341796875, 0.13311767578125, 0.15186309814453125, 0.1706085205078125, 0.18935394287109375, 0.208099365234375, 0.22684478759765625, 0.2455902099609375, 0.26433563232421875, 0.2830810546875, 0.30182647705078125, 0.3205718994140625, 0.33931732177734375, 0.358062744140625, 0.37680816650390625, 0.3955535888671875, 0.41429901123046875, 0.43304443359375, 0.45178985595703125, 0.4705352783203125, 0.48928070068359375, 0.508026123046875, 0.5267715454101562, 0.5455169677734375, 0.5642623901367188, 0.5830078125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 7.0, 9.0, 8.0, 5.0, 6.0, 13.0, 12.0, 22.0, 27.0, 32.0, 53.0, 55.0, 76.0, 75.0, 86.0, 83.0, 82.0, 73.0, 65.0, 55.0, 31.0, 24.0, 33.0, 11.0, 16.0, 10.0, 7.0, 5.0, 7.0, 6.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.1894127130508423, -1.1456818580627441, -1.1019511222839355, -1.058220386505127, -1.0144895315170288, -0.9707587361335754, -0.9270279407501221, -0.8832971453666687, -0.8395663499832153, -0.795835554599762, -0.7521047592163086, -0.7083739638328552, -0.6646431684494019, -0.6209123730659485, -0.5771815776824951, -0.5334507822990417, -0.4897199869155884, -0.445989191532135, -0.40225839614868164, -0.35852760076522827, -0.3147968053817749, -0.27106600999832153, -0.22733521461486816, -0.1836044192314148, -0.13987362384796143, -0.09614282846450806, -0.05241203308105469, -0.008681237697601318, 0.03504955768585205, 0.07878035306930542, 0.12251114845275879, 0.16624194383621216, 0.20997262001037598, 0.25370341539382935, 0.2974342107772827, 0.3411650061607361, 0.38489580154418945, 0.4286265969276428, 0.4723573923110962, 0.5160881876945496, 0.5598189830780029, 0.6035497784614563, 0.6472805738449097, 0.691011369228363, 0.7347421646118164, 0.7784729599952698, 0.8222037553787231, 0.8659345507621765, 0.9096653461456299, 0.9533961415290833, 0.9971269369125366, 1.0408577919006348, 1.0845885276794434, 1.128319263458252, 1.17205011844635, 1.2157809734344482, 1.2595117092132568, 1.3032424449920654, 1.3469732999801636, 1.3907041549682617, 1.4344348907470703, 1.478165626525879, 1.521896481513977, 1.5656273365020752, 1.6093580722808838]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 2.0, 4.0, 5.0, 6.0, 5.0, 11.0, 7.0, 6.0, 12.0, 16.0, 18.0, 26.0, 24.0, 25.0, 32.0, 36.0, 39.0, 35.0, 36.0, 44.0, 41.0, 49.0, 37.0, 46.0, 42.0, 40.0, 45.0, 38.0, 37.0, 39.0, 19.0, 26.0, 33.0, 28.0, 17.0, 15.0, 14.0, 14.0, 13.0, 9.0, 3.0, 3.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.0004099607467651, -0.9704493880271912, -0.9404888153076172, -0.910528302192688, -0.880567729473114, -0.85060715675354, -0.8206465840339661, -0.7906860113143921, -0.7607254981994629, -0.7307649254798889, -0.7008043527603149, -0.6708438396453857, -0.6408832669258118, -0.6109226942062378, -0.5809621214866638, -0.5510015487670898, -0.5210410356521606, -0.49108046293258667, -0.4611199200153351, -0.4311593472957611, -0.4011988043785095, -0.37123823165893555, -0.3412776589393616, -0.31131711602211, -0.2813565135002136, -0.25139594078063965, -0.22143539786338806, -0.1914748251438141, -0.1615142822265625, -0.13155370950698853, -0.10159315168857574, -0.07163259387016296, -0.04167205095291138, -0.011711491271853447, 0.018249068409204483, 0.04820962995290756, 0.07817018777132034, 0.10813075304031372, 0.1380913108587265, 0.16805186867713928, 0.19801242649555206, 0.22797298431396484, 0.2579335570335388, 0.2878940999507904, 0.3178546726703644, 0.34781521558761597, 0.37777578830718994, 0.4077363610267639, 0.4376969039440155, 0.4676574766635895, 0.49761801958084106, 0.527578592300415, 0.557539165019989, 0.587499737739563, 0.6174602508544922, 0.6474208235740662, 0.6773813962936401, 0.7073419690132141, 0.7373025417327881, 0.7672630548477173, 0.7972236275672913, 0.8271842002868652, 0.8571447730064392, 0.8871053457260132, 0.9170658588409424]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 6.0, 5.0, 9.0, 14.0, 18.0, 38.0, 34.0, 59.0, 118.0, 188.0, 292.0, 630.0, 1175.0, 2387.0, 5285.0, 12928.0, 48206.0, 615524.0, 311472.0, 31541.0, 10100.0, 4330.0, 1987.0, 975.0, 524.0, 240.0, 197.0, 96.0, 71.0, 46.0, 22.0, 16.0, 12.0, 7.0, 9.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.68359375, -0.6660079956054688, -0.6484222412109375, -0.6308364868164062, -0.613250732421875, -0.5956649780273438, -0.5780792236328125, -0.5604934692382812, -0.54290771484375, -0.5253219604492188, -0.5077362060546875, -0.49015045166015625, -0.472564697265625, -0.45497894287109375, -0.4373931884765625, -0.41980743408203125, -0.4022216796875, -0.38463592529296875, -0.3670501708984375, -0.34946441650390625, -0.331878662109375, -0.31429290771484375, -0.2967071533203125, -0.27912139892578125, -0.26153564453125, -0.24394989013671875, -0.2263641357421875, -0.20877838134765625, -0.191192626953125, -0.17360687255859375, -0.1560211181640625, -0.13843536376953125, -0.120849609375, -0.10326385498046875, -0.0856781005859375, -0.06809234619140625, -0.050506591796875, -0.03292083740234375, -0.0153350830078125, 0.00225067138671875, 0.01983642578125, 0.03742218017578125, 0.0550079345703125, 0.07259368896484375, 0.090179443359375, 0.10776519775390625, 0.1253509521484375, 0.14293670654296875, 0.1605224609375, 0.17810821533203125, 0.1956939697265625, 0.21327972412109375, 0.230865478515625, 0.24845123291015625, 0.2660369873046875, 0.28362274169921875, 0.30120849609375, 0.31879425048828125, 0.3363800048828125, 0.35396575927734375, 0.371551513671875, 0.38913726806640625, 0.4067230224609375, 0.42430877685546875, 0.44189453125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 2.0, 9.0, 6.0, 10.0, 5.0, 11.0, 15.0, 15.0, 34.0, 21.0, 40.0, 30.0, 37.0, 46.0, 50.0, 36.0, 57.0, 49.0, 40.0, 53.0, 48.0, 50.0, 53.0, 38.0, 36.0, 37.0, 28.0, 36.0, 22.0, 19.0, 18.0, 17.0, 12.0, 4.0, 10.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.84765625, -0.825592041015625, -0.80352783203125, -0.781463623046875, -0.7593994140625, -0.737335205078125, -0.71527099609375, -0.693206787109375, -0.671142578125, -0.649078369140625, -0.62701416015625, -0.604949951171875, -0.5828857421875, -0.560821533203125, -0.53875732421875, -0.516693115234375, -0.49462890625, -0.472564697265625, -0.45050048828125, -0.428436279296875, -0.4063720703125, -0.384307861328125, -0.36224365234375, -0.340179443359375, -0.318115234375, -0.296051025390625, -0.27398681640625, -0.251922607421875, -0.2298583984375, -0.207794189453125, -0.18572998046875, -0.163665771484375, -0.1416015625, -0.119537353515625, -0.09747314453125, -0.075408935546875, -0.0533447265625, -0.031280517578125, -0.00921630859375, 0.012847900390625, 0.034912109375, 0.056976318359375, 0.07904052734375, 0.101104736328125, 0.1231689453125, 0.145233154296875, 0.16729736328125, 0.189361572265625, 0.21142578125, 0.233489990234375, 0.25555419921875, 0.277618408203125, 0.2996826171875, 0.321746826171875, 0.34381103515625, 0.365875244140625, 0.387939453125, 0.410003662109375, 0.43206787109375, 0.454132080078125, 0.4761962890625, 0.498260498046875, 0.52032470703125, 0.542388916015625, 0.564453125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 2.0, 3.0, 6.0, 7.0, 22.0, 22.0, 46.0, 53.0, 114.0, 252.0, 520.0, 1207.0, 3482.0, 12540.0, 84895.0, 772555.0, 147641.0, 18077.0, 4414.0, 1412.0, 630.0, 290.0, 149.0, 66.0, 49.0, 37.0, 26.0, 8.0, 8.0, 4.0, 5.0, 4.0, 3.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.4892578125, -0.47377777099609375, -0.4582977294921875, -0.44281768798828125, -0.427337646484375, -0.41185760498046875, -0.3963775634765625, -0.38089752197265625, -0.36541748046875, -0.34993743896484375, -0.3344573974609375, -0.31897735595703125, -0.303497314453125, -0.28801727294921875, -0.2725372314453125, -0.25705718994140625, -0.2415771484375, -0.22609710693359375, -0.2106170654296875, -0.19513702392578125, -0.179656982421875, -0.16417694091796875, -0.1486968994140625, -0.13321685791015625, -0.11773681640625, -0.10225677490234375, -0.0867767333984375, -0.07129669189453125, -0.055816650390625, -0.04033660888671875, -0.0248565673828125, -0.00937652587890625, 0.006103515625, 0.02158355712890625, 0.0370635986328125, 0.05254364013671875, 0.068023681640625, 0.08350372314453125, 0.0989837646484375, 0.11446380615234375, 0.12994384765625, 0.14542388916015625, 0.1609039306640625, 0.17638397216796875, 0.191864013671875, 0.20734405517578125, 0.2228240966796875, 0.23830413818359375, 0.2537841796875, 0.26926422119140625, 0.2847442626953125, 0.30022430419921875, 0.315704345703125, 0.33118438720703125, 0.3466644287109375, 0.36214447021484375, 0.37762451171875, 0.39310455322265625, 0.4085845947265625, 0.42406463623046875, 0.439544677734375, 0.45502471923828125, 0.4705047607421875, 0.48598480224609375, 0.50146484375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 8.0, 6.0, 6.0, 9.0, 5.0, 15.0, 7.0, 21.0, 23.0, 31.0, 37.0, 37.0, 40.0, 44.0, 47.0, 43.0, 55.0, 56.0, 59.0, 61.0, 55.0, 43.0, 37.0, 45.0, 37.0, 36.0, 29.0, 23.0, 16.0, 19.0, 11.0, 12.0, 10.0, 3.0, 3.0, 7.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6982421875, -1.643096923828125, -1.58795166015625, -1.532806396484375, -1.4776611328125, -1.422515869140625, -1.36737060546875, -1.312225341796875, -1.257080078125, -1.201934814453125, -1.14678955078125, -1.091644287109375, -1.0364990234375, -0.981353759765625, -0.92620849609375, -0.871063232421875, -0.81591796875, -0.760772705078125, -0.70562744140625, -0.650482177734375, -0.5953369140625, -0.540191650390625, -0.48504638671875, -0.429901123046875, -0.374755859375, -0.319610595703125, -0.26446533203125, -0.209320068359375, -0.1541748046875, -0.099029541015625, -0.04388427734375, 0.011260986328125, 0.06640625, 0.121551513671875, 0.17669677734375, 0.231842041015625, 0.2869873046875, 0.342132568359375, 0.39727783203125, 0.452423095703125, 0.507568359375, 0.562713623046875, 0.61785888671875, 0.673004150390625, 0.7281494140625, 0.783294677734375, 0.83843994140625, 0.893585205078125, 0.94873046875, 1.003875732421875, 1.05902099609375, 1.114166259765625, 1.1693115234375, 1.224456787109375, 1.27960205078125, 1.334747314453125, 1.389892578125, 1.445037841796875, 1.50018310546875, 1.555328369140625, 1.6104736328125, 1.665618896484375, 1.72076416015625, 1.775909423828125, 1.8310546875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 6.0, 6.0, 7.0, 5.0, 19.0, 18.0, 28.0, 39.0, 54.0, 95.0, 140.0, 238.0, 440.0, 926.0, 1989.0, 5927.0, 28599.0, 635084.0, 346664.0, 19947.0, 4819.0, 1690.0, 751.0, 378.0, 233.0, 158.0, 85.0, 49.0, 44.0, 37.0, 20.0, 13.0, 14.0, 9.0, 5.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.25830078125, -0.2506828308105469, -0.24306488037109375, -0.23544692993164062, -0.2278289794921875, -0.22021102905273438, -0.21259307861328125, -0.20497512817382812, -0.197357177734375, -0.18973922729492188, -0.18212127685546875, -0.17450332641601562, -0.1668853759765625, -0.15926742553710938, -0.15164947509765625, -0.14403152465820312, -0.13641357421875, -0.12879562377929688, -0.12117767333984375, -0.11355972290039062, -0.1059417724609375, -0.09832382202148438, -0.09070587158203125, -0.08308792114257812, -0.075469970703125, -0.06785202026367188, -0.06023406982421875, -0.052616119384765625, -0.0449981689453125, -0.037380218505859375, -0.02976226806640625, -0.022144317626953125, -0.0145263671875, -0.006908416748046875, 0.00070953369140625, 0.008327484130859375, 0.0159454345703125, 0.023563385009765625, 0.03118133544921875, 0.038799285888671875, 0.046417236328125, 0.054035186767578125, 0.06165313720703125, 0.06927108764648438, 0.0768890380859375, 0.08450698852539062, 0.09212493896484375, 0.09974288940429688, 0.10736083984375, 0.11497879028320312, 0.12259674072265625, 0.13021469116210938, 0.1378326416015625, 0.14545059204101562, 0.15306854248046875, 0.16068649291992188, 0.168304443359375, 0.17592239379882812, 0.18354034423828125, 0.19115829467773438, 0.1987762451171875, 0.20639419555664062, 0.21401214599609375, 0.22163009643554688, 0.229248046875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 9.0, 14.0, 9.0, 22.0, 26.0, 44.0, 68.0, 94.0, 127.0, 185.0, 162.0, 78.0, 60.0, 38.0, 16.0, 13.0, 10.0, 7.0, 3.0, 2.0, 3.0, 2.0, 2.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.814168930053711e-05, -7.53011554479599e-05, -7.246062159538269e-05, -6.962008774280548e-05, -6.677955389022827e-05, -6.393902003765106e-05, -6.109848618507385e-05, -5.825795233249664e-05, -5.5417418479919434e-05, -5.2576884627342224e-05, -4.9736350774765015e-05, -4.6895816922187805e-05, -4.4055283069610596e-05, -4.1214749217033386e-05, -3.837421536445618e-05, -3.553368151187897e-05, -3.269314765930176e-05, -2.985261380672455e-05, -2.701207995414734e-05, -2.417154610157013e-05, -2.133101224899292e-05, -1.849047839641571e-05, -1.56499445438385e-05, -1.2809410691261292e-05, -9.968876838684082e-06, -7.1283429861068726e-06, -4.287809133529663e-06, -1.4472752809524536e-06, 1.3932585716247559e-06, 4.233792424201965e-06, 7.074326276779175e-06, 9.914860129356384e-06, 1.2755393981933594e-05, 1.5595927834510803e-05, 1.8436461687088013e-05, 2.1276995539665222e-05, 2.411752939224243e-05, 2.695806324481964e-05, 2.979859709739685e-05, 3.263913094997406e-05, 3.547966480255127e-05, 3.832019865512848e-05, 4.116073250770569e-05, 4.40012663602829e-05, 4.684180021286011e-05, 4.968233406543732e-05, 5.2522867918014526e-05, 5.5363401770591736e-05, 5.8203935623168945e-05, 6.104446947574615e-05, 6.388500332832336e-05, 6.672553718090057e-05, 6.956607103347778e-05, 7.240660488605499e-05, 7.52471387386322e-05, 7.808767259120941e-05, 8.092820644378662e-05, 8.376874029636383e-05, 8.660927414894104e-05, 8.944980800151825e-05, 9.229034185409546e-05, 9.513087570667267e-05, 9.797140955924988e-05, 0.00010081194341182709, 0.0001036524772644043]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 3.0, 5.0, 9.0, 4.0, 18.0, 22.0, 25.0, 30.0, 45.0, 65.0, 91.0, 106.0, 173.0, 222.0, 288.0, 460.0, 601.0, 946.0, 1491.0, 2508.0, 4821.0, 10367.0, 27506.0, 89970.0, 385482.0, 383153.0, 90109.0, 27786.0, 10464.0, 4547.0, 2537.0, 1430.0, 995.0, 626.0, 445.0, 294.0, 241.0, 162.0, 129.0, 95.0, 63.0, 53.0, 58.0, 29.0, 27.0, 14.0, 15.0, 8.0, 10.0, 5.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.1241455078125, -0.12026596069335938, -0.11638641357421875, -0.11250686645507812, -0.1086273193359375, -0.10474777221679688, -0.10086822509765625, -0.09698867797851562, -0.093109130859375, -0.08922958374023438, -0.08535003662109375, -0.08147048950195312, -0.0775909423828125, -0.07371139526367188, -0.06983184814453125, -0.06595230102539062, -0.06207275390625, -0.058193206787109375, -0.05431365966796875, -0.050434112548828125, -0.0465545654296875, -0.042675018310546875, -0.03879547119140625, -0.034915924072265625, -0.031036376953125, -0.027156829833984375, -0.02327728271484375, -0.019397735595703125, -0.0155181884765625, -0.011638641357421875, -0.00775909423828125, -0.003879547119140625, 0.0, 0.003879547119140625, 0.00775909423828125, 0.011638641357421875, 0.0155181884765625, 0.019397735595703125, 0.02327728271484375, 0.027156829833984375, 0.031036376953125, 0.034915924072265625, 0.03879547119140625, 0.042675018310546875, 0.0465545654296875, 0.050434112548828125, 0.05431365966796875, 0.058193206787109375, 0.06207275390625, 0.06595230102539062, 0.06983184814453125, 0.07371139526367188, 0.0775909423828125, 0.08147048950195312, 0.08535003662109375, 0.08922958374023438, 0.093109130859375, 0.09698867797851562, 0.10086822509765625, 0.10474777221679688, 0.1086273193359375, 0.11250686645507812, 0.11638641357421875, 0.12026596069335938, 0.1241455078125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 3.0, 4.0, 9.0, 4.0, 12.0, 10.0, 30.0, 40.0, 52.0, 62.0, 111.0, 115.0, 126.0, 110.0, 83.0, 66.0, 53.0, 34.0, 25.0, 14.0, 10.0, 9.0, 3.0, 4.0, 3.0, 4.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.048858642578125, -0.047251224517822266, -0.04564380645751953, -0.0440363883972168, -0.04242897033691406, -0.04082155227661133, -0.039214134216308594, -0.03760671615600586, -0.035999298095703125, -0.03439188003540039, -0.032784461975097656, -0.031177043914794922, -0.029569625854492188, -0.027962207794189453, -0.02635478973388672, -0.024747371673583984, -0.02313995361328125, -0.021532535552978516, -0.01992511749267578, -0.018317699432373047, -0.016710281372070312, -0.015102863311767578, -0.013495445251464844, -0.01188802719116211, -0.010280609130859375, -0.00867319107055664, -0.007065773010253906, -0.005458354949951172, -0.0038509368896484375, -0.002243518829345703, -0.0006361007690429688, 0.0009713172912597656, 0.0025787353515625, 0.004186153411865234, 0.005793571472167969, 0.007400989532470703, 0.009008407592773438, 0.010615825653076172, 0.012223243713378906, 0.01383066177368164, 0.015438079833984375, 0.01704549789428711, 0.018652915954589844, 0.020260334014892578, 0.021867752075195312, 0.023475170135498047, 0.02508258819580078, 0.026690006256103516, 0.02829742431640625, 0.029904842376708984, 0.03151226043701172, 0.03311967849731445, 0.03472709655761719, 0.03633451461791992, 0.037941932678222656, 0.03954935073852539, 0.041156768798828125, 0.04276418685913086, 0.044371604919433594, 0.04597902297973633, 0.04758644104003906, 0.0491938591003418, 0.05080127716064453, 0.052408695220947266, 0.05401611328125]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 2.0, 3.0, 5.0, 5.0, 7.0, 9.0, 8.0, 18.0, 16.0, 26.0, 25.0, 56.0, 46.0, 62.0, 72.0, 72.0, 80.0, 73.0, 74.0, 66.0, 59.0, 51.0, 40.0, 28.0, 17.0, 13.0, 18.0, 12.0, 11.0, 2.0, 4.0, 3.0, 7.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.7586199641227722, -0.7334376573562622, -0.7082552909851074, -0.6830729842185974, -0.6578906178474426, -0.6327083110809326, -0.6075259447097778, -0.5823436379432678, -0.5571613311767578, -0.5319790244102478, -0.506796658039093, -0.481614351272583, -0.4564320147037506, -0.4312496781349182, -0.4060673415660858, -0.3808850049972534, -0.355702668428421, -0.3305203318595886, -0.3053379952907562, -0.28015565872192383, -0.2549733519554138, -0.22979101538658142, -0.20460867881774902, -0.17942635715007782, -0.15424402058124542, -0.12906168401241302, -0.10387936234474182, -0.07869702577590942, -0.05351469665765762, -0.028332367539405823, -0.0031500309705734253, 0.02203229069709778, 0.047214627265930176, 0.07239695638418198, 0.09757928550243378, 0.12276162207126617, 0.14794394373893738, 0.17312628030776978, 0.19830861687660217, 0.22349093854427338, 0.24867327511310577, 0.273855596780777, 0.2990379333496094, 0.3242202699184418, 0.34940260648727417, 0.3745849132537842, 0.39976727962493896, 0.424949586391449, 0.45013192296028137, 0.47531425952911377, 0.5004965662956238, 0.5256789326667786, 0.5508612394332886, 0.5760436058044434, 0.6012259125709534, 0.6264082193374634, 0.6515905857086182, 0.6767728924751282, 0.701955258846283, 0.727137565612793, 0.7523199319839478, 0.7775022387504578, 0.8026845455169678, 0.8278669118881226, 0.8530492186546326]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 5.0, 3.0, 5.0, 6.0, 8.0, 10.0, 12.0, 14.0, 16.0, 21.0, 31.0, 26.0, 23.0, 28.0, 37.0, 44.0, 42.0, 41.0, 37.0, 55.0, 44.0, 43.0, 54.0, 47.0, 40.0, 32.0, 38.0, 34.0, 38.0, 24.0, 38.0, 24.0, 20.0, 19.0, 8.0, 14.0, 9.0, 6.0, 4.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.7005771994590759, -0.6812631487846375, -0.6619490385055542, -0.6426349878311157, -0.6233208775520325, -0.604006826877594, -0.5846927165985107, -0.5653786659240723, -0.5460646152496338, -0.5267505645751953, -0.5074364542961121, -0.4881224036216736, -0.4688083231449127, -0.44949424266815186, -0.430180162191391, -0.4108660817146301, -0.39155200123786926, -0.3722379207611084, -0.35292384028434753, -0.33360975980758667, -0.3142957091331482, -0.29498162865638733, -0.27566754817962646, -0.256353497505188, -0.23703940212726593, -0.21772532165050507, -0.1984112560749054, -0.17909717559814453, -0.15978309512138367, -0.140469029545784, -0.12115494906902313, -0.10184088349342346, -0.0825268030166626, -0.06321272999048233, -0.043898653239011765, -0.0245845764875412, -0.005270503461360931, 0.014043569564819336, 0.0333576500415802, 0.05267171561717987, 0.07198579609394073, 0.091299869120121, 0.11061394214630127, 0.12992802262306213, 0.149242103099823, 0.16855616867542267, 0.18787024915218353, 0.2071843147277832, 0.22649839520454407, 0.24581247568130493, 0.2651265561580658, 0.28444063663482666, 0.30375468730926514, 0.323068767786026, 0.34238284826278687, 0.36169689893722534, 0.3810110092163086, 0.40032508969306946, 0.4196391701698303, 0.4389532208442688, 0.45826730132102966, 0.4775813817977905, 0.4968954622745514, 0.5162095427513123, 0.5355235934257507]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 6.0, 2.0, 3.0, 8.0, 6.0, 21.0, 19.0, 20.0, 31.0, 35.0, 44.0, 87.0, 109.0, 165.0, 264.0, 480.0, 756.0, 1327.0, 2248.0, 4301.0, 8302.0, 18792.0, 54336.0, 236580.0, 524740.0, 132702.0, 35209.0, 13510.0, 6345.0, 3337.0, 1881.0, 1130.0, 654.0, 379.0, 226.0, 155.0, 105.0, 72.0, 36.0, 33.0, 30.0, 23.0, 15.0, 7.0, 6.0, 5.0, 6.0, 1.0, 2.0, 4.0, 1.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.95263671875, -0.9222183227539062, -0.8917999267578125, -0.8613815307617188, -0.830963134765625, -0.8005447387695312, -0.7701263427734375, -0.7397079467773438, -0.70928955078125, -0.6788711547851562, -0.6484527587890625, -0.6180343627929688, -0.587615966796875, -0.5571975708007812, -0.5267791748046875, -0.49636077880859375, -0.4659423828125, -0.43552398681640625, -0.4051055908203125, -0.37468719482421875, -0.344268798828125, -0.31385040283203125, -0.2834320068359375, -0.25301361083984375, -0.22259521484375, -0.19217681884765625, -0.1617584228515625, -0.13134002685546875, -0.100921630859375, -0.07050323486328125, -0.0400848388671875, -0.00966644287109375, 0.020751953125, 0.05117034912109375, 0.0815887451171875, 0.11200714111328125, 0.142425537109375, 0.17284393310546875, 0.2032623291015625, 0.23368072509765625, 0.26409912109375, 0.29451751708984375, 0.3249359130859375, 0.35535430908203125, 0.385772705078125, 0.41619110107421875, 0.4466094970703125, 0.47702789306640625, 0.5074462890625, 0.5378646850585938, 0.5682830810546875, 0.5987014770507812, 0.629119873046875, 0.6595382690429688, 0.6899566650390625, 0.7203750610351562, 0.75079345703125, 0.7812118530273438, 0.8116302490234375, 0.8420486450195312, 0.872467041015625, 0.9028854370117188, 0.9333038330078125, 0.9637222290039062, 0.994140625]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 2.0, 4.0, 3.0, 8.0, 4.0, 6.0, 9.0, 15.0, 14.0, 15.0, 22.0, 19.0, 18.0, 28.0, 38.0, 29.0, 40.0, 44.0, 28.0, 48.0, 53.0, 44.0, 62.0, 53.0, 47.0, 41.0, 34.0, 34.0, 41.0, 26.0, 29.0, 28.0, 22.0, 16.0, 17.0, 13.0, 11.0, 6.0, 10.0, 4.0, 7.0, 4.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.0615234375, -1.028961181640625, -0.99639892578125, -0.963836669921875, -0.9312744140625, -0.898712158203125, -0.86614990234375, -0.833587646484375, -0.801025390625, -0.768463134765625, -0.73590087890625, -0.703338623046875, -0.6707763671875, -0.638214111328125, -0.60565185546875, -0.573089599609375, -0.54052734375, -0.507965087890625, -0.47540283203125, -0.442840576171875, -0.4102783203125, -0.377716064453125, -0.34515380859375, -0.312591552734375, -0.280029296875, -0.247467041015625, -0.21490478515625, -0.182342529296875, -0.1497802734375, -0.117218017578125, -0.08465576171875, -0.052093505859375, -0.01953125, 0.013031005859375, 0.04559326171875, 0.078155517578125, 0.1107177734375, 0.143280029296875, 0.17584228515625, 0.208404541015625, 0.240966796875, 0.273529052734375, 0.30609130859375, 0.338653564453125, 0.3712158203125, 0.403778076171875, 0.43634033203125, 0.468902587890625, 0.50146484375, 0.534027099609375, 0.56658935546875, 0.599151611328125, 0.6317138671875, 0.664276123046875, 0.69683837890625, 0.729400634765625, 0.761962890625, 0.794525146484375, 0.82708740234375, 0.859649658203125, 0.8922119140625, 0.924774169921875, 0.95733642578125, 0.989898681640625, 1.0224609375]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 5.0, 8.0, 8.0, 13.0, 17.0, 17.0, 26.0, 35.0, 47.0, 68.0, 94.0, 112.0, 166.0, 259.0, 403.0, 691.0, 1244.0, 2454.0, 5443.0, 14264.0, 43643.0, 188959.0, 586459.0, 145739.0, 36216.0, 12094.0, 4857.0, 2183.0, 1147.0, 630.0, 391.0, 259.0, 178.0, 125.0, 77.0, 58.0, 39.0, 46.0, 20.0, 17.0, 11.0, 8.0, 9.0, 8.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3193359375, -1.275970458984375, -1.23260498046875, -1.189239501953125, -1.1458740234375, -1.102508544921875, -1.05914306640625, -1.015777587890625, -0.972412109375, -0.929046630859375, -0.88568115234375, -0.842315673828125, -0.7989501953125, -0.755584716796875, -0.71221923828125, -0.668853759765625, -0.62548828125, -0.582122802734375, -0.53875732421875, -0.495391845703125, -0.4520263671875, -0.408660888671875, -0.36529541015625, -0.321929931640625, -0.278564453125, -0.235198974609375, -0.19183349609375, -0.148468017578125, -0.1051025390625, -0.061737060546875, -0.01837158203125, 0.024993896484375, 0.068359375, 0.111724853515625, 0.15509033203125, 0.198455810546875, 0.2418212890625, 0.285186767578125, 0.32855224609375, 0.371917724609375, 0.415283203125, 0.458648681640625, 0.50201416015625, 0.545379638671875, 0.5887451171875, 0.632110595703125, 0.67547607421875, 0.718841552734375, 0.76220703125, 0.805572509765625, 0.84893798828125, 0.892303466796875, 0.9356689453125, 0.979034423828125, 1.02239990234375, 1.065765380859375, 1.109130859375, 1.152496337890625, 1.19586181640625, 1.239227294921875, 1.2825927734375, 1.325958251953125, 1.36932373046875, 1.412689208984375, 1.4560546875]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 0.0, 5.0, 4.0, 9.0, 6.0, 14.0, 8.0, 14.0, 15.0, 12.0, 17.0, 25.0, 31.0, 37.0, 22.0, 35.0, 42.0, 45.0, 44.0, 48.0, 40.0, 42.0, 31.0, 46.0, 44.0, 48.0, 38.0, 35.0, 38.0, 37.0, 37.0, 25.0, 15.0, 19.0, 12.0, 10.0, 8.0, 13.0, 11.0, 2.0, 6.0, 6.0, 2.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.171875, -1.13525390625, -1.0986328125, -1.06201171875, -1.025390625, -0.98876953125, -0.9521484375, -0.91552734375, -0.87890625, -0.84228515625, -0.8056640625, -0.76904296875, -0.732421875, -0.69580078125, -0.6591796875, -0.62255859375, -0.5859375, -0.54931640625, -0.5126953125, -0.47607421875, -0.439453125, -0.40283203125, -0.3662109375, -0.32958984375, -0.29296875, -0.25634765625, -0.2197265625, -0.18310546875, -0.146484375, -0.10986328125, -0.0732421875, -0.03662109375, 0.0, 0.03662109375, 0.0732421875, 0.10986328125, 0.146484375, 0.18310546875, 0.2197265625, 0.25634765625, 0.29296875, 0.32958984375, 0.3662109375, 0.40283203125, 0.439453125, 0.47607421875, 0.5126953125, 0.54931640625, 0.5859375, 0.62255859375, 0.6591796875, 0.69580078125, 0.732421875, 0.76904296875, 0.8056640625, 0.84228515625, 0.87890625, 0.91552734375, 0.9521484375, 0.98876953125, 1.025390625, 1.06201171875, 1.0986328125, 1.13525390625, 1.171875]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 3.0, 7.0, 10.0, 15.0, 18.0, 25.0, 38.0, 40.0, 81.0, 83.0, 138.0, 167.0, 303.0, 472.0, 809.0, 1425.0, 2705.0, 5335.0, 11501.0, 28575.0, 89616.0, 555786.0, 255008.0, 57938.0, 20360.0, 8752.0, 4214.0, 2117.0, 1179.0, 686.0, 356.0, 238.0, 180.0, 120.0, 78.0, 47.0, 42.0, 21.0, 22.0, 14.0, 10.0, 10.0, 8.0, 5.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.18408203125, -0.17811012268066406, -0.17213821411132812, -0.1661663055419922, -0.16019439697265625, -0.1542224884033203, -0.14825057983398438, -0.14227867126464844, -0.1363067626953125, -0.13033485412597656, -0.12436294555664062, -0.11839103698730469, -0.11241912841796875, -0.10644721984863281, -0.10047531127929688, -0.09450340270996094, -0.088531494140625, -0.08255958557128906, -0.07658767700195312, -0.07061576843261719, -0.06464385986328125, -0.05867195129394531, -0.052700042724609375, -0.04672813415527344, -0.0407562255859375, -0.03478431701660156, -0.028812408447265625, -0.022840499877929688, -0.01686859130859375, -0.010896682739257812, -0.004924774169921875, 0.0010471343994140625, 0.00701904296875, 0.012990951538085938, 0.018962860107421875, 0.024934768676757812, 0.03090667724609375, 0.03687858581542969, 0.042850494384765625, 0.04882240295410156, 0.0547943115234375, 0.06076622009277344, 0.06673812866210938, 0.07271003723144531, 0.07868194580078125, 0.08465385437011719, 0.09062576293945312, 0.09659767150878906, 0.102569580078125, 0.10854148864746094, 0.11451339721679688, 0.12048530578613281, 0.12645721435546875, 0.1324291229248047, 0.13840103149414062, 0.14437294006347656, 0.1503448486328125, 0.15631675720214844, 0.16228866577148438, 0.1682605743408203, 0.17423248291015625, 0.1802043914794922, 0.18617630004882812, 0.19214820861816406, 0.1981201171875]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 1.0, 8.0, 11.0, 27.0, 19.0, 28.0, 47.0, 63.0, 86.0, 239.0, 175.0, 79.0, 56.0, 49.0, 30.0, 18.0, 14.0, 15.0, 6.0, 4.0, 7.0, 3.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-5.1856040954589844e-05, -5.0487928092479706e-05, -4.911981523036957e-05, -4.775170236825943e-05, -4.638358950614929e-05, -4.5015476644039154e-05, -4.3647363781929016e-05, -4.227925091981888e-05, -4.091113805770874e-05, -3.95430251955986e-05, -3.8174912333488464e-05, -3.6806799471378326e-05, -3.543868660926819e-05, -3.407057374715805e-05, -3.270246088504791e-05, -3.1334348022937775e-05, -2.9966235160827637e-05, -2.85981222987175e-05, -2.723000943660736e-05, -2.5861896574497223e-05, -2.4493783712387085e-05, -2.3125670850276947e-05, -2.175755798816681e-05, -2.038944512605667e-05, -1.9021332263946533e-05, -1.7653219401836395e-05, -1.6285106539726257e-05, -1.491699367761612e-05, -1.3548880815505981e-05, -1.2180767953395844e-05, -1.0812655091285706e-05, -9.444542229175568e-06, -8.07642936706543e-06, -6.708316504955292e-06, -5.340203642845154e-06, -3.972090780735016e-06, -2.603977918624878e-06, -1.23586505651474e-06, 1.3224780559539795e-07, 1.5003606677055359e-06, 2.868473529815674e-06, 4.236586391925812e-06, 5.60469925403595e-06, 6.972812116146088e-06, 8.340924978256226e-06, 9.709037840366364e-06, 1.1077150702476501e-05, 1.244526356458664e-05, 1.3813376426696777e-05, 1.5181489288806915e-05, 1.6549602150917053e-05, 1.791771501302719e-05, 1.928582787513733e-05, 2.0653940737247467e-05, 2.2022053599357605e-05, 2.3390166461467743e-05, 2.475827932357788e-05, 2.612639218568802e-05, 2.7494505047798157e-05, 2.8862617909908295e-05, 3.0230730772018433e-05, 3.159884363412857e-05, 3.296695649623871e-05, 3.4335069358348846e-05, 3.5703182220458984e-05]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 8.0, 5.0, 15.0, 17.0, 24.0, 25.0, 36.0, 64.0, 88.0, 115.0, 161.0, 243.0, 370.0, 565.0, 909.0, 1498.0, 2737.0, 5152.0, 10620.0, 25096.0, 80468.0, 614696.0, 224532.0, 46868.0, 17058.0, 7766.0, 3769.0, 2189.0, 1227.0, 708.0, 451.0, 330.0, 209.0, 154.0, 120.0, 68.0, 50.0, 41.0, 28.0, 22.0, 10.0, 11.0, 7.0, 6.0, 5.0, 5.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.260498046875, -0.2523040771484375, -0.244110107421875, -0.2359161376953125, -0.22772216796875, -0.2195281982421875, -0.211334228515625, -0.2031402587890625, -0.1949462890625, -0.1867523193359375, -0.178558349609375, -0.1703643798828125, -0.16217041015625, -0.1539764404296875, -0.145782470703125, -0.1375885009765625, -0.12939453125, -0.1212005615234375, -0.113006591796875, -0.1048126220703125, -0.09661865234375, -0.0884246826171875, -0.080230712890625, -0.0720367431640625, -0.0638427734375, -0.0556488037109375, -0.047454833984375, -0.0392608642578125, -0.03106689453125, -0.0228729248046875, -0.014678955078125, -0.0064849853515625, 0.001708984375, 0.0099029541015625, 0.018096923828125, 0.0262908935546875, 0.03448486328125, 0.0426788330078125, 0.050872802734375, 0.0590667724609375, 0.0672607421875, 0.0754547119140625, 0.083648681640625, 0.0918426513671875, 0.10003662109375, 0.1082305908203125, 0.116424560546875, 0.1246185302734375, 0.1328125, 0.1410064697265625, 0.149200439453125, 0.1573944091796875, 0.16558837890625, 0.1737823486328125, 0.181976318359375, 0.1901702880859375, 0.1983642578125, 0.2065582275390625, 0.214752197265625, 0.2229461669921875, 0.23114013671875, 0.2393341064453125, 0.247528076171875, 0.2557220458984375, 0.263916015625]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 10.0, 7.0, 7.0, 8.0, 5.0, 17.0, 8.0, 11.0, 23.0, 31.0, 30.0, 50.0, 67.0, 90.0, 163.0, 118.0, 98.0, 45.0, 42.0, 36.0, 18.0, 21.0, 14.0, 12.0, 10.0, 8.0, 13.0, 8.0, 2.0, 8.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.12017822265625, -0.1166372299194336, -0.11309623718261719, -0.10955524444580078, -0.10601425170898438, -0.10247325897216797, -0.09893226623535156, -0.09539127349853516, -0.09185028076171875, -0.08830928802490234, -0.08476829528808594, -0.08122730255126953, -0.07768630981445312, -0.07414531707763672, -0.07060432434082031, -0.0670633316040039, -0.0635223388671875, -0.059981346130371094, -0.05644035339355469, -0.05289936065673828, -0.049358367919921875, -0.04581737518310547, -0.04227638244628906, -0.038735389709472656, -0.03519439697265625, -0.031653404235839844, -0.028112411499023438, -0.02457141876220703, -0.021030426025390625, -0.01748943328857422, -0.013948440551757812, -0.010407447814941406, -0.006866455078125, -0.0033254623413085938, 0.0002155303955078125, 0.0037565231323242188, 0.007297515869140625, 0.010838508605957031, 0.014379501342773438, 0.017920494079589844, 0.02146148681640625, 0.025002479553222656, 0.028543472290039062, 0.03208446502685547, 0.035625457763671875, 0.03916645050048828, 0.04270744323730469, 0.046248435974121094, 0.0497894287109375, 0.053330421447753906, 0.05687141418457031, 0.06041240692138672, 0.06395339965820312, 0.06749439239501953, 0.07103538513183594, 0.07457637786865234, 0.07811737060546875, 0.08165836334228516, 0.08519935607910156, 0.08874034881591797, 0.09228134155273438, 0.09582233428955078, 0.09936332702636719, 0.1029043197631836, 0.1064453125]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 5.0, 6.0, 14.0, 22.0, 28.0, 39.0, 76.0, 111.0, 117.0, 132.0, 148.0, 110.0, 67.0, 38.0, 29.0, 19.0, 11.0, 15.0, 4.0, 7.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0309042930603027, -1.945160984992981, -1.8594176769256592, -1.7736742496490479, -1.687930941581726, -1.6021876335144043, -1.516444206237793, -1.4307008981704712, -1.3449575901031494, -1.2592142820358276, -1.1734709739685059, -1.0877275466918945, -1.0019842386245728, -0.916240930557251, -0.8304975628852844, -0.7447541952133179, -0.6590108871459961, -0.5732675790786743, -0.48752421140670776, -0.4017808735370636, -0.31603753566741943, -0.23029419779777527, -0.1445508599281311, -0.05880749225616455, 0.026935815811157227, 0.11267915368080139, 0.19842249155044556, 0.2841658294200897, 0.3699091672897339, 0.45565250515937805, 0.5413958430290222, 0.6271392107009888, 0.7128827571868896, 0.7986260652542114, 0.884369432926178, 0.9701128005981445, 1.0558561086654663, 1.141599416732788, 1.2273428440093994, 1.3130861520767212, 1.398829460144043, 1.4845727682113647, 1.5703160762786865, 1.6560595035552979, 1.7418028116226196, 1.8275461196899414, 1.9132895469665527, 1.9990328550338745, 2.0847761631011963, 2.1705195903778076, 2.25626277923584, 2.342006206512451, 2.4277496337890625, 2.5134928226470947, 2.599236249923706, 2.6849794387817383, 2.7707228660583496, 2.856466293334961, 2.942209482192993, 3.0279529094696045, 3.1136960983276367, 3.199439525604248, 3.2851829528808594, 3.3709263801574707, 3.456669569015503]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 7.0, 10.0, 5.0, 8.0, 6.0, 11.0, 17.0, 19.0, 15.0, 12.0, 16.0, 34.0, 26.0, 22.0, 26.0, 28.0, 36.0, 39.0, 40.0, 60.0, 44.0, 32.0, 45.0, 36.0, 39.0, 40.0, 28.0, 38.0, 33.0, 29.0, 31.0, 16.0, 20.0, 28.0, 16.0, 12.0, 16.0, 13.0, 10.0, 4.0, 5.0, 2.0, 6.0, 4.0, 7.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.8244893550872803, -1.7670289278030396, -1.7095686197280884, -1.6521081924438477, -1.5946478843688965, -1.5371874570846558, -1.479727029800415, -1.4222667217254639, -1.3648064136505127, -1.307345986366272, -1.2498856782913208, -1.19242525100708, -1.134964942932129, -1.0775045156478882, -1.0200440883636475, -0.9625837802886963, -0.9051233530044556, -0.8476629853248596, -0.7902026176452637, -0.732742190361023, -0.6752818822860718, -0.617821455001831, -0.5603610873222351, -0.5029007196426392, -0.4454403519630432, -0.38797998428344727, -0.3305196166038513, -0.273059219121933, -0.21559885144233704, -0.1581384837627411, -0.10067808628082275, -0.04321771860122681, 0.01424252986907959, 0.07170290499925613, 0.12916328012943268, 0.18662366271018982, 0.24408403038978577, 0.3015443980693817, 0.35900479555130005, 0.416465163230896, 0.47392553091049194, 0.5313858985900879, 0.5888462662696838, 0.6463066339492798, 0.7037670612335205, 0.7612273693084717, 0.8186877965927124, 0.8761481642723083, 0.9336085319519043, 0.9910688996315002, 1.0485292673110962, 1.105989694595337, 1.163450002670288, 1.2209104299545288, 1.2783708572387695, 1.3358311653137207, 1.3932914733886719, 1.4507519006729126, 1.5082122087478638, 1.5656726360321045, 1.6231329441070557, 1.6805933713912964, 1.738053798675537, 1.7955141067504883, 1.852974534034729]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 6.0, 6.0, 3.0, 11.0, 12.0, 5.0, 19.0, 24.0, 29.0, 33.0, 38.0, 41.0, 48.0, 79.0, 77.0, 126.0, 148.0, 158.0, 225.0, 313.0, 474.0, 1032.0, 3191.0, 1040823.0, 1503.0, 585.0, 363.0, 257.0, 198.0, 154.0, 147.0, 80.0, 92.0, 62.0, 46.0, 37.0, 40.0, 23.0, 19.0, 20.0, 15.0, 9.0, 5.0, 2.0, 5.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-2.803248643875122, -2.71335506439209, -2.6234614849090576, -2.5335679054260254, -2.443674325942993, -2.353780746459961, -2.2638869285583496, -2.1739933490753174, -2.084099769592285, -1.994206190109253, -1.9043126106262207, -1.8144190311431885, -1.7245253324508667, -1.6346317529678345, -1.5447381734848022, -1.4548444747924805, -1.3649510145187378, -1.2750574350357056, -1.1851638555526733, -1.0952701568603516, -1.0053765773773193, -0.9154829978942871, -0.8255894184112549, -0.7356957793235779, -0.6458021998405457, -0.5559086203575134, -0.4660149812698364, -0.3761214017868042, -0.2862277925014496, -0.19633418321609497, -0.10644060373306274, -0.016546964645385742, 0.07334661483764648, 0.1632402241230011, 0.2531338334083557, 0.34302741289138794, 0.43292102217674255, 0.5228146314620972, 0.6127082109451294, 0.7026018500328064, 0.7924954295158386, 0.8823890089988708, 0.9722826480865479, 1.06217622756958, 1.1520698070526123, 1.2419633865356445, 1.3318569660186768, 1.4217506647109985, 1.5116442441940308, 1.601537823677063, 1.6914314031600952, 1.781325101852417, 1.8712186813354492, 1.9611122608184814, 2.0510058403015137, 2.140899419784546, 2.230792999267578, 2.3206865787506104, 2.4105801582336426, 2.500473737716675, 2.590367317199707, 2.6802611351013184, 2.7701544761657715, 2.860048294067383, 2.949941873550415]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 7.0, 5.0, 8.0, 12.0, 20.0, 36.0, 34.0, 52.0, 72.0, 104.0, 141.0, 189.0, 317.0, 541.0, 1109.0, 3470.0, 51455272.0, 5843.0, 1321.0, 668.0, 330.0, 216.0, 145.0, 102.0, 78.0, 74.0, 44.0, 40.0, 26.0, 14.0, 8.0, 13.0, 2.0, 7.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.327807426452637, -11.8970308303833, -11.466254234313965, -11.035478591918945, -10.60470199584961, -10.173925399780273, -9.743148803710938, -9.312372207641602, -8.881596565246582, -8.450819969177246, -8.02004337310791, -7.589267253875732, -7.158491134643555, -6.727714538574219, -6.296937942504883, -5.866161823272705, -5.435385227203369, -5.004608631134033, -4.5738325119018555, -4.1430559158325195, -3.712279796600342, -3.281503200531006, -2.850726842880249, -2.419950485229492, -1.9891741275787354, -1.5583977699279785, -1.1276214122772217, -0.6968449354171753, -0.26606857776641846, 0.16470789909362793, 0.5954842567443848, 1.0262606143951416, 1.4570369720458984, 1.8878133296966553, 2.318589687347412, 2.749366283416748, 3.180142402648926, 3.6109189987182617, 4.041695594787598, 4.472471714019775, 4.903247833251953, 5.334024429321289, 5.764800548553467, 6.195577144622803, 6.6263532638549805, 7.057129859924316, 7.487906455993652, 7.91868257522583, 8.349458694458008, 8.780235290527344, 9.21101188659668, 9.6417875289917, 10.072564125061035, 10.503340721130371, 10.934117317199707, 11.364892959594727, 11.795670509338379, 12.226447105407715, 12.65722370147705, 13.08799934387207, 13.518775939941406, 13.949552536010742, 14.380329132080078, 14.811105728149414, 15.241881370544434]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 7.0, 2.0, 12.0, 14.0, 21.0, 26.0, 45.0, 64.0, 85.0, 149.0, 228.0, 342.0, 473.0, 762.0, 1194.0, 1898.0, 2865.0, 4780.0, 7847.0, 13950.0, 24462.0, 46299.0, 87612.0, 169525.0, 320098.0, 567118.0, 3707758.0, 608206.0, 339730.0, 181425.0, 93769.0, 49019.0, 25884.0, 14412.0, 8160.0, 4854.0, 2985.0, 1858.0, 1228.0, 783.0, 496.0, 347.0, 241.0, 145.0, 88.0, 69.0, 43.0, 23.0, 15.0, 10.0, 6.0, 5.0, 4.0, 6.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.78759765625, -0.76263427734375, -0.7376708984375, -0.71270751953125, -0.687744140625, -0.66278076171875, -0.6378173828125, -0.61285400390625, -0.587890625, -0.56292724609375, -0.5379638671875, -0.51300048828125, -0.488037109375, -0.46307373046875, -0.4381103515625, -0.41314697265625, -0.38818359375, -0.36322021484375, -0.3382568359375, -0.31329345703125, -0.288330078125, -0.26336669921875, -0.2384033203125, -0.21343994140625, -0.1884765625, -0.16351318359375, -0.1385498046875, -0.11358642578125, -0.088623046875, -0.06365966796875, -0.0386962890625, -0.01373291015625, 0.01123046875, 0.03619384765625, 0.0611572265625, 0.08612060546875, 0.111083984375, 0.13604736328125, 0.1610107421875, 0.18597412109375, 0.2109375, 0.23590087890625, 0.2608642578125, 0.28582763671875, 0.310791015625, 0.33575439453125, 0.3607177734375, 0.38568115234375, 0.41064453125, 0.43560791015625, 0.4605712890625, 0.48553466796875, 0.510498046875, 0.53546142578125, 0.5604248046875, 0.58538818359375, 0.6103515625, 0.63531494140625, 0.6602783203125, 0.68524169921875, 0.710205078125, 0.73516845703125, 0.7601318359375, 0.78509521484375, 0.81005859375]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 6.0, 7.0, 6.0, 7.0, 9.0, 20.0, 14.0, 22.0, 21.0, 29.0, 31.0, 34.0, 34.0, 42.0, 46.0, 43.0, 49.0, 90.0, 969.0, 108.0, 54.0, 57.0, 42.0, 41.0, 44.0, 31.0, 22.0, 32.0, 20.0, 24.0, 15.0, 11.0, 6.0, 16.0, 5.0, 7.0, 2.0, 3.0, 2.0, 4.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.390625, -9.110595703125, -8.83056640625, -8.550537109375, -8.2705078125, -7.990478515625, -7.71044921875, -7.430419921875, -7.150390625, -6.870361328125, -6.59033203125, -6.310302734375, -6.0302734375, -5.750244140625, -5.47021484375, -5.190185546875, -4.91015625, -4.630126953125, -4.35009765625, -4.070068359375, -3.7900390625, -3.510009765625, -3.22998046875, -2.949951171875, -2.669921875, -2.389892578125, -2.10986328125, -1.829833984375, -1.5498046875, -1.269775390625, -0.98974609375, -0.709716796875, -0.4296875, -0.149658203125, 0.13037109375, 0.410400390625, 0.6904296875, 0.970458984375, 1.25048828125, 1.530517578125, 1.810546875, 2.090576171875, 2.37060546875, 2.650634765625, 2.9306640625, 3.210693359375, 3.49072265625, 3.770751953125, 4.05078125, 4.330810546875, 4.61083984375, 4.890869140625, 5.1708984375, 5.450927734375, 5.73095703125, 6.010986328125, 6.291015625, 6.571044921875, 6.85107421875, 7.131103515625, 7.4111328125, 7.691162109375, 7.97119140625, 8.251220703125, 8.53125]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 6.0, 5.0, 6.0, 14.0, 21.0, 34.0, 44.0, 69.0, 118.0, 137.0, 203.0, 321.0, 456.0, 732.0, 1045.0, 1656.0, 2637.0, 4053.0, 6611.0, 10897.0, 17666.0, 30548.0, 51360.0, 89208.0, 149477.0, 243964.0, 362976.0, 608303.0, 3491047.0, 429515.0, 306232.0, 195766.0, 117228.0, 68352.0, 39872.0, 23387.0, 14168.0, 8637.0, 5303.0, 3302.0, 2136.0, 1305.0, 871.0, 578.0, 347.0, 268.0, 170.0, 125.0, 85.0, 61.0, 38.0, 26.0, 20.0, 12.0, 13.0, 7.0, 7.0, 1.0, 0.0, 2.0], "bins": [-0.4912109375, -0.4759864807128906, -0.46076202392578125, -0.4455375671386719, -0.4303131103515625, -0.4150886535644531, -0.39986419677734375, -0.3846397399902344, -0.369415283203125, -0.3541908264160156, -0.33896636962890625, -0.3237419128417969, -0.3085174560546875, -0.2932929992675781, -0.27806854248046875, -0.2628440856933594, -0.24761962890625, -0.23239517211914062, -0.21717071533203125, -0.20194625854492188, -0.1867218017578125, -0.17149734497070312, -0.15627288818359375, -0.14104843139648438, -0.125823974609375, -0.11059951782226562, -0.09537506103515625, -0.08015060424804688, -0.0649261474609375, -0.049701690673828125, -0.03447723388671875, -0.019252777099609375, -0.0040283203125, 0.011196136474609375, 0.02642059326171875, 0.041645050048828125, 0.0568695068359375, 0.07209396362304688, 0.08731842041015625, 0.10254287719726562, 0.117767333984375, 0.13299179077148438, 0.14821624755859375, 0.16344070434570312, 0.1786651611328125, 0.19388961791992188, 0.20911407470703125, 0.22433853149414062, 0.23956298828125, 0.2547874450683594, 0.27001190185546875, 0.2852363586425781, 0.3004608154296875, 0.3156852722167969, 0.33090972900390625, 0.3461341857910156, 0.361358642578125, 0.3765830993652344, 0.39180755615234375, 0.4070320129394531, 0.4222564697265625, 0.4374809265136719, 0.45270538330078125, 0.4679298400878906, 0.483154296875]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 3.0, 2.0, 9.0, 9.0, 12.0, 10.0, 14.0, 18.0, 25.0, 15.0, 22.0, 24.0, 33.0, 37.0, 35.0, 41.0, 36.0, 35.0, 37.0, 38.0, 422.0, 684.0, 46.0, 44.0, 38.0, 44.0, 27.0, 32.0, 31.0, 31.0, 25.0, 25.0, 30.0, 13.0, 14.0, 18.0, 9.0, 9.0, 6.0, 5.0, 6.0, 3.0, 5.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.1640625, -6.94091796875, -6.7177734375, -6.49462890625, -6.271484375, -6.04833984375, -5.8251953125, -5.60205078125, -5.37890625, -5.15576171875, -4.9326171875, -4.70947265625, -4.486328125, -4.26318359375, -4.0400390625, -3.81689453125, -3.59375, -3.37060546875, -3.1474609375, -2.92431640625, -2.701171875, -2.47802734375, -2.2548828125, -2.03173828125, -1.80859375, -1.58544921875, -1.3623046875, -1.13916015625, -0.916015625, -0.69287109375, -0.4697265625, -0.24658203125, -0.0234375, 0.19970703125, 0.4228515625, 0.64599609375, 0.869140625, 1.09228515625, 1.3154296875, 1.53857421875, 1.76171875, 1.98486328125, 2.2080078125, 2.43115234375, 2.654296875, 2.87744140625, 3.1005859375, 3.32373046875, 3.546875, 3.77001953125, 3.9931640625, 4.21630859375, 4.439453125, 4.66259765625, 4.8857421875, 5.10888671875, 5.33203125, 5.55517578125, 5.7783203125, 6.00146484375, 6.224609375, 6.44775390625, 6.6708984375, 6.89404296875, 7.1171875]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 5.0, 2.0, 6.0, 15.0, 14.0, 22.0, 33.0, 42.0, 65.0, 114.0, 155.0, 223.0, 292.0, 459.0, 693.0, 1046.0, 1751.0, 2905.0, 4997.0, 8948.0, 16815.0, 33974.0, 69716.0, 159678.0, 5644188.0, 188231.0, 77260.0, 37278.0, 18605.0, 9896.0, 5532.0, 3168.0, 1852.0, 1161.0, 733.0, 493.0, 328.0, 193.0, 170.0, 109.0, 75.0, 51.0, 42.0, 42.0, 15.0, 22.0, 11.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0], "bins": [-1.63671875, -1.584869384765625, -1.53302001953125, -1.481170654296875, -1.4293212890625, -1.377471923828125, -1.32562255859375, -1.273773193359375, -1.221923828125, -1.170074462890625, -1.11822509765625, -1.066375732421875, -1.0145263671875, -0.962677001953125, -0.91082763671875, -0.858978271484375, -0.80712890625, -0.755279541015625, -0.70343017578125, -0.651580810546875, -0.5997314453125, -0.547882080078125, -0.49603271484375, -0.444183349609375, -0.392333984375, -0.340484619140625, -0.28863525390625, -0.236785888671875, -0.1849365234375, -0.133087158203125, -0.08123779296875, -0.029388427734375, 0.0224609375, 0.074310302734375, 0.12615966796875, 0.178009033203125, 0.2298583984375, 0.281707763671875, 0.33355712890625, 0.385406494140625, 0.437255859375, 0.489105224609375, 0.54095458984375, 0.592803955078125, 0.6446533203125, 0.696502685546875, 0.74835205078125, 0.800201416015625, 0.85205078125, 0.903900146484375, 0.95574951171875, 1.007598876953125, 1.0594482421875, 1.111297607421875, 1.16314697265625, 1.214996337890625, 1.266845703125, 1.318695068359375, 1.37054443359375, 1.422393798828125, 1.4742431640625, 1.526092529296875, 1.57794189453125, 1.629791259765625, 1.681640625]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 1.0, 8.0, 6.0, 12.0, 8.0, 17.0, 12.0, 12.0, 14.0, 28.0, 19.0, 37.0, 29.0, 29.0, 38.0, 44.0, 43.0, 43.0, 27.0, 60.0, 1028.0, 78.0, 42.0, 40.0, 49.0, 41.0, 42.0, 37.0, 24.0, 26.0, 24.0, 13.0, 17.0, 14.0, 9.0, 12.0, 15.0, 14.0, 0.0, 5.0, 4.0, 3.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.80078125, -7.52801513671875, -7.2552490234375, -6.98248291015625, -6.709716796875, -6.43695068359375, -6.1641845703125, -5.89141845703125, -5.61865234375, -5.34588623046875, -5.0731201171875, -4.80035400390625, -4.527587890625, -4.25482177734375, -3.9820556640625, -3.70928955078125, -3.4365234375, -3.16375732421875, -2.8909912109375, -2.61822509765625, -2.345458984375, -2.07269287109375, -1.7999267578125, -1.52716064453125, -1.25439453125, -0.98162841796875, -0.7088623046875, -0.43609619140625, -0.163330078125, 0.10943603515625, 0.3822021484375, 0.65496826171875, 0.927734375, 1.20050048828125, 1.4732666015625, 1.74603271484375, 2.018798828125, 2.29156494140625, 2.5643310546875, 2.83709716796875, 3.10986328125, 3.38262939453125, 3.6553955078125, 3.92816162109375, 4.200927734375, 4.47369384765625, 4.7464599609375, 5.01922607421875, 5.2919921875, 5.56475830078125, 5.8375244140625, 6.11029052734375, 6.383056640625, 6.65582275390625, 6.9285888671875, 7.20135498046875, 7.47412109375, 7.74688720703125, 8.0196533203125, 8.29241943359375, 8.565185546875, 8.83795166015625, 9.1107177734375, 9.38348388671875, 9.65625]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 1.0, 2.0, 3.0, 8.0, 11.0, 19.0, 49.0, 100.0, 280.0, 302.0, 132.0, 49.0, 22.0, 11.0, 11.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-26.92098045349121, -25.890653610229492, -24.860328674316406, -23.830001831054688, -22.79967498779297, -21.76934814453125, -20.73902130126953, -19.708696365356445, -18.678369522094727, -17.648042678833008, -16.617717742919922, -15.587390899658203, -14.557064056396484, -13.526737213134766, -12.496411323547363, -11.466085433959961, -10.435758590698242, -9.405431747436523, -8.375105857849121, -7.3447794914245605, -6.314453125, -5.2841267585754395, -4.253800392150879, -3.2234740257263184, -2.193147659301758, -1.1628212928771973, -0.13249492645263672, 0.8978314399719238, 1.9281578063964844, 2.958484172821045, 3.9888105392456055, 5.019136905670166, 6.049465179443359, 7.07979154586792, 8.11011791229248, 9.140443801879883, 10.170770645141602, 11.20109748840332, 12.231423377990723, 13.261749267578125, 14.292076110839844, 15.322402954101562, 16.35272979736328, 17.383054733276367, 18.413381576538086, 19.443708419799805, 20.47403335571289, 21.50436019897461, 22.534687042236328, 23.565013885498047, 24.595340728759766, 25.62566566467285, 26.65599250793457, 27.68631935119629, 28.716644287109375, 29.746971130371094, 30.777297973632812, 31.80762481689453, 32.83795166015625, 33.86827850341797, 34.89860534667969, 35.92892837524414, 36.95925521850586, 37.98958206176758, 39.0199089050293]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 7.0, 9.0, 6.0, 5.0, 8.0, 11.0, 15.0, 25.0, 28.0, 36.0, 41.0, 54.0, 77.0, 95.0, 102.0, 111.0, 94.0, 63.0, 51.0, 29.0, 25.0, 19.0, 23.0, 16.0, 10.0, 10.0, 7.0, 9.0, 3.0, 6.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-37.89131164550781, -36.70288848876953, -35.514469146728516, -34.326045989990234, -33.13762664794922, -31.949203491210938, -30.760780334472656, -29.572359085083008, -28.38393783569336, -27.19551658630371, -26.007095336914062, -24.81867218017578, -23.630250930786133, -22.441829681396484, -21.253406524658203, -20.064985275268555, -18.876564025878906, -17.688142776489258, -16.49972152709961, -15.311298370361328, -14.12287712097168, -12.934455871582031, -11.746033668518066, -10.557611465454102, -9.369190216064453, -8.180768966674805, -6.99234676361084, -5.803925037384033, -4.615503311157227, -3.42708158493042, -2.2386598587036133, -1.0502376556396484, 0.13818359375, 1.3266053199768066, 2.5150270462036133, 3.70344877243042, 4.891870498657227, 6.080292224884033, 7.26871395111084, 8.457136154174805, 9.645557403564453, 10.833978652954102, 12.022400856018066, 13.210823059082031, 14.39924430847168, 15.587665557861328, 16.77608871459961, 17.964509963989258, 19.152931213378906, 20.341352462768555, 21.529773712158203, 22.718196868896484, 23.906618118286133, 25.09503936767578, 26.283462524414062, 27.47188377380371, 28.66030502319336, 29.848726272583008, 31.037147521972656, 32.22557067871094, 33.41399383544922, 34.602413177490234, 35.790836334228516, 36.97925567626953, 38.16767883300781]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 6.0, 4.0, 3.0, 2.0, 7.0, 9.0, 6.0, 7.0, 12.0, 17.0, 30.0, 45.0, 47.0, 92.0, 141.0, 225.0, 363.0, 612.0, 983.0, 1657.0, 3410.0, 7133.0, 22565.0, 639471.0, 3477702.0, 24569.0, 7503.0, 3331.0, 1713.0, 1010.0, 578.0, 343.0, 216.0, 146.0, 97.0, 59.0, 45.0, 40.0, 27.0, 15.0, 16.0, 12.0, 2.0, 5.0, 5.0, 3.0, 3.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.143798828125, -0.13866806030273438, -0.13353729248046875, -0.12840652465820312, -0.1232757568359375, -0.11814498901367188, -0.11301422119140625, -0.10788345336914062, -0.102752685546875, -0.09762191772460938, -0.09249114990234375, -0.08736038208007812, -0.0822296142578125, -0.07709884643554688, -0.07196807861328125, -0.06683731079101562, -0.06170654296875, -0.056575775146484375, -0.05144500732421875, -0.046314239501953125, -0.0411834716796875, -0.036052703857421875, -0.03092193603515625, -0.025791168212890625, -0.020660400390625, -0.015529632568359375, -0.01039886474609375, -0.005268096923828125, -0.0001373291015625, 0.004993438720703125, 0.01012420654296875, 0.015254974365234375, 0.0203857421875, 0.025516510009765625, 0.03064727783203125, 0.035778045654296875, 0.0409088134765625, 0.046039581298828125, 0.05117034912109375, 0.056301116943359375, 0.061431884765625, 0.06656265258789062, 0.07169342041015625, 0.07682418823242188, 0.0819549560546875, 0.08708572387695312, 0.09221649169921875, 0.09734725952148438, 0.10247802734375, 0.10760879516601562, 0.11273956298828125, 0.11787033081054688, 0.1230010986328125, 0.12813186645507812, 0.13326263427734375, 0.13839340209960938, 0.143524169921875, 0.14865493774414062, 0.15378570556640625, 0.15891647338867188, 0.1640472412109375, 0.16917800903320312, 0.17430877685546875, 0.17943954467773438, 0.1845703125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 2.0, 5.0, 2.0, 2.0, 3.0, 5.0, 5.0, 4.0, 5.0, 5.0, 3.0, 11.0, 3.0, 13.0, 11.0, 14.0, 20.0, 43.0, 555.0, 142.0, 43.0, 13.0, 6.0, 12.0, 10.0, 13.0, 8.0, 8.0, 7.0, 7.0, 5.0, 2.0, 1.0, 4.0, 5.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06463623046875, -0.06247138977050781, -0.060306549072265625, -0.05814170837402344, -0.05597686767578125, -0.05381202697753906, -0.051647186279296875, -0.04948234558105469, -0.0473175048828125, -0.04515266418457031, -0.042987823486328125, -0.04082298278808594, -0.03865814208984375, -0.03649330139160156, -0.034328460693359375, -0.03216361999511719, -0.029998779296875, -0.027833938598632812, -0.025669097900390625, -0.023504257202148438, -0.02133941650390625, -0.019174575805664062, -0.017009735107421875, -0.014844894409179688, -0.0126800537109375, -0.010515213012695312, -0.008350372314453125, -0.0061855316162109375, -0.00402069091796875, -0.0018558502197265625, 0.000308990478515625, 0.0024738311767578125, 0.004638671875, 0.0068035125732421875, 0.008968353271484375, 0.011133193969726562, 0.01329803466796875, 0.015462875366210938, 0.017627716064453125, 0.019792556762695312, 0.0219573974609375, 0.024122238159179688, 0.026287078857421875, 0.028451919555664062, 0.03061676025390625, 0.03278160095214844, 0.034946441650390625, 0.03711128234863281, 0.039276123046875, 0.04144096374511719, 0.043605804443359375, 0.04577064514160156, 0.04793548583984375, 0.05010032653808594, 0.052265167236328125, 0.05443000793457031, 0.0565948486328125, 0.05875968933105469, 0.060924530029296875, 0.06308937072753906, 0.06525421142578125, 0.06741905212402344, 0.06958389282226562, 0.07174873352050781, 0.07391357421875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 3.0, 5.0, 8.0, 7.0, 7.0, 12.0, 19.0, 37.0, 61.0, 162.0, 385.0, 898.0, 2628.0, 10303.0, 76534.0, 3835437.0, 243155.0, 18806.0, 4011.0, 1144.0, 384.0, 117.0, 54.0, 44.0, 14.0, 14.0, 6.0, 5.0, 5.0, 4.0, 1.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.256103515625, -0.2487201690673828, -0.24133682250976562, -0.23395347595214844, -0.22657012939453125, -0.21918678283691406, -0.21180343627929688, -0.2044200897216797, -0.1970367431640625, -0.1896533966064453, -0.18227005004882812, -0.17488670349121094, -0.16750335693359375, -0.16012001037597656, -0.15273666381835938, -0.1453533172607422, -0.137969970703125, -0.1305866241455078, -0.12320327758789062, -0.11581993103027344, -0.10843658447265625, -0.10105323791503906, -0.09366989135742188, -0.08628654479980469, -0.0789031982421875, -0.07151985168457031, -0.06413650512695312, -0.05675315856933594, -0.04936981201171875, -0.04198646545410156, -0.034603118896484375, -0.027219772338867188, -0.01983642578125, -0.012453079223632812, -0.005069732666015625, 0.0023136138916015625, 0.00969696044921875, 0.017080307006835938, 0.024463653564453125, 0.03184700012207031, 0.0392303466796875, 0.04661369323730469, 0.053997039794921875, 0.06138038635253906, 0.06876373291015625, 0.07614707946777344, 0.08353042602539062, 0.09091377258300781, 0.098297119140625, 0.10568046569824219, 0.11306381225585938, 0.12044715881347656, 0.12783050537109375, 0.13521385192871094, 0.14259719848632812, 0.1499805450439453, 0.1573638916015625, 0.1647472381591797, 0.17213058471679688, 0.17951393127441406, 0.18689727783203125, 0.19428062438964844, 0.20166397094726562, 0.2090473175048828, 0.2164306640625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 5.0, 2.0, 2.0, 11.0, 13.0, 15.0, 16.0, 17.0, 31.0, 37.0, 64.0, 95.0, 190.0, 497.0, 1629.0, 848.0, 237.0, 131.0, 66.0, 42.0, 26.0, 25.0, 18.0, 14.0, 14.0, 5.0, 6.0, 3.0, 6.0, 1.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08892822265625, -0.0864400863647461, -0.08395195007324219, -0.08146381378173828, -0.07897567749023438, -0.07648754119873047, -0.07399940490722656, -0.07151126861572266, -0.06902313232421875, -0.06653499603271484, -0.06404685974121094, -0.06155872344970703, -0.059070587158203125, -0.05658245086669922, -0.05409431457519531, -0.051606178283691406, -0.0491180419921875, -0.046629905700683594, -0.04414176940917969, -0.04165363311767578, -0.039165496826171875, -0.03667736053466797, -0.03418922424316406, -0.031701087951660156, -0.02921295166015625, -0.026724815368652344, -0.024236679077148438, -0.02174854278564453, -0.019260406494140625, -0.01677227020263672, -0.014284133911132812, -0.011795997619628906, -0.009307861328125, -0.006819725036621094, -0.0043315887451171875, -0.0018434524536132812, 0.000644683837890625, 0.0031328201293945312, 0.0056209564208984375, 0.008109092712402344, 0.01059722900390625, 0.013085365295410156, 0.015573501586914062, 0.01806163787841797, 0.020549774169921875, 0.02303791046142578, 0.025526046752929688, 0.028014183044433594, 0.0305023193359375, 0.032990455627441406, 0.03547859191894531, 0.03796672821044922, 0.040454864501953125, 0.04294300079345703, 0.04543113708496094, 0.047919273376464844, 0.05040740966796875, 0.052895545959472656, 0.05538368225097656, 0.05787181854248047, 0.060359954833984375, 0.06284809112548828, 0.06533622741699219, 0.0678243637084961, 0.0703125]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 7.0, 1.0, 9.0, 45.0, 321.0, 552.0, 60.0, 10.0, 4.0, 1.0, 1.0], "bins": [-2.028738260269165, -1.9939026832580566, -1.9590669870376587, -1.9242314100265503, -1.8893957138061523, -1.854560136795044, -1.819724440574646, -1.7848888635635376, -1.7500531673431396, -1.7152175903320312, -1.6803818941116333, -1.645546317100525, -1.610710620880127, -1.5758750438690186, -1.5410393476486206, -1.5062037706375122, -1.4713681936264038, -1.4365326166152954, -1.4016969203948975, -1.366861343383789, -1.3320256471633911, -1.2971900701522827, -1.2623543739318848, -1.2275187969207764, -1.192683219909668, -1.1578476428985596, -1.1230119466781616, -1.0881763696670532, -1.0533406734466553, -1.0185050964355469, -0.9836694598197937, -0.9488338232040405, -0.9139982461929321, -0.879162609577179, -0.8443269729614258, -0.8094913363456726, -0.7746556997299194, -0.739820122718811, -0.7049844861030579, -0.6701488494873047, -0.6353132128715515, -0.6004775762557983, -0.5656419396400452, -0.530806303024292, -0.4959706962108612, -0.46113505959510803, -0.42629945278167725, -0.3914638161659241, -0.3566281795501709, -0.3217925429344177, -0.28695690631866455, -0.25212129950523376, -0.2172856628894806, -0.18245002627372742, -0.14761440455913544, -0.11277878284454346, -0.07794314622879028, -0.043107517063617706, -0.00827188789844513, 0.026563741266727448, 0.061399370431900024, 0.0962350070476532, 0.13107062876224518, 0.16590625047683716, 0.20074188709259033]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 3.0, 4.0, 5.0, 8.0, 6.0, 11.0, 17.0, 16.0, 26.0, 26.0, 26.0, 45.0, 45.0, 48.0, 42.0, 51.0, 70.0, 57.0, 59.0, 61.0, 59.0, 54.0, 42.0, 36.0, 40.0, 29.0, 30.0, 25.0, 10.0, 14.0, 15.0, 8.0, 4.0, 6.0, 2.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2548907995223999, -0.2457183450460434, -0.2365458905696869, -0.22737343609333038, -0.21820098161697388, -0.20902852714061737, -0.19985607266426086, -0.19068363308906555, -0.18151116371154785, -0.17233870923519135, -0.16316625475883484, -0.15399380028247833, -0.14482134580612183, -0.13564889132976532, -0.1264764368534088, -0.1173039898276329, -0.108131542801857, -0.09895908832550049, -0.08978663384914398, -0.08061417937278748, -0.07144172489643097, -0.06226927414536476, -0.05309682339429855, -0.04392436891794205, -0.03475191444158554, -0.025579459965229034, -0.016407007351517677, -0.00723455473780632, 0.0019378997385501862, 0.011110354214906693, 0.0202828049659729, 0.029455259442329407, 0.03862771391868591, 0.04780016839504242, 0.056972622871398926, 0.06614507734775543, 0.07531753182411194, 0.08448998630046844, 0.09366243332624435, 0.10283488780260086, 0.11200734227895737, 0.12117979675531387, 0.13035224378108978, 0.1395246982574463, 0.1486971527338028, 0.1578696072101593, 0.1670420616865158, 0.17621451616287231, 0.18538697063922882, 0.19455942511558533, 0.20373187959194183, 0.21290433406829834, 0.22207678854465485, 0.23124924302101135, 0.24042168259620667, 0.24959415197372437, 0.2587665915489197, 0.267939031124115, 0.2771115005016327, 0.286283940076828, 0.2954564094543457, 0.304628849029541, 0.3138013184070587, 0.32297375798225403, 0.33214622735977173]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 4.0, 4.0, 2.0, 8.0, 14.0, 22.0, 20.0, 24.0, 31.0, 71.0, 85.0, 132.0, 152.0, 246.0, 378.0, 480.0, 699.0, 1135.0, 1628.0, 2450.0, 3811.0, 6190.0, 10296.0, 19216.0, 44230.0, 804667.0, 90915.0, 26485.0, 13639.0, 7797.0, 4742.0, 2901.0, 1959.0, 1311.0, 845.0, 605.0, 397.0, 284.0, 201.0, 143.0, 91.0, 70.0, 51.0, 51.0, 19.0, 18.0, 12.0, 10.0, 8.0, 9.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.2327880859375, -0.2254505157470703, -0.21811294555664062, -0.21077537536621094, -0.20343780517578125, -0.19610023498535156, -0.18876266479492188, -0.1814250946044922, -0.1740875244140625, -0.1667499542236328, -0.15941238403320312, -0.15207481384277344, -0.14473724365234375, -0.13739967346191406, -0.13006210327148438, -0.12272453308105469, -0.115386962890625, -0.10804939270019531, -0.10071182250976562, -0.09337425231933594, -0.08603668212890625, -0.07869911193847656, -0.07136154174804688, -0.06402397155761719, -0.0566864013671875, -0.04934883117675781, -0.042011260986328125, -0.03467369079589844, -0.02733612060546875, -0.019998550415039062, -0.012660980224609375, -0.0053234100341796875, 0.00201416015625, 0.009351730346679688, 0.016689300537109375, 0.024026870727539062, 0.03136444091796875, 0.03870201110839844, 0.046039581298828125, 0.05337715148925781, 0.0607147216796875, 0.06805229187011719, 0.07538986206054688, 0.08272743225097656, 0.09006500244140625, 0.09740257263183594, 0.10474014282226562, 0.11207771301269531, 0.119415283203125, 0.1267528533935547, 0.13409042358398438, 0.14142799377441406, 0.14876556396484375, 0.15610313415527344, 0.16344070434570312, 0.1707782745361328, 0.1781158447265625, 0.1854534149169922, 0.19279098510742188, 0.20012855529785156, 0.20746612548828125, 0.21480369567871094, 0.22214126586914062, 0.2294788360595703, 0.23681640625]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 5.0, 1.0, 3.0, 8.0, 4.0, 4.0, 7.0, 2.0, 5.0, 12.0, 11.0, 14.0, 14.0, 23.0, 53.0, 437.0, 243.0, 40.0, 19.0, 8.0, 11.0, 14.0, 9.0, 10.0, 5.0, 6.0, 7.0, 6.0, 4.0, 4.0, 4.0, 0.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06396484375, -0.06182289123535156, -0.059680938720703125, -0.05753898620605469, -0.05539703369140625, -0.05325508117675781, -0.051113128662109375, -0.04897117614746094, -0.0468292236328125, -0.04468727111816406, -0.042545318603515625, -0.04040336608886719, -0.03826141357421875, -0.03611946105957031, -0.033977508544921875, -0.03183555603027344, -0.029693603515625, -0.027551651000976562, -0.025409698486328125, -0.023267745971679688, -0.02112579345703125, -0.018983840942382812, -0.016841888427734375, -0.014699935913085938, -0.0125579833984375, -0.010416030883789062, -0.008274078369140625, -0.0061321258544921875, -0.00399017333984375, -0.0018482208251953125, 0.000293731689453125, 0.0024356842041015625, 0.00457763671875, 0.0067195892333984375, 0.008861541748046875, 0.011003494262695312, 0.01314544677734375, 0.015287399291992188, 0.017429351806640625, 0.019571304321289062, 0.0217132568359375, 0.023855209350585938, 0.025997161865234375, 0.028139114379882812, 0.03028106689453125, 0.03242301940917969, 0.034564971923828125, 0.03670692443847656, 0.038848876953125, 0.04099082946777344, 0.043132781982421875, 0.04527473449707031, 0.04741668701171875, 0.04955863952636719, 0.051700592041015625, 0.05384254455566406, 0.0559844970703125, 0.05812644958496094, 0.060268402099609375, 0.06241035461425781, 0.06455230712890625, 0.06669425964355469, 0.06883621215820312, 0.07097816467285156, 0.0731201171875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 6.0, 10.0, 8.0, 16.0, 15.0, 21.0, 20.0, 36.0, 45.0, 70.0, 61.0, 95.0, 132.0, 206.0, 371.0, 728.0, 1555.0, 3538.0, 8115.0, 23018.0, 79520.0, 406666.0, 407787.0, 78802.0, 23000.0, 8146.0, 3308.0, 1481.0, 715.0, 353.0, 203.0, 139.0, 83.0, 63.0, 51.0, 42.0, 42.0, 19.0, 26.0, 15.0, 9.0, 8.0, 10.0, 7.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.160888671875, -0.15586090087890625, -0.1508331298828125, -0.14580535888671875, -0.140777587890625, -0.13574981689453125, -0.1307220458984375, -0.12569427490234375, -0.12066650390625, -0.11563873291015625, -0.1106109619140625, -0.10558319091796875, -0.100555419921875, -0.09552764892578125, -0.0904998779296875, -0.08547210693359375, -0.0804443359375, -0.07541656494140625, -0.0703887939453125, -0.06536102294921875, -0.060333251953125, -0.05530548095703125, -0.0502777099609375, -0.04524993896484375, -0.04022216796875, -0.03519439697265625, -0.0301666259765625, -0.02513885498046875, -0.020111083984375, -0.01508331298828125, -0.0100555419921875, -0.00502777099609375, 0.0, 0.00502777099609375, 0.0100555419921875, 0.01508331298828125, 0.020111083984375, 0.02513885498046875, 0.0301666259765625, 0.03519439697265625, 0.04022216796875, 0.04524993896484375, 0.0502777099609375, 0.05530548095703125, 0.060333251953125, 0.06536102294921875, 0.0703887939453125, 0.07541656494140625, 0.0804443359375, 0.08547210693359375, 0.0904998779296875, 0.09552764892578125, 0.100555419921875, 0.10558319091796875, 0.1106109619140625, 0.11563873291015625, 0.12066650390625, 0.12569427490234375, 0.1307220458984375, 0.13574981689453125, 0.140777587890625, 0.14580535888671875, 0.1508331298828125, 0.15586090087890625, 0.160888671875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 2.0, 3.0, 7.0, 7.0, 7.0, 10.0, 17.0, 15.0, 10.0, 7.0, 26.0, 31.0, 35.0, 21.0, 45.0, 46.0, 42.0, 38.0, 47.0, 46.0, 42.0, 50.0, 47.0, 47.0, 57.0, 39.0, 31.0, 41.0, 20.0, 26.0, 31.0, 18.0, 12.0, 17.0, 20.0, 11.0, 6.0, 6.0, 4.0, 6.0, 5.0, 4.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2490234375, -0.24152374267578125, -0.2340240478515625, -0.22652435302734375, -0.219024658203125, -0.21152496337890625, -0.2040252685546875, -0.19652557373046875, -0.18902587890625, -0.18152618408203125, -0.1740264892578125, -0.16652679443359375, -0.159027099609375, -0.15152740478515625, -0.1440277099609375, -0.13652801513671875, -0.1290283203125, -0.12152862548828125, -0.1140289306640625, -0.10652923583984375, -0.099029541015625, -0.09152984619140625, -0.0840301513671875, -0.07653045654296875, -0.06903076171875, -0.06153106689453125, -0.0540313720703125, -0.04653167724609375, -0.039031982421875, -0.03153228759765625, -0.0240325927734375, -0.01653289794921875, -0.009033203125, -0.00153350830078125, 0.0059661865234375, 0.01346588134765625, 0.020965576171875, 0.02846527099609375, 0.0359649658203125, 0.04346466064453125, 0.05096435546875, 0.05846405029296875, 0.0659637451171875, 0.07346343994140625, 0.080963134765625, 0.08846282958984375, 0.0959625244140625, 0.10346221923828125, 0.1109619140625, 0.11846160888671875, 0.1259613037109375, 0.13346099853515625, 0.140960693359375, 0.14846038818359375, 0.1559600830078125, 0.16345977783203125, 0.17095947265625, 0.17845916748046875, 0.1859588623046875, 0.19345855712890625, 0.200958251953125, 0.20845794677734375, 0.2159576416015625, 0.22345733642578125, 0.23095703125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 2.0, 2.0, 3.0, 9.0, 12.0, 21.0, 22.0, 39.0, 63.0, 113.0, 167.0, 318.0, 604.0, 1379.0, 3385.0, 10342.0, 47908.0, 487145.0, 437328.0, 44059.0, 9766.0, 3245.0, 1310.0, 565.0, 299.0, 178.0, 93.0, 70.0, 34.0, 17.0, 13.0, 9.0, 11.0, 7.0, 6.0, 8.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.086669921875, -0.08395957946777344, -0.08124923706054688, -0.07853889465332031, -0.07582855224609375, -0.07311820983886719, -0.07040786743164062, -0.06769752502441406, -0.0649871826171875, -0.06227684020996094, -0.059566497802734375, -0.05685615539550781, -0.05414581298828125, -0.05143547058105469, -0.048725128173828125, -0.04601478576660156, -0.043304443359375, -0.04059410095214844, -0.037883758544921875, -0.03517341613769531, -0.03246307373046875, -0.029752731323242188, -0.027042388916015625, -0.024332046508789062, -0.0216217041015625, -0.018911361694335938, -0.016201019287109375, -0.013490676879882812, -0.01078033447265625, -0.008069992065429688, -0.005359649658203125, -0.0026493072509765625, 6.103515625e-05, 0.0027713775634765625, 0.005481719970703125, 0.008192062377929688, 0.01090240478515625, 0.013612747192382812, 0.016323089599609375, 0.019033432006835938, 0.0217437744140625, 0.024454116821289062, 0.027164459228515625, 0.029874801635742188, 0.03258514404296875, 0.03529548645019531, 0.038005828857421875, 0.04071617126464844, 0.043426513671875, 0.04613685607910156, 0.048847198486328125, 0.05155754089355469, 0.05426788330078125, 0.05697822570800781, 0.059688568115234375, 0.06239891052246094, 0.0651092529296875, 0.06781959533691406, 0.07052993774414062, 0.07324028015136719, 0.07595062255859375, 0.07866096496582031, 0.08137130737304688, 0.08408164978027344, 0.0867919921875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 4.0, 5.0, 6.0, 6.0, 7.0, 11.0, 6.0, 15.0, 11.0, 14.0, 16.0, 22.0, 29.0, 35.0, 38.0, 65.0, 58.0, 63.0, 63.0, 71.0, 64.0, 57.0, 57.0, 44.0, 28.0, 41.0, 31.0, 30.0, 14.0, 18.0, 13.0, 16.0, 10.0, 6.0, 9.0, 6.0, 6.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.430511474609375e-05, -1.3804063200950623e-05, -1.3303011655807495e-05, -1.2801960110664368e-05, -1.230090856552124e-05, -1.1799857020378113e-05, -1.1298805475234985e-05, -1.0797753930091858e-05, -1.029670238494873e-05, -9.795650839805603e-06, -9.294599294662476e-06, -8.793547749519348e-06, -8.29249620437622e-06, -7.791444659233093e-06, -7.290393114089966e-06, -6.789341568946838e-06, -6.288290023803711e-06, -5.7872384786605835e-06, -5.286186933517456e-06, -4.785135388374329e-06, -4.284083843231201e-06, -3.7830322980880737e-06, -3.2819807529449463e-06, -2.780929207801819e-06, -2.2798776626586914e-06, -1.778826117515564e-06, -1.2777745723724365e-06, -7.767230272293091e-07, -2.7567148208618164e-07, 2.253800630569458e-07, 7.264316082000732e-07, 1.2274831533432007e-06, 1.7285346984863281e-06, 2.2295862436294556e-06, 2.730637788772583e-06, 3.2316893339157104e-06, 3.732740879058838e-06, 4.233792424201965e-06, 4.734843969345093e-06, 5.23589551448822e-06, 5.736947059631348e-06, 6.237998604774475e-06, 6.7390501499176025e-06, 7.24010169506073e-06, 7.741153240203857e-06, 8.242204785346985e-06, 8.743256330490112e-06, 9.24430787563324e-06, 9.745359420776367e-06, 1.0246410965919495e-05, 1.0747462511062622e-05, 1.124851405620575e-05, 1.1749565601348877e-05, 1.2250617146492004e-05, 1.2751668691635132e-05, 1.325272023677826e-05, 1.3753771781921387e-05, 1.4254823327064514e-05, 1.4755874872207642e-05, 1.5256926417350769e-05, 1.5757977962493896e-05, 1.6259029507637024e-05, 1.676008105278015e-05, 1.726113259792328e-05, 1.7762184143066406e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 5.0, 8.0, 9.0, 13.0, 17.0, 20.0, 59.0, 90.0, 138.0, 240.0, 602.0, 1592.0, 4777.0, 21573.0, 178881.0, 719144.0, 101171.0, 14390.0, 3657.0, 1199.0, 471.0, 224.0, 115.0, 66.0, 40.0, 16.0, 12.0, 14.0, 6.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.09033203125, -0.08754253387451172, -0.08475303649902344, -0.08196353912353516, -0.07917404174804688, -0.0763845443725586, -0.07359504699707031, -0.07080554962158203, -0.06801605224609375, -0.06522655487060547, -0.06243705749511719, -0.059647560119628906, -0.056858062744140625, -0.054068565368652344, -0.05127906799316406, -0.04848957061767578, -0.0457000732421875, -0.04291057586669922, -0.04012107849121094, -0.037331581115722656, -0.034542083740234375, -0.031752586364746094, -0.028963088989257812, -0.02617359161376953, -0.02338409423828125, -0.02059459686279297, -0.017805099487304688, -0.015015602111816406, -0.012226104736328125, -0.009436607360839844, -0.0066471099853515625, -0.0038576126098632812, -0.001068115234375, 0.0017213821411132812, 0.0045108795166015625, 0.007300376892089844, 0.010089874267578125, 0.012879371643066406, 0.015668869018554688, 0.01845836639404297, 0.02124786376953125, 0.02403736114501953, 0.026826858520507812, 0.029616355895996094, 0.032405853271484375, 0.035195350646972656, 0.03798484802246094, 0.04077434539794922, 0.0435638427734375, 0.04635334014892578, 0.04914283752441406, 0.051932334899902344, 0.054721832275390625, 0.057511329650878906, 0.06030082702636719, 0.06309032440185547, 0.06587982177734375, 0.06866931915283203, 0.07145881652832031, 0.0742483139038086, 0.07703781127929688, 0.07982730865478516, 0.08261680603027344, 0.08540630340576172, 0.08819580078125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 2.0, 2.0, 3.0, 6.0, 6.0, 7.0, 14.0, 25.0, 24.0, 28.0, 31.0, 37.0, 56.0, 64.0, 73.0, 70.0, 80.0, 90.0, 87.0, 66.0, 52.0, 40.0, 39.0, 32.0, 24.0, 10.0, 10.0, 8.0, 4.0, 7.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06884765625, -0.06633663177490234, -0.06382560729980469, -0.06131458282470703, -0.058803558349609375, -0.05629253387451172, -0.05378150939941406, -0.051270484924316406, -0.04875946044921875, -0.046248435974121094, -0.04373741149902344, -0.04122638702392578, -0.038715362548828125, -0.03620433807373047, -0.03369331359863281, -0.031182289123535156, -0.0286712646484375, -0.026160240173339844, -0.023649215698242188, -0.02113819122314453, -0.018627166748046875, -0.01611614227294922, -0.013605117797851562, -0.011094093322753906, -0.00858306884765625, -0.006072044372558594, -0.0035610198974609375, -0.0010499954223632812, 0.001461029052734375, 0.003972053527832031, 0.0064830780029296875, 0.008994102478027344, 0.011505126953125, 0.014016151428222656, 0.016527175903320312, 0.01903820037841797, 0.021549224853515625, 0.02406024932861328, 0.026571273803710938, 0.029082298278808594, 0.03159332275390625, 0.034104347229003906, 0.03661537170410156, 0.03912639617919922, 0.041637420654296875, 0.04414844512939453, 0.04665946960449219, 0.049170494079589844, 0.0516815185546875, 0.054192543029785156, 0.05670356750488281, 0.05921459197998047, 0.061725616455078125, 0.06423664093017578, 0.06674766540527344, 0.0692586898803711, 0.07176971435546875, 0.0742807388305664, 0.07679176330566406, 0.07930278778076172, 0.08181381225585938, 0.08432483673095703, 0.08683586120605469, 0.08934688568115234, 0.09185791015625]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [3.0, 4.0, 15.0, 35.0, 177.0, 576.0, 146.0, 40.0, 11.0, 2.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.6978521943092346, -0.5693410038948059, -0.4408298134803772, -0.3123186230659485, -0.18380743265151978, -0.055296242237091064, 0.07321494817733765, 0.20172613859176636, 0.33023732900619507, 0.4587485194206238, 0.5872597098350525, 0.7157709002494812, 0.8442820906639099, 0.9727932810783386, 1.101304531097412, 1.2298157215118408, 1.3583269119262695, 1.4868381023406982, 1.615349292755127, 1.7438604831695557, 1.8723716735839844, 2.000882863998413, 2.129394054412842, 2.2579052448272705, 2.386416435241699, 2.514927625656128, 2.6434388160705566, 2.7719500064849854, 2.900461196899414, 3.0289723873138428, 3.1574835777282715, 3.2859947681427, 3.414505958557129, 3.5430171489715576, 3.6715283393859863, 3.800039529800415, 3.9285507202148438, 4.057062149047852, 4.185573101043701, 4.314084053039551, 4.442595481872559, 4.571106910705566, 4.699617862701416, 4.828128814697266, 4.956640243530273, 5.085151672363281, 5.213662624359131, 5.3421735763549805, 5.470685005187988, 5.599196434020996, 5.727707386016846, 5.856218338012695, 5.984729766845703, 6.113241195678711, 6.2417521476745605, 6.37026309967041, 6.498774528503418, 6.627285957336426, 6.755796909332275, 6.884307861328125, 7.012819290161133, 7.141330718994141, 7.26984167098999, 7.39835262298584, 7.526864051818848]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 3.0, 1.0, 6.0, 2.0, 5.0, 7.0, 2.0, 5.0, 3.0, 7.0, 9.0, 13.0, 20.0, 34.0, 51.0, 79.0, 108.0, 133.0, 140.0, 118.0, 83.0, 58.0, 39.0, 12.0, 16.0, 13.0, 6.0, 4.0, 7.0, 2.0, 8.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.230095386505127, -4.105755805969238, -3.9814162254333496, -3.857076644897461, -3.7327370643615723, -3.6083974838256836, -3.484057903289795, -3.3597183227539062, -3.2353787422180176, -3.111039161682129, -2.9866995811462402, -2.8623600006103516, -2.738020420074463, -2.613680839538574, -2.4893412590026855, -2.365001678466797, -2.240662097930908, -2.1163225173950195, -1.9919829368591309, -1.8676433563232422, -1.7433037757873535, -1.6189641952514648, -1.4946246147155762, -1.3702850341796875, -1.245945692062378, -1.1216061115264893, -0.9972665309906006, -0.8729269504547119, -0.7485873699188232, -0.6242478489875793, -0.4999082684516907, -0.375568687915802, -0.25122904777526855, -0.12688946723937988, -0.002549901604652405, 0.12178966403007507, 0.24612924456596375, 0.37046879529953003, 0.4948083758354187, 0.6191479563713074, 0.743487536907196, 0.8678271174430847, 0.9921666979789734, 1.1165062189102173, 1.240845799446106, 1.3651853799819946, 1.4895249605178833, 1.613864541053772, 1.7382041215896606, 1.8625437021255493, 1.986883282661438, 2.111222743988037, 2.235562324523926, 2.3599019050598145, 2.484241485595703, 2.608581066131592, 2.7329206466674805, 2.857260227203369, 2.981599807739258, 3.1059393882751465, 3.230278968811035, 3.354618549346924, 3.4789581298828125, 3.603297710418701, 3.72763729095459]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 4.0, 5.0, 6.0, 3.0, 7.0, 10.0, 14.0, 20.0, 24.0, 43.0, 60.0, 74.0, 98.0, 136.0, 218.0, 298.0, 432.0, 654.0, 968.0, 1613.0, 2574.0, 4730.0, 10664.0, 32215.0, 807588.0, 3277268.0, 32567.0, 10307.0, 4837.0, 2609.0, 1473.0, 936.0, 576.0, 404.0, 269.0, 174.0, 114.0, 81.0, 60.0, 42.0, 38.0, 28.0, 7.0, 12.0, 6.0, 8.0, 4.0, 5.0, 2.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.431640625, -0.41815948486328125, -0.4046783447265625, -0.39119720458984375, -0.377716064453125, -0.36423492431640625, -0.3507537841796875, -0.33727264404296875, -0.32379150390625, -0.31031036376953125, -0.2968292236328125, -0.28334808349609375, -0.269866943359375, -0.25638580322265625, -0.2429046630859375, -0.22942352294921875, -0.2159423828125, -0.20246124267578125, -0.1889801025390625, -0.17549896240234375, -0.162017822265625, -0.14853668212890625, -0.1350555419921875, -0.12157440185546875, -0.10809326171875, -0.09461212158203125, -0.0811309814453125, -0.06764984130859375, -0.054168701171875, -0.04068756103515625, -0.0272064208984375, -0.01372528076171875, -0.000244140625, 0.01323699951171875, 0.0267181396484375, 0.04019927978515625, 0.053680419921875, 0.06716156005859375, 0.0806427001953125, 0.09412384033203125, 0.10760498046875, 0.12108612060546875, 0.1345672607421875, 0.14804840087890625, 0.161529541015625, 0.17501068115234375, 0.1884918212890625, 0.20197296142578125, 0.2154541015625, 0.22893524169921875, 0.2424163818359375, 0.25589752197265625, 0.269378662109375, 0.28285980224609375, 0.2963409423828125, 0.30982208251953125, 0.32330322265625, 0.33678436279296875, 0.3502655029296875, 0.36374664306640625, 0.377227783203125, 0.39070892333984375, 0.4041900634765625, 0.41767120361328125, 0.43115234375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 3.0, 4.0, 4.0, 4.0, 6.0, 3.0, 8.0, 6.0, 8.0, 16.0, 20.0, 19.0, 39.0, 123.0, 374.0, 197.0, 60.0, 19.0, 13.0, 16.0, 9.0, 8.0, 12.0, 6.0, 3.0, 7.0, 2.0, 3.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0684814453125, -0.06637763977050781, -0.06427383422851562, -0.06217002868652344, -0.06006622314453125, -0.05796241760253906, -0.055858612060546875, -0.05375480651855469, -0.0516510009765625, -0.04954719543457031, -0.047443389892578125, -0.04533958435058594, -0.04323577880859375, -0.04113197326660156, -0.039028167724609375, -0.03692436218261719, -0.034820556640625, -0.03271675109863281, -0.030612945556640625, -0.028509140014648438, -0.02640533447265625, -0.024301528930664062, -0.022197723388671875, -0.020093917846679688, -0.0179901123046875, -0.015886306762695312, -0.013782501220703125, -0.011678695678710938, -0.00957489013671875, -0.0074710845947265625, -0.005367279052734375, -0.0032634735107421875, -0.00115966796875, 0.0009441375732421875, 0.003047943115234375, 0.0051517486572265625, 0.00725555419921875, 0.009359359741210938, 0.011463165283203125, 0.013566970825195312, 0.0156707763671875, 0.017774581909179688, 0.019878387451171875, 0.021982192993164062, 0.02408599853515625, 0.026189804077148438, 0.028293609619140625, 0.030397415161132812, 0.032501220703125, 0.03460502624511719, 0.036708831787109375, 0.03881263732910156, 0.04091644287109375, 0.04302024841308594, 0.045124053955078125, 0.04722785949707031, 0.0493316650390625, 0.05143547058105469, 0.053539276123046875, 0.05564308166503906, 0.05774688720703125, 0.05985069274902344, 0.061954498291015625, 0.06405830383300781, 0.066162109375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 3.0, 8.0, 8.0, 8.0, 21.0, 21.0, 42.0, 82.0, 141.0, 343.0, 895.0, 3087.0, 15300.0, 168753.0, 3893035.0, 96939.0, 11388.0, 2675.0, 832.0, 351.0, 153.0, 74.0, 32.0, 25.0, 22.0, 12.0, 9.0, 3.0, 5.0, 1.0, 2.0, 3.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.380859375, -0.36525726318359375, -0.3496551513671875, -0.33405303955078125, -0.318450927734375, -0.30284881591796875, -0.2872467041015625, -0.27164459228515625, -0.25604248046875, -0.24044036865234375, -0.2248382568359375, -0.20923614501953125, -0.193634033203125, -0.17803192138671875, -0.1624298095703125, -0.14682769775390625, -0.1312255859375, -0.11562347412109375, -0.1000213623046875, -0.08441925048828125, -0.068817138671875, -0.05321502685546875, -0.0376129150390625, -0.02201080322265625, -0.00640869140625, 0.00919342041015625, 0.0247955322265625, 0.04039764404296875, 0.055999755859375, 0.07160186767578125, 0.0872039794921875, 0.10280609130859375, 0.118408203125, 0.13401031494140625, 0.1496124267578125, 0.16521453857421875, 0.180816650390625, 0.19641876220703125, 0.2120208740234375, 0.22762298583984375, 0.24322509765625, 0.25882720947265625, 0.2744293212890625, 0.29003143310546875, 0.305633544921875, 0.32123565673828125, 0.3368377685546875, 0.35243988037109375, 0.3680419921875, 0.38364410400390625, 0.3992462158203125, 0.41484832763671875, 0.430450439453125, 0.44605255126953125, 0.4616546630859375, 0.47725677490234375, 0.49285888671875, 0.5084609985351562, 0.5240631103515625, 0.5396652221679688, 0.555267333984375, 0.5708694458007812, 0.5864715576171875, 0.6020736694335938, 0.61767578125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 9.0, 3.0, 4.0, 4.0, 7.0, 7.0, 10.0, 17.0, 11.0, 23.0, 30.0, 43.0, 69.0, 93.0, 196.0, 368.0, 2101.0, 524.0, 192.0, 102.0, 72.0, 50.0, 30.0, 27.0, 18.0, 17.0, 13.0, 7.0, 8.0, 4.0, 3.0, 5.0, 4.0, 0.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.050872802734375, -0.04871988296508789, -0.04656696319580078, -0.04441404342651367, -0.04226112365722656, -0.04010820388793945, -0.037955284118652344, -0.035802364349365234, -0.033649444580078125, -0.031496524810791016, -0.029343605041503906, -0.027190685272216797, -0.025037765502929688, -0.022884845733642578, -0.02073192596435547, -0.01857900619506836, -0.01642608642578125, -0.01427316665649414, -0.012120246887207031, -0.009967327117919922, -0.007814407348632812, -0.005661487579345703, -0.0035085678100585938, -0.0013556480407714844, 0.000797271728515625, 0.0029501914978027344, 0.005103111267089844, 0.007256031036376953, 0.009408950805664062, 0.011561870574951172, 0.013714790344238281, 0.01586771011352539, 0.0180206298828125, 0.02017354965209961, 0.02232646942138672, 0.024479389190673828, 0.026632308959960938, 0.028785228729248047, 0.030938148498535156, 0.033091068267822266, 0.035243988037109375, 0.037396907806396484, 0.039549827575683594, 0.0417027473449707, 0.04385566711425781, 0.04600858688354492, 0.04816150665283203, 0.05031442642211914, 0.05246734619140625, 0.05462026596069336, 0.05677318572998047, 0.05892610549926758, 0.06107902526855469, 0.0632319450378418, 0.0653848648071289, 0.06753778457641602, 0.06969070434570312, 0.07184362411499023, 0.07399654388427734, 0.07614946365356445, 0.07830238342285156, 0.08045530319213867, 0.08260822296142578, 0.08476114273071289, 0.0869140625]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 30.0, 603.0, 342.0, 17.0, 8.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.39007556438446045, -0.3403872549533844, -0.29069894552230835, -0.2410106658935547, -0.19132235646247864, -0.1416340470314026, -0.09194576740264893, -0.042257457971572876, 0.007430851459503174, 0.05711915343999863, 0.10680745542049408, 0.15649574995040894, 0.20618405938148499, 0.25587236881256104, 0.3055606484413147, 0.35524895787239075, 0.4049372673034668, 0.45462557673454285, 0.5043138861656189, 0.5540021657943726, 0.603690505027771, 0.6533787846565247, 0.7030670642852783, 0.7527554035186768, 0.8024436831474304, 0.8521319627761841, 0.9018203020095825, 0.9515085816383362, 1.0011968612670898, 1.0508852005004883, 1.1005735397338867, 1.1502617597579956, 1.1999499797821045, 1.249638319015503, 1.2993265390396118, 1.3490148782730103, 1.3987032175064087, 1.4483914375305176, 1.498079776763916, 1.5477681159973145, 1.597456455230713, 1.6471447944641113, 1.6968330144882202, 1.7465213537216187, 1.796209692955017, 1.845897912979126, 1.8955862522125244, 1.9452745914459229, 1.9949628114700317, 2.0446510314941406, 2.094339370727539, 2.1440277099609375, 2.193716049194336, 2.2434043884277344, 2.293092727661133, 2.342780828475952, 2.3924691677093506, 2.442157506942749, 2.4918458461761475, 2.541533946990967, 2.5912222862243652, 2.6409106254577637, 2.690598964691162, 2.7402873039245605, 2.789975643157959]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 6.0, 2.0, 10.0, 7.0, 13.0, 14.0, 30.0, 34.0, 28.0, 34.0, 50.0, 57.0, 66.0, 74.0, 75.0, 74.0, 61.0, 78.0, 56.0, 40.0, 48.0, 36.0, 21.0, 23.0, 19.0, 12.0, 9.0, 7.0, 3.0, 6.0, 6.0, 4.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.37470340728759766, -0.3640134930610657, -0.3533235788345337, -0.3426336646080017, -0.3319437801837921, -0.32125386595726013, -0.31056395173072815, -0.29987403750419617, -0.2891841530799866, -0.2784942388534546, -0.2678043246269226, -0.2571144104003906, -0.24642452597618103, -0.23573461174964905, -0.22504469752311707, -0.21435478329658508, -0.2036648690700531, -0.19297495484352112, -0.18228505551815033, -0.17159514129161835, -0.16090524196624756, -0.15021532773971558, -0.1395254135131836, -0.1288354992866516, -0.11814559996128082, -0.10745569318532944, -0.09676578640937805, -0.08607587218284607, -0.07538596540689468, -0.0646960586309433, -0.054006144404411316, -0.04331623762845993, -0.032626330852508545, -0.02193642221391201, -0.011246513575315475, -0.0005566030740737915, 0.010133303701877594, 0.02082321047782898, 0.03151312470436096, 0.04220303148031235, 0.05289293825626373, 0.06358284503221512, 0.0742727518081665, 0.08496266603469849, 0.09565257281064987, 0.10634247958660126, 0.11703239381313324, 0.12772229313850403, 0.138412207365036, 0.149102121591568, 0.15979202091693878, 0.17048193514347076, 0.18117183446884155, 0.19186174869537354, 0.20255166292190552, 0.2132415771484375, 0.2239314764738083, 0.23462139070034027, 0.24531129002571106, 0.25600120425224304, 0.266691118478775, 0.2773810029029846, 0.2880709171295166, 0.2987608313560486, 0.30945074558258057]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 3.0, 6.0, 7.0, 9.0, 16.0, 24.0, 25.0, 47.0, 65.0, 85.0, 149.0, 251.0, 384.0, 681.0, 1264.0, 2439.0, 5247.0, 13232.0, 45199.0, 799595.0, 140698.0, 23171.0, 8301.0, 3567.0, 1829.0, 913.0, 494.0, 285.0, 207.0, 117.0, 76.0, 56.0, 38.0, 16.0, 23.0, 11.0, 8.0, 6.0, 5.0, 1.0, 7.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.392578125, -0.3802146911621094, -0.36785125732421875, -0.3554878234863281, -0.3431243896484375, -0.3307609558105469, -0.31839752197265625, -0.3060340881347656, -0.293670654296875, -0.2813072204589844, -0.26894378662109375, -0.2565803527832031, -0.2442169189453125, -0.23185348510742188, -0.21949005126953125, -0.20712661743164062, -0.19476318359375, -0.18239974975585938, -0.17003631591796875, -0.15767288208007812, -0.1453094482421875, -0.13294601440429688, -0.12058258056640625, -0.10821914672851562, -0.095855712890625, -0.08349227905273438, -0.07112884521484375, -0.058765411376953125, -0.0464019775390625, -0.034038543701171875, -0.02167510986328125, -0.009311676025390625, 0.0030517578125, 0.015415191650390625, 0.02777862548828125, 0.040142059326171875, 0.0525054931640625, 0.06486892700195312, 0.07723236083984375, 0.08959579467773438, 0.101959228515625, 0.11432266235351562, 0.12668609619140625, 0.13904953002929688, 0.1514129638671875, 0.16377639770507812, 0.17613983154296875, 0.18850326538085938, 0.20086669921875, 0.21323013305664062, 0.22559356689453125, 0.23795700073242188, 0.2503204345703125, 0.2626838684082031, 0.27504730224609375, 0.2874107360839844, 0.299774169921875, 0.3121376037597656, 0.32450103759765625, 0.3368644714355469, 0.3492279052734375, 0.3615913391113281, 0.37395477294921875, 0.3863182067871094, 0.398681640625]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 0.0, 2.0, 2.0, 2.0, 7.0, 6.0, 7.0, 3.0, 9.0, 10.0, 12.0, 12.0, 23.0, 41.0, 110.0, 268.0, 245.0, 98.0, 51.0, 19.0, 15.0, 11.0, 13.0, 11.0, 7.0, 4.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06549072265625, -0.06343650817871094, -0.061382293701171875, -0.05932807922363281, -0.05727386474609375, -0.05521965026855469, -0.053165435791015625, -0.05111122131347656, -0.0490570068359375, -0.04700279235839844, -0.044948577880859375, -0.04289436340332031, -0.04084014892578125, -0.03878593444824219, -0.036731719970703125, -0.03467750549316406, -0.032623291015625, -0.030569076538085938, -0.028514862060546875, -0.026460647583007812, -0.02440643310546875, -0.022352218627929688, -0.020298004150390625, -0.018243789672851562, -0.0161895751953125, -0.014135360717773438, -0.012081146240234375, -0.010026931762695312, -0.00797271728515625, -0.0059185028076171875, -0.003864288330078125, -0.0018100738525390625, 0.000244140625, 0.0022983551025390625, 0.004352569580078125, 0.0064067840576171875, 0.00846099853515625, 0.010515213012695312, 0.012569427490234375, 0.014623641967773438, 0.0166778564453125, 0.018732070922851562, 0.020786285400390625, 0.022840499877929688, 0.02489471435546875, 0.026948928833007812, 0.029003143310546875, 0.031057357788085938, 0.033111572265625, 0.03516578674316406, 0.037220001220703125, 0.03927421569824219, 0.04132843017578125, 0.04338264465332031, 0.045436859130859375, 0.04749107360839844, 0.0495452880859375, 0.05159950256347656, 0.053653717041015625, 0.05570793151855469, 0.05776214599609375, 0.05981636047363281, 0.061870574951171875, 0.06392478942871094, 0.06597900390625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 2.0, 4.0, 6.0, 8.0, 7.0, 13.0, 17.0, 14.0, 32.0, 31.0, 49.0, 73.0, 141.0, 217.0, 500.0, 1278.0, 3590.0, 12762.0, 65192.0, 573668.0, 336304.0, 41212.0, 8938.0, 2550.0, 954.0, 436.0, 223.0, 87.0, 54.0, 57.0, 34.0, 25.0, 15.0, 20.0, 12.0, 6.0, 6.0, 8.0, 7.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.2415771484375, -0.23399734497070312, -0.22641754150390625, -0.21883773803710938, -0.2112579345703125, -0.20367813110351562, -0.19609832763671875, -0.18851852416992188, -0.180938720703125, -0.17335891723632812, -0.16577911376953125, -0.15819931030273438, -0.1506195068359375, -0.14303970336914062, -0.13545989990234375, -0.12788009643554688, -0.12030029296875, -0.11272048950195312, -0.10514068603515625, -0.09756088256835938, -0.0899810791015625, -0.08240127563476562, -0.07482147216796875, -0.06724166870117188, -0.059661865234375, -0.052082061767578125, -0.04450225830078125, -0.036922454833984375, -0.0293426513671875, -0.021762847900390625, -0.01418304443359375, -0.006603240966796875, 0.0009765625, 0.008556365966796875, 0.01613616943359375, 0.023715972900390625, 0.0312957763671875, 0.038875579833984375, 0.04645538330078125, 0.054035186767578125, 0.061614990234375, 0.06919479370117188, 0.07677459716796875, 0.08435440063476562, 0.0919342041015625, 0.09951400756835938, 0.10709381103515625, 0.11467361450195312, 0.12225341796875, 0.12983322143554688, 0.13741302490234375, 0.14499282836914062, 0.1525726318359375, 0.16015243530273438, 0.16773223876953125, 0.17531204223632812, 0.182891845703125, 0.19047164916992188, 0.19805145263671875, 0.20563125610351562, 0.2132110595703125, 0.22079086303710938, 0.22837066650390625, 0.23595046997070312, 0.2435302734375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 2.0, 5.0, 4.0, 10.0, 13.0, 13.0, 13.0, 14.0, 22.0, 21.0, 19.0, 30.0, 31.0, 35.0, 31.0, 37.0, 50.0, 54.0, 60.0, 50.0, 51.0, 50.0, 56.0, 38.0, 41.0, 29.0, 41.0, 22.0, 16.0, 28.0, 25.0, 21.0, 9.0, 18.0, 12.0, 9.0, 7.0, 7.0, 7.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.15234375, -0.14720726013183594, -0.14207077026367188, -0.1369342803955078, -0.13179779052734375, -0.1266613006591797, -0.12152481079101562, -0.11638832092285156, -0.1112518310546875, -0.10611534118652344, -0.10097885131835938, -0.09584236145019531, -0.09070587158203125, -0.08556938171386719, -0.08043289184570312, -0.07529640197753906, -0.070159912109375, -0.06502342224121094, -0.059886932373046875, -0.05475044250488281, -0.04961395263671875, -0.04447746276855469, -0.039340972900390625, -0.03420448303222656, -0.0290679931640625, -0.023931503295898438, -0.018795013427734375, -0.013658523559570312, -0.00852203369140625, -0.0033855438232421875, 0.001750946044921875, 0.0068874359130859375, 0.01202392578125, 0.017160415649414062, 0.022296905517578125, 0.027433395385742188, 0.03256988525390625, 0.03770637512207031, 0.042842864990234375, 0.04797935485839844, 0.0531158447265625, 0.05825233459472656, 0.06338882446289062, 0.06852531433105469, 0.07366180419921875, 0.07879829406738281, 0.08393478393554688, 0.08907127380371094, 0.094207763671875, 0.09934425354003906, 0.10448074340820312, 0.10961723327636719, 0.11475372314453125, 0.11989021301269531, 0.12502670288085938, 0.13016319274902344, 0.1352996826171875, 0.14043617248535156, 0.14557266235351562, 0.1507091522216797, 0.15584564208984375, 0.1609821319580078, 0.16611862182617188, 0.17125511169433594, 0.1763916015625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 4.0, 6.0, 12.0, 14.0, 9.0, 27.0, 64.0, 90.0, 133.0, 276.0, 630.0, 1937.0, 10080.0, 291906.0, 721612.0, 17500.0, 2706.0, 840.0, 325.0, 172.0, 89.0, 47.0, 28.0, 18.0, 13.0, 7.0, 6.0, 2.0, 4.0, 1.0, 3.0, 2.0, 1.0], "bins": [-0.52294921875, -0.5113582611083984, -0.4997673034667969, -0.4881763458251953, -0.47658538818359375, -0.4649944305419922, -0.4534034729003906, -0.44181251525878906, -0.4302215576171875, -0.41863059997558594, -0.4070396423339844, -0.3954486846923828, -0.38385772705078125, -0.3722667694091797, -0.3606758117675781, -0.34908485412597656, -0.337493896484375, -0.32590293884277344, -0.3143119812011719, -0.3027210235595703, -0.29113006591796875, -0.2795391082763672, -0.2679481506347656, -0.25635719299316406, -0.2447662353515625, -0.23317527770996094, -0.22158432006835938, -0.2099933624267578, -0.19840240478515625, -0.1868114471435547, -0.17522048950195312, -0.16362953186035156, -0.15203857421875, -0.14044761657714844, -0.12885665893554688, -0.11726570129394531, -0.10567474365234375, -0.09408378601074219, -0.08249282836914062, -0.07090187072753906, -0.0593109130859375, -0.04771995544433594, -0.036128997802734375, -0.024538040161132812, -0.01294708251953125, -0.0013561248779296875, 0.010234832763671875, 0.021825790405273438, 0.033416748046875, 0.04500770568847656, 0.056598663330078125, 0.06818962097167969, 0.07978057861328125, 0.09137153625488281, 0.10296249389648438, 0.11455345153808594, 0.1261444091796875, 0.13773536682128906, 0.14932632446289062, 0.1609172821044922, 0.17250823974609375, 0.1840991973876953, 0.19569015502929688, 0.20728111267089844, 0.2188720703125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 5.0, 8.0, 11.0, 9.0, 5.0, 11.0, 20.0, 27.0, 47.0, 46.0, 53.0, 77.0, 96.0, 84.0, 100.0, 95.0, 66.0, 64.0, 42.0, 42.0, 30.0, 11.0, 14.0, 6.0, 15.0, 6.0, 3.0, 1.0, 5.0, 7.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.546476364135742e-05, -3.448314964771271e-05, -3.350153565406799e-05, -3.251992166042328e-05, -3.1538307666778564e-05, -3.055669367313385e-05, -2.9575079679489136e-05, -2.859346568584442e-05, -2.7611851692199707e-05, -2.6630237698554993e-05, -2.564862370491028e-05, -2.4667009711265564e-05, -2.368539571762085e-05, -2.2703781723976135e-05, -2.172216773033142e-05, -2.0740553736686707e-05, -1.9758939743041992e-05, -1.8777325749397278e-05, -1.7795711755752563e-05, -1.681409776210785e-05, -1.5832483768463135e-05, -1.485086977481842e-05, -1.3869255781173706e-05, -1.2887641787528992e-05, -1.1906027793884277e-05, -1.0924413800239563e-05, -9.942799806594849e-06, -8.961185812950134e-06, -7.97957181930542e-06, -6.9979578256607056e-06, -6.016343832015991e-06, -5.034729838371277e-06, -4.0531158447265625e-06, -3.071501851081848e-06, -2.089887857437134e-06, -1.1082738637924194e-06, -1.2665987014770508e-07, 8.549541234970093e-07, 1.8365681171417236e-06, 2.818182110786438e-06, 3.7997961044311523e-06, 4.781410098075867e-06, 5.763024091720581e-06, 6.744638085365295e-06, 7.72625207901001e-06, 8.707866072654724e-06, 9.689480066299438e-06, 1.0671094059944153e-05, 1.1652708053588867e-05, 1.2634322047233582e-05, 1.3615936040878296e-05, 1.459755003452301e-05, 1.5579164028167725e-05, 1.656077802181244e-05, 1.7542392015457153e-05, 1.8524006009101868e-05, 1.9505620002746582e-05, 2.0487233996391296e-05, 2.146884799003601e-05, 2.2450461983680725e-05, 2.343207597732544e-05, 2.4413689970970154e-05, 2.5395303964614868e-05, 2.6376917958259583e-05, 2.7358531951904297e-05]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 5.0, 14.0, 13.0, 16.0, 32.0, 50.0, 97.0, 211.0, 401.0, 990.0, 3615.0, 21476.0, 489862.0, 504561.0, 21887.0, 3615.0, 985.0, 329.0, 167.0, 77.0, 58.0, 41.0, 15.0, 7.0, 5.0, 6.0, 3.0, 6.0, 2.0, 7.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.355224609375, -0.3465614318847656, -0.33789825439453125, -0.3292350769042969, -0.3205718994140625, -0.3119087219238281, -0.30324554443359375, -0.2945823669433594, -0.285919189453125, -0.2772560119628906, -0.26859283447265625, -0.2599296569824219, -0.2512664794921875, -0.24260330200195312, -0.23394012451171875, -0.22527694702148438, -0.21661376953125, -0.20795059204101562, -0.19928741455078125, -0.19062423706054688, -0.1819610595703125, -0.17329788208007812, -0.16463470458984375, -0.15597152709960938, -0.147308349609375, -0.13864517211914062, -0.12998199462890625, -0.12131881713867188, -0.1126556396484375, -0.10399246215820312, -0.09532928466796875, -0.08666610717773438, -0.0780029296875, -0.06933975219726562, -0.06067657470703125, -0.052013397216796875, -0.0433502197265625, -0.034687042236328125, -0.02602386474609375, -0.017360687255859375, -0.008697509765625, -3.4332275390625e-05, 0.00862884521484375, 0.017292022705078125, 0.0259552001953125, 0.034618377685546875, 0.04328155517578125, 0.051944732666015625, 0.06060791015625, 0.06927108764648438, 0.07793426513671875, 0.08659744262695312, 0.0952606201171875, 0.10392379760742188, 0.11258697509765625, 0.12125015258789062, 0.129913330078125, 0.13857650756835938, 0.14723968505859375, 0.15590286254882812, 0.1645660400390625, 0.17322921752929688, 0.18189239501953125, 0.19055557250976562, 0.19921875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 0.0, 4.0, 5.0, 6.0, 3.0, 14.0, 18.0, 40.0, 36.0, 44.0, 89.0, 136.0, 168.0, 161.0, 102.0, 62.0, 35.0, 15.0, 22.0, 14.0, 12.0, 10.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2457275390625, -0.2398223876953125, -0.233917236328125, -0.2280120849609375, -0.22210693359375, -0.2162017822265625, -0.210296630859375, -0.2043914794921875, -0.198486328125, -0.1925811767578125, -0.186676025390625, -0.1807708740234375, -0.17486572265625, -0.1689605712890625, -0.163055419921875, -0.1571502685546875, -0.1512451171875, -0.1453399658203125, -0.139434814453125, -0.1335296630859375, -0.12762451171875, -0.1217193603515625, -0.115814208984375, -0.1099090576171875, -0.10400390625, -0.0980987548828125, -0.092193603515625, -0.0862884521484375, -0.08038330078125, -0.0744781494140625, -0.068572998046875, -0.0626678466796875, -0.0567626953125, -0.0508575439453125, -0.044952392578125, -0.0390472412109375, -0.03314208984375, -0.0272369384765625, -0.021331787109375, -0.0154266357421875, -0.009521484375, -0.0036163330078125, 0.002288818359375, 0.0081939697265625, 0.01409912109375, 0.0200042724609375, 0.025909423828125, 0.0318145751953125, 0.0377197265625, 0.0436248779296875, 0.049530029296875, 0.0554351806640625, 0.06134033203125, 0.0672454833984375, 0.073150634765625, 0.0790557861328125, 0.0849609375, 0.0908660888671875, 0.096771240234375, 0.1026763916015625, 0.10858154296875, 0.1144866943359375, 0.120391845703125, 0.1262969970703125, 0.1322021484375]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 8.0, 12.0, 91.0, 746.0, 134.0, 17.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4037139415740967, -2.2271244525909424, -2.050535202026367, -1.873945713043213, -1.6973564624786377, -1.5207669734954834, -1.3441776037216187, -1.167588233947754, -0.9909988641738892, -0.8144094944000244, -0.6378201246261597, -0.46123069524765015, -0.2846413254737854, -0.10805195569992065, 0.06853747367858887, 0.2451268434524536, 0.42171621322631836, 0.5983055830001831, 0.7748949527740479, 0.9514843821525574, 1.1280736923217773, 1.3046631813049316, 1.4812525510787964, 1.6578419208526611, 1.8344312906265259, 2.0110206604003906, 2.187610149383545, 2.36419939994812, 2.5407888889312744, 2.7173781394958496, 2.893967628479004, 3.070557117462158, 3.2471461296081543, 3.4237356185913086, 3.600324869155884, 3.776914358139038, 3.9535036087036133, 4.130093097686768, 4.306682586669922, 4.483271598815918, 4.659861087799072, 4.836450576782227, 5.013040065765381, 5.189629077911377, 5.366218566894531, 5.5428080558776855, 5.71939754486084, 5.895986557006836, 6.072576522827148, 6.249166011810303, 6.425755500793457, 6.602344512939453, 6.778934001922607, 6.955523490905762, 7.132112979888916, 7.30870246887207, 7.485291481018066, 7.661880970001221, 7.838470458984375, 8.015059471130371, 8.191649436950684, 8.36823844909668, 8.544827461242676, 8.721417427062988, 8.898006439208984]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 7.0, 4.0, 3.0, 8.0, 11.0, 16.0, 19.0, 21.0, 25.0, 34.0, 74.0, 62.0, 83.0, 97.0, 102.0, 69.0, 86.0, 73.0, 57.0, 34.0, 31.0, 26.0, 18.0, 15.0, 6.0, 4.0, 3.0, 3.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.964937448501587, -1.9055211544036865, -1.8461049795150757, -1.7866886854171753, -1.7272725105285645, -1.667856216430664, -1.6084399223327637, -1.5490236282348633, -1.4896074533462524, -1.430191159248352, -1.3707749843597412, -1.3113586902618408, -1.2519423961639404, -1.1925262212753296, -1.1331099271774292, -1.0736937522888184, -1.014277458190918, -0.9548612236976624, -0.8954449892044067, -0.8360286951065063, -0.7766124606132507, -0.7171962261199951, -0.6577799320220947, -0.5983636975288391, -0.5389474630355835, -0.4795312285423279, -0.4201149642467499, -0.3606986999511719, -0.30128246545791626, -0.24186623096466064, -0.18244996666908264, -0.12303370237350464, -0.06361734867095947, -0.004201099276542664, 0.055215150117874146, 0.11463139951229095, 0.17404764890670776, 0.23346388339996338, 0.2928801476955414, 0.3522964119911194, 0.411712646484375, 0.4711288809776306, 0.5305451154708862, 0.5899614095687866, 0.6493776440620422, 0.7087938785552979, 0.7682101726531982, 0.8276264071464539, 0.8870426416397095, 0.9464588761329651, 1.0058751106262207, 1.065291404724121, 1.1247076988220215, 1.1841238737106323, 1.2435401678085327, 1.3029563426971436, 1.362372636795044, 1.4217889308929443, 1.4812051057815552, 1.5406213998794556, 1.6000375747680664, 1.6594538688659668, 1.7188701629638672, 1.7782864570617676, 1.8377026319503784]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 1.0, 6.0, 6.0, 2.0, 3.0, 3.0, 13.0, 10.0, 15.0, 14.0, 22.0, 24.0, 29.0, 41.0, 69.0, 72.0, 89.0, 139.0, 188.0, 222.0, 370.0, 515.0, 814.0, 1201.0, 1973.0, 3632.0, 8720.0, 36898.0, 3933959.0, 175413.0, 17911.0, 5356.0, 2506.0, 1422.0, 880.0, 569.0, 404.0, 261.0, 174.0, 112.0, 69.0, 42.0, 32.0, 24.0, 14.0, 8.0, 9.0, 7.0, 5.0, 7.0, 1.0, 6.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.6591796875, -0.6384353637695312, -0.6176910400390625, -0.5969467163085938, -0.576202392578125, -0.5554580688476562, -0.5347137451171875, -0.5139694213867188, -0.49322509765625, -0.47248077392578125, -0.4517364501953125, -0.43099212646484375, -0.410247802734375, -0.38950347900390625, -0.3687591552734375, -0.34801483154296875, -0.3272705078125, -0.30652618408203125, -0.2857818603515625, -0.26503753662109375, -0.244293212890625, -0.22354888916015625, -0.2028045654296875, -0.18206024169921875, -0.16131591796875, -0.14057159423828125, -0.1198272705078125, -0.09908294677734375, -0.078338623046875, -0.05759429931640625, -0.0368499755859375, -0.01610565185546875, 0.004638671875, 0.02538299560546875, 0.0461273193359375, 0.06687164306640625, 0.087615966796875, 0.10836029052734375, 0.1291046142578125, 0.14984893798828125, 0.17059326171875, 0.19133758544921875, 0.2120819091796875, 0.23282623291015625, 0.253570556640625, 0.27431488037109375, 0.2950592041015625, 0.31580352783203125, 0.3365478515625, 0.35729217529296875, 0.3780364990234375, 0.39878082275390625, 0.419525146484375, 0.44026947021484375, 0.4610137939453125, 0.48175811767578125, 0.50250244140625, 0.5232467651367188, 0.5439910888671875, 0.5647354125976562, 0.585479736328125, 0.6062240600585938, 0.6269683837890625, 0.6477127075195312, 0.66845703125]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 0.0, 1.0, 3.0, 2.0, 7.0, 8.0, 10.0, 6.0, 12.0, 7.0, 15.0, 26.0, 65.0, 121.0, 238.0, 220.0, 122.0, 57.0, 22.0, 8.0, 12.0, 10.0, 10.0, 8.0, 6.0, 2.0, 2.0, 4.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0694580078125, -0.0672750473022461, -0.06509208679199219, -0.06290912628173828, -0.060726165771484375, -0.05854320526123047, -0.05636024475097656, -0.054177284240722656, -0.05199432373046875, -0.049811363220214844, -0.04762840270996094, -0.04544544219970703, -0.043262481689453125, -0.04107952117919922, -0.03889656066894531, -0.036713600158691406, -0.0345306396484375, -0.032347679138183594, -0.030164718627929688, -0.02798175811767578, -0.025798797607421875, -0.02361583709716797, -0.021432876586914062, -0.019249916076660156, -0.01706695556640625, -0.014883995056152344, -0.012701034545898438, -0.010518074035644531, -0.008335113525390625, -0.006152153015136719, -0.0039691925048828125, -0.0017862319946289062, 0.000396728515625, 0.0025796890258789062, 0.0047626495361328125, 0.006945610046386719, 0.009128570556640625, 0.011311531066894531, 0.013494491577148438, 0.015677452087402344, 0.01786041259765625, 0.020043373107910156, 0.022226333618164062, 0.02440929412841797, 0.026592254638671875, 0.02877521514892578, 0.030958175659179688, 0.033141136169433594, 0.0353240966796875, 0.037507057189941406, 0.03969001770019531, 0.04187297821044922, 0.044055938720703125, 0.04623889923095703, 0.04842185974121094, 0.050604820251464844, 0.05278778076171875, 0.054970741271972656, 0.05715370178222656, 0.05933666229248047, 0.061519622802734375, 0.06370258331298828, 0.06588554382324219, 0.0680685043334961, 0.07025146484375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 5.0, 2.0, 5.0, 8.0, 8.0, 7.0, 7.0, 12.0, 15.0, 27.0, 47.0, 66.0, 139.0, 328.0, 1158.0, 4772.0, 29905.0, 3692246.0, 443837.0, 17197.0, 3117.0, 854.0, 256.0, 92.0, 47.0, 38.0, 15.0, 13.0, 15.0, 11.0, 9.0, 8.0, 6.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.71435546875, -0.6919403076171875, -0.669525146484375, -0.6471099853515625, -0.62469482421875, -0.6022796630859375, -0.579864501953125, -0.5574493408203125, -0.5350341796875, -0.5126190185546875, -0.490203857421875, -0.4677886962890625, -0.44537353515625, -0.4229583740234375, -0.400543212890625, -0.3781280517578125, -0.355712890625, -0.3332977294921875, -0.310882568359375, -0.2884674072265625, -0.26605224609375, -0.2436370849609375, -0.221221923828125, -0.1988067626953125, -0.1763916015625, -0.1539764404296875, -0.131561279296875, -0.1091461181640625, -0.08673095703125, -0.0643157958984375, -0.041900634765625, -0.0194854736328125, 0.0029296875, 0.0253448486328125, 0.047760009765625, 0.0701751708984375, 0.09259033203125, 0.1150054931640625, 0.137420654296875, 0.1598358154296875, 0.1822509765625, 0.2046661376953125, 0.227081298828125, 0.2494964599609375, 0.27191162109375, 0.2943267822265625, 0.316741943359375, 0.3391571044921875, 0.361572265625, 0.3839874267578125, 0.406402587890625, 0.4288177490234375, 0.45123291015625, 0.4736480712890625, 0.496063232421875, 0.5184783935546875, 0.5408935546875, 0.5633087158203125, 0.585723876953125, 0.6081390380859375, 0.63055419921875, 0.6529693603515625, 0.675384521484375, 0.6977996826171875, 0.72021484375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 2.0, 2.0, 6.0, 5.0, 6.0, 11.0, 8.0, 8.0, 16.0, 37.0, 68.0, 114.0, 218.0, 710.0, 2140.0, 334.0, 159.0, 84.0, 40.0, 27.0, 21.0, 17.0, 5.0, 9.0, 6.0, 2.0, 2.0, 5.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08087158203125, -0.07810592651367188, -0.07534027099609375, -0.07257461547851562, -0.0698089599609375, -0.06704330444335938, -0.06427764892578125, -0.061511993408203125, -0.058746337890625, -0.055980682373046875, -0.05321502685546875, -0.050449371337890625, -0.0476837158203125, -0.044918060302734375, -0.04215240478515625, -0.039386749267578125, -0.03662109375, -0.033855438232421875, -0.03108978271484375, -0.028324127197265625, -0.0255584716796875, -0.022792816162109375, -0.02002716064453125, -0.017261505126953125, -0.014495849609375, -0.011730194091796875, -0.00896453857421875, -0.006198883056640625, -0.0034332275390625, -0.000667572021484375, 0.00209808349609375, 0.004863739013671875, 0.00762939453125, 0.010395050048828125, 0.01316070556640625, 0.015926361083984375, 0.0186920166015625, 0.021457672119140625, 0.02422332763671875, 0.026988983154296875, 0.029754638671875, 0.032520294189453125, 0.03528594970703125, 0.038051605224609375, 0.0408172607421875, 0.043582916259765625, 0.04634857177734375, 0.049114227294921875, 0.0518798828125, 0.054645538330078125, 0.05741119384765625, 0.060176849365234375, 0.0629425048828125, 0.06570816040039062, 0.06847381591796875, 0.07123947143554688, 0.074005126953125, 0.07677078247070312, 0.07953643798828125, 0.08230209350585938, 0.0850677490234375, 0.08783340454101562, 0.09059906005859375, 0.09336471557617188, 0.09613037109375]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 1.0, 3.0, 8.0, 14.0, 39.0, 84.0, 236.0, 267.0, 204.0, 89.0, 35.0, 13.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25120946764945984, -0.23506291210651398, -0.21891635656356812, -0.20276981592178345, -0.1866232454776764, -0.17047670483589172, -0.15433014929294586, -0.13818359375, -0.12203703820705414, -0.10589048266410828, -0.08974392712116241, -0.07359737902879715, -0.05745082348585129, -0.041304267942905426, -0.02515771985054016, -0.0090111643075943, 0.0071353912353515625, 0.023281944915652275, 0.03942849859595299, 0.05557505041360855, 0.07172160595655441, 0.08786816149950027, 0.10401470959186554, 0.1201612651348114, 0.13630782067775726, 0.15245437622070312, 0.168600931763649, 0.18474748730659485, 0.20089402794837952, 0.21704059839248657, 0.23318713903427124, 0.2493336945772171, 0.26548027992248535, 0.28162682056427, 0.2977733910083771, 0.31391993165016174, 0.3300665020942688, 0.34621304273605347, 0.36235958337783813, 0.3785061538219452, 0.39465272426605225, 0.4107992649078369, 0.42694583535194397, 0.44309237599372864, 0.4592389464378357, 0.47538548707962036, 0.49153202772140503, 0.5076786279678345, 0.5238251686096191, 0.5399717092514038, 0.5561182498931885, 0.5722648501396179, 0.5884113907814026, 0.6045579314231873, 0.6207044720649719, 0.6368510723114014, 0.6529975533485413, 0.6691440939903259, 0.6852906346321106, 0.70143723487854, 0.7175837755203247, 0.7337303161621094, 0.749876856803894, 0.7660233974456787, 0.7821699976921082]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 3.0, 6.0, 11.0, 13.0, 11.0, 21.0, 24.0, 27.0, 41.0, 50.0, 44.0, 79.0, 77.0, 78.0, 74.0, 64.0, 73.0, 66.0, 54.0, 50.0, 35.0, 29.0, 23.0, 8.0, 6.0, 9.0, 13.0, 2.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.3986917734146118, -0.3883019685745239, -0.37791216373443604, -0.36752235889434814, -0.35713255405426025, -0.34674274921417236, -0.3363529443740845, -0.3259631097316742, -0.3155733048915863, -0.3051835000514984, -0.2947936952114105, -0.28440389037132263, -0.27401408553123474, -0.26362425088882446, -0.2532344460487366, -0.24284464120864868, -0.23245485126972198, -0.2220650464296341, -0.2116752415895462, -0.20128542184829712, -0.19089561700820923, -0.18050581216812134, -0.17011600732803345, -0.15972620248794556, -0.14933639764785767, -0.13894659280776978, -0.12855678796768188, -0.1181669756770134, -0.10777716338634491, -0.09738735854625702, -0.08699755370616913, -0.07660774141550064, -0.06621792912483215, -0.055828120559453964, -0.045438311994075775, -0.035048507153987885, -0.024658698588609695, -0.014268890023231506, -0.0038790851831436157, 0.006510727107524872, 0.016900531947612762, 0.02729034051299095, 0.03768014907836914, 0.04806995391845703, 0.05845976248383522, 0.06884957104921341, 0.0792393758893013, 0.08962918817996979, 0.10001899302005768, 0.11040879786014557, 0.12079861015081406, 0.13118842244148254, 0.14157822728157043, 0.15196803212165833, 0.16235783696174622, 0.1727476418018341, 0.183137446641922, 0.1935272514820099, 0.20391705632209778, 0.21430686116218567, 0.22469668090343475, 0.23508648574352264, 0.24547629058361053, 0.2558661103248596, 0.2662559151649475]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 10.0, 9.0, 15.0, 13.0, 21.0, 38.0, 44.0, 76.0, 109.0, 142.0, 272.0, 503.0, 801.0, 1654.0, 3404.0, 9290.0, 32667.0, 444039.0, 504265.0, 34259.0, 9567.0, 3617.0, 1622.0, 818.0, 495.0, 276.0, 176.0, 107.0, 66.0, 41.0, 42.0, 26.0, 19.0, 15.0, 13.0, 11.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.4345703125, -0.41959381103515625, -0.4046173095703125, -0.38964080810546875, -0.374664306640625, -0.35968780517578125, -0.3447113037109375, -0.32973480224609375, -0.31475830078125, -0.29978179931640625, -0.2848052978515625, -0.26982879638671875, -0.254852294921875, -0.23987579345703125, -0.2248992919921875, -0.20992279052734375, -0.1949462890625, -0.17996978759765625, -0.1649932861328125, -0.15001678466796875, -0.135040283203125, -0.12006378173828125, -0.1050872802734375, -0.09011077880859375, -0.07513427734375, -0.06015777587890625, -0.0451812744140625, -0.03020477294921875, -0.015228271484375, -0.00025177001953125, 0.0147247314453125, 0.02970123291015625, 0.044677734375, 0.05965423583984375, 0.0746307373046875, 0.08960723876953125, 0.104583740234375, 0.11956024169921875, 0.1345367431640625, 0.14951324462890625, 0.16448974609375, 0.17946624755859375, 0.1944427490234375, 0.20941925048828125, 0.224395751953125, 0.23937225341796875, 0.2543487548828125, 0.26932525634765625, 0.2843017578125, 0.29927825927734375, 0.3142547607421875, 0.32923126220703125, 0.344207763671875, 0.35918426513671875, 0.3741607666015625, 0.38913726806640625, 0.40411376953125, 0.41909027099609375, 0.4340667724609375, 0.44904327392578125, 0.464019775390625, 0.47899627685546875, 0.4939727783203125, 0.5089492797851562, 0.52392578125]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 3.0, 9.0, 6.0, 8.0, 15.0, 12.0, 22.0, 55.0, 108.0, 187.0, 218.0, 162.0, 71.0, 43.0, 14.0, 20.0, 13.0, 11.0, 7.0, 5.0, 5.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07061767578125, -0.06855344772338867, -0.06648921966552734, -0.06442499160766602, -0.06236076354980469, -0.06029653549194336, -0.05823230743408203, -0.0561680793762207, -0.054103851318359375, -0.05203962326049805, -0.04997539520263672, -0.04791116714477539, -0.04584693908691406, -0.043782711029052734, -0.041718482971191406, -0.03965425491333008, -0.03759002685546875, -0.03552579879760742, -0.033461570739746094, -0.031397342681884766, -0.029333114624023438, -0.02726888656616211, -0.02520465850830078, -0.023140430450439453, -0.021076202392578125, -0.019011974334716797, -0.01694774627685547, -0.01488351821899414, -0.012819290161132812, -0.010755062103271484, -0.008690834045410156, -0.006626605987548828, -0.0045623779296875, -0.002498149871826172, -0.00043392181396484375, 0.0016303062438964844, 0.0036945343017578125, 0.005758762359619141, 0.007822990417480469, 0.009887218475341797, 0.011951446533203125, 0.014015674591064453, 0.01607990264892578, 0.01814413070678711, 0.020208358764648438, 0.022272586822509766, 0.024336814880371094, 0.026401042938232422, 0.02846527099609375, 0.030529499053955078, 0.032593727111816406, 0.034657955169677734, 0.03672218322753906, 0.03878641128540039, 0.04085063934326172, 0.04291486740112305, 0.044979095458984375, 0.0470433235168457, 0.04910755157470703, 0.05117177963256836, 0.05323600769042969, 0.055300235748291016, 0.057364463806152344, 0.05942869186401367, 0.061492919921875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 5.0, 1.0, 4.0, 6.0, 5.0, 9.0, 13.0, 10.0, 21.0, 19.0, 35.0, 48.0, 72.0, 110.0, 175.0, 299.0, 597.0, 1414.0, 5209.0, 34093.0, 492698.0, 473079.0, 32940.0, 4905.0, 1372.0, 607.0, 296.0, 162.0, 95.0, 71.0, 47.0, 30.0, 21.0, 20.0, 17.0, 10.0, 7.0, 10.0, 7.0, 3.0, 9.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.51806640625, -0.5032615661621094, -0.48845672607421875, -0.4736518859863281, -0.4588470458984375, -0.4440422058105469, -0.42923736572265625, -0.4144325256347656, -0.399627685546875, -0.3848228454589844, -0.37001800537109375, -0.3552131652832031, -0.3404083251953125, -0.3256034851074219, -0.31079864501953125, -0.2959938049316406, -0.28118896484375, -0.2663841247558594, -0.25157928466796875, -0.23677444458007812, -0.2219696044921875, -0.20716476440429688, -0.19235992431640625, -0.17755508422851562, -0.162750244140625, -0.14794540405273438, -0.13314056396484375, -0.11833572387695312, -0.1035308837890625, -0.08872604370117188, -0.07392120361328125, -0.059116363525390625, -0.0443115234375, -0.029506683349609375, -0.01470184326171875, 0.000102996826171875, 0.0149078369140625, 0.029712677001953125, 0.04451751708984375, 0.059322357177734375, 0.074127197265625, 0.08893203735351562, 0.10373687744140625, 0.11854171752929688, 0.1333465576171875, 0.14815139770507812, 0.16295623779296875, 0.17776107788085938, 0.19256591796875, 0.20737075805664062, 0.22217559814453125, 0.23698043823242188, 0.2517852783203125, 0.2665901184082031, 0.28139495849609375, 0.2961997985839844, 0.311004638671875, 0.3258094787597656, 0.34061431884765625, 0.3554191589355469, 0.3702239990234375, 0.3850288391113281, 0.39983367919921875, 0.4146385192871094, 0.429443359375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 3.0, 0.0, 5.0, 4.0, 6.0, 7.0, 6.0, 9.0, 16.0, 13.0, 13.0, 30.0, 26.0, 20.0, 30.0, 38.0, 36.0, 29.0, 36.0, 47.0, 50.0, 54.0, 50.0, 35.0, 42.0, 56.0, 40.0, 34.0, 32.0, 42.0, 25.0, 28.0, 21.0, 16.0, 16.0, 19.0, 10.0, 17.0, 6.0, 5.0, 10.0, 6.0, 7.0, 5.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0], "bins": [-0.193603515625, -0.18836593627929688, -0.18312835693359375, -0.17789077758789062, -0.1726531982421875, -0.16741561889648438, -0.16217803955078125, -0.15694046020507812, -0.151702880859375, -0.14646530151367188, -0.14122772216796875, -0.13599014282226562, -0.1307525634765625, -0.12551498413085938, -0.12027740478515625, -0.11503982543945312, -0.10980224609375, -0.10456466674804688, -0.09932708740234375, -0.09408950805664062, -0.0888519287109375, -0.08361434936523438, -0.07837677001953125, -0.07313919067382812, -0.067901611328125, -0.06266403198242188, -0.05742645263671875, -0.052188873291015625, -0.0469512939453125, -0.041713714599609375, -0.03647613525390625, -0.031238555908203125, -0.0260009765625, -0.020763397216796875, -0.01552581787109375, -0.010288238525390625, -0.0050506591796875, 0.000186920166015625, 0.00542449951171875, 0.010662078857421875, 0.015899658203125, 0.021137237548828125, 0.02637481689453125, 0.031612396240234375, 0.0368499755859375, 0.042087554931640625, 0.04732513427734375, 0.052562713623046875, 0.05780029296875, 0.06303787231445312, 0.06827545166015625, 0.07351303100585938, 0.0787506103515625, 0.08398818969726562, 0.08922576904296875, 0.09446334838867188, 0.099700927734375, 0.10493850708007812, 0.11017608642578125, 0.11541366577148438, 0.1206512451171875, 0.12588882446289062, 0.13112640380859375, 0.13636398315429688, 0.1416015625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 4.0, 3.0, 8.0, 7.0, 11.0, 25.0, 31.0, 48.0, 79.0, 141.0, 222.0, 464.0, 984.0, 2176.0, 5498.0, 16982.0, 64715.0, 321303.0, 490534.0, 106177.0, 25782.0, 7963.0, 2917.0, 1247.0, 571.0, 260.0, 148.0, 82.0, 52.0, 45.0, 30.0, 13.0, 9.0, 11.0, 4.0, 9.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.143798828125, -0.1393280029296875, -0.134857177734375, -0.1303863525390625, -0.12591552734375, -0.1214447021484375, -0.116973876953125, -0.1125030517578125, -0.1080322265625, -0.1035614013671875, -0.099090576171875, -0.0946197509765625, -0.09014892578125, -0.0856781005859375, -0.081207275390625, -0.0767364501953125, -0.072265625, -0.0677947998046875, -0.063323974609375, -0.0588531494140625, -0.05438232421875, -0.0499114990234375, -0.045440673828125, -0.0409698486328125, -0.0364990234375, -0.0320281982421875, -0.027557373046875, -0.0230865478515625, -0.01861572265625, -0.0141448974609375, -0.009674072265625, -0.0052032470703125, -0.000732421875, 0.0037384033203125, 0.008209228515625, 0.0126800537109375, 0.01715087890625, 0.0216217041015625, 0.026092529296875, 0.0305633544921875, 0.0350341796875, 0.0395050048828125, 0.043975830078125, 0.0484466552734375, 0.05291748046875, 0.0573883056640625, 0.061859130859375, 0.0663299560546875, 0.07080078125, 0.0752716064453125, 0.079742431640625, 0.0842132568359375, 0.08868408203125, 0.0931549072265625, 0.097625732421875, 0.1020965576171875, 0.1065673828125, 0.1110382080078125, 0.115509033203125, 0.1199798583984375, 0.12445068359375, 0.1289215087890625, 0.133392333984375, 0.1378631591796875, 0.142333984375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 5.0, 5.0, 7.0, 11.0, 13.0, 4.0, 18.0, 15.0, 11.0, 23.0, 21.0, 24.0, 28.0, 46.0, 51.0, 53.0, 44.0, 49.0, 61.0, 45.0, 49.0, 62.0, 54.0, 39.0, 28.0, 44.0, 37.0, 30.0, 29.0, 22.0, 20.0, 13.0, 9.0, 9.0, 7.0, 6.0, 5.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.24249267578125e-05, -3.15103679895401e-05, -3.05958092212677e-05, -2.96812504529953e-05, -2.87666916847229e-05, -2.78521329164505e-05, -2.69375741481781e-05, -2.60230153799057e-05, -2.51084566116333e-05, -2.41938978433609e-05, -2.32793390750885e-05, -2.23647803068161e-05, -2.14502215385437e-05, -2.05356627702713e-05, -1.96211040019989e-05, -1.87065452337265e-05, -1.77919864654541e-05, -1.68774276971817e-05, -1.5962868928909302e-05, -1.5048310160636902e-05, -1.4133751392364502e-05, -1.3219192624092102e-05, -1.2304633855819702e-05, -1.1390075087547302e-05, -1.0475516319274902e-05, -9.560957551002502e-06, -8.646398782730103e-06, -7.731840014457703e-06, -6.817281246185303e-06, -5.902722477912903e-06, -4.988163709640503e-06, -4.073604941368103e-06, -3.159046173095703e-06, -2.2444874048233032e-06, -1.3299286365509033e-06, -4.153698682785034e-07, 4.991888999938965e-07, 1.4137476682662964e-06, 2.3283064365386963e-06, 3.242865204811096e-06, 4.157423973083496e-06, 5.071982741355896e-06, 5.986541509628296e-06, 6.901100277900696e-06, 7.815659046173096e-06, 8.730217814445496e-06, 9.644776582717896e-06, 1.0559335350990295e-05, 1.1473894119262695e-05, 1.2388452887535095e-05, 1.3303011655807495e-05, 1.4217570424079895e-05, 1.5132129192352295e-05, 1.6046687960624695e-05, 1.6961246728897095e-05, 1.7875805497169495e-05, 1.8790364265441895e-05, 1.9704923033714294e-05, 2.0619481801986694e-05, 2.1534040570259094e-05, 2.2448599338531494e-05, 2.3363158106803894e-05, 2.4277716875076294e-05, 2.5192275643348694e-05, 2.6106834411621094e-05]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 3.0, 6.0, 5.0, 6.0, 5.0, 12.0, 18.0, 12.0, 31.0, 43.0, 67.0, 97.0, 201.0, 401.0, 990.0, 3451.0, 20010.0, 250674.0, 702202.0, 60061.0, 7279.0, 1725.0, 604.0, 253.0, 149.0, 79.0, 48.0, 42.0, 14.0, 12.0, 13.0, 12.0, 5.0, 11.0, 7.0, 3.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.23291015625, -0.22545433044433594, -0.21799850463867188, -0.2105426788330078, -0.20308685302734375, -0.1956310272216797, -0.18817520141601562, -0.18071937561035156, -0.1732635498046875, -0.16580772399902344, -0.15835189819335938, -0.1508960723876953, -0.14344024658203125, -0.1359844207763672, -0.12852859497070312, -0.12107276916503906, -0.113616943359375, -0.10616111755371094, -0.09870529174804688, -0.09124946594238281, -0.08379364013671875, -0.07633781433105469, -0.06888198852539062, -0.06142616271972656, -0.0539703369140625, -0.04651451110839844, -0.039058685302734375, -0.03160285949707031, -0.02414703369140625, -0.016691207885742188, -0.009235382080078125, -0.0017795562744140625, 0.00567626953125, 0.013132095336914062, 0.020587921142578125, 0.028043746948242188, 0.03549957275390625, 0.04295539855957031, 0.050411224365234375, 0.05786705017089844, 0.0653228759765625, 0.07277870178222656, 0.08023452758789062, 0.08769035339355469, 0.09514617919921875, 0.10260200500488281, 0.11005783081054688, 0.11751365661621094, 0.124969482421875, 0.13242530822753906, 0.13988113403320312, 0.1473369598388672, 0.15479278564453125, 0.1622486114501953, 0.16970443725585938, 0.17716026306152344, 0.1846160888671875, 0.19207191467285156, 0.19952774047851562, 0.2069835662841797, 0.21443939208984375, 0.2218952178955078, 0.22935104370117188, 0.23680686950683594, 0.2442626953125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 1.0, 1.0, 3.0, 8.0, 7.0, 4.0, 11.0, 12.0, 9.0, 11.0, 11.0, 15.0, 28.0, 29.0, 37.0, 42.0, 45.0, 52.0, 67.0, 67.0, 81.0, 84.0, 65.0, 52.0, 53.0, 37.0, 30.0, 28.0, 21.0, 18.0, 17.0, 12.0, 8.0, 9.0, 7.0, 7.0, 4.0, 1.0, 3.0, 4.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.07537841796875, -0.07311534881591797, -0.07085227966308594, -0.0685892105102539, -0.06632614135742188, -0.06406307220458984, -0.06180000305175781, -0.05953693389892578, -0.05727386474609375, -0.05501079559326172, -0.05274772644042969, -0.050484657287597656, -0.048221588134765625, -0.045958518981933594, -0.04369544982910156, -0.04143238067626953, -0.0391693115234375, -0.03690624237060547, -0.03464317321777344, -0.032380104064941406, -0.030117034912109375, -0.027853965759277344, -0.025590896606445312, -0.02332782745361328, -0.02106475830078125, -0.01880168914794922, -0.016538619995117188, -0.014275550842285156, -0.012012481689453125, -0.009749412536621094, -0.0074863433837890625, -0.005223274230957031, -0.002960205078125, -0.0006971359252929688, 0.0015659332275390625, 0.0038290023803710938, 0.006092071533203125, 0.008355140686035156, 0.010618209838867188, 0.012881278991699219, 0.01514434814453125, 0.01740741729736328, 0.019670486450195312, 0.021933555603027344, 0.024196624755859375, 0.026459693908691406, 0.028722763061523438, 0.03098583221435547, 0.0332489013671875, 0.03551197052001953, 0.03777503967285156, 0.040038108825683594, 0.042301177978515625, 0.044564247131347656, 0.04682731628417969, 0.04909038543701172, 0.05135345458984375, 0.05361652374267578, 0.05587959289550781, 0.058142662048339844, 0.060405731201171875, 0.0626688003540039, 0.06493186950683594, 0.06719493865966797, 0.0694580078125]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 5.0, 4.0, 23.0, 119.0, 474.0, 302.0, 56.0, 21.0, 7.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.012691020965576, -1.855126142501831, -1.697561264038086, -1.5399965047836304, -1.3824316263198853, -1.2248667478561401, -1.0673019886016846, -0.9097371101379395, -0.7521722316741943, -0.5946073532104492, -0.4370425343513489, -0.27947768568992615, -0.12191283702850342, 0.0356520414352417, 0.19321686029434204, 0.3507816791534424, 0.5083465576171875, 0.6659114360809326, 0.823476254940033, 0.9810410737991333, 1.1386059522628784, 1.2961708307266235, 1.453735589981079, 1.6113004684448242, 1.7688653469085693, 1.9264302253723145, 2.0839951038360596, 2.2415599822998047, 2.3991246223449707, 2.556689739227295, 2.714254379272461, 2.871819257736206, 3.029383659362793, 3.186948537826538, 3.344513416290283, 3.5020782947540283, 3.6596431732177734, 3.8172078132629395, 3.9747726917266846, 4.13233757019043, 4.289902687072754, 4.44746732711792, 4.605032444000244, 4.76259708404541, 4.920162200927734, 5.0777268409729, 5.235291957855225, 5.392856597900391, 5.550421237945557, 5.707985877990723, 5.865550994873047, 6.023115634918213, 6.180680751800537, 6.338245391845703, 6.495810508728027, 6.653375148773193, 6.810939788818359, 6.968504428863525, 7.12606954574585, 7.283634185791016, 7.44119930267334, 7.598763942718506, 7.75632905960083, 7.913893699645996, 8.07145881652832]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 4.0, 3.0, 5.0, 8.0, 11.0, 10.0, 20.0, 25.0, 24.0, 32.0, 40.0, 44.0, 38.0, 61.0, 67.0, 57.0, 66.0, 72.0, 51.0, 80.0, 42.0, 35.0, 40.0, 42.0, 33.0, 22.0, 17.0, 11.0, 12.0, 9.0, 7.0, 9.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.9406133890151978, -1.8857911825180054, -1.8309688568115234, -1.776146650314331, -1.7213244438171387, -1.6665022373199463, -1.611680030822754, -1.556857705116272, -1.5020354986190796, -1.4472132921218872, -1.3923909664154053, -1.337568759918213, -1.2827465534210205, -1.2279243469238281, -1.1731021404266357, -1.1182798147201538, -1.0634576082229614, -1.008635401725769, -0.9538131356239319, -0.8989908695220947, -0.8441686630249023, -0.78934645652771, -0.7345241904258728, -0.6797019243240356, -0.6248797178268433, -0.5700575113296509, -0.5152352452278137, -0.46041300892829895, -0.4055907726287842, -0.3507685363292694, -0.29594630002975464, -0.24112406373023987, -0.18630194664001465, -0.13147971034049988, -0.07665747404098511, -0.021835237741470337, 0.032986998558044434, 0.0878092348575592, 0.14263147115707397, 0.19745370745658875, 0.2522759437561035, 0.3070981800556183, 0.36192041635513306, 0.4167426526546478, 0.4715648889541626, 0.526387095451355, 0.5812093615531921, 0.6360316276550293, 0.6908538341522217, 0.7456760406494141, 0.8004983067512512, 0.8553205728530884, 0.9101427793502808, 0.9649649858474731, 1.019787311553955, 1.0746095180511475, 1.1294317245483398, 1.1842539310455322, 1.2390761375427246, 1.2938984632492065, 1.348720669746399, 1.4035428762435913, 1.4583652019500732, 1.5131874084472656, 1.568009614944458]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 5.0, 2.0, 11.0, 15.0, 23.0, 38.0, 86.0, 164.0, 377.0, 1260.0, 9295.0, 4110605.0, 69112.0, 2482.0, 483.0, 155.0, 87.0, 26.0, 20.0, 12.0, 9.0, 5.0, 9.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5185546875, -1.467529296875, -1.41650390625, -1.365478515625, -1.314453125, -1.263427734375, -1.21240234375, -1.161376953125, -1.1103515625, -1.059326171875, -1.00830078125, -0.957275390625, -0.90625, -0.855224609375, -0.80419921875, -0.753173828125, -0.7021484375, -0.651123046875, -0.60009765625, -0.549072265625, -0.498046875, -0.447021484375, -0.39599609375, -0.344970703125, -0.2939453125, -0.242919921875, -0.19189453125, -0.140869140625, -0.08984375, -0.038818359375, 0.01220703125, 0.063232421875, 0.1142578125, 0.165283203125, 0.21630859375, 0.267333984375, 0.318359375, 0.369384765625, 0.42041015625, 0.471435546875, 0.5224609375, 0.573486328125, 0.62451171875, 0.675537109375, 0.7265625, 0.777587890625, 0.82861328125, 0.879638671875, 0.9306640625, 0.981689453125, 1.03271484375, 1.083740234375, 1.134765625, 1.185791015625, 1.23681640625, 1.287841796875, 1.3388671875, 1.389892578125, 1.44091796875, 1.491943359375, 1.54296875, 1.593994140625, 1.64501953125, 1.696044921875, 1.7470703125]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 5.0, 1.0, 5.0, 2.0, 8.0, 10.0, 9.0, 17.0, 42.0, 42.0, 83.0, 132.0, 182.0, 155.0, 121.0, 61.0, 47.0, 29.0, 19.0, 10.0, 6.0, 9.0, 2.0, 6.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.068603515625, -0.06628894805908203, -0.06397438049316406, -0.061659812927246094, -0.059345245361328125, -0.057030677795410156, -0.05471611022949219, -0.05240154266357422, -0.05008697509765625, -0.04777240753173828, -0.04545783996582031, -0.043143272399902344, -0.040828704833984375, -0.038514137268066406, -0.03619956970214844, -0.03388500213623047, -0.0315704345703125, -0.02925586700439453, -0.026941299438476562, -0.024626731872558594, -0.022312164306640625, -0.019997596740722656, -0.017683029174804688, -0.015368461608886719, -0.01305389404296875, -0.010739326477050781, -0.008424758911132812, -0.006110191345214844, -0.003795623779296875, -0.0014810562133789062, 0.0008335113525390625, 0.0031480789184570312, 0.005462646484375, 0.007777214050292969, 0.010091781616210938, 0.012406349182128906, 0.014720916748046875, 0.017035484313964844, 0.019350051879882812, 0.02166461944580078, 0.02397918701171875, 0.02629375457763672, 0.028608322143554688, 0.030922889709472656, 0.033237457275390625, 0.035552024841308594, 0.03786659240722656, 0.04018115997314453, 0.0424957275390625, 0.04481029510498047, 0.04712486267089844, 0.049439430236816406, 0.051753997802734375, 0.054068565368652344, 0.05638313293457031, 0.05869770050048828, 0.06101226806640625, 0.06332683563232422, 0.06564140319824219, 0.06795597076416016, 0.07027053833007812, 0.0725851058959961, 0.07489967346191406, 0.07721424102783203, 0.07952880859375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 10.0, 8.0, 9.0, 30.0, 43.0, 85.0, 162.0, 320.0, 780.0, 2637.0, 11211.0, 80389.0, 3740875.0, 323037.0, 26662.0, 5431.0, 1479.0, 529.0, 239.0, 119.0, 68.0, 49.0, 29.0, 23.0, 17.0, 12.0, 10.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.447998046875, -0.4329261779785156, -0.41785430908203125, -0.4027824401855469, -0.3877105712890625, -0.3726387023925781, -0.35756683349609375, -0.3424949645996094, -0.327423095703125, -0.3123512268066406, -0.29727935791015625, -0.2822074890136719, -0.2671356201171875, -0.2520637512207031, -0.23699188232421875, -0.22192001342773438, -0.20684814453125, -0.19177627563476562, -0.17670440673828125, -0.16163253784179688, -0.1465606689453125, -0.13148880004882812, -0.11641693115234375, -0.10134506225585938, -0.086273193359375, -0.07120132446289062, -0.05612945556640625, -0.041057586669921875, -0.0259857177734375, -0.010913848876953125, 0.00415802001953125, 0.019229888916015625, 0.0343017578125, 0.049373626708984375, 0.06444549560546875, 0.07951736450195312, 0.0945892333984375, 0.10966110229492188, 0.12473297119140625, 0.13980484008789062, 0.154876708984375, 0.16994857788085938, 0.18502044677734375, 0.20009231567382812, 0.2151641845703125, 0.23023605346679688, 0.24530792236328125, 0.2603797912597656, 0.27545166015625, 0.2905235290527344, 0.30559539794921875, 0.3206672668457031, 0.3357391357421875, 0.3508110046386719, 0.36588287353515625, 0.3809547424316406, 0.396026611328125, 0.4110984802246094, 0.42617034912109375, 0.4412422180175781, 0.4563140869140625, 0.4713859558105469, 0.48645782470703125, 0.5015296936035156, 0.5166015625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 4.0, 6.0, 10.0, 6.0, 14.0, 16.0, 22.0, 31.0, 42.0, 76.0, 84.0, 156.0, 327.0, 1228.0, 1235.0, 294.0, 156.0, 89.0, 65.0, 48.0, 28.0, 25.0, 20.0, 19.0, 15.0, 12.0, 8.0, 6.0, 10.0, 5.0, 4.0, 6.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.07440185546875, -0.07221412658691406, -0.07002639770507812, -0.06783866882324219, -0.06565093994140625, -0.06346321105957031, -0.061275482177734375, -0.05908775329589844, -0.0569000244140625, -0.05471229553222656, -0.052524566650390625, -0.05033683776855469, -0.04814910888671875, -0.04596138000488281, -0.043773651123046875, -0.04158592224121094, -0.039398193359375, -0.03721046447753906, -0.035022735595703125, -0.03283500671386719, -0.03064727783203125, -0.028459548950195312, -0.026271820068359375, -0.024084091186523438, -0.0218963623046875, -0.019708633422851562, -0.017520904541015625, -0.015333175659179688, -0.01314544677734375, -0.010957717895507812, -0.008769989013671875, -0.0065822601318359375, -0.00439453125, -0.0022068023681640625, -1.9073486328125e-05, 0.0021686553955078125, 0.00435638427734375, 0.0065441131591796875, 0.008731842041015625, 0.010919570922851562, 0.0131072998046875, 0.015295028686523438, 0.017482757568359375, 0.019670486450195312, 0.02185821533203125, 0.024045944213867188, 0.026233673095703125, 0.028421401977539062, 0.030609130859375, 0.03279685974121094, 0.034984588623046875, 0.03717231750488281, 0.03936004638671875, 0.04154777526855469, 0.043735504150390625, 0.04592323303222656, 0.0481109619140625, 0.05029869079589844, 0.052486419677734375, 0.05467414855957031, 0.05686187744140625, 0.05904960632324219, 0.061237335205078125, 0.06342506408691406, 0.06561279296875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 5.0, 5.0, 13.0, 68.0, 322.0, 442.0, 134.0, 23.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2751205265522003, -0.23692554235458374, -0.19873055815696716, -0.1605355590581894, -0.12234057486057281, -0.08414559066295624, -0.04595059156417847, -0.00775560736656189, 0.030439376831054688, 0.06863436102867126, 0.10682935267686844, 0.1450243443250656, 0.1832193285226822, 0.22141431272029877, 0.25960931181907654, 0.2978042960166931, 0.3359992802143097, 0.37419426441192627, 0.41238924860954285, 0.4505842328071594, 0.4887792468070984, 0.5269742012023926, 0.5651692152023315, 0.6033642292022705, 0.6415591835975647, 0.6797541975975037, 0.7179491519927979, 0.7561441659927368, 0.794339120388031, 0.83253413438797, 0.8707290887832642, 0.9089241027832031, 0.9471191167831421, 0.985314130783081, 1.02350914478302, 1.0617040395736694, 1.0998990535736084, 1.1380940675735474, 1.1762890815734863, 1.2144839763641357, 1.2526789903640747, 1.2908740043640137, 1.3290690183639526, 1.367263913154602, 1.405458927154541, 1.44365394115448, 1.481848955154419, 1.5200438499450684, 1.5582389831542969, 1.5964339971542358, 1.6346290111541748, 1.6728239059448242, 1.7110189199447632, 1.7492139339447021, 1.7874089479446411, 1.82560396194458, 1.8637988567352295, 1.9019938707351685, 1.9401888847351074, 1.9783837795257568, 2.0165789127349854, 2.0547738075256348, 2.092968702316284, 2.1311638355255127, 2.169358730316162]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 3.0, 1.0, 4.0, 6.0, 13.0, 10.0, 6.0, 17.0, 18.0, 16.0, 19.0, 26.0, 28.0, 26.0, 28.0, 38.0, 32.0, 39.0, 43.0, 42.0, 49.0, 47.0, 43.0, 34.0, 50.0, 39.0, 28.0, 39.0, 29.0, 21.0, 26.0, 30.0, 28.0, 21.0, 23.0, 12.0, 9.0, 16.0, 10.0, 14.0, 8.0, 6.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.21693402528762817, -0.20960736274719238, -0.2022807002067566, -0.1949540376663208, -0.187627375125885, -0.18030071258544922, -0.17297405004501343, -0.16564738750457764, -0.15832072496414185, -0.15099406242370605, -0.14366739988327026, -0.13634073734283447, -0.12901407480239868, -0.12168741226196289, -0.1143607497215271, -0.10703408718109131, -0.09970742464065552, -0.09238076210021973, -0.08505409955978394, -0.07772743701934814, -0.07040077447891235, -0.06307411193847656, -0.05574744939804077, -0.04842078685760498, -0.04109412431716919, -0.0337674617767334, -0.026440799236297607, -0.019114136695861816, -0.011787474155426025, -0.004460811614990234, 0.0028658509254455566, 0.010192513465881348, 0.01751917600631714, 0.02484583854675293, 0.03217250108718872, 0.03949916362762451, 0.0468258261680603, 0.054152488708496094, 0.061479151248931885, 0.06880581378936768, 0.07613247632980347, 0.08345913887023926, 0.09078580141067505, 0.09811246395111084, 0.10543912649154663, 0.11276578903198242, 0.12009245157241821, 0.127419114112854, 0.1347457766532898, 0.14207243919372559, 0.14939910173416138, 0.15672576427459717, 0.16405242681503296, 0.17137908935546875, 0.17870575189590454, 0.18603241443634033, 0.19335907697677612, 0.20068573951721191, 0.2080124020576477, 0.2153390645980835, 0.2226657271385193, 0.22999238967895508, 0.23731905221939087, 0.24464571475982666, 0.25197237730026245]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 4.0, 6.0, 3.0, 9.0, 9.0, 6.0, 17.0, 17.0, 25.0, 32.0, 57.0, 61.0, 111.0, 150.0, 213.0, 356.0, 571.0, 1154.0, 2165.0, 4723.0, 13110.0, 52276.0, 385229.0, 495137.0, 66677.0, 15653.0, 5542.0, 2386.0, 1141.0, 640.0, 383.0, 215.0, 154.0, 97.0, 66.0, 44.0, 32.0, 25.0, 15.0, 12.0, 6.0, 5.0, 12.0, 5.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.339111328125, -0.3285369873046875, -0.317962646484375, -0.3073883056640625, -0.29681396484375, -0.2862396240234375, -0.275665283203125, -0.2650909423828125, -0.2545166015625, -0.2439422607421875, -0.233367919921875, -0.2227935791015625, -0.21221923828125, -0.2016448974609375, -0.191070556640625, -0.1804962158203125, -0.169921875, -0.1593475341796875, -0.148773193359375, -0.1381988525390625, -0.12762451171875, -0.1170501708984375, -0.106475830078125, -0.0959014892578125, -0.0853271484375, -0.0747528076171875, -0.064178466796875, -0.0536041259765625, -0.04302978515625, -0.0324554443359375, -0.021881103515625, -0.0113067626953125, -0.000732421875, 0.0098419189453125, 0.020416259765625, 0.0309906005859375, 0.04156494140625, 0.0521392822265625, 0.062713623046875, 0.0732879638671875, 0.0838623046875, 0.0944366455078125, 0.105010986328125, 0.1155853271484375, 0.12615966796875, 0.1367340087890625, 0.147308349609375, 0.1578826904296875, 0.16845703125, 0.1790313720703125, 0.189605712890625, 0.2001800537109375, 0.21075439453125, 0.2213287353515625, 0.231903076171875, 0.2424774169921875, 0.2530517578125, 0.2636260986328125, 0.274200439453125, 0.2847747802734375, 0.29534912109375, 0.3059234619140625, 0.316497802734375, 0.3270721435546875, 0.337646484375]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 4.0, 1.0, 5.0, 3.0, 7.0, 6.0, 9.0, 22.0, 29.0, 51.0, 81.0, 131.0, 140.0, 147.0, 122.0, 75.0, 71.0, 36.0, 23.0, 18.0, 7.0, 6.0, 6.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07244873046875, -0.07018089294433594, -0.06791305541992188, -0.06564521789550781, -0.06337738037109375, -0.06110954284667969, -0.058841705322265625, -0.05657386779785156, -0.0543060302734375, -0.05203819274902344, -0.049770355224609375, -0.04750251770019531, -0.04523468017578125, -0.04296684265136719, -0.040699005126953125, -0.03843116760253906, -0.036163330078125, -0.03389549255371094, -0.031627655029296875, -0.029359817504882812, -0.02709197998046875, -0.024824142456054688, -0.022556304931640625, -0.020288467407226562, -0.0180206298828125, -0.015752792358398438, -0.013484954833984375, -0.011217117309570312, -0.00894927978515625, -0.0066814422607421875, -0.004413604736328125, -0.0021457672119140625, 0.0001220703125, 0.0023899078369140625, 0.004657745361328125, 0.0069255828857421875, 0.00919342041015625, 0.011461257934570312, 0.013729095458984375, 0.015996932983398438, 0.0182647705078125, 0.020532608032226562, 0.022800445556640625, 0.025068283081054688, 0.02733612060546875, 0.029603958129882812, 0.031871795654296875, 0.03413963317871094, 0.036407470703125, 0.03867530822753906, 0.040943145751953125, 0.04321098327636719, 0.04547882080078125, 0.04774665832519531, 0.050014495849609375, 0.05228233337402344, 0.0545501708984375, 0.05681800842285156, 0.059085845947265625, 0.06135368347167969, 0.06362152099609375, 0.06588935852050781, 0.06815719604492188, 0.07042503356933594, 0.07269287109375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 3.0, 2.0, 5.0, 2.0, 2.0, 8.0, 4.0, 8.0, 7.0, 7.0, 14.0, 15.0, 26.0, 24.0, 37.0, 51.0, 90.0, 122.0, 218.0, 337.0, 650.0, 1420.0, 4443.0, 21404.0, 171660.0, 708476.0, 117052.0, 16297.0, 3491.0, 1174.0, 589.0, 302.0, 214.0, 119.0, 90.0, 47.0, 40.0, 26.0, 19.0, 10.0, 12.0, 12.0, 4.0, 5.0, 8.0, 8.0, 4.0, 1.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.3681640625, -0.354736328125, -0.34130859375, -0.327880859375, -0.314453125, -0.301025390625, -0.28759765625, -0.274169921875, -0.2607421875, -0.247314453125, -0.23388671875, -0.220458984375, -0.20703125, -0.193603515625, -0.18017578125, -0.166748046875, -0.1533203125, -0.139892578125, -0.12646484375, -0.113037109375, -0.099609375, -0.086181640625, -0.07275390625, -0.059326171875, -0.0458984375, -0.032470703125, -0.01904296875, -0.005615234375, 0.0078125, 0.021240234375, 0.03466796875, 0.048095703125, 0.0615234375, 0.074951171875, 0.08837890625, 0.101806640625, 0.115234375, 0.128662109375, 0.14208984375, 0.155517578125, 0.1689453125, 0.182373046875, 0.19580078125, 0.209228515625, 0.22265625, 0.236083984375, 0.24951171875, 0.262939453125, 0.2763671875, 0.289794921875, 0.30322265625, 0.316650390625, 0.330078125, 0.343505859375, 0.35693359375, 0.370361328125, 0.3837890625, 0.397216796875, 0.41064453125, 0.424072265625, 0.4375, 0.450927734375, 0.46435546875, 0.477783203125, 0.4912109375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 11.0, 13.0, 6.0, 6.0, 9.0, 16.0, 15.0, 19.0, 26.0, 34.0, 31.0, 34.0, 36.0, 39.0, 44.0, 44.0, 51.0, 59.0, 61.0, 47.0, 52.0, 57.0, 45.0, 36.0, 26.0, 38.0, 20.0, 21.0, 16.0, 12.0, 20.0, 13.0, 8.0, 10.0, 7.0, 9.0, 5.0, 4.0, 4.0, 3.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2279052734375, -0.22083282470703125, -0.2137603759765625, -0.20668792724609375, -0.199615478515625, -0.19254302978515625, -0.1854705810546875, -0.17839813232421875, -0.17132568359375, -0.16425323486328125, -0.1571807861328125, -0.15010833740234375, -0.143035888671875, -0.13596343994140625, -0.1288909912109375, -0.12181854248046875, -0.11474609375, -0.10767364501953125, -0.1006011962890625, -0.09352874755859375, -0.086456298828125, -0.07938385009765625, -0.0723114013671875, -0.06523895263671875, -0.05816650390625, -0.05109405517578125, -0.0440216064453125, -0.03694915771484375, -0.029876708984375, -0.02280426025390625, -0.0157318115234375, -0.00865936279296875, -0.0015869140625, 0.00548553466796875, 0.0125579833984375, 0.01963043212890625, 0.026702880859375, 0.03377532958984375, 0.0408477783203125, 0.04792022705078125, 0.05499267578125, 0.06206512451171875, 0.0691375732421875, 0.07621002197265625, 0.083282470703125, 0.09035491943359375, 0.0974273681640625, 0.10449981689453125, 0.111572265625, 0.11864471435546875, 0.1257171630859375, 0.13278961181640625, 0.139862060546875, 0.14693450927734375, 0.1540069580078125, 0.16107940673828125, 0.16815185546875, 0.17522430419921875, 0.1822967529296875, 0.18936920166015625, 0.196441650390625, 0.20351409912109375, 0.2105865478515625, 0.21765899658203125, 0.2247314453125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 7.0, 5.0, 11.0, 17.0, 20.0, 27.0, 47.0, 55.0, 92.0, 133.0, 265.0, 435.0, 791.0, 1402.0, 2868.0, 6339.0, 14871.0, 44134.0, 197044.0, 583623.0, 138573.0, 34778.0, 12472.0, 5219.0, 2467.0, 1274.0, 635.0, 376.0, 205.0, 133.0, 80.0, 58.0, 33.0, 21.0, 15.0, 10.0, 7.0, 1.0, 8.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1424560546875, -0.13743972778320312, -0.13242340087890625, -0.12740707397460938, -0.1223907470703125, -0.11737442016601562, -0.11235809326171875, -0.10734176635742188, -0.102325439453125, -0.09730911254882812, -0.09229278564453125, -0.08727645874023438, -0.0822601318359375, -0.07724380493164062, -0.07222747802734375, -0.06721115112304688, -0.06219482421875, -0.057178497314453125, -0.05216217041015625, -0.047145843505859375, -0.0421295166015625, -0.037113189697265625, -0.03209686279296875, -0.027080535888671875, -0.022064208984375, -0.017047882080078125, -0.01203155517578125, -0.007015228271484375, -0.0019989013671875, 0.003017425537109375, 0.00803375244140625, 0.013050079345703125, 0.01806640625, 0.023082733154296875, 0.02809906005859375, 0.033115386962890625, 0.0381317138671875, 0.043148040771484375, 0.04816436767578125, 0.053180694580078125, 0.058197021484375, 0.06321334838867188, 0.06822967529296875, 0.07324600219726562, 0.0782623291015625, 0.08327865600585938, 0.08829498291015625, 0.09331130981445312, 0.09832763671875, 0.10334396362304688, 0.10836029052734375, 0.11337661743164062, 0.1183929443359375, 0.12340927124023438, 0.12842559814453125, 0.13344192504882812, 0.138458251953125, 0.14347457885742188, 0.14849090576171875, 0.15350723266601562, 0.1585235595703125, 0.16353988647460938, 0.16855621337890625, 0.17357254028320312, 0.1785888671875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 5.0, 3.0, 6.0, 8.0, 13.0, 21.0, 30.0, 45.0, 43.0, 47.0, 66.0, 75.0, 90.0, 93.0, 105.0, 87.0, 73.0, 60.0, 37.0, 27.0, 21.0, 14.0, 8.0, 9.0, 8.0, 0.0, 2.0, 3.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.297494888305664e-05, -4.1513703763484955e-05, -4.005245864391327e-05, -3.859121352434158e-05, -3.71299684047699e-05, -3.566872328519821e-05, -3.4207478165626526e-05, -3.274623304605484e-05, -3.1284987926483154e-05, -2.982374280691147e-05, -2.8362497687339783e-05, -2.6901252567768097e-05, -2.544000744819641e-05, -2.3978762328624725e-05, -2.251751720905304e-05, -2.1056272089481354e-05, -1.9595026969909668e-05, -1.8133781850337982e-05, -1.6672536730766296e-05, -1.521129161119461e-05, -1.3750046491622925e-05, -1.2288801372051239e-05, -1.0827556252479553e-05, -9.366311132907867e-06, -7.905066013336182e-06, -6.443820893764496e-06, -4.98257577419281e-06, -3.5213306546211243e-06, -2.0600855350494385e-06, -5.988404154777527e-07, 8.624047040939331e-07, 2.323649823665619e-06, 3.7848949432373047e-06, 5.2461400628089905e-06, 6.707385182380676e-06, 8.168630301952362e-06, 9.629875421524048e-06, 1.1091120541095734e-05, 1.255236566066742e-05, 1.4013610780239105e-05, 1.547485589981079e-05, 1.6936101019382477e-05, 1.8397346138954163e-05, 1.985859125852585e-05, 2.1319836378097534e-05, 2.278108149766922e-05, 2.4242326617240906e-05, 2.570357173681259e-05, 2.7164816856384277e-05, 2.8626061975955963e-05, 3.008730709552765e-05, 3.1548552215099335e-05, 3.300979733467102e-05, 3.4471042454242706e-05, 3.593228757381439e-05, 3.739353269338608e-05, 3.8854777812957764e-05, 4.031602293252945e-05, 4.1777268052101135e-05, 4.323851317167282e-05, 4.469975829124451e-05, 4.616100341081619e-05, 4.762224853038788e-05, 4.9083493649959564e-05, 5.054473876953125e-05]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 3.0, 7.0, 8.0, 10.0, 14.0, 21.0, 24.0, 49.0, 85.0, 162.0, 376.0, 1036.0, 3798.0, 28192.0, 801304.0, 198810.0, 11333.0, 2145.0, 641.0, 261.0, 108.0, 66.0, 31.0, 21.0, 12.0, 13.0, 7.0, 4.0, 2.0, 7.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4443359375, -0.43119049072265625, -0.4180450439453125, -0.40489959716796875, -0.391754150390625, -0.37860870361328125, -0.3654632568359375, -0.35231781005859375, -0.33917236328125, -0.32602691650390625, -0.3128814697265625, -0.29973602294921875, -0.286590576171875, -0.27344512939453125, -0.2602996826171875, -0.24715423583984375, -0.2340087890625, -0.22086334228515625, -0.2077178955078125, -0.19457244873046875, -0.181427001953125, -0.16828155517578125, -0.1551361083984375, -0.14199066162109375, -0.12884521484375, -0.11569976806640625, -0.1025543212890625, -0.08940887451171875, -0.076263427734375, -0.06311798095703125, -0.0499725341796875, -0.03682708740234375, -0.023681640625, -0.01053619384765625, 0.0026092529296875, 0.01575469970703125, 0.028900146484375, 0.04204559326171875, 0.0551910400390625, 0.06833648681640625, 0.08148193359375, 0.09462738037109375, 0.1077728271484375, 0.12091827392578125, 0.134063720703125, 0.14720916748046875, 0.1603546142578125, 0.17350006103515625, 0.1866455078125, 0.19979095458984375, 0.2129364013671875, 0.22608184814453125, 0.239227294921875, 0.25237274169921875, 0.2655181884765625, 0.27866363525390625, 0.29180908203125, 0.30495452880859375, 0.3180999755859375, 0.33124542236328125, 0.344390869140625, 0.35753631591796875, 0.3706817626953125, 0.38382720947265625, 0.39697265625]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 4.0, 3.0, 7.0, 7.0, 11.0, 9.0, 9.0, 12.0, 15.0, 29.0, 32.0, 51.0, 71.0, 77.0, 111.0, 151.0, 128.0, 79.0, 57.0, 31.0, 27.0, 18.0, 21.0, 11.0, 6.0, 6.0, 6.0, 3.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1651611328125, -0.16032028198242188, -0.15547943115234375, -0.15063858032226562, -0.1457977294921875, -0.14095687866210938, -0.13611602783203125, -0.13127517700195312, -0.126434326171875, -0.12159347534179688, -0.11675262451171875, -0.11191177368164062, -0.1070709228515625, -0.10223007202148438, -0.09738922119140625, -0.09254837036132812, -0.08770751953125, -0.08286666870117188, -0.07802581787109375, -0.07318496704101562, -0.0683441162109375, -0.06350326538085938, -0.05866241455078125, -0.053821563720703125, -0.048980712890625, -0.044139862060546875, -0.03929901123046875, -0.034458160400390625, -0.0296173095703125, -0.024776458740234375, -0.01993560791015625, -0.015094757080078125, -0.01025390625, -0.005413055419921875, -0.00057220458984375, 0.004268646240234375, 0.0091094970703125, 0.013950347900390625, 0.01879119873046875, 0.023632049560546875, 0.028472900390625, 0.033313751220703125, 0.03815460205078125, 0.042995452880859375, 0.0478363037109375, 0.052677154541015625, 0.05751800537109375, 0.062358856201171875, 0.06719970703125, 0.07204055786132812, 0.07688140869140625, 0.08172225952148438, 0.0865631103515625, 0.09140396118164062, 0.09624481201171875, 0.10108566284179688, 0.105926513671875, 0.11076736450195312, 0.11560821533203125, 0.12044906616210938, 0.1252899169921875, 0.13013076782226562, 0.13497161865234375, 0.13981246948242188, 0.1446533203125]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 14.0, 86.0, 442.0, 394.0, 58.0, 13.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3341137170791626, -1.1095914840698242, -0.8850691914558411, -0.6605468988418579, -0.43602466583251953, -0.21150243282318115, 0.013019919395446777, 0.23754215240478516, 0.46206438541412354, 0.6865866184234619, 0.9111089110374451, 1.1356312036514282, 1.3601534366607666, 1.584675669670105, 1.809198021888733, 2.0337202548980713, 2.258242607116699, 2.482764959335327, 2.707287073135376, 2.931809425354004, 3.1563315391540527, 3.3808538913726807, 3.6053762435913086, 3.8298983573913574, 4.054420471191406, 4.278942584991455, 4.503465175628662, 4.727987289428711, 4.95250940322876, 5.177031517028809, 5.401554107666016, 5.6260762214660645, 5.850598335266113, 6.075120449066162, 6.299643039703369, 6.524165153503418, 6.748687267303467, 6.973209381103516, 7.197731971740723, 7.4222540855407715, 7.64677619934082, 7.871298313140869, 8.095820426940918, 8.320343017578125, 8.544865608215332, 8.769387245178223, 8.99390983581543, 9.218432426452637, 9.442955017089844, 9.66747760772705, 9.891999244689941, 10.116521835327148, 10.341044425964355, 10.565566062927246, 10.790088653564453, 11.01461124420166, 11.23913288116455, 11.463655471801758, 11.688177108764648, 11.912699699401855, 12.137222290039062, 12.361743927001953, 12.58626651763916, 12.810789108276367, 13.035310745239258]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 5.0, 9.0, 3.0, 7.0, 8.0, 9.0, 17.0, 20.0, 15.0, 16.0, 31.0, 27.0, 28.0, 34.0, 35.0, 29.0, 43.0, 31.0, 39.0, 42.0, 59.0, 40.0, 50.0, 44.0, 29.0, 45.0, 35.0, 38.0, 26.0, 36.0, 23.0, 18.0, 19.0, 15.0, 18.0, 15.0, 10.0, 9.0, 8.0, 6.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2969822883605957, -1.2545192241668701, -1.2120561599731445, -1.1695929765701294, -1.1271299123764038, -1.0846668481826782, -1.042203664779663, -0.9997406005859375, -0.9572775363922119, -0.9148144721984863, -0.872351348400116, -0.8298882246017456, -0.78742516040802, -0.7449620962142944, -0.7024989724159241, -0.6600358486175537, -0.6175727844238281, -0.5751097202301025, -0.5326465964317322, -0.4901835024356842, -0.44772040843963623, -0.40525731444358826, -0.3627942204475403, -0.3203311264514923, -0.27786803245544434, -0.23540493845939636, -0.1929418444633484, -0.15047875046730042, -0.10801565647125244, -0.06555256247520447, -0.023089468479156494, 0.01937362551689148, 0.061836838722229004, 0.10429993271827698, 0.14676302671432495, 0.18922612071037292, 0.2316892147064209, 0.27415230870246887, 0.31661540269851685, 0.3590784966945648, 0.4015415906906128, 0.44400468468666077, 0.48646777868270874, 0.5289309024810791, 0.5713939666748047, 0.6138570308685303, 0.6563201546669006, 0.698783278465271, 0.7412463426589966, 0.7837094068527222, 0.8261725306510925, 0.8686356544494629, 0.9110987186431885, 0.9535617828369141, 0.9960249066352844, 1.0384880304336548, 1.0809510946273804, 1.123414158821106, 1.165877342224121, 1.2083404064178467, 1.2508034706115723, 1.2932665348052979, 1.3357295989990234, 1.3781927824020386, 1.4206558465957642]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 3.0, 3.0, 6.0, 6.0, 3.0, 8.0, 12.0, 13.0, 20.0, 33.0, 50.0, 61.0, 122.0, 242.0, 437.0, 953.0, 2437.0, 8017.0, 58453.0, 3979016.0, 127187.0, 12173.0, 2938.0, 1036.0, 509.0, 212.0, 137.0, 81.0, 47.0, 23.0, 16.0, 12.0, 4.0, 4.0, 1.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5166015625, -0.49973297119140625, -0.4828643798828125, -0.46599578857421875, -0.449127197265625, -0.43225860595703125, -0.4153900146484375, -0.39852142333984375, -0.38165283203125, -0.36478424072265625, -0.3479156494140625, -0.33104705810546875, -0.314178466796875, -0.29730987548828125, -0.2804412841796875, -0.26357269287109375, -0.2467041015625, -0.22983551025390625, -0.2129669189453125, -0.19609832763671875, -0.179229736328125, -0.16236114501953125, -0.1454925537109375, -0.12862396240234375, -0.11175537109375, -0.09488677978515625, -0.0780181884765625, -0.06114959716796875, -0.044281005859375, -0.02741241455078125, -0.0105438232421875, 0.00632476806640625, 0.023193359375, 0.04006195068359375, 0.0569305419921875, 0.07379913330078125, 0.090667724609375, 0.10753631591796875, 0.1244049072265625, 0.14127349853515625, 0.15814208984375, 0.17501068115234375, 0.1918792724609375, 0.20874786376953125, 0.225616455078125, 0.24248504638671875, 0.2593536376953125, 0.27622222900390625, 0.2930908203125, 0.30995941162109375, 0.3268280029296875, 0.34369659423828125, 0.360565185546875, 0.37743377685546875, 0.3943023681640625, 0.41117095947265625, 0.42803955078125, 0.44490814208984375, 0.4617767333984375, 0.47864532470703125, 0.495513916015625, 0.5123825073242188, 0.5292510986328125, 0.5461196899414062, 0.56298828125]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 3.0, 5.0, 4.0, 10.0, 6.0, 15.0, 22.0, 24.0, 52.0, 76.0, 93.0, 118.0, 109.0, 94.0, 96.0, 74.0, 69.0, 42.0, 39.0, 11.0, 11.0, 12.0, 10.0, 4.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07122802734375, -0.06891059875488281, -0.06659317016601562, -0.06427574157714844, -0.06195831298828125, -0.05964088439941406, -0.057323455810546875, -0.05500602722167969, -0.0526885986328125, -0.05037117004394531, -0.048053741455078125, -0.04573631286621094, -0.04341888427734375, -0.04110145568847656, -0.038784027099609375, -0.03646659851074219, -0.034149169921875, -0.03183174133300781, -0.029514312744140625, -0.027196884155273438, -0.02487945556640625, -0.022562026977539062, -0.020244598388671875, -0.017927169799804688, -0.0156097412109375, -0.013292312622070312, -0.010974884033203125, -0.008657455444335938, -0.00634002685546875, -0.0040225982666015625, -0.001705169677734375, 0.0006122589111328125, 0.0029296875, 0.0052471160888671875, 0.007564544677734375, 0.009881973266601562, 0.01219940185546875, 0.014516830444335938, 0.016834259033203125, 0.019151687622070312, 0.0214691162109375, 0.023786544799804688, 0.026103973388671875, 0.028421401977539062, 0.03073883056640625, 0.03305625915527344, 0.035373687744140625, 0.03769111633300781, 0.040008544921875, 0.04232597351074219, 0.044643402099609375, 0.04696083068847656, 0.04927825927734375, 0.05159568786621094, 0.053913116455078125, 0.05623054504394531, 0.0585479736328125, 0.06086540222167969, 0.06318283081054688, 0.06550025939941406, 0.06781768798828125, 0.07013511657714844, 0.07245254516601562, 0.07476997375488281, 0.07708740234375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 6.0, 4.0, 4.0, 7.0, 6.0, 6.0, 13.0, 26.0, 42.0, 75.0, 154.0, 294.0, 583.0, 1470.0, 3704.0, 11461.0, 49159.0, 605717.0, 3405345.0, 90489.0, 16936.0, 5258.0, 1930.0, 814.0, 377.0, 192.0, 89.0, 30.0, 22.0, 20.0, 8.0, 9.0, 12.0, 8.0, 5.0, 2.0, 2.0, 1.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.329833984375, -0.3195762634277344, -0.30931854248046875, -0.2990608215332031, -0.2888031005859375, -0.2785453796386719, -0.26828765869140625, -0.2580299377441406, -0.247772216796875, -0.23751449584960938, -0.22725677490234375, -0.21699905395507812, -0.2067413330078125, -0.19648361206054688, -0.18622589111328125, -0.17596817016601562, -0.16571044921875, -0.15545272827148438, -0.14519500732421875, -0.13493728637695312, -0.1246795654296875, -0.11442184448242188, -0.10416412353515625, -0.09390640258789062, -0.083648681640625, -0.07339096069335938, -0.06313323974609375, -0.052875518798828125, -0.0426177978515625, -0.032360076904296875, -0.02210235595703125, -0.011844635009765625, -0.0015869140625, 0.008670806884765625, 0.01892852783203125, 0.029186248779296875, 0.0394439697265625, 0.049701690673828125, 0.05995941162109375, 0.07021713256835938, 0.080474853515625, 0.09073257446289062, 0.10099029541015625, 0.11124801635742188, 0.1215057373046875, 0.13176345825195312, 0.14202117919921875, 0.15227890014648438, 0.16253662109375, 0.17279434204101562, 0.18305206298828125, 0.19330978393554688, 0.2035675048828125, 0.21382522583007812, 0.22408294677734375, 0.23434066772460938, 0.244598388671875, 0.2548561096191406, 0.26511383056640625, 0.2753715515136719, 0.2856292724609375, 0.2958869934082031, 0.30614471435546875, 0.3164024353027344, 0.32666015625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 7.0, 7.0, 4.0, 7.0, 4.0, 7.0, 16.0, 20.0, 30.0, 30.0, 47.0, 91.0, 158.0, 325.0, 1703.0, 913.0, 289.0, 117.0, 95.0, 61.0, 37.0, 28.0, 21.0, 12.0, 7.0, 11.0, 7.0, 4.0, 3.0, 4.0, 3.0, 1.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.067138671875, -0.06473255157470703, -0.06232643127441406, -0.059920310974121094, -0.057514190673828125, -0.055108070373535156, -0.05270195007324219, -0.05029582977294922, -0.04788970947265625, -0.04548358917236328, -0.04307746887207031, -0.040671348571777344, -0.038265228271484375, -0.035859107971191406, -0.03345298767089844, -0.03104686737060547, -0.0286407470703125, -0.02623462677001953, -0.023828506469726562, -0.021422386169433594, -0.019016265869140625, -0.016610145568847656, -0.014204025268554688, -0.011797904968261719, -0.00939178466796875, -0.006985664367675781, -0.0045795440673828125, -0.0021734237670898438, 0.000232696533203125, 0.0026388168334960938, 0.0050449371337890625, 0.007451057434082031, 0.009857177734375, 0.012263298034667969, 0.014669418334960938, 0.017075538635253906, 0.019481658935546875, 0.021887779235839844, 0.024293899536132812, 0.02670001983642578, 0.02910614013671875, 0.03151226043701172, 0.03391838073730469, 0.036324501037597656, 0.038730621337890625, 0.041136741638183594, 0.04354286193847656, 0.04594898223876953, 0.0483551025390625, 0.05076122283935547, 0.05316734313964844, 0.055573463439941406, 0.057979583740234375, 0.060385704040527344, 0.06279182434082031, 0.06519794464111328, 0.06760406494140625, 0.07001018524169922, 0.07241630554199219, 0.07482242584228516, 0.07722854614257812, 0.0796346664428711, 0.08204078674316406, 0.08444690704345703, 0.08685302734375]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 8.0, 19.0, 154.0, 569.0, 229.0, 32.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7553646564483643, -2.6998515129089355, -2.644338369369507, -2.588825225830078, -2.5333120822906494, -2.4777989387512207, -2.422285795211792, -2.3667726516723633, -2.3112595081329346, -2.255746364593506, -2.200233221054077, -2.1447200775146484, -2.0892069339752197, -2.033693790435791, -1.9781806468963623, -1.9226675033569336, -1.8671542406082153, -1.8116410970687866, -1.756127953529358, -1.7006148099899292, -1.6451016664505005, -1.5895885229110718, -1.5340752601623535, -1.4785621166229248, -1.423048973083496, -1.3675358295440674, -1.3120226860046387, -1.25650954246521, -1.2009963989257812, -1.1454832553863525, -1.0899701118469238, -1.0344569683074951, -0.9789438247680664, -0.9234306812286377, -0.867917537689209, -0.8124043941497803, -0.7568912506103516, -0.7013781070709229, -0.6458649039268494, -0.5903517603874207, -0.5348386168479919, -0.47932547330856323, -0.4238123297691345, -0.3682991564273834, -0.3127860128879547, -0.257272869348526, -0.2017596960067749, -0.1462465524673462, -0.09073340892791748, -0.03522025793790817, 0.020292893052101135, 0.07580605149269104, 0.13131919503211975, 0.18683233857154846, 0.24234551191329956, 0.29785865545272827, 0.353371798992157, 0.4088849425315857, 0.4643980860710144, 0.5199112892150879, 0.5754244327545166, 0.6309375762939453, 0.686450719833374, 0.7419638633728027, 0.7974770069122314]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 7.0, 7.0, 6.0, 9.0, 8.0, 14.0, 16.0, 21.0, 32.0, 28.0, 15.0, 34.0, 36.0, 48.0, 39.0, 24.0, 42.0, 32.0, 58.0, 42.0, 34.0, 51.0, 45.0, 45.0, 39.0, 31.0, 29.0, 29.0, 27.0, 23.0, 18.0, 18.0, 14.0, 16.0, 12.0, 9.0, 11.0, 8.0, 9.0, 4.0, 2.0, 2.0, 2.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.2598996162414551, -0.2520107626914978, -0.24412190914154053, -0.23623305559158325, -0.22834420204162598, -0.2204553484916687, -0.21256649494171143, -0.20467764139175415, -0.19678878784179688, -0.1888999342918396, -0.18101108074188232, -0.17312222719192505, -0.16523337364196777, -0.1573445200920105, -0.14945566654205322, -0.14156681299209595, -0.13367794454097748, -0.1257890909910202, -0.11790023744106293, -0.11001138389110565, -0.10212253034114838, -0.0942336767911911, -0.08634481579065323, -0.07845596224069595, -0.07056710869073868, -0.0626782551407814, -0.05478940159082413, -0.04690054431557655, -0.03901169076561928, -0.031122837215662003, -0.02323397994041443, -0.015345126390457153, -0.007456272840499878, 0.0004325816407799721, 0.008321436122059822, 0.016210291534662247, 0.024099145084619522, 0.0319879986345768, 0.03987685590982437, 0.04776570945978165, 0.05565456300973892, 0.0635434165596962, 0.07143227010965347, 0.07932113111019135, 0.08720998466014862, 0.0950988382101059, 0.10298769176006317, 0.11087654531002045, 0.11876539885997772, 0.126654252409935, 0.13454310595989227, 0.14243195950984955, 0.15032081305980682, 0.1582096666097641, 0.16609853506088257, 0.17398738861083984, 0.18187624216079712, 0.1897650957107544, 0.19765394926071167, 0.20554280281066895, 0.21343165636062622, 0.2213205099105835, 0.22920936346054077, 0.23709821701049805, 0.24498707056045532]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 4.0, 11.0, 8.0, 9.0, 17.0, 22.0, 32.0, 31.0, 56.0, 74.0, 106.0, 129.0, 182.0, 225.0, 324.0, 579.0, 869.0, 1458.0, 2628.0, 5153.0, 11095.0, 25648.0, 66025.0, 193083.0, 409245.0, 208730.0, 71008.0, 27548.0, 11653.0, 5515.0, 2819.0, 1518.0, 897.0, 575.0, 365.0, 256.0, 171.0, 130.0, 106.0, 62.0, 45.0, 38.0, 28.0, 29.0, 17.0, 13.0, 10.0, 4.0, 3.0, 7.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.189453125, -0.18396759033203125, -0.1784820556640625, -0.17299652099609375, -0.167510986328125, -0.16202545166015625, -0.1565399169921875, -0.15105438232421875, -0.14556884765625, -0.14008331298828125, -0.1345977783203125, -0.12911224365234375, -0.123626708984375, -0.11814117431640625, -0.1126556396484375, -0.10717010498046875, -0.1016845703125, -0.09619903564453125, -0.0907135009765625, -0.08522796630859375, -0.079742431640625, -0.07425689697265625, -0.0687713623046875, -0.06328582763671875, -0.05780029296875, -0.05231475830078125, -0.0468292236328125, -0.04134368896484375, -0.035858154296875, -0.03037261962890625, -0.0248870849609375, -0.01940155029296875, -0.013916015625, -0.00843048095703125, -0.0029449462890625, 0.00254058837890625, 0.008026123046875, 0.01351165771484375, 0.0189971923828125, 0.02448272705078125, 0.02996826171875, 0.03545379638671875, 0.0409393310546875, 0.04642486572265625, 0.051910400390625, 0.05739593505859375, 0.0628814697265625, 0.06836700439453125, 0.0738525390625, 0.07933807373046875, 0.0848236083984375, 0.09030914306640625, 0.095794677734375, 0.10128021240234375, 0.1067657470703125, 0.11225128173828125, 0.11773681640625, 0.12322235107421875, 0.1287078857421875, 0.13419342041015625, 0.139678955078125, 0.14516448974609375, 0.1506500244140625, 0.15613555908203125, 0.16162109375]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 9.0, 16.0, 21.0, 19.0, 39.0, 59.0, 65.0, 76.0, 103.0, 102.0, 103.0, 86.0, 89.0, 59.0, 57.0, 29.0, 12.0, 13.0, 14.0, 6.0, 8.0, 6.0, 1.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07379150390625, -0.07160377502441406, -0.06941604614257812, -0.06722831726074219, -0.06504058837890625, -0.06285285949707031, -0.060665130615234375, -0.05847740173339844, -0.0562896728515625, -0.05410194396972656, -0.051914215087890625, -0.04972648620605469, -0.04753875732421875, -0.04535102844238281, -0.043163299560546875, -0.04097557067871094, -0.038787841796875, -0.03660011291503906, -0.034412384033203125, -0.03222465515136719, -0.03003692626953125, -0.027849197387695312, -0.025661468505859375, -0.023473739624023438, -0.0212860107421875, -0.019098281860351562, -0.016910552978515625, -0.014722824096679688, -0.01253509521484375, -0.010347366333007812, -0.008159637451171875, -0.0059719085693359375, -0.0037841796875, -0.0015964508056640625, 0.000591278076171875, 0.0027790069580078125, 0.00496673583984375, 0.0071544647216796875, 0.009342193603515625, 0.011529922485351562, 0.0137176513671875, 0.015905380249023438, 0.018093109130859375, 0.020280838012695312, 0.02246856689453125, 0.024656295776367188, 0.026844024658203125, 0.029031753540039062, 0.031219482421875, 0.03340721130371094, 0.035594940185546875, 0.03778266906738281, 0.03997039794921875, 0.04215812683105469, 0.044345855712890625, 0.04653358459472656, 0.0487213134765625, 0.05090904235839844, 0.053096771240234375, 0.05528450012207031, 0.05747222900390625, 0.05965995788574219, 0.061847686767578125, 0.06403541564941406, 0.06622314453125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 4.0, 9.0, 12.0, 18.0, 28.0, 30.0, 61.0, 84.0, 122.0, 228.0, 410.0, 805.0, 2125.0, 8448.0, 64309.0, 685742.0, 257273.0, 22138.0, 4105.0, 1251.0, 585.0, 313.0, 169.0, 96.0, 62.0, 39.0, 33.0, 18.0, 14.0, 10.0, 6.0, 0.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.356689453125, -0.3442878723144531, -0.33188629150390625, -0.3194847106933594, -0.3070831298828125, -0.2946815490722656, -0.28227996826171875, -0.2698783874511719, -0.257476806640625, -0.24507522583007812, -0.23267364501953125, -0.22027206420898438, -0.2078704833984375, -0.19546890258789062, -0.18306732177734375, -0.17066574096679688, -0.15826416015625, -0.14586257934570312, -0.13346099853515625, -0.12105941772460938, -0.1086578369140625, -0.09625625610351562, -0.08385467529296875, -0.07145309448242188, -0.059051513671875, -0.046649932861328125, -0.03424835205078125, -0.021846771240234375, -0.0094451904296875, 0.002956390380859375, 0.01535797119140625, 0.027759552001953125, 0.0401611328125, 0.052562713623046875, 0.06496429443359375, 0.07736587524414062, 0.0897674560546875, 0.10216903686523438, 0.11457061767578125, 0.12697219848632812, 0.139373779296875, 0.15177536010742188, 0.16417694091796875, 0.17657852172851562, 0.1889801025390625, 0.20138168334960938, 0.21378326416015625, 0.22618484497070312, 0.23858642578125, 0.2509880065917969, 0.26338958740234375, 0.2757911682128906, 0.2881927490234375, 0.3005943298339844, 0.31299591064453125, 0.3253974914550781, 0.337799072265625, 0.3502006530761719, 0.36260223388671875, 0.3750038146972656, 0.3874053955078125, 0.3998069763183594, 0.41220855712890625, 0.4246101379394531, 0.43701171875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 4.0, 6.0, 8.0, 10.0, 7.0, 10.0, 23.0, 28.0, 41.0, 50.0, 38.0, 53.0, 55.0, 60.0, 72.0, 76.0, 77.0, 64.0, 75.0, 48.0, 43.0, 30.0, 32.0, 33.0, 15.0, 8.0, 13.0, 10.0, 6.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2469482421875, -0.2376537322998047, -0.22835922241210938, -0.21906471252441406, -0.20977020263671875, -0.20047569274902344, -0.19118118286132812, -0.1818866729736328, -0.1725921630859375, -0.1632976531982422, -0.15400314331054688, -0.14470863342285156, -0.13541412353515625, -0.12611961364746094, -0.11682510375976562, -0.10753059387207031, -0.098236083984375, -0.08894157409667969, -0.07964706420898438, -0.07035255432128906, -0.06105804443359375, -0.05176353454589844, -0.042469024658203125, -0.03317451477050781, -0.0238800048828125, -0.014585494995117188, -0.005290985107421875, 0.0040035247802734375, 0.01329803466796875, 0.022592544555664062, 0.031887054443359375, 0.04118156433105469, 0.05047607421875, 0.05977058410644531, 0.06906509399414062, 0.07835960388183594, 0.08765411376953125, 0.09694862365722656, 0.10624313354492188, 0.11553764343261719, 0.1248321533203125, 0.1341266632080078, 0.14342117309570312, 0.15271568298339844, 0.16201019287109375, 0.17130470275878906, 0.18059921264648438, 0.1898937225341797, 0.199188232421875, 0.2084827423095703, 0.21777725219726562, 0.22707176208496094, 0.23636627197265625, 0.24566078186035156, 0.2549552917480469, 0.2642498016357422, 0.2735443115234375, 0.2828388214111328, 0.2921333312988281, 0.30142784118652344, 0.31072235107421875, 0.32001686096191406, 0.3293113708496094, 0.3386058807373047, 0.347900390625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 6.0, 8.0, 6.0, 17.0, 10.0, 23.0, 23.0, 36.0, 57.0, 76.0, 97.0, 189.0, 300.0, 536.0, 1075.0, 1975.0, 4657.0, 12494.0, 47591.0, 345682.0, 537505.0, 68983.0, 16321.0, 5626.0, 2496.0, 1201.0, 627.0, 335.0, 198.0, 117.0, 96.0, 67.0, 37.0, 21.0, 17.0, 16.0, 10.0, 9.0, 4.0, 12.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.1746826171875, -0.17009925842285156, -0.16551589965820312, -0.1609325408935547, -0.15634918212890625, -0.1517658233642578, -0.14718246459960938, -0.14259910583496094, -0.1380157470703125, -0.13343238830566406, -0.12884902954101562, -0.12426567077636719, -0.11968231201171875, -0.11509895324707031, -0.11051559448242188, -0.10593223571777344, -0.101348876953125, -0.09676551818847656, -0.09218215942382812, -0.08759880065917969, -0.08301544189453125, -0.07843208312988281, -0.07384872436523438, -0.06926536560058594, -0.0646820068359375, -0.06009864807128906, -0.055515289306640625, -0.05093193054199219, -0.04634857177734375, -0.04176521301269531, -0.037181854248046875, -0.03259849548339844, -0.02801513671875, -0.023431777954101562, -0.018848419189453125, -0.014265060424804688, -0.00968170166015625, -0.0050983428955078125, -0.000514984130859375, 0.0040683746337890625, 0.0086517333984375, 0.013235092163085938, 0.017818450927734375, 0.022401809692382812, 0.02698516845703125, 0.03156852722167969, 0.036151885986328125, 0.04073524475097656, 0.045318603515625, 0.04990196228027344, 0.054485321044921875, 0.05906867980957031, 0.06365203857421875, 0.06823539733886719, 0.07281875610351562, 0.07740211486816406, 0.0819854736328125, 0.08656883239746094, 0.09115219116210938, 0.09573554992675781, 0.10031890869140625, 0.10490226745605469, 0.10948562622070312, 0.11406898498535156, 0.11865234375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 7.0, 7.0, 5.0, 11.0, 13.0, 14.0, 13.0, 29.0, 33.0, 44.0, 55.0, 71.0, 82.0, 84.0, 82.0, 93.0, 66.0, 74.0, 50.0, 42.0, 31.0, 13.0, 26.0, 17.0, 10.0, 8.0, 10.0, 3.0, 2.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.9114227294921875e-05, -4.783552139997482e-05, -4.655681550502777e-05, -4.527810961008072e-05, -4.399940371513367e-05, -4.2720697820186615e-05, -4.144199192523956e-05, -4.016328603029251e-05, -3.888458013534546e-05, -3.760587424039841e-05, -3.6327168345451355e-05, -3.50484624505043e-05, -3.376975655555725e-05, -3.24910506606102e-05, -3.121234476566315e-05, -2.9933638870716095e-05, -2.8654932975769043e-05, -2.737622708082199e-05, -2.609752118587494e-05, -2.4818815290927887e-05, -2.3540109395980835e-05, -2.2261403501033783e-05, -2.098269760608673e-05, -1.970399171113968e-05, -1.8425285816192627e-05, -1.7146579921245575e-05, -1.5867874026298523e-05, -1.4589168131351471e-05, -1.3310462236404419e-05, -1.2031756341457367e-05, -1.0753050446510315e-05, -9.474344551563263e-06, -8.195638656616211e-06, -6.916932761669159e-06, -5.638226866722107e-06, -4.359520971775055e-06, -3.080815076828003e-06, -1.802109181880951e-06, -5.234032869338989e-07, 7.553026080131531e-07, 2.034008502960205e-06, 3.312714397907257e-06, 4.591420292854309e-06, 5.870126187801361e-06, 7.148832082748413e-06, 8.427537977695465e-06, 9.706243872642517e-06, 1.0984949767589569e-05, 1.2263655662536621e-05, 1.3542361557483673e-05, 1.4821067452430725e-05, 1.6099773347377777e-05, 1.737847924232483e-05, 1.865718513727188e-05, 1.9935891032218933e-05, 2.1214596927165985e-05, 2.2493302822113037e-05, 2.377200871706009e-05, 2.505071461200714e-05, 2.6329420506954193e-05, 2.7608126401901245e-05, 2.8886832296848297e-05, 3.016553819179535e-05, 3.14442440867424e-05, 3.272294998168945e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 7.0, 9.0, 14.0, 13.0, 21.0, 27.0, 74.0, 108.0, 172.0, 354.0, 691.0, 1867.0, 6039.0, 29380.0, 381784.0, 577290.0, 39444.0, 7369.0, 2154.0, 862.0, 381.0, 206.0, 98.0, 72.0, 38.0, 28.0, 13.0, 8.0, 10.0, 5.0, 3.0, 4.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.217529296875, -0.21114540100097656, -0.20476150512695312, -0.1983776092529297, -0.19199371337890625, -0.1856098175048828, -0.17922592163085938, -0.17284202575683594, -0.1664581298828125, -0.16007423400878906, -0.15369033813476562, -0.1473064422607422, -0.14092254638671875, -0.1345386505126953, -0.12815475463867188, -0.12177085876464844, -0.115386962890625, -0.10900306701660156, -0.10261917114257812, -0.09623527526855469, -0.08985137939453125, -0.08346748352050781, -0.07708358764648438, -0.07069969177246094, -0.0643157958984375, -0.05793190002441406, -0.051548004150390625, -0.04516410827636719, -0.03878021240234375, -0.03239631652832031, -0.026012420654296875, -0.019628524780273438, -0.01324462890625, -0.0068607330322265625, -0.000476837158203125, 0.0059070587158203125, 0.01229095458984375, 0.018674850463867188, 0.025058746337890625, 0.03144264221191406, 0.0378265380859375, 0.04421043395996094, 0.050594329833984375, 0.05697822570800781, 0.06336212158203125, 0.06974601745605469, 0.07612991333007812, 0.08251380920410156, 0.088897705078125, 0.09528160095214844, 0.10166549682617188, 0.10804939270019531, 0.11443328857421875, 0.12081718444824219, 0.12720108032226562, 0.13358497619628906, 0.1399688720703125, 0.14635276794433594, 0.15273666381835938, 0.1591205596923828, 0.16550445556640625, 0.1718883514404297, 0.17827224731445312, 0.18465614318847656, 0.1910400390625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 7.0, 4.0, 4.0, 2.0, 4.0, 3.0, 11.0, 6.0, 6.0, 6.0, 16.0, 14.0, 26.0, 26.0, 26.0, 45.0, 80.0, 80.0, 105.0, 95.0, 110.0, 78.0, 59.0, 41.0, 40.0, 18.0, 27.0, 16.0, 8.0, 6.0, 10.0, 5.0, 2.0, 4.0, 3.0, 3.0, 3.0, 0.0, 4.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0831298828125, -0.08046150207519531, -0.07779312133789062, -0.07512474060058594, -0.07245635986328125, -0.06978797912597656, -0.06711959838867188, -0.06445121765136719, -0.0617828369140625, -0.05911445617675781, -0.056446075439453125, -0.05377769470214844, -0.05110931396484375, -0.04844093322753906, -0.045772552490234375, -0.04310417175292969, -0.040435791015625, -0.03776741027832031, -0.035099029541015625, -0.03243064880371094, -0.02976226806640625, -0.027093887329101562, -0.024425506591796875, -0.021757125854492188, -0.0190887451171875, -0.016420364379882812, -0.013751983642578125, -0.011083602905273438, -0.00841522216796875, -0.0057468414306640625, -0.003078460693359375, -0.0004100799560546875, 0.00225830078125, 0.0049266815185546875, 0.007595062255859375, 0.010263442993164062, 0.01293182373046875, 0.015600204467773438, 0.018268585205078125, 0.020936965942382812, 0.0236053466796875, 0.026273727416992188, 0.028942108154296875, 0.03161048889160156, 0.03427886962890625, 0.03694725036621094, 0.039615631103515625, 0.04228401184082031, 0.044952392578125, 0.04762077331542969, 0.050289154052734375, 0.05295753479003906, 0.05562591552734375, 0.05829429626464844, 0.060962677001953125, 0.06363105773925781, 0.0662994384765625, 0.06896781921386719, 0.07163619995117188, 0.07430458068847656, 0.07697296142578125, 0.07964134216308594, 0.08230972290039062, 0.08497810363769531, 0.087646484375]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 8.0, 3.0, 10.0, 19.0, 25.0, 53.0, 89.0, 139.0, 149.0, 151.0, 129.0, 86.0, 63.0, 31.0, 21.0, 7.0, 9.0, 4.0, 2.0, 4.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.450547218322754, -1.4065881967544556, -1.3626291751861572, -1.3186701536178589, -1.2747111320495605, -1.2307521104812622, -1.1867930889129639, -1.1428340673446655, -1.0988750457763672, -1.0549160242080688, -1.0109570026397705, -0.9669979810714722, -0.9230389595031738, -0.8790799379348755, -0.8351209163665771, -0.7911618947982788, -0.7472028136253357, -0.7032437920570374, -0.659284770488739, -0.6153257489204407, -0.5713667273521423, -0.527407705783844, -0.48344865441322327, -0.4394896328449249, -0.3955306112766266, -0.35157158970832825, -0.3076125681400299, -0.2636535167694092, -0.21969451010227203, -0.1757354885339737, -0.13177645206451416, -0.08781743049621582, -0.04385840892791748, 0.00010061636567115784, 0.044059641659259796, 0.08801867067813873, 0.13197769224643707, 0.1759367138147354, 0.21989575028419495, 0.2638547718524933, 0.3078137934207916, 0.35177281498908997, 0.3957318365573883, 0.43969088792800903, 0.4836499094963074, 0.5276089310646057, 0.571567952632904, 0.6155269742012024, 0.6594859957695007, 0.7034450173377991, 0.7474040389060974, 0.7913630604743958, 0.8353220820426941, 0.8792811036109924, 0.9232401847839355, 0.9671992063522339, 1.0111582279205322, 1.0551172494888306, 1.099076271057129, 1.1430352926254272, 1.1869943141937256, 1.230953335762024, 1.2749123573303223, 1.3188713788986206, 1.362830400466919]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 4.0, 6.0, 10.0, 14.0, 12.0, 14.0, 16.0, 22.0, 20.0, 21.0, 26.0, 29.0, 39.0, 32.0, 31.0, 39.0, 33.0, 40.0, 32.0, 44.0, 50.0, 38.0, 43.0, 41.0, 38.0, 42.0, 31.0, 33.0, 36.0, 18.0, 12.0, 20.0, 22.0, 13.0, 15.0, 12.0, 9.0, 14.0, 5.0, 6.0, 5.0, 3.0, 5.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0191164016723633, -0.9862051010131836, -0.9532938599586487, -0.9203826189041138, -0.8874713182449341, -0.8545600175857544, -0.8216487765312195, -0.7887375354766846, -0.7558262348175049, -0.7229149341583252, -0.6900036931037903, -0.6570924520492554, -0.6241811513900757, -0.591269850730896, -0.5583586096763611, -0.5254473686218262, -0.4925360679626465, -0.4596247971057892, -0.4267135262489319, -0.3938022553920746, -0.3608909845352173, -0.32797971367836, -0.2950684428215027, -0.2621571719646454, -0.22924590110778809, -0.1963346302509308, -0.1634233593940735, -0.1305120885372162, -0.09760081768035889, -0.06468954682350159, -0.03177827596664429, 0.0011329948902130127, 0.03404414653778076, 0.06695541739463806, 0.09986668825149536, 0.13277795910835266, 0.16568922996520996, 0.19860050082206726, 0.23151177167892456, 0.26442304253578186, 0.29733431339263916, 0.33024558424949646, 0.36315685510635376, 0.39606812596321106, 0.42897939682006836, 0.46189066767692566, 0.49480193853378296, 0.5277131795883179, 0.5606244802474976, 0.5935357809066772, 0.6264470219612122, 0.6593582630157471, 0.6922695636749268, 0.7251808643341064, 0.7580921053886414, 0.7910033464431763, 0.823914647102356, 0.8568259477615356, 0.8897371888160706, 0.9226484298706055, 0.9555597305297852, 0.9884710311889648, 1.0213823318481445, 1.0542935132980347, 1.0872048139572144]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 3.0, 7.0, 2.0, 14.0, 7.0, 12.0, 19.0, 26.0, 47.0, 67.0, 153.0, 239.0, 531.0, 1253.0, 3712.0, 18489.0, 440281.0, 3693445.0, 28827.0, 4653.0, 1349.0, 563.0, 260.0, 135.0, 61.0, 50.0, 28.0, 20.0, 12.0, 9.0, 4.0, 7.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.494873046875, -0.4799232482910156, -0.46497344970703125, -0.4500236511230469, -0.4350738525390625, -0.4201240539550781, -0.40517425537109375, -0.3902244567871094, -0.375274658203125, -0.3603248596191406, -0.34537506103515625, -0.3304252624511719, -0.3154754638671875, -0.3005256652832031, -0.28557586669921875, -0.2706260681152344, -0.25567626953125, -0.24072647094726562, -0.22577667236328125, -0.21082687377929688, -0.1958770751953125, -0.18092727661132812, -0.16597747802734375, -0.15102767944335938, -0.136077880859375, -0.12112808227539062, -0.10617828369140625, -0.09122848510742188, -0.0762786865234375, -0.061328887939453125, -0.04637908935546875, -0.031429290771484375, -0.0164794921875, -0.001529693603515625, 0.01342010498046875, 0.028369903564453125, 0.0433197021484375, 0.058269500732421875, 0.07321929931640625, 0.08816909790039062, 0.103118896484375, 0.11806869506835938, 0.13301849365234375, 0.14796829223632812, 0.1629180908203125, 0.17786788940429688, 0.19281768798828125, 0.20776748657226562, 0.22271728515625, 0.23766708374023438, 0.25261688232421875, 0.2675666809082031, 0.2825164794921875, 0.2974662780761719, 0.31241607666015625, 0.3273658752441406, 0.342315673828125, 0.3572654724121094, 0.37221527099609375, 0.3871650695800781, 0.4021148681640625, 0.4170646667480469, 0.43201446533203125, 0.4469642639160156, 0.4619140625]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 10.0, 11.0, 11.0, 12.0, 27.0, 37.0, 55.0, 52.0, 71.0, 80.0, 78.0, 86.0, 96.0, 76.0, 81.0, 57.0, 50.0, 37.0, 21.0, 16.0, 11.0, 4.0, 9.0, 9.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0693359375, -0.0672616958618164, -0.06518745422363281, -0.06311321258544922, -0.061038970947265625, -0.05896472930908203, -0.05689048767089844, -0.054816246032714844, -0.05274200439453125, -0.050667762756347656, -0.04859352111816406, -0.04651927947998047, -0.044445037841796875, -0.04237079620361328, -0.04029655456542969, -0.038222312927246094, -0.0361480712890625, -0.034073829650878906, -0.03199958801269531, -0.02992534637451172, -0.027851104736328125, -0.02577686309814453, -0.023702621459960938, -0.021628379821777344, -0.01955413818359375, -0.017479896545410156, -0.015405654907226562, -0.013331413269042969, -0.011257171630859375, -0.009182929992675781, -0.0071086883544921875, -0.005034446716308594, -0.002960205078125, -0.0008859634399414062, 0.0011882781982421875, 0.0032625198364257812, 0.005336761474609375, 0.007411003112792969, 0.009485244750976562, 0.011559486389160156, 0.01363372802734375, 0.015707969665527344, 0.017782211303710938, 0.01985645294189453, 0.021930694580078125, 0.02400493621826172, 0.026079177856445312, 0.028153419494628906, 0.0302276611328125, 0.032301902770996094, 0.03437614440917969, 0.03645038604736328, 0.038524627685546875, 0.04059886932373047, 0.04267311096191406, 0.044747352600097656, 0.04682159423828125, 0.048895835876464844, 0.05097007751464844, 0.05304431915283203, 0.055118560791015625, 0.05719280242919922, 0.05926704406738281, 0.061341285705566406, 0.06341552734375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 1.0, 7.0, 8.0, 11.0, 16.0, 40.0, 64.0, 153.0, 397.0, 1304.0, 5820.0, 45254.0, 3848256.0, 275038.0, 14260.0, 2510.0, 686.0, 240.0, 97.0, 58.0, 28.0, 14.0, 7.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.409912109375, -0.3933601379394531, -0.37680816650390625, -0.3602561950683594, -0.3437042236328125, -0.3271522521972656, -0.31060028076171875, -0.2940483093261719, -0.277496337890625, -0.2609443664550781, -0.24439239501953125, -0.22784042358398438, -0.2112884521484375, -0.19473648071289062, -0.17818450927734375, -0.16163253784179688, -0.14508056640625, -0.12852859497070312, -0.11197662353515625, -0.09542465209960938, -0.0788726806640625, -0.062320709228515625, -0.04576873779296875, -0.029216766357421875, -0.012664794921875, 0.003887176513671875, 0.02043914794921875, 0.036991119384765625, 0.0535430908203125, 0.07009506225585938, 0.08664703369140625, 0.10319900512695312, 0.1197509765625, 0.13630294799804688, 0.15285491943359375, 0.16940689086914062, 0.1859588623046875, 0.20251083374023438, 0.21906280517578125, 0.23561477661132812, 0.252166748046875, 0.2687187194824219, 0.28527069091796875, 0.3018226623535156, 0.3183746337890625, 0.3349266052246094, 0.35147857666015625, 0.3680305480957031, 0.38458251953125, 0.4011344909667969, 0.41768646240234375, 0.4342384338378906, 0.4507904052734375, 0.4673423767089844, 0.48389434814453125, 0.5004463195800781, 0.516998291015625, 0.5335502624511719, 0.5501022338867188, 0.5666542053222656, 0.5832061767578125, 0.5997581481933594, 0.6163101196289062, 0.6328620910644531, 0.6494140625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 7.0, 5.0, 8.0, 10.0, 14.0, 8.0, 21.0, 30.0, 32.0, 66.0, 124.0, 187.0, 609.0, 2155.0, 382.0, 169.0, 88.0, 59.0, 39.0, 18.0, 17.0, 7.0, 3.0, 4.0, 6.0, 4.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.078857421875, -0.0759744644165039, -0.07309150695800781, -0.07020854949951172, -0.06732559204101562, -0.06444263458251953, -0.06155967712402344, -0.058676719665527344, -0.05579376220703125, -0.052910804748535156, -0.05002784729003906, -0.04714488983154297, -0.044261932373046875, -0.04137897491455078, -0.03849601745605469, -0.035613059997558594, -0.0327301025390625, -0.029847145080566406, -0.026964187622070312, -0.02408123016357422, -0.021198272705078125, -0.01831531524658203, -0.015432357788085938, -0.012549400329589844, -0.00966644287109375, -0.006783485412597656, -0.0039005279541015625, -0.0010175704956054688, 0.001865386962890625, 0.004748344421386719, 0.0076313018798828125, 0.010514259338378906, 0.013397216796875, 0.016280174255371094, 0.019163131713867188, 0.02204608917236328, 0.024929046630859375, 0.02781200408935547, 0.030694961547851562, 0.033577919006347656, 0.03646087646484375, 0.039343833923339844, 0.04222679138183594, 0.04510974884033203, 0.047992706298828125, 0.05087566375732422, 0.05375862121582031, 0.056641578674316406, 0.0595245361328125, 0.062407493591308594, 0.06529045104980469, 0.06817340850830078, 0.07105636596679688, 0.07393932342529297, 0.07682228088378906, 0.07970523834228516, 0.08258819580078125, 0.08547115325927734, 0.08835411071777344, 0.09123706817626953, 0.09412002563476562, 0.09700298309326172, 0.09988594055175781, 0.1027688980102539, 0.10565185546875]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 6.0, 46.0, 115.0, 291.0, 356.0, 141.0, 35.0, 12.0, 6.0, 0.0, 1.0, 2.0], "bins": [-1.8550047874450684, -1.8219696283340454, -1.788934588432312, -1.755899429321289, -1.7228642702102661, -1.6898291110992432, -1.6567940711975098, -1.6237589120864868, -1.5907237529754639, -1.557688593864441, -1.5246535539627075, -1.4916183948516846, -1.4585832357406616, -1.4255480766296387, -1.3925130367279053, -1.3594778776168823, -1.3264427185058594, -1.2934075593948364, -1.260372519493103, -1.22733736038208, -1.1943022012710571, -1.1612670421600342, -1.1282320022583008, -1.0951968431472778, -1.0621618032455444, -1.0291266441345215, -0.9960915446281433, -0.9630564451217651, -0.9300212860107422, -0.896986186504364, -0.8639510869979858, -0.8309159278869629, -0.7978808283805847, -0.7648457288742065, -0.7318105697631836, -0.6987754702568054, -0.6657403111457825, -0.6327052116394043, -0.5996700525283813, -0.5666349530220032, -0.533599853515625, -0.5005647540092468, -0.4675295948982239, -0.4344944953918457, -0.40145933628082275, -0.3684242367744446, -0.335389107465744, -0.30235397815704346, -0.2693188190460205, -0.23628368973731995, -0.20324856042861938, -0.17021344602108002, -0.13717831671237946, -0.1041431874036789, -0.07110807299613953, -0.038072943687438965, -0.005037814378738403, 0.02799731120467186, 0.06103243678808212, 0.09406755864620209, 0.12710268795490265, 0.1601378172636032, 0.19317293167114258, 0.22620806097984314, 0.2592431902885437]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 6.0, 9.0, 10.0, 8.0, 25.0, 13.0, 16.0, 19.0, 29.0, 20.0, 27.0, 46.0, 33.0, 35.0, 51.0, 46.0, 46.0, 52.0, 52.0, 57.0, 50.0, 44.0, 45.0, 31.0, 37.0, 33.0, 29.0, 20.0, 19.0, 16.0, 14.0, 11.0, 10.0, 10.0, 5.0, 3.0, 3.0, 5.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2625809907913208, -0.25440624356269836, -0.24623146653175354, -0.2380567193031311, -0.22988195717334747, -0.22170719504356384, -0.2135324329137802, -0.20535767078399658, -0.19718292355537415, -0.18900816142559052, -0.18083339929580688, -0.17265865206718445, -0.16448388993740082, -0.1563091278076172, -0.14813436567783356, -0.13995960354804993, -0.1317848414182663, -0.12361007928848267, -0.11543532460927963, -0.107260562479496, -0.09908580780029297, -0.09091104567050934, -0.08273628354072571, -0.07456152141094208, -0.06638676673173904, -0.05821200832724571, -0.05003724992275238, -0.04186248779296875, -0.03368772938847542, -0.025512970983982086, -0.017338208854198456, -0.009163450449705124, -0.000988692045211792, 0.0071860672906041145, 0.015360826626420021, 0.023535586893558502, 0.031710345298051834, 0.039885103702545166, 0.048059865832328796, 0.05623462423682213, 0.06440938264131546, 0.07258414477109909, 0.08075889945030212, 0.08893366158008575, 0.09710842370986938, 0.10528317838907242, 0.11345794051885605, 0.12163269519805908, 0.1298074573278427, 0.13798221945762634, 0.14615698158740997, 0.1543317437171936, 0.16250649094581604, 0.17068125307559967, 0.1788560152053833, 0.18703077733516693, 0.19520553946495056, 0.2033803015947342, 0.21155506372451782, 0.21972981095314026, 0.2279045730829239, 0.23607933521270752, 0.24425409734249115, 0.2524288594722748, 0.2606036067008972]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 4.0, 12.0, 12.0, 11.0, 31.0, 37.0, 67.0, 126.0, 191.0, 358.0, 620.0, 1297.0, 3346.0, 9480.0, 33091.0, 156531.0, 555692.0, 223254.0, 45103.0, 12038.0, 3908.0, 1608.0, 755.0, 384.0, 229.0, 145.0, 87.0, 46.0, 30.0, 26.0, 13.0, 14.0, 2.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.27197265625, -0.26387977600097656, -0.2557868957519531, -0.2476940155029297, -0.23960113525390625, -0.2315082550048828, -0.22341537475585938, -0.21532249450683594, -0.2072296142578125, -0.19913673400878906, -0.19104385375976562, -0.1829509735107422, -0.17485809326171875, -0.1667652130126953, -0.15867233276367188, -0.15057945251464844, -0.142486572265625, -0.13439369201660156, -0.12630081176757812, -0.11820793151855469, -0.11011505126953125, -0.10202217102050781, -0.09392929077148438, -0.08583641052246094, -0.0777435302734375, -0.06965065002441406, -0.061557769775390625, -0.05346488952636719, -0.04537200927734375, -0.03727912902832031, -0.029186248779296875, -0.021093368530273438, -0.01300048828125, -0.0049076080322265625, 0.003185272216796875, 0.011278152465820312, 0.01937103271484375, 0.027463912963867188, 0.035556793212890625, 0.04364967346191406, 0.0517425537109375, 0.05983543395996094, 0.06792831420898438, 0.07602119445800781, 0.08411407470703125, 0.09220695495605469, 0.10029983520507812, 0.10839271545410156, 0.116485595703125, 0.12457847595214844, 0.13267135620117188, 0.1407642364501953, 0.14885711669921875, 0.1569499969482422, 0.16504287719726562, 0.17313575744628906, 0.1812286376953125, 0.18932151794433594, 0.19741439819335938, 0.2055072784423828, 0.21360015869140625, 0.2216930389404297, 0.22978591918945312, 0.23787879943847656, 0.2459716796875]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 4.0, 5.0, 9.0, 17.0, 14.0, 22.0, 32.0, 48.0, 56.0, 58.0, 68.0, 77.0, 67.0, 80.0, 95.0, 67.0, 73.0, 63.0, 37.0, 42.0, 23.0, 9.0, 9.0, 10.0, 8.0, 7.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.07159423828125, -0.06954240798950195, -0.0674905776977539, -0.06543874740600586, -0.06338691711425781, -0.061335086822509766, -0.05928325653076172, -0.05723142623901367, -0.055179595947265625, -0.05312776565551758, -0.05107593536376953, -0.049024105072021484, -0.04697227478027344, -0.04492044448852539, -0.042868614196777344, -0.0408167839050293, -0.03876495361328125, -0.0367131233215332, -0.034661293029785156, -0.03260946273803711, -0.030557632446289062, -0.028505802154541016, -0.02645397186279297, -0.024402141571044922, -0.022350311279296875, -0.020298480987548828, -0.01824665069580078, -0.016194820404052734, -0.014142990112304688, -0.01209115982055664, -0.010039329528808594, -0.007987499237060547, -0.0059356689453125, -0.003883838653564453, -0.0018320083618164062, 0.00021982192993164062, 0.0022716522216796875, 0.004323482513427734, 0.006375312805175781, 0.008427143096923828, 0.010478973388671875, 0.012530803680419922, 0.014582633972167969, 0.016634464263916016, 0.018686294555664062, 0.02073812484741211, 0.022789955139160156, 0.024841785430908203, 0.02689361572265625, 0.028945446014404297, 0.030997276306152344, 0.03304910659790039, 0.03510093688964844, 0.037152767181396484, 0.03920459747314453, 0.04125642776489258, 0.043308258056640625, 0.04536008834838867, 0.04741191864013672, 0.049463748931884766, 0.05151557922363281, 0.05356740951538086, 0.055619239807128906, 0.05767107009887695, 0.059722900390625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 4.0, 2.0, 0.0, 3.0, 5.0, 7.0, 6.0, 13.0, 16.0, 18.0, 29.0, 55.0, 52.0, 99.0, 155.0, 259.0, 563.0, 1263.0, 3984.0, 21539.0, 239689.0, 691469.0, 76038.0, 9291.0, 2200.0, 842.0, 395.0, 194.0, 124.0, 71.0, 50.0, 35.0, 26.0, 14.0, 17.0, 12.0, 8.0, 4.0, 3.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.305908203125, -0.2946929931640625, -0.283477783203125, -0.2722625732421875, -0.26104736328125, -0.2498321533203125, -0.238616943359375, -0.2274017333984375, -0.2161865234375, -0.2049713134765625, -0.193756103515625, -0.1825408935546875, -0.17132568359375, -0.1601104736328125, -0.148895263671875, -0.1376800537109375, -0.12646484375, -0.1152496337890625, -0.104034423828125, -0.0928192138671875, -0.08160400390625, -0.0703887939453125, -0.059173583984375, -0.0479583740234375, -0.0367431640625, -0.0255279541015625, -0.014312744140625, -0.0030975341796875, 0.00811767578125, 0.0193328857421875, 0.030548095703125, 0.0417633056640625, 0.052978515625, 0.0641937255859375, 0.075408935546875, 0.0866241455078125, 0.09783935546875, 0.1090545654296875, 0.120269775390625, 0.1314849853515625, 0.1427001953125, 0.1539154052734375, 0.165130615234375, 0.1763458251953125, 0.18756103515625, 0.1987762451171875, 0.209991455078125, 0.2212066650390625, 0.232421875, 0.2436370849609375, 0.254852294921875, 0.2660675048828125, 0.27728271484375, 0.2884979248046875, 0.299713134765625, 0.3109283447265625, 0.3221435546875, 0.3333587646484375, 0.344573974609375, 0.3557891845703125, 0.36700439453125, 0.3782196044921875, 0.389434814453125, 0.4006500244140625, 0.411865234375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 6.0, 1.0, 0.0, 4.0, 4.0, 9.0, 9.0, 11.0, 7.0, 15.0, 21.0, 17.0, 25.0, 30.0, 37.0, 30.0, 45.0, 48.0, 48.0, 51.0, 45.0, 51.0, 49.0, 42.0, 44.0, 53.0, 42.0, 45.0, 36.0, 38.0, 19.0, 23.0, 18.0, 24.0, 18.0, 15.0, 4.0, 9.0, 6.0, 3.0, 4.0, 5.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18701171875, -0.18027687072753906, -0.17354202270507812, -0.1668071746826172, -0.16007232666015625, -0.1533374786376953, -0.14660263061523438, -0.13986778259277344, -0.1331329345703125, -0.12639808654785156, -0.11966323852539062, -0.11292839050292969, -0.10619354248046875, -0.09945869445800781, -0.09272384643554688, -0.08598899841308594, -0.079254150390625, -0.07251930236816406, -0.06578445434570312, -0.05904960632324219, -0.05231475830078125, -0.04557991027832031, -0.038845062255859375, -0.03211021423339844, -0.0253753662109375, -0.018640518188476562, -0.011905670166015625, -0.0051708221435546875, 0.00156402587890625, 0.008298873901367188, 0.015033721923828125, 0.021768569946289062, 0.02850341796875, 0.03523826599121094, 0.041973114013671875, 0.04870796203613281, 0.05544281005859375, 0.06217765808105469, 0.06891250610351562, 0.07564735412597656, 0.0823822021484375, 0.08911705017089844, 0.09585189819335938, 0.10258674621582031, 0.10932159423828125, 0.11605644226074219, 0.12279129028320312, 0.12952613830566406, 0.136260986328125, 0.14299583435058594, 0.14973068237304688, 0.1564655303955078, 0.16320037841796875, 0.1699352264404297, 0.17667007446289062, 0.18340492248535156, 0.1901397705078125, 0.19687461853027344, 0.20360946655273438, 0.2103443145751953, 0.21707916259765625, 0.2238140106201172, 0.23054885864257812, 0.23728370666503906, 0.2440185546875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 3.0, 3.0, 4.0, 5.0, 13.0, 11.0, 23.0, 28.0, 47.0, 86.0, 113.0, 192.0, 351.0, 598.0, 1073.0, 2314.0, 5140.0, 13962.0, 48854.0, 276784.0, 557283.0, 102850.0, 23993.0, 8082.0, 3337.0, 1540.0, 758.0, 441.0, 259.0, 160.0, 96.0, 49.0, 30.0, 21.0, 23.0, 11.0, 10.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.11199951171875, -0.1084136962890625, -0.104827880859375, -0.1012420654296875, -0.09765625, -0.0940704345703125, -0.090484619140625, -0.0868988037109375, -0.08331298828125, -0.0797271728515625, -0.076141357421875, -0.0725555419921875, -0.0689697265625, -0.0653839111328125, -0.061798095703125, -0.0582122802734375, -0.05462646484375, -0.0510406494140625, -0.047454833984375, -0.0438690185546875, -0.040283203125, -0.0366973876953125, -0.033111572265625, -0.0295257568359375, -0.02593994140625, -0.0223541259765625, -0.018768310546875, -0.0151824951171875, -0.0115966796875, -0.0080108642578125, -0.004425048828125, -0.0008392333984375, 0.00274658203125, 0.0063323974609375, 0.009918212890625, 0.0135040283203125, 0.01708984375, 0.0206756591796875, 0.024261474609375, 0.0278472900390625, 0.03143310546875, 0.0350189208984375, 0.038604736328125, 0.0421905517578125, 0.0457763671875, 0.0493621826171875, 0.052947998046875, 0.0565338134765625, 0.06011962890625, 0.0637054443359375, 0.067291259765625, 0.0708770751953125, 0.074462890625, 0.0780487060546875, 0.081634521484375, 0.0852203369140625, 0.08880615234375, 0.0923919677734375, 0.095977783203125, 0.0995635986328125, 0.1031494140625, 0.1067352294921875, 0.110321044921875, 0.1139068603515625, 0.11749267578125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 7.0, 10.0, 17.0, 30.0, 47.0, 83.0, 108.0, 141.0, 163.0, 116.0, 101.0, 60.0, 43.0, 30.0, 23.0, 9.0, 13.0, 4.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.073713302612305e-05, -5.8677978813648224e-05, -5.66188246011734e-05, -5.455967038869858e-05, -5.2500516176223755e-05, -5.044136196374893e-05, -4.838220775127411e-05, -4.6323053538799286e-05, -4.426389932632446e-05, -4.220474511384964e-05, -4.014559090137482e-05, -3.8086436688899994e-05, -3.602728247642517e-05, -3.396812826395035e-05, -3.1908974051475525e-05, -2.9849819839000702e-05, -2.779066562652588e-05, -2.5731511414051056e-05, -2.3672357201576233e-05, -2.161320298910141e-05, -1.9554048776626587e-05, -1.7494894564151764e-05, -1.543574035167694e-05, -1.3376586139202118e-05, -1.1317431926727295e-05, -9.258277714252472e-06, -7.199123501777649e-06, -5.139969289302826e-06, -3.080815076828003e-06, -1.02166086435318e-06, 1.037493348121643e-06, 3.096647560596466e-06, 5.155801773071289e-06, 7.214955985546112e-06, 9.274110198020935e-06, 1.1333264410495758e-05, 1.3392418622970581e-05, 1.5451572835445404e-05, 1.7510727047920227e-05, 1.956988126039505e-05, 2.1629035472869873e-05, 2.3688189685344696e-05, 2.574734389781952e-05, 2.7806498110294342e-05, 2.9865652322769165e-05, 3.192480653524399e-05, 3.398396074771881e-05, 3.6043114960193634e-05, 3.810226917266846e-05, 4.016142338514328e-05, 4.22205775976181e-05, 4.4279731810092926e-05, 4.633888602256775e-05, 4.839804023504257e-05, 5.0457194447517395e-05, 5.251634865999222e-05, 5.457550287246704e-05, 5.6634657084941864e-05, 5.869381129741669e-05, 6.075296550989151e-05, 6.281211972236633e-05, 6.487127393484116e-05, 6.693042814731598e-05, 6.89895823597908e-05, 7.104873657226562e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 6.0, 2.0, 3.0, 5.0, 15.0, 12.0, 24.0, 46.0, 61.0, 147.0, 304.0, 876.0, 3620.0, 32883.0, 789359.0, 207528.0, 10901.0, 1779.0, 560.0, 202.0, 92.0, 54.0, 30.0, 21.0, 7.0, 5.0, 10.0, 3.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.236572265625, -0.22888565063476562, -0.22119903564453125, -0.21351242065429688, -0.2058258056640625, -0.19813919067382812, -0.19045257568359375, -0.18276596069335938, -0.175079345703125, -0.16739273071289062, -0.15970611572265625, -0.15201950073242188, -0.1443328857421875, -0.13664627075195312, -0.12895965576171875, -0.12127304077148438, -0.11358642578125, -0.10589981079101562, -0.09821319580078125, -0.09052658081054688, -0.0828399658203125, -0.07515335083007812, -0.06746673583984375, -0.059780120849609375, -0.052093505859375, -0.044406890869140625, -0.03672027587890625, -0.029033660888671875, -0.0213470458984375, -0.013660430908203125, -0.00597381591796875, 0.001712799072265625, 0.0093994140625, 0.017086029052734375, 0.02477264404296875, 0.032459259033203125, 0.0401458740234375, 0.047832489013671875, 0.05551910400390625, 0.06320571899414062, 0.070892333984375, 0.07857894897460938, 0.08626556396484375, 0.09395217895507812, 0.1016387939453125, 0.10932540893554688, 0.11701202392578125, 0.12469863891601562, 0.13238525390625, 0.14007186889648438, 0.14775848388671875, 0.15544509887695312, 0.1631317138671875, 0.17081832885742188, 0.17850494384765625, 0.18619155883789062, 0.193878173828125, 0.20156478881835938, 0.20925140380859375, 0.21693801879882812, 0.2246246337890625, 0.23231124877929688, 0.23999786376953125, 0.24768447875976562, 0.25537109375]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 5.0, 6.0, 14.0, 17.0, 14.0, 34.0, 30.0, 42.0, 76.0, 86.0, 96.0, 105.0, 116.0, 90.0, 66.0, 50.0, 52.0, 27.0, 28.0, 17.0, 7.0, 10.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10528564453125, -0.10187721252441406, -0.09846878051757812, -0.09506034851074219, -0.09165191650390625, -0.08824348449707031, -0.08483505249023438, -0.08142662048339844, -0.0780181884765625, -0.07460975646972656, -0.07120132446289062, -0.06779289245605469, -0.06438446044921875, -0.06097602844238281, -0.057567596435546875, -0.05415916442871094, -0.050750732421875, -0.04734230041503906, -0.043933868408203125, -0.04052543640136719, -0.03711700439453125, -0.03370857238769531, -0.030300140380859375, -0.026891708374023438, -0.0234832763671875, -0.020074844360351562, -0.016666412353515625, -0.013257980346679688, -0.00984954833984375, -0.0064411163330078125, -0.003032684326171875, 0.0003757476806640625, 0.0037841796875, 0.0071926116943359375, 0.010601043701171875, 0.014009475708007812, 0.01741790771484375, 0.020826339721679688, 0.024234771728515625, 0.027643203735351562, 0.0310516357421875, 0.03446006774902344, 0.037868499755859375, 0.04127693176269531, 0.04468536376953125, 0.04809379577636719, 0.051502227783203125, 0.05491065979003906, 0.058319091796875, 0.06172752380371094, 0.06513595581054688, 0.06854438781738281, 0.07195281982421875, 0.07536125183105469, 0.07876968383789062, 0.08217811584472656, 0.0855865478515625, 0.08899497985839844, 0.09240341186523438, 0.09581184387207031, 0.09922027587890625, 0.10262870788574219, 0.10603713989257812, 0.10944557189941406, 0.11285400390625]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 10.0, 49.0, 188.0, 385.0, 270.0, 84.0, 19.0, 8.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1447193622589111, -1.0274990797042847, -0.9102786779403687, -0.7930583953857422, -0.675838053226471, -0.5586177110671997, -0.44139742851257324, -0.324177086353302, -0.20695674419403076, -0.08973641693592072, 0.02748391032218933, 0.14470422267913818, 0.2619245648384094, 0.37914490699768066, 0.49636518955230713, 0.6135855317115784, 0.7308058738708496, 0.8480262160301208, 0.9652465581893921, 1.0824668407440186, 1.1996872425079346, 1.316907525062561, 1.4341278076171875, 1.5513482093811035, 1.66856849193573, 1.7857887744903564, 1.9030091762542725, 2.0202293395996094, 2.1374497413635254, 2.2546701431274414, 2.3718905448913574, 2.4891107082366943, 2.6063313484191895, 2.7235517501831055, 2.8407719135284424, 2.9579923152923584, 3.0752127170562744, 3.1924328804016113, 3.3096532821655273, 3.4268736839294434, 3.5440940856933594, 3.6613144874572754, 3.7785346508026123, 3.8957550525665283, 4.012975215911865, 4.130195617675781, 4.247416019439697, 4.364636421203613, 4.481856346130371, 4.599076747894287, 4.716297149658203, 4.833517074584961, 4.950737476348877, 5.067957878112793, 5.185178279876709, 5.302398681640625, 5.419619083404541, 5.536839485168457, 5.654059886932373, 5.771280288696289, 5.888500213623047, 6.005720615386963, 6.122941017150879, 6.240161418914795, 6.357381820678711]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 1.0, 7.0, 6.0, 6.0, 13.0, 14.0, 16.0, 21.0, 20.0, 19.0, 29.0, 28.0, 29.0, 36.0, 42.0, 34.0, 40.0, 58.0, 58.0, 49.0, 44.0, 42.0, 42.0, 42.0, 35.0, 38.0, 29.0, 40.0, 27.0, 22.0, 30.0, 17.0, 13.0, 7.0, 7.0, 9.0, 11.0, 4.0, 4.0, 6.0, 1.0, 2.0, 3.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.1114375591278076, -1.0776102542877197, -1.0437829494476318, -1.009955644607544, -0.976128339767456, -0.9423010349273682, -0.9084737300872803, -0.8746464252471924, -0.8408191204071045, -0.8069918155670166, -0.7731645107269287, -0.7393372058868408, -0.7055099010467529, -0.671682596206665, -0.6378552913665771, -0.6040279865264893, -0.5702007412910461, -0.5363734364509583, -0.5025461316108704, -0.46871882677078247, -0.4348915219306946, -0.4010642170906067, -0.3672369420528412, -0.3334096372127533, -0.2995823323726654, -0.2657550275325775, -0.23192772269248962, -0.19810043275356293, -0.16427312791347504, -0.13044582307338715, -0.09661853313446045, -0.06279122829437256, -0.028963923454284668, 0.004863377660512924, 0.038690678775310516, 0.07251797616481781, 0.1063452810049057, 0.1401725858449936, 0.1739998757839203, 0.20782718062400818, 0.24165448546409607, 0.27548179030418396, 0.30930909514427185, 0.34313637018203735, 0.37696367502212524, 0.41079097986221313, 0.444618284702301, 0.4784455895423889, 0.5122728943824768, 0.5461001992225647, 0.5799275040626526, 0.6137548089027405, 0.6475821137428284, 0.6814094185829163, 0.7152366638183594, 0.7490639686584473, 0.7828912734985352, 0.816718578338623, 0.8505458831787109, 0.8843731880187988, 0.9182004928588867, 0.9520277976989746, 0.9858551025390625, 1.0196824073791504, 1.0535097122192383]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 6.0, 1.0, 1.0, 5.0, 4.0, 7.0, 4.0, 4.0, 10.0, 17.0, 12.0, 25.0, 37.0, 40.0, 72.0, 115.0, 157.0, 285.0, 493.0, 860.0, 1689.0, 3745.0, 9583.0, 30725.0, 157313.0, 3653209.0, 272545.0, 42615.0, 12082.0, 4505.0, 1967.0, 944.0, 490.0, 246.0, 178.0, 99.0, 62.0, 33.0, 30.0, 20.0, 18.0, 11.0, 5.0, 9.0, 4.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25048828125, -0.24280738830566406, -0.23512649536132812, -0.2274456024169922, -0.21976470947265625, -0.2120838165283203, -0.20440292358398438, -0.19672203063964844, -0.1890411376953125, -0.18136024475097656, -0.17367935180664062, -0.1659984588623047, -0.15831756591796875, -0.1506366729736328, -0.14295578002929688, -0.13527488708496094, -0.127593994140625, -0.11991310119628906, -0.11223220825195312, -0.10455131530761719, -0.09687042236328125, -0.08918952941894531, -0.08150863647460938, -0.07382774353027344, -0.0661468505859375, -0.05846595764160156, -0.050785064697265625, -0.04310417175292969, -0.03542327880859375, -0.027742385864257812, -0.020061492919921875, -0.012380599975585938, -0.00469970703125, 0.0029811859130859375, 0.010662078857421875, 0.018342971801757812, 0.02602386474609375, 0.03370475769042969, 0.041385650634765625, 0.04906654357910156, 0.0567474365234375, 0.06442832946777344, 0.07210922241210938, 0.07979011535644531, 0.08747100830078125, 0.09515190124511719, 0.10283279418945312, 0.11051368713378906, 0.118194580078125, 0.12587547302246094, 0.13355636596679688, 0.1412372589111328, 0.14891815185546875, 0.1565990447998047, 0.16427993774414062, 0.17196083068847656, 0.1796417236328125, 0.18732261657714844, 0.19500350952148438, 0.2026844024658203, 0.21036529541015625, 0.2180461883544922, 0.22572708129882812, 0.23340797424316406, 0.2410888671875]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 4.0, 10.0, 11.0, 8.0, 18.0, 18.0, 23.0, 40.0, 40.0, 66.0, 69.0, 57.0, 65.0, 64.0, 74.0, 70.0, 65.0, 63.0, 55.0, 48.0, 49.0, 24.0, 15.0, 12.0, 12.0, 10.0, 10.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0616455078125, -0.059771060943603516, -0.05789661407470703, -0.05602216720581055, -0.05414772033691406, -0.05227327346801758, -0.050398826599121094, -0.04852437973022461, -0.046649932861328125, -0.04477548599243164, -0.042901039123535156, -0.04102659225463867, -0.03915214538574219, -0.0372776985168457, -0.03540325164794922, -0.033528804779052734, -0.03165435791015625, -0.029779911041259766, -0.02790546417236328, -0.026031017303466797, -0.024156570434570312, -0.022282123565673828, -0.020407676696777344, -0.01853322982788086, -0.016658782958984375, -0.01478433609008789, -0.012909889221191406, -0.011035442352294922, -0.009160995483398438, -0.007286548614501953, -0.005412101745605469, -0.0035376548767089844, -0.0016632080078125, 0.00021123886108398438, 0.0020856857299804688, 0.003960132598876953, 0.0058345794677734375, 0.007709026336669922, 0.009583473205566406, 0.01145792007446289, 0.013332366943359375, 0.01520681381225586, 0.017081260681152344, 0.018955707550048828, 0.020830154418945312, 0.022704601287841797, 0.02457904815673828, 0.026453495025634766, 0.02832794189453125, 0.030202388763427734, 0.03207683563232422, 0.0339512825012207, 0.03582572937011719, 0.03770017623901367, 0.039574623107910156, 0.04144906997680664, 0.043323516845703125, 0.04519796371459961, 0.047072410583496094, 0.04894685745239258, 0.05082130432128906, 0.05269575119018555, 0.05457019805908203, 0.056444644927978516, 0.058319091796875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 6.0, 11.0, 12.0, 7.0, 16.0, 21.0, 69.0, 101.0, 185.0, 486.0, 1645.0, 7485.0, 58951.0, 3463896.0, 625782.0, 29355.0, 4460.0, 1117.0, 323.0, 152.0, 71.0, 35.0, 27.0, 21.0, 10.0, 6.0, 9.0, 6.0, 4.0, 3.0, 0.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33349609375, -0.3215217590332031, -0.30954742431640625, -0.2975730895996094, -0.2855987548828125, -0.2736244201660156, -0.26165008544921875, -0.24967575073242188, -0.237701416015625, -0.22572708129882812, -0.21375274658203125, -0.20177841186523438, -0.1898040771484375, -0.17782974243164062, -0.16585540771484375, -0.15388107299804688, -0.14190673828125, -0.12993240356445312, -0.11795806884765625, -0.10598373413085938, -0.0940093994140625, -0.08203506469726562, -0.07006072998046875, -0.058086395263671875, -0.046112060546875, -0.034137725830078125, -0.02216339111328125, -0.010189056396484375, 0.0017852783203125, 0.013759613037109375, 0.02573394775390625, 0.037708282470703125, 0.0496826171875, 0.061656951904296875, 0.07363128662109375, 0.08560562133789062, 0.0975799560546875, 0.10955429077148438, 0.12152862548828125, 0.13350296020507812, 0.145477294921875, 0.15745162963867188, 0.16942596435546875, 0.18140029907226562, 0.1933746337890625, 0.20534896850585938, 0.21732330322265625, 0.22929763793945312, 0.24127197265625, 0.2532463073730469, 0.26522064208984375, 0.2771949768066406, 0.2891693115234375, 0.3011436462402344, 0.31311798095703125, 0.3250923156738281, 0.337066650390625, 0.3490409851074219, 0.36101531982421875, 0.3729896545410156, 0.3849639892578125, 0.3969383239746094, 0.40891265869140625, 0.4208869934082031, 0.432861328125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 4.0, 6.0, 9.0, 12.0, 14.0, 20.0, 34.0, 44.0, 61.0, 124.0, 184.0, 441.0, 1699.0, 745.0, 279.0, 158.0, 77.0, 51.0, 37.0, 18.0, 14.0, 9.0, 10.0, 8.0, 10.0, 6.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.1416015625, -0.13812732696533203, -0.13465309143066406, -0.1311788558959961, -0.12770462036132812, -0.12423038482666016, -0.12075614929199219, -0.11728191375732422, -0.11380767822265625, -0.11033344268798828, -0.10685920715332031, -0.10338497161865234, -0.09991073608398438, -0.0964365005493164, -0.09296226501464844, -0.08948802947998047, -0.0860137939453125, -0.08253955841064453, -0.07906532287597656, -0.0755910873413086, -0.07211685180664062, -0.06864261627197266, -0.06516838073730469, -0.06169414520263672, -0.05821990966796875, -0.05474567413330078, -0.05127143859863281, -0.047797203063964844, -0.044322967529296875, -0.040848731994628906, -0.03737449645996094, -0.03390026092529297, -0.030426025390625, -0.02695178985595703, -0.023477554321289062, -0.020003318786621094, -0.016529083251953125, -0.013054847717285156, -0.009580612182617188, -0.006106376647949219, -0.00263214111328125, 0.0008420944213867188, 0.0043163299560546875, 0.007790565490722656, 0.011264801025390625, 0.014739036560058594, 0.018213272094726562, 0.02168750762939453, 0.0251617431640625, 0.02863597869873047, 0.03211021423339844, 0.035584449768066406, 0.039058685302734375, 0.042532920837402344, 0.04600715637207031, 0.04948139190673828, 0.05295562744140625, 0.05642986297607422, 0.05990409851074219, 0.06337833404541016, 0.06685256958007812, 0.0703268051147461, 0.07380104064941406, 0.07727527618408203, 0.08074951171875]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 8.0, 17.0, 44.0, 64.0, 101.0, 151.0, 154.0, 160.0, 132.0, 83.0, 44.0, 21.0, 11.0, 5.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.9112545847892761, -0.8900306224822998, -0.8688066601753235, -0.8475827574729919, -0.8263587951660156, -0.8051348328590393, -0.783910870552063, -0.7626869678497314, -0.7414630055427551, -0.7202390432357788, -0.6990150809288025, -0.677791178226471, -0.6565672159194946, -0.6353432536125183, -0.614119291305542, -0.5928953886032104, -0.5716713666915894, -0.550447404384613, -0.5292234420776367, -0.5079995393753052, -0.48677557706832886, -0.46555161476135254, -0.4443276524543762, -0.4231037199497223, -0.40187978744506836, -0.38065582513809204, -0.3594318926334381, -0.3382079303264618, -0.31698399782180786, -0.29576003551483154, -0.2745360732078552, -0.2533121407032013, -0.23208820819854736, -0.21086426079273224, -0.18964031338691711, -0.1684163510799408, -0.14719241857528687, -0.12596845626831055, -0.10474450886249542, -0.0835205614566803, -0.06229661405086517, -0.04107266664505005, -0.019848715513944626, 0.0013752356171607971, 0.02259918302297592, 0.043823130428791046, 0.06504708528518677, 0.08627103269100189, 0.10749498009681702, 0.12871892750263214, 0.14994287490844727, 0.17116683721542358, 0.19239076972007751, 0.21361473202705383, 0.23483867943286896, 0.2560626268386841, 0.2772865891456604, 0.2985105514526367, 0.31973448395729065, 0.34095844626426697, 0.3621823787689209, 0.3834063410758972, 0.40463030338287354, 0.42585423588752747, 0.4470781683921814]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 3.0, 11.0, 6.0, 6.0, 14.0, 10.0, 13.0, 14.0, 26.0, 29.0, 25.0, 41.0, 19.0, 27.0, 47.0, 32.0, 45.0, 45.0, 52.0, 41.0, 47.0, 51.0, 29.0, 53.0, 33.0, 35.0, 36.0, 31.0, 27.0, 19.0, 24.0, 25.0, 27.0, 11.0, 11.0, 7.0, 8.0, 5.0, 4.0, 2.0, 2.0, 5.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.27719610929489136, -0.26700854301452637, -0.25682100653648376, -0.24663344025611877, -0.23644588887691498, -0.22625833749771118, -0.21607078611850739, -0.2058832347393036, -0.1956956684589386, -0.1855081170797348, -0.175320565700531, -0.16513299942016602, -0.15494544804096222, -0.14475789666175842, -0.13457034528255463, -0.12438278645277023, -0.11419524252414703, -0.10400769114494324, -0.09382013231515884, -0.08363258093595505, -0.07344502210617065, -0.06325747072696686, -0.05306991934776306, -0.04288236051797867, -0.03269480913877487, -0.022507254034280777, -0.012319700792431831, -0.0021321475505828857, 0.008055407553911209, 0.018242962658405304, 0.0284305140376091, 0.038618072867393494, 0.04880562424659729, 0.058993179351091385, 0.06918073445558548, 0.07936828583478928, 0.08955584466457367, 0.09974339604377747, 0.10993094742298126, 0.12011850625276566, 0.13030606508255005, 0.14049361646175385, 0.15068116784095764, 0.16086873412132263, 0.17105628550052643, 0.18124383687973022, 0.19143138825893402, 0.20161893963813782, 0.2118064910173416, 0.2219940423965454, 0.2321815937757492, 0.242369145154953, 0.252556711435318, 0.2627442479133606, 0.2729318141937256, 0.2831193804740906, 0.2933069169521332, 0.30349448323249817, 0.31368201971054077, 0.32386958599090576, 0.33405712246894836, 0.34424468874931335, 0.35443222522735596, 0.36461979150772095, 0.37480735778808594]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 6.0, 14.0, 8.0, 11.0, 15.0, 28.0, 45.0, 71.0, 141.0, 236.0, 436.0, 850.0, 1739.0, 4264.0, 11946.0, 40904.0, 163083.0, 580005.0, 179512.0, 44124.0, 12952.0, 4453.0, 1820.0, 865.0, 461.0, 227.0, 126.0, 74.0, 48.0, 31.0, 19.0, 14.0, 15.0, 6.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2890625, -0.28069114685058594, -0.2723197937011719, -0.2639484405517578, -0.25557708740234375, -0.2472057342529297, -0.23883438110351562, -0.23046302795410156, -0.2220916748046875, -0.21372032165527344, -0.20534896850585938, -0.1969776153564453, -0.18860626220703125, -0.1802349090576172, -0.17186355590820312, -0.16349220275878906, -0.155120849609375, -0.14674949645996094, -0.13837814331054688, -0.1300067901611328, -0.12163543701171875, -0.11326408386230469, -0.10489273071289062, -0.09652137756347656, -0.0881500244140625, -0.07977867126464844, -0.07140731811523438, -0.06303596496582031, -0.05466461181640625, -0.04629325866699219, -0.037921905517578125, -0.029550552368164062, -0.02117919921875, -0.012807846069335938, -0.004436492919921875, 0.0039348602294921875, 0.01230621337890625, 0.020677566528320312, 0.029048919677734375, 0.03742027282714844, 0.0457916259765625, 0.05416297912597656, 0.06253433227539062, 0.07090568542480469, 0.07927703857421875, 0.08764839172363281, 0.09601974487304688, 0.10439109802246094, 0.112762451171875, 0.12113380432128906, 0.12950515747070312, 0.1378765106201172, 0.14624786376953125, 0.1546192169189453, 0.16299057006835938, 0.17136192321777344, 0.1797332763671875, 0.18810462951660156, 0.19647598266601562, 0.2048473358154297, 0.21321868896484375, 0.2215900421142578, 0.22996139526367188, 0.23833274841308594, 0.2467041015625]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 4.0, 6.0, 5.0, 17.0, 20.0, 16.0, 32.0, 46.0, 39.0, 55.0, 66.0, 75.0, 83.0, 65.0, 73.0, 71.0, 66.0, 70.0, 56.0, 37.0, 21.0, 26.0, 21.0, 8.0, 11.0, 4.0, 7.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.058685302734375, -0.05675458908081055, -0.054823875427246094, -0.05289316177368164, -0.05096244812011719, -0.049031734466552734, -0.04710102081298828, -0.04517030715942383, -0.043239593505859375, -0.04130887985229492, -0.03937816619873047, -0.037447452545166016, -0.03551673889160156, -0.03358602523803711, -0.031655311584472656, -0.029724597930908203, -0.02779388427734375, -0.025863170623779297, -0.023932456970214844, -0.02200174331665039, -0.020071029663085938, -0.018140316009521484, -0.01620960235595703, -0.014278888702392578, -0.012348175048828125, -0.010417461395263672, -0.008486747741699219, -0.006556034088134766, -0.0046253204345703125, -0.0026946067810058594, -0.0007638931274414062, 0.0011668205261230469, 0.0030975341796875, 0.005028247833251953, 0.006958961486816406, 0.00888967514038086, 0.010820388793945312, 0.012751102447509766, 0.014681816101074219, 0.016612529754638672, 0.018543243408203125, 0.020473957061767578, 0.02240467071533203, 0.024335384368896484, 0.026266098022460938, 0.02819681167602539, 0.030127525329589844, 0.0320582389831543, 0.03398895263671875, 0.0359196662902832, 0.037850379943847656, 0.03978109359741211, 0.04171180725097656, 0.043642520904541016, 0.04557323455810547, 0.04750394821166992, 0.049434661865234375, 0.05136537551879883, 0.05329608917236328, 0.055226802825927734, 0.05715751647949219, 0.05908823013305664, 0.061018943786621094, 0.06294965744018555, 0.06488037109375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 5.0, 5.0, 10.0, 17.0, 24.0, 33.0, 41.0, 68.0, 108.0, 166.0, 332.0, 702.0, 1580.0, 4837.0, 22859.0, 173923.0, 720651.0, 101464.0, 15456.0, 3722.0, 1265.0, 533.0, 290.0, 182.0, 103.0, 57.0, 42.0, 25.0, 12.0, 7.0, 13.0, 7.0, 6.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.378173828125, -0.36748504638671875, -0.3567962646484375, -0.34610748291015625, -0.335418701171875, -0.32472991943359375, -0.3140411376953125, -0.30335235595703125, -0.29266357421875, -0.28197479248046875, -0.2712860107421875, -0.26059722900390625, -0.249908447265625, -0.23921966552734375, -0.2285308837890625, -0.21784210205078125, -0.2071533203125, -0.19646453857421875, -0.1857757568359375, -0.17508697509765625, -0.164398193359375, -0.15370941162109375, -0.1430206298828125, -0.13233184814453125, -0.12164306640625, -0.11095428466796875, -0.1002655029296875, -0.08957672119140625, -0.078887939453125, -0.06819915771484375, -0.0575103759765625, -0.04682159423828125, -0.0361328125, -0.02544403076171875, -0.0147552490234375, -0.00406646728515625, 0.006622314453125, 0.01731109619140625, 0.0279998779296875, 0.03868865966796875, 0.04937744140625, 0.06006622314453125, 0.0707550048828125, 0.08144378662109375, 0.092132568359375, 0.10282135009765625, 0.1135101318359375, 0.12419891357421875, 0.1348876953125, 0.14557647705078125, 0.1562652587890625, 0.16695404052734375, 0.177642822265625, 0.18833160400390625, 0.1990203857421875, 0.20970916748046875, 0.22039794921875, 0.23108673095703125, 0.2417755126953125, 0.25246429443359375, 0.263153076171875, 0.27384185791015625, 0.2845306396484375, 0.29521942138671875, 0.305908203125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 8.0, 8.0, 8.0, 7.0, 12.0, 18.0, 22.0, 26.0, 25.0, 30.0, 29.0, 42.0, 45.0, 45.0, 46.0, 50.0, 66.0, 65.0, 54.0, 53.0, 55.0, 45.0, 39.0, 30.0, 30.0, 25.0, 28.0, 17.0, 22.0, 12.0, 11.0, 11.0, 7.0, 5.0, 1.0, 6.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2491455078125, -0.24191856384277344, -0.23469161987304688, -0.2274646759033203, -0.22023773193359375, -0.2130107879638672, -0.20578384399414062, -0.19855690002441406, -0.1913299560546875, -0.18410301208496094, -0.17687606811523438, -0.1696491241455078, -0.16242218017578125, -0.1551952362060547, -0.14796829223632812, -0.14074134826660156, -0.133514404296875, -0.12628746032714844, -0.11906051635742188, -0.11183357238769531, -0.10460662841796875, -0.09737968444824219, -0.09015274047851562, -0.08292579650878906, -0.0756988525390625, -0.06847190856933594, -0.061244964599609375, -0.05401802062988281, -0.04679107666015625, -0.03956413269042969, -0.032337188720703125, -0.025110244750976562, -0.01788330078125, -0.010656356811523438, -0.003429412841796875, 0.0037975311279296875, 0.01102447509765625, 0.018251419067382812, 0.025478363037109375, 0.03270530700683594, 0.0399322509765625, 0.04715919494628906, 0.054386138916015625, 0.06161308288574219, 0.06884002685546875, 0.07606697082519531, 0.08329391479492188, 0.09052085876464844, 0.097747802734375, 0.10497474670410156, 0.11220169067382812, 0.11942863464355469, 0.12665557861328125, 0.1338825225830078, 0.14110946655273438, 0.14833641052246094, 0.1555633544921875, 0.16279029846191406, 0.17001724243164062, 0.1772441864013672, 0.18447113037109375, 0.1916980743408203, 0.19892501831054688, 0.20615196228027344, 0.21337890625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 1.0, 1.0, 5.0, 8.0, 10.0, 5.0, 16.0, 12.0, 33.0, 45.0, 65.0, 120.0, 224.0, 364.0, 616.0, 1260.0, 2518.0, 6015.0, 17809.0, 83403.0, 744466.0, 152019.0, 25216.0, 7768.0, 3122.0, 1580.0, 783.0, 430.0, 232.0, 138.0, 87.0, 59.0, 35.0, 23.0, 22.0, 12.0, 7.0, 7.0, 4.0, 1.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.2413330078125, -0.23393821716308594, -0.22654342651367188, -0.2191486358642578, -0.21175384521484375, -0.2043590545654297, -0.19696426391601562, -0.18956947326660156, -0.1821746826171875, -0.17477989196777344, -0.16738510131835938, -0.1599903106689453, -0.15259552001953125, -0.1452007293701172, -0.13780593872070312, -0.13041114807128906, -0.123016357421875, -0.11562156677246094, -0.10822677612304688, -0.10083198547363281, -0.09343719482421875, -0.08604240417480469, -0.07864761352539062, -0.07125282287597656, -0.0638580322265625, -0.05646324157714844, -0.049068450927734375, -0.04167366027832031, -0.03427886962890625, -0.026884078979492188, -0.019489288330078125, -0.012094497680664062, -0.00469970703125, 0.0026950836181640625, 0.010089874267578125, 0.017484664916992188, 0.02487945556640625, 0.03227424621582031, 0.039669036865234375, 0.04706382751464844, 0.0544586181640625, 0.06185340881347656, 0.06924819946289062, 0.07664299011230469, 0.08403778076171875, 0.09143257141113281, 0.09882736206054688, 0.10622215270996094, 0.113616943359375, 0.12101173400878906, 0.12840652465820312, 0.1358013153076172, 0.14319610595703125, 0.1505908966064453, 0.15798568725585938, 0.16538047790527344, 0.1727752685546875, 0.18017005920410156, 0.18756484985351562, 0.1949596405029297, 0.20235443115234375, 0.2097492218017578, 0.21714401245117188, 0.22453880310058594, 0.23193359375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 11.0, 7.0, 8.0, 15.0, 21.0, 28.0, 29.0, 56.0, 63.0, 104.0, 87.0, 106.0, 120.0, 102.0, 70.0, 46.0, 46.0, 24.0, 19.0, 15.0, 9.0, 7.0, 1.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3451786041259766e-05, -4.1754916310310364e-05, -4.005804657936096e-05, -3.836117684841156e-05, -3.666430711746216e-05, -3.4967437386512756e-05, -3.3270567655563354e-05, -3.157369792461395e-05, -2.987682819366455e-05, -2.817995846271515e-05, -2.6483088731765747e-05, -2.4786219000816345e-05, -2.3089349269866943e-05, -2.139247953891754e-05, -1.969560980796814e-05, -1.7998740077018738e-05, -1.6301870346069336e-05, -1.4605000615119934e-05, -1.2908130884170532e-05, -1.121126115322113e-05, -9.514391422271729e-06, -7.817521691322327e-06, -6.120651960372925e-06, -4.423782229423523e-06, -2.726912498474121e-06, -1.0300427675247192e-06, 6.668269634246826e-07, 2.3636966943740845e-06, 4.060566425323486e-06, 5.757436156272888e-06, 7.45430588722229e-06, 9.151175618171692e-06, 1.0848045349121094e-05, 1.2544915080070496e-05, 1.4241784811019897e-05, 1.59386545419693e-05, 1.76355242729187e-05, 1.9332394003868103e-05, 2.1029263734817505e-05, 2.2726133465766907e-05, 2.442300319671631e-05, 2.611987292766571e-05, 2.7816742658615112e-05, 2.9513612389564514e-05, 3.1210482120513916e-05, 3.290735185146332e-05, 3.460422158241272e-05, 3.630109131336212e-05, 3.7997961044311523e-05, 3.9694830775260925e-05, 4.139170050621033e-05, 4.308857023715973e-05, 4.478543996810913e-05, 4.648230969905853e-05, 4.8179179430007935e-05, 4.9876049160957336e-05, 5.157291889190674e-05, 5.326978862285614e-05, 5.496665835380554e-05, 5.6663528084754944e-05, 5.8360397815704346e-05, 6.005726754665375e-05, 6.175413727760315e-05, 6.345100700855255e-05, 6.514787673950195e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 10.0, 12.0, 19.0, 31.0, 53.0, 101.0, 222.0, 491.0, 1307.0, 5123.0, 46469.0, 931137.0, 55520.0, 5735.0, 1356.0, 493.0, 233.0, 114.0, 54.0, 30.0, 12.0, 16.0, 7.0, 0.0, 5.0, 0.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.45703125, -0.442535400390625, -0.42803955078125, -0.413543701171875, -0.3990478515625, -0.384552001953125, -0.37005615234375, -0.355560302734375, -0.341064453125, -0.326568603515625, -0.31207275390625, -0.297576904296875, -0.2830810546875, -0.268585205078125, -0.25408935546875, -0.239593505859375, -0.22509765625, -0.210601806640625, -0.19610595703125, -0.181610107421875, -0.1671142578125, -0.152618408203125, -0.13812255859375, -0.123626708984375, -0.109130859375, -0.094635009765625, -0.08013916015625, -0.065643310546875, -0.0511474609375, -0.036651611328125, -0.02215576171875, -0.007659912109375, 0.0068359375, 0.021331787109375, 0.03582763671875, 0.050323486328125, 0.0648193359375, 0.079315185546875, 0.09381103515625, 0.108306884765625, 0.122802734375, 0.137298583984375, 0.15179443359375, 0.166290283203125, 0.1807861328125, 0.195281982421875, 0.20977783203125, 0.224273681640625, 0.23876953125, 0.253265380859375, 0.26776123046875, 0.282257080078125, 0.2967529296875, 0.311248779296875, 0.32574462890625, 0.340240478515625, 0.354736328125, 0.369232177734375, 0.38372802734375, 0.398223876953125, 0.4127197265625, 0.427215576171875, 0.44171142578125, 0.456207275390625, 0.470703125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 6.0, 5.0, 9.0, 7.0, 16.0, 23.0, 33.0, 33.0, 91.0, 163.0, 224.0, 182.0, 83.0, 39.0, 29.0, 14.0, 17.0, 7.0, 8.0, 7.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.23779296875, -0.23044395446777344, -0.22309494018554688, -0.2157459259033203, -0.20839691162109375, -0.2010478973388672, -0.19369888305664062, -0.18634986877441406, -0.1790008544921875, -0.17165184020996094, -0.16430282592773438, -0.1569538116455078, -0.14960479736328125, -0.1422557830810547, -0.13490676879882812, -0.12755775451660156, -0.120208740234375, -0.11285972595214844, -0.10551071166992188, -0.09816169738769531, -0.09081268310546875, -0.08346366882324219, -0.07611465454101562, -0.06876564025878906, -0.0614166259765625, -0.05406761169433594, -0.046718597412109375, -0.03936958312988281, -0.03202056884765625, -0.024671554565429688, -0.017322540283203125, -0.009973526000976562, -0.00262451171875, 0.0047245025634765625, 0.012073516845703125, 0.019422531127929688, 0.02677154541015625, 0.03412055969238281, 0.041469573974609375, 0.04881858825683594, 0.0561676025390625, 0.06351661682128906, 0.07086563110351562, 0.07821464538574219, 0.08556365966796875, 0.09291267395019531, 0.10026168823242188, 0.10761070251464844, 0.114959716796875, 0.12230873107910156, 0.12965774536132812, 0.1370067596435547, 0.14435577392578125, 0.1517047882080078, 0.15905380249023438, 0.16640281677246094, 0.1737518310546875, 0.18110084533691406, 0.18844985961914062, 0.1957988739013672, 0.20314788818359375, 0.2104969024658203, 0.21784591674804688, 0.22519493103027344, 0.2325439453125]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 15.0, 70.0, 262.0, 377.0, 207.0, 54.0, 15.0, 4.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4786880016326904, -1.3231526613235474, -1.1676174402236938, -1.0120820999145508, -0.8565468192100525, -0.7010115385055542, -0.5454761981964111, -0.3899409770965576, -0.23440563678741455, -0.07887034118175507, 0.07666495442390442, 0.2322002649307251, 0.3877355456352234, 0.5432708263397217, 0.6988061666488647, 0.8543413877487183, 1.0098767280578613, 1.1654120683670044, 1.320947289466858, 1.476482629776001, 1.6320178508758545, 1.7875531911849976, 1.9430885314941406, 2.098623752593994, 2.2541589736938477, 2.409694194793701, 2.565229654312134, 2.7207648754119873, 2.876300096511841, 3.0318355560302734, 3.187370777130127, 3.3429059982299805, 3.498441219329834, 3.6539764404296875, 3.80951189994812, 3.9650471210479736, 4.120582580566406, 4.27611780166626, 4.431653022766113, 4.587188243865967, 4.74272346496582, 4.898258686065674, 5.053793907165527, 5.209329605102539, 5.364864826202393, 5.520400047302246, 5.6759352684021, 5.831470489501953, 5.987006187438965, 6.142541408538818, 6.298076629638672, 6.453612327575684, 6.609147548675537, 6.764682769775391, 6.920217990875244, 7.075753211975098, 7.231288433074951, 7.386823654174805, 7.542358875274658, 7.697894096374512, 7.853429794311523, 8.008964538574219, 8.16450023651123, 8.320035934448242, 8.475570678710938]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 6.0, 2.0, 4.0, 6.0, 3.0, 9.0, 8.0, 12.0, 11.0, 14.0, 24.0, 19.0, 22.0, 24.0, 13.0, 21.0, 20.0, 37.0, 26.0, 41.0, 35.0, 37.0, 48.0, 41.0, 38.0, 40.0, 35.0, 42.0, 41.0, 42.0, 23.0, 26.0, 21.0, 31.0, 29.0, 34.0, 8.0, 18.0, 11.0, 15.0, 15.0, 9.0, 11.0, 6.0, 9.0, 6.0, 5.0, 3.0, 5.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-1.0830885171890259, -1.0505239963531494, -1.0179593563079834, -0.9853948354721069, -0.9528303146362305, -0.920265793800354, -0.8877012133598328, -0.8551366329193115, -0.8225721120834351, -0.7900075912475586, -0.7574430108070374, -0.7248784303665161, -0.6923139095306396, -0.6597493886947632, -0.6271848082542419, -0.5946202278137207, -0.5620557069778442, -0.5294911861419678, -0.49692660570144653, -0.4643620550632477, -0.43179750442504883, -0.39923295378685, -0.3666684031486511, -0.33410385251045227, -0.3015393018722534, -0.26897475123405457, -0.2364102005958557, -0.20384564995765686, -0.171281099319458, -0.13871654868125916, -0.1061519980430603, -0.07358744740486145, -0.04102301597595215, -0.008458465337753296, 0.024106085300445557, 0.05667063593864441, 0.08923518657684326, 0.12179973721504211, 0.15436428785324097, 0.18692883849143982, 0.21949338912963867, 0.2520579397678375, 0.2846224904060364, 0.31718704104423523, 0.3497515916824341, 0.38231614232063293, 0.4148806929588318, 0.44744524359703064, 0.4800097942352295, 0.512574315071106, 0.5451388955116272, 0.5777034759521484, 0.6102679967880249, 0.6428325176239014, 0.6753970980644226, 0.7079616785049438, 0.7405261993408203, 0.7730907201766968, 0.805655300617218, 0.8382198810577393, 0.8707844018936157, 0.9033489227294922, 0.9359135031700134, 0.9684780836105347, 1.0010426044464111]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 16.0, 10.0, 19.0, 27.0, 37.0, 47.0, 89.0, 132.0, 227.0, 413.0, 744.0, 1411.0, 2945.0, 7122.0, 20595.0, 81087.0, 3133046.0, 851121.0, 65734.0, 17679.0, 6376.0, 2665.0, 1330.0, 604.0, 324.0, 177.0, 89.0, 84.0, 42.0, 39.0, 20.0, 8.0, 4.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2548828125, -0.24714279174804688, -0.23940277099609375, -0.23166275024414062, -0.2239227294921875, -0.21618270874023438, -0.20844268798828125, -0.20070266723632812, -0.192962646484375, -0.18522262573242188, -0.17748260498046875, -0.16974258422851562, -0.1620025634765625, -0.15426254272460938, -0.14652252197265625, -0.13878250122070312, -0.13104248046875, -0.12330245971679688, -0.11556243896484375, -0.10782241821289062, -0.1000823974609375, -0.09234237670898438, -0.08460235595703125, -0.07686233520507812, -0.069122314453125, -0.061382293701171875, -0.05364227294921875, -0.045902252197265625, -0.0381622314453125, -0.030422210693359375, -0.02268218994140625, -0.014942169189453125, -0.0072021484375, 0.000537872314453125, 0.00827789306640625, 0.016017913818359375, 0.0237579345703125, 0.031497955322265625, 0.03923797607421875, 0.046977996826171875, 0.054718017578125, 0.062458038330078125, 0.07019805908203125, 0.07793807983398438, 0.0856781005859375, 0.09341812133789062, 0.10115814208984375, 0.10889816284179688, 0.11663818359375, 0.12437820434570312, 0.13211822509765625, 0.13985824584960938, 0.1475982666015625, 0.15533828735351562, 0.16307830810546875, 0.17081832885742188, 0.178558349609375, 0.18629837036132812, 0.19403839111328125, 0.20177841186523438, 0.2095184326171875, 0.21725845336914062, 0.22499847412109375, 0.23273849487304688, 0.240478515625]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 7.0, 3.0, 9.0, 14.0, 11.0, 24.0, 30.0, 26.0, 25.0, 42.0, 61.0, 64.0, 65.0, 65.0, 59.0, 56.0, 52.0, 65.0, 75.0, 38.0, 42.0, 41.0, 41.0, 23.0, 16.0, 10.0, 11.0, 4.0, 7.0, 7.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0625, -0.06059408187866211, -0.05868816375732422, -0.05678224563598633, -0.05487632751464844, -0.05297040939331055, -0.051064491271972656, -0.049158573150634766, -0.047252655029296875, -0.045346736907958984, -0.043440818786621094, -0.0415349006652832, -0.03962898254394531, -0.03772306442260742, -0.03581714630126953, -0.03391122817993164, -0.03200531005859375, -0.03009939193725586, -0.02819347381591797, -0.026287555694580078, -0.024381637573242188, -0.022475719451904297, -0.020569801330566406, -0.018663883209228516, -0.016757965087890625, -0.014852046966552734, -0.012946128845214844, -0.011040210723876953, -0.009134292602539062, -0.007228374481201172, -0.005322456359863281, -0.0034165382385253906, -0.0015106201171875, 0.0003952980041503906, 0.0023012161254882812, 0.004207134246826172, 0.0061130523681640625, 0.008018970489501953, 0.009924888610839844, 0.011830806732177734, 0.013736724853515625, 0.015642642974853516, 0.017548561096191406, 0.019454479217529297, 0.021360397338867188, 0.023266315460205078, 0.02517223358154297, 0.02707815170288086, 0.02898406982421875, 0.03088998794555664, 0.03279590606689453, 0.03470182418823242, 0.03660774230957031, 0.0385136604309082, 0.040419578552246094, 0.042325496673583984, 0.044231414794921875, 0.046137332916259766, 0.048043251037597656, 0.04994916915893555, 0.05185508728027344, 0.05376100540161133, 0.05566692352294922, 0.05757284164428711, 0.059478759765625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 8.0, 3.0, 7.0, 9.0, 18.0, 15.0, 36.0, 60.0, 85.0, 186.0, 353.0, 669.0, 1488.0, 3589.0, 9920.0, 34471.0, 219669.0, 3698399.0, 178694.0, 30853.0, 9491.0, 3480.0, 1394.0, 652.0, 340.0, 159.0, 97.0, 52.0, 32.0, 21.0, 20.0, 12.0, 3.0, 6.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.36181640625, -0.3510017395019531, -0.34018707275390625, -0.3293724060058594, -0.3185577392578125, -0.3077430725097656, -0.29692840576171875, -0.2861137390136719, -0.275299072265625, -0.2644844055175781, -0.25366973876953125, -0.24285507202148438, -0.2320404052734375, -0.22122573852539062, -0.21041107177734375, -0.19959640502929688, -0.18878173828125, -0.17796707153320312, -0.16715240478515625, -0.15633773803710938, -0.1455230712890625, -0.13470840454101562, -0.12389373779296875, -0.11307907104492188, -0.102264404296875, -0.09144973754882812, -0.08063507080078125, -0.06982040405273438, -0.0590057373046875, -0.048191070556640625, -0.03737640380859375, -0.026561737060546875, -0.0157470703125, -0.004932403564453125, 0.00588226318359375, 0.016696929931640625, 0.0275115966796875, 0.038326263427734375, 0.04914093017578125, 0.059955596923828125, 0.070770263671875, 0.08158493041992188, 0.09239959716796875, 0.10321426391601562, 0.1140289306640625, 0.12484359741210938, 0.13565826416015625, 0.14647293090820312, 0.15728759765625, 0.16810226440429688, 0.17891693115234375, 0.18973159790039062, 0.2005462646484375, 0.21136093139648438, 0.22217559814453125, 0.23299026489257812, 0.243804931640625, 0.2546195983886719, 0.26543426513671875, 0.2762489318847656, 0.2870635986328125, 0.2978782653808594, 0.30869293212890625, 0.3195075988769531, 0.330322265625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 6.0, 6.0, 4.0, 14.0, 6.0, 16.0, 18.0, 31.0, 56.0, 82.0, 128.0, 301.0, 1533.0, 1168.0, 290.0, 141.0, 82.0, 43.0, 36.0, 23.0, 21.0, 21.0, 11.0, 15.0, 10.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1251220703125, -0.12143707275390625, -0.1177520751953125, -0.11406707763671875, -0.110382080078125, -0.10669708251953125, -0.1030120849609375, -0.09932708740234375, -0.09564208984375, -0.09195709228515625, -0.0882720947265625, -0.08458709716796875, -0.080902099609375, -0.07721710205078125, -0.0735321044921875, -0.06984710693359375, -0.066162109375, -0.06247711181640625, -0.0587921142578125, -0.05510711669921875, -0.051422119140625, -0.04773712158203125, -0.0440521240234375, -0.04036712646484375, -0.03668212890625, -0.03299713134765625, -0.0293121337890625, -0.02562713623046875, -0.021942138671875, -0.01825714111328125, -0.0145721435546875, -0.01088714599609375, -0.0072021484375, -0.00351715087890625, 0.0001678466796875, 0.00385284423828125, 0.007537841796875, 0.01122283935546875, 0.0149078369140625, 0.01859283447265625, 0.02227783203125, 0.02596282958984375, 0.0296478271484375, 0.03333282470703125, 0.037017822265625, 0.04070281982421875, 0.0443878173828125, 0.04807281494140625, 0.0517578125, 0.05544281005859375, 0.0591278076171875, 0.06281280517578125, 0.066497802734375, 0.07018280029296875, 0.0738677978515625, 0.07755279541015625, 0.08123779296875, 0.08492279052734375, 0.0886077880859375, 0.09229278564453125, 0.095977783203125, 0.09966278076171875, 0.1033477783203125, 0.10703277587890625, 0.1107177734375]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 10.0, 18.0, 33.0, 85.0, 160.0, 197.0, 215.0, 144.0, 82.0, 35.0, 15.0, 8.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5483378171920776, -0.5134613513946533, -0.4785849153995514, -0.4437084496021271, -0.40883201360702515, -0.37395554780960083, -0.3390790820121765, -0.3042026162147522, -0.26932618021965027, -0.23444972932338715, -0.19957327842712402, -0.1646968126296997, -0.12982036173343658, -0.09494391083717346, -0.060067445039749146, -0.025190994143486023, 0.0096854567527771, 0.04456191137433052, 0.07943836599588394, 0.11431482434272766, 0.14919127523899078, 0.1840677261352539, 0.21894419193267822, 0.25382065773010254, 0.28869709372520447, 0.3235735595226288, 0.3584499955177307, 0.39332646131515503, 0.42820292711257935, 0.4630793631076813, 0.4979558289051056, 0.5328322649002075, 0.5677087306976318, 0.6025851964950562, 0.6374616622924805, 0.6723381280899048, 0.7072145342826843, 0.7420910000801086, 0.776967465877533, 0.8118439316749573, 0.8467203378677368, 0.8815968036651611, 0.9164732694625854, 0.9513497352600098, 0.9862261414527893, 1.0211026668548584, 1.0559790134429932, 1.0908554792404175, 1.1257319450378418, 1.1606084108352661, 1.1954848766326904, 1.2303613424301147, 1.265237808227539, 1.3001141548156738, 1.3349907398223877, 1.3698670864105225, 1.4047436714172363, 1.4396201372146606, 1.474496603012085, 1.5093730688095093, 1.5442495346069336, 1.5791258811950684, 1.6140024662017822, 1.648878812789917, 1.6837552785873413]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 5.0, 1.0, 3.0, 4.0, 11.0, 5.0, 9.0, 10.0, 14.0, 18.0, 26.0, 32.0, 32.0, 22.0, 34.0, 33.0, 33.0, 45.0, 47.0, 51.0, 39.0, 37.0, 47.0, 31.0, 56.0, 38.0, 40.0, 39.0, 34.0, 32.0, 28.0, 22.0, 21.0, 18.0, 21.0, 11.0, 14.0, 10.0, 8.0, 5.0, 8.0, 5.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.37145864963531494, -0.3599833846092224, -0.3485080897808075, -0.33703282475471497, -0.32555752992630005, -0.3140822649002075, -0.302606999874115, -0.2911317050457001, -0.27965644001960754, -0.268181174993515, -0.2567058801651001, -0.24523061513900757, -0.23375533521175385, -0.22228005528450012, -0.2108047753572464, -0.19932949542999268, -0.18785421550273895, -0.17637893557548523, -0.1649036556482315, -0.15342837572097778, -0.14195311069488525, -0.13047783076763153, -0.11900255084037781, -0.10752727836370468, -0.09605199843645096, -0.08457671850919724, -0.07310144603252411, -0.061626166105270386, -0.05015088990330696, -0.038675613701343536, -0.027200333774089813, -0.015725061297416687, -0.004249781370162964, 0.007225495763123035, 0.018700772896409035, 0.03017605096101761, 0.04165132716298103, 0.05312660336494446, 0.06460188329219818, 0.07607715576887131, 0.08755243569612503, 0.09902771562337875, 0.11050298810005188, 0.1219782680273056, 0.13345354795455933, 0.14492881298065186, 0.15640410780906677, 0.1678793728351593, 0.17935465276241302, 0.19082993268966675, 0.20230521261692047, 0.2137804925441742, 0.22525575757026672, 0.23673103749752045, 0.24820631742477417, 0.2596815824508667, 0.2711568772792816, 0.28263214230537415, 0.29410743713378906, 0.3055827021598816, 0.3170579969882965, 0.32853326201438904, 0.34000855684280396, 0.3514838218688965, 0.362959086894989]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 10.0, 11.0, 25.0, 32.0, 40.0, 66.0, 96.0, 165.0, 260.0, 465.0, 746.0, 1374.0, 2547.0, 5176.0, 11158.0, 25411.0, 65155.0, 189160.0, 443216.0, 189920.0, 65793.0, 25719.0, 10900.0, 5176.0, 2557.0, 1403.0, 776.0, 435.0, 261.0, 180.0, 101.0, 81.0, 45.0, 40.0, 27.0, 8.0, 8.0, 8.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2462158203125, -0.23928070068359375, -0.2323455810546875, -0.22541046142578125, -0.218475341796875, -0.21154022216796875, -0.2046051025390625, -0.19766998291015625, -0.19073486328125, -0.18379974365234375, -0.1768646240234375, -0.16992950439453125, -0.162994384765625, -0.15605926513671875, -0.1491241455078125, -0.14218902587890625, -0.13525390625, -0.12831878662109375, -0.1213836669921875, -0.11444854736328125, -0.107513427734375, -0.10057830810546875, -0.0936431884765625, -0.08670806884765625, -0.07977294921875, -0.07283782958984375, -0.0659027099609375, -0.05896759033203125, -0.052032470703125, -0.04509735107421875, -0.0381622314453125, -0.03122711181640625, -0.0242919921875, -0.01735687255859375, -0.0104217529296875, -0.00348663330078125, 0.003448486328125, 0.01038360595703125, 0.0173187255859375, 0.02425384521484375, 0.03118896484375, 0.03812408447265625, 0.0450592041015625, 0.05199432373046875, 0.058929443359375, 0.06586456298828125, 0.0727996826171875, 0.07973480224609375, 0.086669921875, 0.09360504150390625, 0.1005401611328125, 0.10747528076171875, 0.114410400390625, 0.12134552001953125, 0.1282806396484375, 0.13521575927734375, 0.14215087890625, 0.14908599853515625, 0.1560211181640625, 0.16295623779296875, 0.169891357421875, 0.17682647705078125, 0.1837615966796875, 0.19069671630859375, 0.1976318359375]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 5.0, 7.0, 7.0, 7.0, 8.0, 16.0, 16.0, 23.0, 21.0, 21.0, 31.0, 39.0, 58.0, 46.0, 63.0, 60.0, 59.0, 57.0, 46.0, 50.0, 49.0, 61.0, 46.0, 48.0, 31.0, 30.0, 23.0, 18.0, 11.0, 11.0, 12.0, 7.0, 7.0, 4.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.062255859375, -0.060442447662353516, -0.05862903594970703, -0.05681562423706055, -0.05500221252441406, -0.05318880081176758, -0.051375389099121094, -0.04956197738647461, -0.047748565673828125, -0.04593515396118164, -0.044121742248535156, -0.04230833053588867, -0.04049491882324219, -0.0386815071105957, -0.03686809539794922, -0.035054683685302734, -0.03324127197265625, -0.031427860260009766, -0.02961444854736328, -0.027801036834716797, -0.025987625122070312, -0.024174213409423828, -0.022360801696777344, -0.02054738998413086, -0.018733978271484375, -0.01692056655883789, -0.015107154846191406, -0.013293743133544922, -0.011480331420898438, -0.009666919708251953, -0.007853507995605469, -0.006040096282958984, -0.0042266845703125, -0.0024132728576660156, -0.0005998611450195312, 0.0012135505676269531, 0.0030269622802734375, 0.004840373992919922, 0.006653785705566406, 0.00846719741821289, 0.010280609130859375, 0.01209402084350586, 0.013907432556152344, 0.015720844268798828, 0.017534255981445312, 0.019347667694091797, 0.02116107940673828, 0.022974491119384766, 0.02478790283203125, 0.026601314544677734, 0.02841472625732422, 0.030228137969970703, 0.03204154968261719, 0.03385496139526367, 0.035668373107910156, 0.03748178482055664, 0.039295196533203125, 0.04110860824584961, 0.042922019958496094, 0.04473543167114258, 0.04654884338378906, 0.04836225509643555, 0.05017566680908203, 0.051989078521728516, 0.053802490234375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 9.0, 5.0, 24.0, 41.0, 51.0, 98.0, 196.0, 311.0, 630.0, 1662.0, 5582.0, 37622.0, 536430.0, 427184.0, 31050.0, 4848.0, 1455.0, 589.0, 317.0, 179.0, 105.0, 61.0, 35.0, 30.0, 14.0, 9.0, 10.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.59326171875, -0.5784149169921875, -0.563568115234375, -0.5487213134765625, -0.53387451171875, -0.5190277099609375, -0.504180908203125, -0.4893341064453125, -0.4744873046875, -0.4596405029296875, -0.444793701171875, -0.4299468994140625, -0.41510009765625, -0.4002532958984375, -0.385406494140625, -0.3705596923828125, -0.355712890625, -0.3408660888671875, -0.326019287109375, -0.3111724853515625, -0.29632568359375, -0.2814788818359375, -0.266632080078125, -0.2517852783203125, -0.2369384765625, -0.2220916748046875, -0.207244873046875, -0.1923980712890625, -0.17755126953125, -0.1627044677734375, -0.147857666015625, -0.1330108642578125, -0.1181640625, -0.1033172607421875, -0.088470458984375, -0.0736236572265625, -0.05877685546875, -0.0439300537109375, -0.029083251953125, -0.0142364501953125, 0.0006103515625, 0.0154571533203125, 0.030303955078125, 0.0451507568359375, 0.05999755859375, 0.0748443603515625, 0.089691162109375, 0.1045379638671875, 0.119384765625, 0.1342315673828125, 0.149078369140625, 0.1639251708984375, 0.17877197265625, 0.1936187744140625, 0.208465576171875, 0.2233123779296875, 0.2381591796875, 0.2530059814453125, 0.267852783203125, 0.2826995849609375, 0.29754638671875, 0.3123931884765625, 0.327239990234375, 0.3420867919921875, 0.35693359375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 13.0, 13.0, 18.0, 18.0, 21.0, 24.0, 33.0, 40.0, 41.0, 62.0, 53.0, 68.0, 64.0, 78.0, 73.0, 62.0, 63.0, 61.0, 36.0, 32.0, 24.0, 27.0, 22.0, 13.0, 17.0, 8.0, 1.0, 6.0, 2.0, 7.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.39111328125, -0.38060760498046875, -0.3701019287109375, -0.35959625244140625, -0.349090576171875, -0.33858489990234375, -0.3280792236328125, -0.31757354736328125, -0.30706787109375, -0.29656219482421875, -0.2860565185546875, -0.27555084228515625, -0.265045166015625, -0.25453948974609375, -0.2440338134765625, -0.23352813720703125, -0.2230224609375, -0.21251678466796875, -0.2020111083984375, -0.19150543212890625, -0.180999755859375, -0.17049407958984375, -0.1599884033203125, -0.14948272705078125, -0.13897705078125, -0.12847137451171875, -0.1179656982421875, -0.10746002197265625, -0.096954345703125, -0.08644866943359375, -0.0759429931640625, -0.06543731689453125, -0.054931640625, -0.04442596435546875, -0.0339202880859375, -0.02341461181640625, -0.012908935546875, -0.00240325927734375, 0.0081024169921875, 0.01860809326171875, 0.02911376953125, 0.03961944580078125, 0.0501251220703125, 0.06063079833984375, 0.071136474609375, 0.08164215087890625, 0.0921478271484375, 0.10265350341796875, 0.1131591796875, 0.12366485595703125, 0.1341705322265625, 0.14467620849609375, 0.155181884765625, 0.16568756103515625, 0.1761932373046875, 0.18669891357421875, 0.19720458984375, 0.20771026611328125, 0.2182159423828125, 0.22872161865234375, 0.239227294921875, 0.24973297119140625, 0.2602386474609375, 0.27074432373046875, 0.28125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 4.0, 12.0, 9.0, 19.0, 16.0, 27.0, 46.0, 53.0, 86.0, 157.0, 222.0, 376.0, 645.0, 1117.0, 2098.0, 4073.0, 8570.0, 20785.0, 59727.0, 255209.0, 528501.0, 108666.0, 33256.0, 12731.0, 5771.0, 2797.0, 1462.0, 790.0, 459.0, 299.0, 186.0, 125.0, 72.0, 56.0, 41.0, 26.0, 15.0, 19.0, 8.0, 10.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1690673828125, -0.16365432739257812, -0.15824127197265625, -0.15282821655273438, -0.1474151611328125, -0.14200210571289062, -0.13658905029296875, -0.13117599487304688, -0.125762939453125, -0.12034988403320312, -0.11493682861328125, -0.10952377319335938, -0.1041107177734375, -0.09869766235351562, -0.09328460693359375, -0.08787155151367188, -0.08245849609375, -0.07704544067382812, -0.07163238525390625, -0.06621932983398438, -0.0608062744140625, -0.055393218994140625, -0.04998016357421875, -0.044567108154296875, -0.039154052734375, -0.033740997314453125, -0.02832794189453125, -0.022914886474609375, -0.0175018310546875, -0.012088775634765625, -0.00667572021484375, -0.001262664794921875, 0.004150390625, 0.009563446044921875, 0.01497650146484375, 0.020389556884765625, 0.0258026123046875, 0.031215667724609375, 0.03662872314453125, 0.042041778564453125, 0.047454833984375, 0.052867889404296875, 0.05828094482421875, 0.06369400024414062, 0.0691070556640625, 0.07452011108398438, 0.07993316650390625, 0.08534622192382812, 0.09075927734375, 0.09617233276367188, 0.10158538818359375, 0.10699844360351562, 0.1124114990234375, 0.11782455444335938, 0.12323760986328125, 0.12865066528320312, 0.134063720703125, 0.13947677612304688, 0.14488983154296875, 0.15030288696289062, 0.1557159423828125, 0.16112899780273438, 0.16654205322265625, 0.17195510864257812, 0.1773681640625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 2.0, 3.0, 3.0, 4.0, 8.0, 9.0, 11.0, 14.0, 14.0, 15.0, 34.0, 27.0, 37.0, 45.0, 65.0, 89.0, 78.0, 93.0, 73.0, 81.0, 57.0, 46.0, 45.0, 38.0, 29.0, 16.0, 17.0, 8.0, 8.0, 5.0, 4.0, 8.0, 4.0, 1.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.6253204345703125e-05, -4.484318196773529e-05, -4.3433159589767456e-05, -4.202313721179962e-05, -4.061311483383179e-05, -3.920309245586395e-05, -3.779307007789612e-05, -3.6383047699928284e-05, -3.497302532196045e-05, -3.3563002943992615e-05, -3.215298056602478e-05, -3.0742958188056946e-05, -2.933293581008911e-05, -2.7922913432121277e-05, -2.6512891054153442e-05, -2.5102868676185608e-05, -2.3692846298217773e-05, -2.228282392024994e-05, -2.0872801542282104e-05, -1.946277916431427e-05, -1.8052756786346436e-05, -1.66427344083786e-05, -1.5232712030410767e-05, -1.3822689652442932e-05, -1.2412667274475098e-05, -1.1002644896507263e-05, -9.592622518539429e-06, -8.182600140571594e-06, -6.77257776260376e-06, -5.362555384635925e-06, -3.952533006668091e-06, -2.5425106287002563e-06, -1.1324882507324219e-06, 2.775341272354126e-07, 1.687556505203247e-06, 3.0975788831710815e-06, 4.507601261138916e-06, 5.9176236391067505e-06, 7.327646017074585e-06, 8.73766839504242e-06, 1.0147690773010254e-05, 1.1557713150978088e-05, 1.2967735528945923e-05, 1.4377757906913757e-05, 1.5787780284881592e-05, 1.7197802662849426e-05, 1.860782504081726e-05, 2.0017847418785095e-05, 2.142786979675293e-05, 2.2837892174720764e-05, 2.42479145526886e-05, 2.5657936930656433e-05, 2.7067959308624268e-05, 2.8477981686592102e-05, 2.9888004064559937e-05, 3.129802644252777e-05, 3.2708048820495605e-05, 3.411807119846344e-05, 3.5528093576431274e-05, 3.693811595439911e-05, 3.834813833236694e-05, 3.975816071033478e-05, 4.116818308830261e-05, 4.257820546627045e-05, 4.398822784423828e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 6.0, 10.0, 15.0, 12.0, 33.0, 45.0, 69.0, 128.0, 247.0, 538.0, 1144.0, 3510.0, 13660.0, 82022.0, 768987.0, 149718.0, 20816.0, 4770.0, 1505.0, 628.0, 300.0, 164.0, 78.0, 66.0, 39.0, 16.0, 7.0, 2.0, 5.0, 1.0, 4.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.279296875, -0.26918792724609375, -0.2590789794921875, -0.24897003173828125, -0.238861083984375, -0.22875213623046875, -0.2186431884765625, -0.20853424072265625, -0.19842529296875, -0.18831634521484375, -0.1782073974609375, -0.16809844970703125, -0.157989501953125, -0.14788055419921875, -0.1377716064453125, -0.12766265869140625, -0.1175537109375, -0.10744476318359375, -0.0973358154296875, -0.08722686767578125, -0.077117919921875, -0.06700897216796875, -0.0569000244140625, -0.04679107666015625, -0.03668212890625, -0.02657318115234375, -0.0164642333984375, -0.00635528564453125, 0.003753662109375, 0.01386260986328125, 0.0239715576171875, 0.03408050537109375, 0.044189453125, 0.05429840087890625, 0.0644073486328125, 0.07451629638671875, 0.084625244140625, 0.09473419189453125, 0.1048431396484375, 0.11495208740234375, 0.12506103515625, 0.13516998291015625, 0.1452789306640625, 0.15538787841796875, 0.165496826171875, 0.17560577392578125, 0.1857147216796875, 0.19582366943359375, 0.2059326171875, 0.21604156494140625, 0.2261505126953125, 0.23625946044921875, 0.246368408203125, 0.25647735595703125, 0.2665863037109375, 0.27669525146484375, 0.28680419921875, 0.29691314697265625, 0.3070220947265625, 0.31713104248046875, 0.327239990234375, 0.33734893798828125, 0.3474578857421875, 0.35756683349609375, 0.36767578125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 1.0, 1.0, 5.0, 4.0, 4.0, 5.0, 8.0, 3.0, 9.0, 13.0, 10.0, 8.0, 24.0, 10.0, 26.0, 30.0, 54.0, 66.0, 107.0, 130.0, 111.0, 79.0, 67.0, 45.0, 39.0, 26.0, 20.0, 16.0, 11.0, 14.0, 12.0, 11.0, 10.0, 5.0, 0.0, 2.0, 8.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.142822265625, -0.13818931579589844, -0.13355636596679688, -0.1289234161376953, -0.12429046630859375, -0.11965751647949219, -0.11502456665039062, -0.11039161682128906, -0.1057586669921875, -0.10112571716308594, -0.09649276733398438, -0.09185981750488281, -0.08722686767578125, -0.08259391784667969, -0.07796096801757812, -0.07332801818847656, -0.068695068359375, -0.06406211853027344, -0.059429168701171875, -0.05479621887207031, -0.05016326904296875, -0.04553031921386719, -0.040897369384765625, -0.03626441955566406, -0.0316314697265625, -0.026998519897460938, -0.022365570068359375, -0.017732620239257812, -0.01309967041015625, -0.008466720581054688, -0.003833770751953125, 0.0007991790771484375, 0.00543212890625, 0.010065078735351562, 0.014698028564453125, 0.019330978393554688, 0.02396392822265625, 0.028596878051757812, 0.033229827880859375, 0.03786277770996094, 0.0424957275390625, 0.04712867736816406, 0.051761627197265625, 0.05639457702636719, 0.06102752685546875, 0.06566047668457031, 0.07029342651367188, 0.07492637634277344, 0.079559326171875, 0.08419227600097656, 0.08882522583007812, 0.09345817565917969, 0.09809112548828125, 0.10272407531738281, 0.10735702514648438, 0.11198997497558594, 0.1166229248046875, 0.12125587463378906, 0.12588882446289062, 0.1305217742919922, 0.13515472412109375, 0.1397876739501953, 0.14442062377929688, 0.14905357360839844, 0.1536865234375]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 11.0, 16.0, 19.0, 47.0, 67.0, 85.0, 139.0, 140.0, 141.0, 116.0, 93.0, 46.0, 38.0, 21.0, 8.0, 9.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.738926649093628, -1.6743013858795166, -1.6096762418746948, -1.5450509786605835, -1.4804257154464722, -1.4158005714416504, -1.351175308227539, -1.2865500450134277, -1.2219247817993164, -1.157299518585205, -1.0926743745803833, -1.028049111366272, -0.9634238481521606, -0.8987986445426941, -0.8341734409332275, -0.7695481777191162, -0.7049230337142944, -0.6402978301048279, -0.5756725668907166, -0.51104736328125, -0.44642212986946106, -0.3817968964576721, -0.31717169284820557, -0.2525464594364166, -0.18792122602462769, -0.12329600006341934, -0.058670774102211, 0.005954444408416748, 0.07057967782020569, 0.13520491123199463, 0.19983011484146118, 0.2644553482532501, 0.32908058166503906, 0.393705815076828, 0.45833104848861694, 0.5229562520980835, 0.5875815153121948, 0.6522067189216614, 0.7168319225311279, 0.7814571857452393, 0.8460823893547058, 0.9107075929641724, 0.9753328561782837, 1.0399580001831055, 1.1045832633972168, 1.1692085266113281, 1.2338337898254395, 1.2984589338302612, 1.3630841970443726, 1.4277094602584839, 1.4923346042633057, 1.556959867477417, 1.6215851306915283, 1.6862103939056396, 1.7508355379104614, 1.8154608011245728, 1.8800859451293945, 1.9447112083435059, 2.009336471557617, 2.0739617347717285, 2.1385867595672607, 2.203212022781372, 2.2678372859954834, 2.3324625492095947, 2.397087812423706]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 4.0, 3.0, 10.0, 7.0, 7.0, 10.0, 11.0, 19.0, 21.0, 21.0, 19.0, 27.0, 24.0, 49.0, 41.0, 50.0, 40.0, 56.0, 54.0, 48.0, 52.0, 44.0, 37.0, 58.0, 32.0, 49.0, 36.0, 35.0, 26.0, 23.0, 18.0, 20.0, 14.0, 6.0, 4.0, 4.0, 9.0, 5.0, 5.0, 6.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.6430422067642212, -1.598127841949463, -1.5532134771347046, -1.5082991123199463, -1.4633848667144775, -1.4184705018997192, -1.373556137084961, -1.3286417722702026, -1.2837274074554443, -1.238813042640686, -1.1938986778259277, -1.1489843130111694, -1.1040699481964111, -1.0591557025909424, -1.014241337776184, -0.9693269729614258, -0.9244126081466675, -0.8794982433319092, -0.8345838785171509, -0.7896695733070374, -0.744755208492279, -0.6998408436775208, -0.6549265384674072, -0.6100121736526489, -0.5650978088378906, -0.5201834440231323, -0.4752691090106964, -0.4303547739982605, -0.3854404091835022, -0.3405260443687439, -0.295611709356308, -0.25069737434387207, -0.20578312873840332, -0.1608687788248062, -0.1159544289112091, -0.071040078997612, -0.026125729084014893, 0.018788620829582214, 0.06370297074317932, 0.10861730575561523, 0.15353167057037354, 0.19844602048397064, 0.24336037039756775, 0.28827470541000366, 0.33318907022476196, 0.37810343503952026, 0.4230177700519562, 0.4679321050643921, 0.5128464698791504, 0.5577608346939087, 0.602675199508667, 0.6475895047187805, 0.6925038695335388, 0.7374182343482971, 0.7823325395584106, 0.827246904373169, 0.8721612691879272, 0.9170756340026855, 0.9619899988174438, 1.0069043636322021, 1.051818609237671, 1.0967329740524292, 1.1416473388671875, 1.1865617036819458, 1.231476068496704]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 4.0, 3.0, 9.0, 10.0, 11.0, 15.0, 23.0, 35.0, 49.0, 84.0, 128.0, 211.0, 324.0, 555.0, 1033.0, 1958.0, 4029.0, 9137.0, 25165.0, 91019.0, 2496218.0, 1437920.0, 85717.0, 23669.0, 8874.0, 3799.0, 1866.0, 978.0, 557.0, 303.0, 182.0, 125.0, 81.0, 58.0, 36.0, 31.0, 19.0, 15.0, 13.0, 5.0, 6.0, 7.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2452392578125, -0.2370586395263672, -0.22887802124023438, -0.22069740295410156, -0.21251678466796875, -0.20433616638183594, -0.19615554809570312, -0.1879749298095703, -0.1797943115234375, -0.1716136932373047, -0.16343307495117188, -0.15525245666503906, -0.14707183837890625, -0.13889122009277344, -0.13071060180664062, -0.12252998352050781, -0.114349365234375, -0.10616874694824219, -0.09798812866210938, -0.08980751037597656, -0.08162689208984375, -0.07344627380371094, -0.06526565551757812, -0.05708503723144531, -0.0489044189453125, -0.04072380065917969, -0.032543182373046875, -0.024362564086914062, -0.01618194580078125, -0.008001327514648438, 0.000179290771484375, 0.008359909057617188, 0.01654052734375, 0.024721145629882812, 0.032901763916015625, 0.04108238220214844, 0.04926300048828125, 0.05744361877441406, 0.06562423706054688, 0.07380485534667969, 0.0819854736328125, 0.09016609191894531, 0.09834671020507812, 0.10652732849121094, 0.11470794677734375, 0.12288856506347656, 0.13106918334960938, 0.1392498016357422, 0.147430419921875, 0.1556110382080078, 0.16379165649414062, 0.17197227478027344, 0.18015289306640625, 0.18833351135253906, 0.19651412963867188, 0.2046947479248047, 0.2128753662109375, 0.2210559844970703, 0.22923660278320312, 0.23741722106933594, 0.24559783935546875, 0.25377845764160156, 0.2619590759277344, 0.2701396942138672, 0.2783203125]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 10.0, 17.0, 14.0, 18.0, 22.0, 24.0, 25.0, 32.0, 49.0, 47.0, 54.0, 55.0, 77.0, 58.0, 63.0, 68.0, 60.0, 53.0, 58.0, 46.0, 29.0, 25.0, 29.0, 21.0, 13.0, 7.0, 7.0, 3.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06298828125, -0.06085777282714844, -0.058727264404296875, -0.05659675598144531, -0.05446624755859375, -0.05233573913574219, -0.050205230712890625, -0.04807472229003906, -0.0459442138671875, -0.04381370544433594, -0.041683197021484375, -0.03955268859863281, -0.03742218017578125, -0.03529167175292969, -0.033161163330078125, -0.031030654907226562, -0.028900146484375, -0.026769638061523438, -0.024639129638671875, -0.022508621215820312, -0.02037811279296875, -0.018247604370117188, -0.016117095947265625, -0.013986587524414062, -0.0118560791015625, -0.009725570678710938, -0.007595062255859375, -0.0054645538330078125, -0.00333404541015625, -0.0012035369873046875, 0.000926971435546875, 0.0030574798583984375, 0.00518798828125, 0.0073184967041015625, 0.009449005126953125, 0.011579513549804688, 0.01371002197265625, 0.015840530395507812, 0.017971038818359375, 0.020101547241210938, 0.0222320556640625, 0.024362564086914062, 0.026493072509765625, 0.028623580932617188, 0.03075408935546875, 0.03288459777832031, 0.035015106201171875, 0.03714561462402344, 0.039276123046875, 0.04140663146972656, 0.043537139892578125, 0.04566764831542969, 0.04779815673828125, 0.04992866516113281, 0.052059173583984375, 0.05418968200683594, 0.0563201904296875, 0.05845069885253906, 0.060581207275390625, 0.06271171569824219, 0.06484222412109375, 0.06697273254394531, 0.06910324096679688, 0.07123374938964844, 0.0733642578125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 4.0, 6.0, 16.0, 11.0, 17.0, 36.0, 46.0, 66.0, 86.0, 183.0, 391.0, 783.0, 1946.0, 5259.0, 16393.0, 67744.0, 599282.0, 3329645.0, 131783.0, 27636.0, 8037.0, 2818.0, 1079.0, 431.0, 225.0, 139.0, 71.0, 46.0, 35.0, 24.0, 10.0, 11.0, 6.0, 5.0, 8.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.430908203125, -0.41991424560546875, -0.4089202880859375, -0.39792633056640625, -0.386932373046875, -0.37593841552734375, -0.3649444580078125, -0.35395050048828125, -0.34295654296875, -0.33196258544921875, -0.3209686279296875, -0.30997467041015625, -0.298980712890625, -0.28798675537109375, -0.2769927978515625, -0.26599884033203125, -0.2550048828125, -0.24401092529296875, -0.2330169677734375, -0.22202301025390625, -0.211029052734375, -0.20003509521484375, -0.1890411376953125, -0.17804718017578125, -0.16705322265625, -0.15605926513671875, -0.1450653076171875, -0.13407135009765625, -0.123077392578125, -0.11208343505859375, -0.1010894775390625, -0.09009552001953125, -0.0791015625, -0.06810760498046875, -0.0571136474609375, -0.04611968994140625, -0.035125732421875, -0.02413177490234375, -0.0131378173828125, -0.00214385986328125, 0.00885009765625, 0.01984405517578125, 0.0308380126953125, 0.04183197021484375, 0.052825927734375, 0.06381988525390625, 0.0748138427734375, 0.08580780029296875, 0.0968017578125, 0.10779571533203125, 0.1187896728515625, 0.12978363037109375, 0.140777587890625, 0.15177154541015625, 0.1627655029296875, 0.17375946044921875, 0.18475341796875, 0.19574737548828125, 0.2067413330078125, 0.21773529052734375, 0.228729248046875, 0.23972320556640625, 0.2507171630859375, 0.26171112060546875, 0.272705078125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 6.0, 2.0, 4.0, 8.0, 6.0, 10.0, 15.0, 14.0, 34.0, 38.0, 72.0, 102.0, 163.0, 369.0, 1721.0, 845.0, 288.0, 114.0, 88.0, 58.0, 34.0, 21.0, 25.0, 16.0, 10.0, 7.0, 3.0, 2.0, 4.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2093505859375, -0.20434284210205078, -0.19933509826660156, -0.19432735443115234, -0.18931961059570312, -0.1843118667602539, -0.1793041229248047, -0.17429637908935547, -0.16928863525390625, -0.16428089141845703, -0.1592731475830078, -0.1542654037475586, -0.14925765991210938, -0.14424991607666016, -0.13924217224121094, -0.13423442840576172, -0.1292266845703125, -0.12421894073486328, -0.11921119689941406, -0.11420345306396484, -0.10919570922851562, -0.1041879653930664, -0.09918022155761719, -0.09417247772216797, -0.08916473388671875, -0.08415699005126953, -0.07914924621582031, -0.0741415023803711, -0.06913375854492188, -0.06412601470947266, -0.05911827087402344, -0.05411052703857422, -0.049102783203125, -0.04409503936767578, -0.03908729553222656, -0.034079551696777344, -0.029071807861328125, -0.024064064025878906, -0.019056320190429688, -0.014048576354980469, -0.00904083251953125, -0.004033088684082031, 0.0009746551513671875, 0.005982398986816406, 0.010990142822265625, 0.015997886657714844, 0.021005630493164062, 0.02601337432861328, 0.0310211181640625, 0.03602886199951172, 0.04103660583496094, 0.046044349670410156, 0.051052093505859375, 0.056059837341308594, 0.06106758117675781, 0.06607532501220703, 0.07108306884765625, 0.07609081268310547, 0.08109855651855469, 0.0861063003540039, 0.09111404418945312, 0.09612178802490234, 0.10112953186035156, 0.10613727569580078, 0.11114501953125]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 4.0, 11.0, 16.0, 55.0, 148.0, 283.0, 251.0, 156.0, 54.0, 23.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.73797869682312, -2.681168556213379, -2.6243584156036377, -2.5675482749938965, -2.5107381343841553, -2.453927993774414, -2.397117853164673, -2.3403077125549316, -2.2834973335266113, -2.22668719291687, -2.169877052307129, -2.1130669116973877, -2.0562567710876465, -1.9994466304779053, -1.9426363706588745, -1.8858262300491333, -1.8290162086486816, -1.7722060680389404, -1.7153959274291992, -1.658585786819458, -1.6017756462097168, -1.5449655055999756, -1.4881552457809448, -1.4313451051712036, -1.3745349645614624, -1.3177248239517212, -1.26091468334198, -1.2041045427322388, -1.147294282913208, -1.0904841423034668, -1.0336740016937256, -0.9768638610839844, -0.9200537800788879, -0.8632436394691467, -0.8064334392547607, -0.7496232986450195, -0.6928131580352783, -0.6360030174255371, -0.5791928768157959, -0.5223826766014099, -0.4655725359916687, -0.4087623953819275, -0.3519522249698639, -0.2951420545578003, -0.23833191394805908, -0.18152177333831787, -0.12471160292625427, -0.06790143251419067, -0.011091291904449463, 0.04571886360645294, 0.10252901911735535, 0.15933917462825775, 0.21614933013916016, 0.27295947074890137, 0.32976964116096497, 0.38657981157302856, 0.4433899521827698, 0.500200092792511, 0.557010293006897, 0.6138204336166382, 0.6706305742263794, 0.7274407148361206, 0.7842508554458618, 0.8410610556602478, 0.897871196269989]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 4.0, 6.0, 9.0, 16.0, 22.0, 33.0, 42.0, 41.0, 54.0, 58.0, 70.0, 70.0, 65.0, 64.0, 68.0, 63.0, 59.0, 56.0, 48.0, 42.0, 24.0, 31.0, 28.0, 11.0, 11.0, 4.0, 7.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8174375295639038, -0.7941892743110657, -0.7709410190582275, -0.7476927042007446, -0.7244444489479065, -0.7011961936950684, -0.6779479384422302, -0.6546996831893921, -0.6314513683319092, -0.608203113079071, -0.5849548578262329, -0.56170654296875, -0.5384582877159119, -0.5152100324630737, -0.4919617772102356, -0.46871352195739746, -0.4454652667045593, -0.4222170114517212, -0.39896872639656067, -0.37572047114372253, -0.352472186088562, -0.3292239308357239, -0.30597567558288574, -0.2827274203300476, -0.2594791352748871, -0.23623086512088776, -0.21298259496688843, -0.1897343397140503, -0.16648606956005096, -0.14323779940605164, -0.1199895441532135, -0.09674127399921417, -0.07349306344985962, -0.05024479702115059, -0.02699653059244156, -0.003748267889022827, 0.0195000022649765, 0.04274827241897583, 0.06599652767181396, 0.0892447978258133, 0.11249306797981262, 0.13574133813381195, 0.15898960828781128, 0.18223786354064941, 0.20548613369464874, 0.22873440384864807, 0.2519826591014862, 0.27523094415664673, 0.29847919940948486, 0.321727454662323, 0.3449757397174835, 0.36822399497032166, 0.3914722800254822, 0.4147205352783203, 0.43796879053115845, 0.4612170457839966, 0.4844653308391571, 0.5077136158943176, 0.5309618711471558, 0.5542101263999939, 0.577458381652832, 0.6007066965103149, 0.6239548921585083, 0.6472032070159912, 0.6704514622688293]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 6.0, 6.0, 7.0, 15.0, 31.0, 27.0, 56.0, 90.0, 114.0, 163.0, 292.0, 446.0, 800.0, 1294.0, 2353.0, 4379.0, 8584.0, 17701.0, 38781.0, 102292.0, 524241.0, 233138.0, 61435.0, 26391.0, 12223.0, 6098.0, 3234.0, 1790.0, 987.0, 567.0, 361.0, 246.0, 124.0, 84.0, 63.0, 51.0, 34.0, 19.0, 5.0, 12.0, 5.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.220458984375, -0.21329116821289062, -0.20612335205078125, -0.19895553588867188, -0.1917877197265625, -0.18461990356445312, -0.17745208740234375, -0.17028427124023438, -0.163116455078125, -0.15594863891601562, -0.14878082275390625, -0.14161300659179688, -0.1344451904296875, -0.12727737426757812, -0.12010955810546875, -0.11294174194335938, -0.10577392578125, -0.09860610961914062, -0.09143829345703125, -0.08427047729492188, -0.0771026611328125, -0.06993484497070312, -0.06276702880859375, -0.055599212646484375, -0.048431396484375, -0.041263580322265625, -0.03409576416015625, -0.026927947998046875, -0.0197601318359375, -0.012592315673828125, -0.00542449951171875, 0.001743316650390625, 0.0089111328125, 0.016078948974609375, 0.02324676513671875, 0.030414581298828125, 0.0375823974609375, 0.044750213623046875, 0.05191802978515625, 0.059085845947265625, 0.066253662109375, 0.07342147827148438, 0.08058929443359375, 0.08775711059570312, 0.0949249267578125, 0.10209274291992188, 0.10926055908203125, 0.11642837524414062, 0.12359619140625, 0.13076400756835938, 0.13793182373046875, 0.14509963989257812, 0.1522674560546875, 0.15943527221679688, 0.16660308837890625, 0.17377090454101562, 0.180938720703125, 0.18810653686523438, 0.19527435302734375, 0.20244216918945312, 0.2096099853515625, 0.21677780151367188, 0.22394561767578125, 0.23111343383789062, 0.23828125]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 1.0, 3.0, 2.0, 4.0, 1.0, 5.0, 5.0, 8.0, 6.0, 16.0, 10.0, 23.0, 14.0, 19.0, 25.0, 32.0, 27.0, 31.0, 34.0, 41.0, 50.0, 42.0, 46.0, 47.0, 66.0, 43.0, 39.0, 53.0, 45.0, 40.0, 49.0, 35.0, 26.0, 30.0, 17.0, 13.0, 15.0, 10.0, 10.0, 7.0, 6.0, 2.0, 2.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.056243896484375, -0.0545191764831543, -0.052794456481933594, -0.05106973648071289, -0.04934501647949219, -0.047620296478271484, -0.04589557647705078, -0.04417085647583008, -0.042446136474609375, -0.04072141647338867, -0.03899669647216797, -0.037271976470947266, -0.03554725646972656, -0.03382253646850586, -0.032097816467285156, -0.030373096466064453, -0.02864837646484375, -0.026923656463623047, -0.025198936462402344, -0.02347421646118164, -0.021749496459960938, -0.020024776458740234, -0.01830005645751953, -0.016575336456298828, -0.014850616455078125, -0.013125896453857422, -0.011401176452636719, -0.009676456451416016, -0.007951736450195312, -0.006227016448974609, -0.004502296447753906, -0.002777576446533203, -0.0010528564453125, 0.0006718635559082031, 0.0023965835571289062, 0.004121303558349609, 0.0058460235595703125, 0.007570743560791016, 0.009295463562011719, 0.011020183563232422, 0.012744903564453125, 0.014469623565673828, 0.01619434356689453, 0.017919063568115234, 0.019643783569335938, 0.02136850357055664, 0.023093223571777344, 0.024817943572998047, 0.02654266357421875, 0.028267383575439453, 0.029992103576660156, 0.03171682357788086, 0.03344154357910156, 0.035166263580322266, 0.03689098358154297, 0.03861570358276367, 0.040340423583984375, 0.04206514358520508, 0.04378986358642578, 0.045514583587646484, 0.04723930358886719, 0.04896402359008789, 0.050688743591308594, 0.0524134635925293, 0.05413818359375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 5.0, 8.0, 9.0, 16.0, 18.0, 43.0, 58.0, 92.0, 173.0, 344.0, 617.0, 1440.0, 5368.0, 30667.0, 480709.0, 489801.0, 30995.0, 5350.0, 1374.0, 688.0, 322.0, 183.0, 127.0, 57.0, 32.0, 23.0, 17.0, 13.0, 5.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52685546875, -0.5108909606933594, -0.49492645263671875, -0.4789619445800781, -0.4629974365234375, -0.4470329284667969, -0.43106842041015625, -0.4151039123535156, -0.399139404296875, -0.3831748962402344, -0.36721038818359375, -0.3512458801269531, -0.3352813720703125, -0.3193168640136719, -0.30335235595703125, -0.2873878479003906, -0.27142333984375, -0.2554588317871094, -0.23949432373046875, -0.22352981567382812, -0.2075653076171875, -0.19160079956054688, -0.17563629150390625, -0.15967178344726562, -0.143707275390625, -0.12774276733398438, -0.11177825927734375, -0.09581375122070312, -0.0798492431640625, -0.06388473510742188, -0.04792022705078125, -0.031955718994140625, -0.0159912109375, -2.6702880859375e-05, 0.01593780517578125, 0.031902313232421875, 0.0478668212890625, 0.06383132934570312, 0.07979583740234375, 0.09576034545898438, 0.111724853515625, 0.12768936157226562, 0.14365386962890625, 0.15961837768554688, 0.1755828857421875, 0.19154739379882812, 0.20751190185546875, 0.22347640991210938, 0.23944091796875, 0.2554054260253906, 0.27136993408203125, 0.2873344421386719, 0.3032989501953125, 0.3192634582519531, 0.33522796630859375, 0.3511924743652344, 0.367156982421875, 0.3831214904785156, 0.39908599853515625, 0.4150505065917969, 0.4310150146484375, 0.4469795227050781, 0.46294403076171875, 0.4789085388183594, 0.494873046875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 8.0, 5.0, 5.0, 7.0, 14.0, 18.0, 18.0, 21.0, 26.0, 41.0, 62.0, 56.0, 74.0, 70.0, 70.0, 79.0, 72.0, 72.0, 52.0, 66.0, 40.0, 30.0, 23.0, 17.0, 16.0, 12.0, 11.0, 10.0, 7.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.423828125, -0.4123382568359375, -0.400848388671875, -0.3893585205078125, -0.37786865234375, -0.3663787841796875, -0.354888916015625, -0.3433990478515625, -0.3319091796875, -0.3204193115234375, -0.308929443359375, -0.2974395751953125, -0.28594970703125, -0.2744598388671875, -0.262969970703125, -0.2514801025390625, -0.239990234375, -0.2285003662109375, -0.217010498046875, -0.2055206298828125, -0.19403076171875, -0.1825408935546875, -0.171051025390625, -0.1595611572265625, -0.1480712890625, -0.1365814208984375, -0.125091552734375, -0.1136016845703125, -0.10211181640625, -0.0906219482421875, -0.079132080078125, -0.0676422119140625, -0.05615234375, -0.0446624755859375, -0.033172607421875, -0.0216827392578125, -0.01019287109375, 0.0012969970703125, 0.012786865234375, 0.0242767333984375, 0.0357666015625, 0.0472564697265625, 0.058746337890625, 0.0702362060546875, 0.08172607421875, 0.0932159423828125, 0.104705810546875, 0.1161956787109375, 0.127685546875, 0.1391754150390625, 0.150665283203125, 0.1621551513671875, 0.17364501953125, 0.1851348876953125, 0.196624755859375, 0.2081146240234375, 0.2196044921875, 0.2310943603515625, 0.242584228515625, 0.2540740966796875, 0.26556396484375, 0.2770538330078125, 0.288543701171875, 0.3000335693359375, 0.3115234375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 4.0, 6.0, 9.0, 10.0, 17.0, 16.0, 30.0, 69.0, 111.0, 163.0, 339.0, 757.0, 1920.0, 5371.0, 19654.0, 590198.0, 403358.0, 18164.0, 5005.0, 1809.0, 732.0, 351.0, 190.0, 109.0, 59.0, 26.0, 43.0, 15.0, 6.0, 2.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.52001953125, -0.5047149658203125, -0.489410400390625, -0.4741058349609375, -0.45880126953125, -0.4434967041015625, -0.428192138671875, -0.4128875732421875, -0.3975830078125, -0.3822784423828125, -0.366973876953125, -0.3516693115234375, -0.33636474609375, -0.3210601806640625, -0.305755615234375, -0.2904510498046875, -0.275146484375, -0.2598419189453125, -0.244537353515625, -0.2292327880859375, -0.21392822265625, -0.1986236572265625, -0.183319091796875, -0.1680145263671875, -0.1527099609375, -0.1374053955078125, -0.122100830078125, -0.1067962646484375, -0.09149169921875, -0.0761871337890625, -0.060882568359375, -0.0455780029296875, -0.0302734375, -0.0149688720703125, 0.000335693359375, 0.0156402587890625, 0.03094482421875, 0.0462493896484375, 0.061553955078125, 0.0768585205078125, 0.0921630859375, 0.1074676513671875, 0.122772216796875, 0.1380767822265625, 0.15338134765625, 0.1686859130859375, 0.183990478515625, 0.1992950439453125, 0.214599609375, 0.2299041748046875, 0.245208740234375, 0.2605133056640625, 0.27581787109375, 0.2911224365234375, 0.306427001953125, 0.3217315673828125, 0.3370361328125, 0.3523406982421875, 0.367645263671875, 0.3829498291015625, 0.39825439453125, 0.4135589599609375, 0.428863525390625, 0.4441680908203125, 0.45947265625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 3.0, 1.0, 2.0, 5.0, 2.0, 11.0, 18.0, 31.0, 61.0, 117.0, 218.0, 213.0, 148.0, 73.0, 43.0, 21.0, 13.0, 11.0, 9.0, 9.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.161233901977539e-05, -8.811336010694504e-05, -8.461438119411469e-05, -8.111540228128433e-05, -7.761642336845398e-05, -7.411744445562363e-05, -7.061846554279327e-05, -6.711948662996292e-05, -6.362050771713257e-05, -6.0121528804302216e-05, -5.662254989147186e-05, -5.312357097864151e-05, -4.962459206581116e-05, -4.6125613152980804e-05, -4.262663424015045e-05, -3.91276553273201e-05, -3.5628676414489746e-05, -3.212969750165939e-05, -2.863071858882904e-05, -2.5131739675998688e-05, -2.1632760763168335e-05, -1.8133781850337982e-05, -1.463480293750763e-05, -1.1135824024677277e-05, -7.636845111846924e-06, -4.137866199016571e-06, -6.388872861862183e-07, 2.8600916266441345e-06, 6.359070539474487e-06, 9.85804945230484e-06, 1.3357028365135193e-05, 1.6856007277965546e-05, 2.03549861907959e-05, 2.385396510362625e-05, 2.7352944016456604e-05, 3.085192292928696e-05, 3.435090184211731e-05, 3.784988075494766e-05, 4.1348859667778015e-05, 4.484783858060837e-05, 4.834681749343872e-05, 5.1845796406269073e-05, 5.5344775319099426e-05, 5.884375423192978e-05, 6.234273314476013e-05, 6.584171205759048e-05, 6.934069097042084e-05, 7.283966988325119e-05, 7.633864879608154e-05, 7.98376277089119e-05, 8.333660662174225e-05, 8.68355855345726e-05, 9.033456444740295e-05, 9.383354336023331e-05, 9.733252227306366e-05, 0.00010083150118589401, 0.00010433048009872437, 0.00010782945901155472, 0.00011132843792438507, 0.00011482741683721542, 0.00011832639575004578, 0.00012182537466287613, 0.00012532435357570648, 0.00012882333248853683, 0.0001323223114013672]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 1.0, 8.0, 7.0, 11.0, 12.0, 27.0, 27.0, 58.0, 71.0, 127.0, 223.0, 419.0, 795.0, 1909.0, 5176.0, 17029.0, 225274.0, 764033.0, 22752.0, 6262.0, 2294.0, 945.0, 447.0, 261.0, 135.0, 86.0, 45.0, 33.0, 25.0, 24.0, 7.0, 8.0, 5.0, 5.0, 6.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.5693359375, -0.5543899536132812, -0.5394439697265625, -0.5244979858398438, -0.509552001953125, -0.49460601806640625, -0.4796600341796875, -0.46471405029296875, -0.44976806640625, -0.43482208251953125, -0.4198760986328125, -0.40493011474609375, -0.389984130859375, -0.37503814697265625, -0.3600921630859375, -0.34514617919921875, -0.3302001953125, -0.31525421142578125, -0.3003082275390625, -0.28536224365234375, -0.270416259765625, -0.25547027587890625, -0.2405242919921875, -0.22557830810546875, -0.21063232421875, -0.19568634033203125, -0.1807403564453125, -0.16579437255859375, -0.150848388671875, -0.13590240478515625, -0.1209564208984375, -0.10601043701171875, -0.091064453125, -0.07611846923828125, -0.0611724853515625, -0.04622650146484375, -0.031280517578125, -0.01633453369140625, -0.0013885498046875, 0.01355743408203125, 0.02850341796875, 0.04344940185546875, 0.0583953857421875, 0.07334136962890625, 0.088287353515625, 0.10323333740234375, 0.1181793212890625, 0.13312530517578125, 0.1480712890625, 0.16301727294921875, 0.1779632568359375, 0.19290924072265625, 0.207855224609375, 0.22280120849609375, 0.2377471923828125, 0.25269317626953125, 0.26763916015625, 0.28258514404296875, 0.2975311279296875, 0.31247711181640625, 0.327423095703125, 0.34236907958984375, 0.3573150634765625, 0.37226104736328125, 0.38720703125]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 6.0, 4.0, 3.0, 11.0, 11.0, 14.0, 21.0, 27.0, 49.0, 122.0, 444.0, 139.0, 54.0, 38.0, 18.0, 12.0, 6.0, 8.0, 8.0, 6.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4052734375, -0.3944816589355469, -0.38368988037109375, -0.3728981018066406, -0.3621063232421875, -0.3513145446777344, -0.34052276611328125, -0.3297309875488281, -0.318939208984375, -0.3081474304199219, -0.29735565185546875, -0.2865638732910156, -0.2757720947265625, -0.2649803161621094, -0.25418853759765625, -0.24339675903320312, -0.23260498046875, -0.22181320190429688, -0.21102142333984375, -0.20022964477539062, -0.1894378662109375, -0.17864608764648438, -0.16785430908203125, -0.15706253051757812, -0.146270751953125, -0.13547897338867188, -0.12468719482421875, -0.11389541625976562, -0.1031036376953125, -0.09231185913085938, -0.08152008056640625, -0.07072830200195312, -0.0599365234375, -0.049144744873046875, -0.03835296630859375, -0.027561187744140625, -0.0167694091796875, -0.005977630615234375, 0.00481414794921875, 0.015605926513671875, 0.026397705078125, 0.037189483642578125, 0.04798126220703125, 0.058773040771484375, 0.0695648193359375, 0.08035659790039062, 0.09114837646484375, 0.10194015502929688, 0.11273193359375, 0.12352371215820312, 0.13431549072265625, 0.14510726928710938, 0.1558990478515625, 0.16669082641601562, 0.17748260498046875, 0.18827438354492188, 0.199066162109375, 0.20985794067382812, 0.22064971923828125, 0.23144149780273438, 0.2422332763671875, 0.2530250549316406, 0.26381683349609375, 0.2746086120605469, 0.285400390625]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 14.0, 23.0, 79.0, 121.0, 255.0, 217.0, 168.0, 77.0, 29.0, 10.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.621408939361572, -5.481589317321777, -5.341769695281982, -5.201949596405029, -5.062129974365234, -4.9223103523254395, -4.7824907302856445, -4.64267110824585, -4.502851486206055, -4.36303186416626, -4.223212242126465, -4.083392143249512, -3.943572521209717, -3.803752899169922, -3.663933277130127, -3.524113655090332, -3.384293556213379, -3.244473934173584, -3.10465407371521, -2.964834451675415, -2.825014591217041, -2.685194969177246, -2.545375347137451, -2.4055557250976562, -2.2657358646392822, -2.1259162425994873, -1.9860963821411133, -1.8462767601013184, -1.7064570188522339, -1.5666372776031494, -1.4268176555633545, -1.28699791431427, -1.1471786499023438, -1.0073589086532593, -0.8675392270088196, -0.7277195453643799, -0.5878998041152954, -0.44808006286621094, -0.30826038122177124, -0.16844069957733154, -0.02862095832824707, 0.11119875311851501, 0.2510184645652771, 0.3908381760120392, 0.5306578874588013, 0.6704776287078857, 0.8102973103523254, 0.9501169919967651, 1.0899367332458496, 1.229756474494934, 1.3695762157440186, 1.5093958377838135, 1.649215579032898, 1.7890353202819824, 1.9288549423217773, 2.0686745643615723, 2.2084944248199463, 2.348314046859741, 2.4881339073181152, 2.62795352935791, 2.767773151397705, 2.907593011856079, 3.047412633895874, 3.187232494354248, 3.327052116394043]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 6.0, 1.0, 7.0, 6.0, 12.0, 6.0, 8.0, 15.0, 15.0, 16.0, 20.0, 27.0, 21.0, 21.0, 27.0, 40.0, 28.0, 38.0, 39.0, 46.0, 48.0, 29.0, 50.0, 38.0, 37.0, 33.0, 38.0, 35.0, 39.0, 36.0, 34.0, 31.0, 15.0, 23.0, 9.0, 17.0, 13.0, 13.0, 23.0, 10.0, 5.0, 11.0, 3.0, 4.0, 4.0, 2.0, 2.0, 2.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.2642617225646973, -1.2237061262130737, -1.1831506490707397, -1.1425950527191162, -1.1020395755767822, -1.0614839792251587, -1.0209285020828247, -0.9803729057312012, -0.9398173689842224, -0.8992618322372437, -0.8587062954902649, -0.8181507587432861, -0.7775951623916626, -0.7370396852493286, -0.6964840888977051, -0.6559285521507263, -0.6153730154037476, -0.5748174786567688, -0.53426194190979, -0.4937063753604889, -0.45315083861351013, -0.41259530186653137, -0.3720397353172302, -0.33148419857025146, -0.2909286618232727, -0.25037312507629395, -0.209817573428154, -0.16926202178001404, -0.12870648503303528, -0.08815094828605652, -0.047595396637916565, -0.007039844989776611, 0.03351569175720215, 0.0740712359547615, 0.11462678015232086, 0.15518233180046082, 0.19573786854743958, 0.23629340529441833, 0.2768489718437195, 0.31740450859069824, 0.357960045337677, 0.39851558208465576, 0.4390711188316345, 0.47962668538093567, 0.5201822519302368, 0.5607377290725708, 0.6012933254241943, 0.6418488621711731, 0.6824043989181519, 0.7229599356651306, 0.7635154724121094, 0.8040710091590881, 0.8446265459060669, 0.8851821422576904, 0.9257376790046692, 0.966293215751648, 1.0068488121032715, 1.047404408454895, 1.087959885597229, 1.1285154819488525, 1.1690709590911865, 1.20962655544281, 1.250182032585144, 1.2907376289367676, 1.3312931060791016]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 9.0, 13.0, 9.0, 11.0, 14.0, 17.0, 27.0, 42.0, 51.0, 59.0, 96.0, 115.0, 210.0, 371.0, 546.0, 843.0, 1457.0, 2537.0, 4800.0, 10310.0, 24374.0, 75655.0, 810517.0, 3114533.0, 94877.0, 28500.0, 11608.0, 5564.0, 2919.0, 1621.0, 947.0, 556.0, 371.0, 229.0, 151.0, 100.0, 60.0, 35.0, 40.0, 21.0, 29.0, 10.0, 8.0, 9.0, 5.0, 7.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.279541015625, -0.2715721130371094, -0.26360321044921875, -0.2556343078613281, -0.2476654052734375, -0.23969650268554688, -0.23172760009765625, -0.22375869750976562, -0.215789794921875, -0.20782089233398438, -0.19985198974609375, -0.19188308715820312, -0.1839141845703125, -0.17594528198242188, -0.16797637939453125, -0.16000747680664062, -0.15203857421875, -0.14406967163085938, -0.13610076904296875, -0.12813186645507812, -0.1201629638671875, -0.11219406127929688, -0.10422515869140625, -0.09625625610351562, -0.088287353515625, -0.08031845092773438, -0.07234954833984375, -0.06438064575195312, -0.0564117431640625, -0.048442840576171875, -0.04047393798828125, -0.032505035400390625, -0.0245361328125, -0.016567230224609375, -0.00859832763671875, -0.000629425048828125, 0.0073394775390625, 0.015308380126953125, 0.02327728271484375, 0.031246185302734375, 0.039215087890625, 0.047183990478515625, 0.05515289306640625, 0.06312179565429688, 0.0710906982421875, 0.07905960083007812, 0.08702850341796875, 0.09499740600585938, 0.10296630859375, 0.11093521118164062, 0.11890411376953125, 0.12687301635742188, 0.1348419189453125, 0.14281082153320312, 0.15077972412109375, 0.15874862670898438, 0.166717529296875, 0.17468643188476562, 0.18265533447265625, 0.19062423706054688, 0.1985931396484375, 0.20656204223632812, 0.21453094482421875, 0.22249984741210938, 0.23046875]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 4.0, 2.0, 2.0, 4.0, 5.0, 10.0, 9.0, 8.0, 17.0, 17.0, 20.0, 16.0, 26.0, 28.0, 34.0, 44.0, 41.0, 39.0, 48.0, 52.0, 47.0, 46.0, 32.0, 51.0, 39.0, 58.0, 45.0, 40.0, 32.0, 31.0, 31.0, 36.0, 22.0, 13.0, 14.0, 6.0, 10.0, 7.0, 8.0, 1.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06640625, -0.06442022323608398, -0.06243419647216797, -0.06044816970825195, -0.05846214294433594, -0.05647611618041992, -0.054490089416503906, -0.05250406265258789, -0.050518035888671875, -0.04853200912475586, -0.046545982360839844, -0.04455995559692383, -0.04257392883300781, -0.0405879020690918, -0.03860187530517578, -0.036615848541259766, -0.03462982177734375, -0.032643795013427734, -0.03065776824951172, -0.028671741485595703, -0.026685714721679688, -0.024699687957763672, -0.022713661193847656, -0.02072763442993164, -0.018741607666015625, -0.01675558090209961, -0.014769554138183594, -0.012783527374267578, -0.010797500610351562, -0.008811473846435547, -0.006825447082519531, -0.004839420318603516, -0.0028533935546875, -0.0008673667907714844, 0.0011186599731445312, 0.003104686737060547, 0.0050907135009765625, 0.007076740264892578, 0.009062767028808594, 0.01104879379272461, 0.013034820556640625, 0.01502084732055664, 0.017006874084472656, 0.018992900848388672, 0.020978927612304688, 0.022964954376220703, 0.02495098114013672, 0.026937007904052734, 0.02892303466796875, 0.030909061431884766, 0.03289508819580078, 0.0348811149597168, 0.03686714172363281, 0.03885316848754883, 0.040839195251464844, 0.04282522201538086, 0.044811248779296875, 0.04679727554321289, 0.048783302307128906, 0.05076932907104492, 0.05275535583496094, 0.05474138259887695, 0.05672740936279297, 0.058713436126708984, 0.060699462890625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 6.0, 2.0, 5.0, 7.0, 7.0, 9.0, 12.0, 22.0, 32.0, 45.0, 76.0, 103.0, 125.0, 232.0, 357.0, 616.0, 1223.0, 2294.0, 5417.0, 14938.0, 51274.0, 342935.0, 3589827.0, 137256.0, 30023.0, 9574.0, 3787.0, 1772.0, 947.0, 523.0, 303.0, 177.0, 112.0, 71.0, 62.0, 34.0, 19.0, 12.0, 18.0, 11.0, 9.0, 7.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.457275390625, -0.44467926025390625, -0.4320831298828125, -0.41948699951171875, -0.406890869140625, -0.39429473876953125, -0.3816986083984375, -0.36910247802734375, -0.35650634765625, -0.34391021728515625, -0.3313140869140625, -0.31871795654296875, -0.306121826171875, -0.29352569580078125, -0.2809295654296875, -0.26833343505859375, -0.2557373046875, -0.24314117431640625, -0.2305450439453125, -0.21794891357421875, -0.205352783203125, -0.19275665283203125, -0.1801605224609375, -0.16756439208984375, -0.15496826171875, -0.14237213134765625, -0.1297760009765625, -0.11717987060546875, -0.104583740234375, -0.09198760986328125, -0.0793914794921875, -0.06679534912109375, -0.05419921875, -0.04160308837890625, -0.0290069580078125, -0.01641082763671875, -0.003814697265625, 0.00878143310546875, 0.0213775634765625, 0.03397369384765625, 0.04656982421875, 0.05916595458984375, 0.0717620849609375, 0.08435821533203125, 0.096954345703125, 0.10955047607421875, 0.1221466064453125, 0.13474273681640625, 0.1473388671875, 0.15993499755859375, 0.1725311279296875, 0.18512725830078125, 0.197723388671875, 0.21031951904296875, 0.2229156494140625, 0.23551177978515625, 0.24810791015625, 0.26070404052734375, 0.2733001708984375, 0.28589630126953125, 0.298492431640625, 0.31108856201171875, 0.3236846923828125, 0.33628082275390625, 0.348876953125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 3.0, 10.0, 4.0, 10.0, 14.0, 30.0, 33.0, 60.0, 84.0, 154.0, 580.0, 2321.0, 381.0, 153.0, 82.0, 50.0, 36.0, 21.0, 21.0, 4.0, 6.0, 4.0, 4.0, 6.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2244873046875, -0.21848106384277344, -0.21247482299804688, -0.2064685821533203, -0.20046234130859375, -0.1944561004638672, -0.18844985961914062, -0.18244361877441406, -0.1764373779296875, -0.17043113708496094, -0.16442489624023438, -0.1584186553955078, -0.15241241455078125, -0.1464061737060547, -0.14039993286132812, -0.13439369201660156, -0.128387451171875, -0.12238121032714844, -0.11637496948242188, -0.11036872863769531, -0.10436248779296875, -0.09835624694824219, -0.09235000610351562, -0.08634376525878906, -0.0803375244140625, -0.07433128356933594, -0.06832504272460938, -0.06231880187988281, -0.05631256103515625, -0.05030632019042969, -0.044300079345703125, -0.03829383850097656, -0.03228759765625, -0.026281356811523438, -0.020275115966796875, -0.014268875122070312, -0.00826263427734375, -0.0022563934326171875, 0.003749847412109375, 0.009756088256835938, 0.0157623291015625, 0.021768569946289062, 0.027774810791015625, 0.03378105163574219, 0.03978729248046875, 0.04579353332519531, 0.051799774169921875, 0.05780601501464844, 0.063812255859375, 0.06981849670410156, 0.07582473754882812, 0.08183097839355469, 0.08783721923828125, 0.09384346008300781, 0.09984970092773438, 0.10585594177246094, 0.1118621826171875, 0.11786842346191406, 0.12387466430664062, 0.1298809051513672, 0.13588714599609375, 0.1418933868408203, 0.14789962768554688, 0.15390586853027344, 0.159912109375]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 7.0, 10.0, 11.0, 14.0, 36.0, 42.0, 56.0, 113.0, 103.0, 129.0, 110.0, 125.0, 96.0, 51.0, 40.0, 18.0, 26.0, 7.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0710904598236084, -1.042158603668213, -1.0132266283035278, -0.9842947125434875, -0.9553627967834473, -0.9264309406280518, -0.8974990248680115, -0.8685671091079712, -0.8396351933479309, -0.8107032775878906, -0.7817713618278503, -0.7528394460678101, -0.7239075899124146, -0.6949756145477295, -0.666043758392334, -0.6371118426322937, -0.6081799268722534, -0.5792480111122131, -0.5503160953521729, -0.5213841795921326, -0.4924522936344147, -0.4635203778743744, -0.4345884919166565, -0.4056565761566162, -0.3767246603965759, -0.34779274463653564, -0.31886082887649536, -0.28992894291877747, -0.2609970271587372, -0.2320651113986969, -0.2031332105398178, -0.17420130968093872, -0.14526933431625366, -0.11633742600679398, -0.08740551769733429, -0.0584736093878746, -0.029541701078414917, -0.0006097853183746338, 0.028322115540504456, 0.057254016399383545, 0.08618593215942383, 0.11511784046888351, 0.1440497487783432, 0.1729816496372223, 0.20191356539726257, 0.23084548115730286, 0.25977736711502075, 0.28870928287506104, 0.3176411986351013, 0.3465731143951416, 0.3755050301551819, 0.4044369161128998, 0.43336883187294006, 0.46230074763298035, 0.49123263359069824, 0.5201645493507385, 0.5490964651107788, 0.5780283808708191, 0.6069602966308594, 0.6358922123908997, 0.6648241281509399, 0.6937559843063354, 0.7226879000663757, 0.751619815826416, 0.7805517315864563]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 7.0, 6.0, 7.0, 9.0, 10.0, 12.0, 10.0, 14.0, 29.0, 23.0, 24.0, 20.0, 27.0, 30.0, 29.0, 30.0, 30.0, 34.0, 28.0, 40.0, 38.0, 44.0, 40.0, 30.0, 45.0, 34.0, 35.0, 26.0, 25.0, 30.0, 25.0, 26.0, 15.0, 25.0, 19.0, 28.0, 19.0, 18.0, 11.0, 8.0, 10.0, 7.0, 8.0, 7.0, 4.0, 0.0, 0.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.42418307065963745, -0.41092607378959656, -0.3976690471172333, -0.3844120502471924, -0.3711550533771515, -0.3578980267047882, -0.3446410298347473, -0.33138400316238403, -0.31812700629234314, -0.30487000942230225, -0.29161298274993896, -0.27835598587989807, -0.2650989890098572, -0.2518419623374939, -0.238584965467453, -0.22532795369625092, -0.21207095682621002, -0.19881394505500793, -0.18555694818496704, -0.17229993641376495, -0.15904292464256287, -0.14578592777252197, -0.13252891600131989, -0.1192719042301178, -0.10601489990949631, -0.09275789558887482, -0.07950088381767273, -0.06624387949705124, -0.05298687145113945, -0.03972986340522766, -0.02647285908460617, -0.013215847313404083, 4.1157007217407227e-05, 0.013298164121806622, 0.026555171236395836, 0.039812177419662476, 0.053069185465574265, 0.06632619351148605, 0.07958319783210754, 0.09284020960330963, 0.10609721392393112, 0.11935421824455261, 0.1326112300157547, 0.1458682417869568, 0.15912523865699768, 0.17238225042819977, 0.18563926219940186, 0.19889625906944275, 0.21215327084064484, 0.22541028261184692, 0.23866727948188782, 0.2519242763519287, 0.265181303024292, 0.2784382998943329, 0.2916952967643738, 0.30495232343673706, 0.31820932030677795, 0.33146631717681885, 0.34472334384918213, 0.357980340719223, 0.3712373375892639, 0.3844943642616272, 0.3977513611316681, 0.411008358001709, 0.42426538467407227]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 2.0, 9.0, 11.0, 10.0, 12.0, 15.0, 14.0, 27.0, 44.0, 60.0, 94.0, 135.0, 212.0, 372.0, 598.0, 994.0, 1760.0, 3241.0, 6365.0, 12656.0, 26285.0, 61200.0, 219200.0, 493876.0, 134307.0, 45022.0, 20501.0, 10103.0, 5020.0, 2801.0, 1449.0, 767.0, 505.0, 293.0, 196.0, 113.0, 95.0, 55.0, 45.0, 23.0, 24.0, 16.0, 12.0, 11.0, 3.0, 2.0, 1.0, 1.0, 3.0], "bins": [-0.23486328125, -0.22873687744140625, -0.2226104736328125, -0.21648406982421875, -0.210357666015625, -0.20423126220703125, -0.1981048583984375, -0.19197845458984375, -0.18585205078125, -0.17972564697265625, -0.1735992431640625, -0.16747283935546875, -0.161346435546875, -0.15522003173828125, -0.1490936279296875, -0.14296722412109375, -0.1368408203125, -0.13071441650390625, -0.1245880126953125, -0.11846160888671875, -0.112335205078125, -0.10620880126953125, -0.1000823974609375, -0.09395599365234375, -0.08782958984375, -0.08170318603515625, -0.0755767822265625, -0.06945037841796875, -0.063323974609375, -0.05719757080078125, -0.0510711669921875, -0.04494476318359375, -0.038818359375, -0.03269195556640625, -0.0265655517578125, -0.02043914794921875, -0.014312744140625, -0.00818634033203125, -0.0020599365234375, 0.00406646728515625, 0.01019287109375, 0.01631927490234375, 0.0224456787109375, 0.02857208251953125, 0.034698486328125, 0.04082489013671875, 0.0469512939453125, 0.05307769775390625, 0.0592041015625, 0.06533050537109375, 0.0714569091796875, 0.07758331298828125, 0.083709716796875, 0.08983612060546875, 0.0959625244140625, 0.10208892822265625, 0.10821533203125, 0.11434173583984375, 0.1204681396484375, 0.12659454345703125, 0.132720947265625, 0.13884735107421875, 0.1449737548828125, 0.15110015869140625, 0.1572265625]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 4.0, 3.0, 7.0, 3.0, 9.0, 8.0, 14.0, 19.0, 15.0, 26.0, 25.0, 31.0, 35.0, 39.0, 31.0, 46.0, 45.0, 50.0, 47.0, 61.0, 50.0, 49.0, 41.0, 42.0, 51.0, 38.0, 47.0, 31.0, 33.0, 18.0, 31.0, 11.0, 9.0, 13.0, 6.0, 5.0, 5.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.08038330078125, -0.07811260223388672, -0.07584190368652344, -0.07357120513916016, -0.07130050659179688, -0.0690298080444336, -0.06675910949707031, -0.06448841094970703, -0.06221771240234375, -0.05994701385498047, -0.05767631530761719, -0.055405616760253906, -0.053134918212890625, -0.050864219665527344, -0.04859352111816406, -0.04632282257080078, -0.0440521240234375, -0.04178142547607422, -0.03951072692871094, -0.037240028381347656, -0.034969329833984375, -0.032698631286621094, -0.030427932739257812, -0.02815723419189453, -0.02588653564453125, -0.02361583709716797, -0.021345138549804688, -0.019074440002441406, -0.016803741455078125, -0.014533042907714844, -0.012262344360351562, -0.009991645812988281, -0.007720947265625, -0.005450248718261719, -0.0031795501708984375, -0.0009088516235351562, 0.001361846923828125, 0.0036325454711914062, 0.0059032440185546875, 0.008173942565917969, 0.01044464111328125, 0.012715339660644531, 0.014986038208007812, 0.017256736755371094, 0.019527435302734375, 0.021798133850097656, 0.024068832397460938, 0.02633953094482422, 0.0286102294921875, 0.03088092803955078, 0.03315162658691406, 0.035422325134277344, 0.037693023681640625, 0.039963722229003906, 0.04223442077636719, 0.04450511932373047, 0.04677581787109375, 0.04904651641845703, 0.05131721496582031, 0.053587913513183594, 0.055858612060546875, 0.058129310607910156, 0.06040000915527344, 0.06267070770263672, 0.06494140625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 6.0, 5.0, 5.0, 12.0, 17.0, 24.0, 28.0, 57.0, 78.0, 202.0, 301.0, 608.0, 1536.0, 4370.0, 13719.0, 53823.0, 783424.0, 152811.0, 25639.0, 7392.0, 2545.0, 980.0, 439.0, 221.0, 117.0, 65.0, 41.0, 23.0, 29.0, 15.0, 10.0, 3.0, 7.0, 6.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.54345703125, -0.5273513793945312, -0.5112457275390625, -0.49514007568359375, -0.479034423828125, -0.46292877197265625, -0.4468231201171875, -0.43071746826171875, -0.41461181640625, -0.39850616455078125, -0.3824005126953125, -0.36629486083984375, -0.350189208984375, -0.33408355712890625, -0.3179779052734375, -0.30187225341796875, -0.2857666015625, -0.26966094970703125, -0.2535552978515625, -0.23744964599609375, -0.221343994140625, -0.20523834228515625, -0.1891326904296875, -0.17302703857421875, -0.15692138671875, -0.14081573486328125, -0.1247100830078125, -0.10860443115234375, -0.092498779296875, -0.07639312744140625, -0.0602874755859375, -0.04418182373046875, -0.028076171875, -0.01197052001953125, 0.0041351318359375, 0.02024078369140625, 0.036346435546875, 0.05245208740234375, 0.0685577392578125, 0.08466339111328125, 0.10076904296875, 0.11687469482421875, 0.1329803466796875, 0.14908599853515625, 0.165191650390625, 0.18129730224609375, 0.1974029541015625, 0.21350860595703125, 0.2296142578125, 0.24571990966796875, 0.2618255615234375, 0.27793121337890625, 0.294036865234375, 0.31014251708984375, 0.3262481689453125, 0.34235382080078125, 0.35845947265625, 0.37456512451171875, 0.3906707763671875, 0.40677642822265625, 0.422882080078125, 0.43898773193359375, 0.4550933837890625, 0.47119903564453125, 0.4873046875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 4.0, 8.0, 4.0, 7.0, 12.0, 17.0, 19.0, 36.0, 52.0, 55.0, 60.0, 89.0, 73.0, 93.0, 93.0, 80.0, 64.0, 54.0, 45.0, 38.0, 27.0, 20.0, 10.0, 5.0, 12.0, 6.0, 1.0, 5.0, 2.0, 2.0, 3.0, 3.0, 0.0, 4.0, 1.0, 1.0, 1.0], "bins": [-0.65087890625, -0.6347808837890625, -0.618682861328125, -0.6025848388671875, -0.58648681640625, -0.5703887939453125, -0.554290771484375, -0.5381927490234375, -0.5220947265625, -0.5059967041015625, -0.489898681640625, -0.4738006591796875, -0.45770263671875, -0.4416046142578125, -0.425506591796875, -0.4094085693359375, -0.393310546875, -0.3772125244140625, -0.361114501953125, -0.3450164794921875, -0.32891845703125, -0.3128204345703125, -0.296722412109375, -0.2806243896484375, -0.2645263671875, -0.2484283447265625, -0.232330322265625, -0.2162322998046875, -0.20013427734375, -0.1840362548828125, -0.167938232421875, -0.1518402099609375, -0.1357421875, -0.1196441650390625, -0.103546142578125, -0.0874481201171875, -0.07135009765625, -0.0552520751953125, -0.039154052734375, -0.0230560302734375, -0.0069580078125, 0.0091400146484375, 0.025238037109375, 0.0413360595703125, 0.05743408203125, 0.0735321044921875, 0.089630126953125, 0.1057281494140625, 0.121826171875, 0.1379241943359375, 0.154022216796875, 0.1701202392578125, 0.18621826171875, 0.2023162841796875, 0.218414306640625, 0.2345123291015625, 0.2506103515625, 0.2667083740234375, 0.282806396484375, 0.2989044189453125, 0.31500244140625, 0.3311004638671875, 0.347198486328125, 0.3632965087890625, 0.37939453125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 6.0, 3.0, 6.0, 3.0, 8.0, 21.0, 13.0, 36.0, 45.0, 46.0, 87.0, 119.0, 157.0, 267.0, 401.0, 609.0, 1069.0, 1887.0, 3883.0, 10519.0, 37420.0, 688278.0, 258670.0, 28580.0, 8676.0, 3415.0, 1688.0, 931.0, 566.0, 371.0, 247.0, 158.0, 115.0, 87.0, 49.0, 38.0, 27.0, 14.0, 11.0, 7.0, 9.0, 11.0, 7.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.369384765625, -0.358489990234375, -0.34759521484375, -0.336700439453125, -0.3258056640625, -0.314910888671875, -0.30401611328125, -0.293121337890625, -0.2822265625, -0.271331787109375, -0.26043701171875, -0.249542236328125, -0.2386474609375, -0.227752685546875, -0.21685791015625, -0.205963134765625, -0.195068359375, -0.184173583984375, -0.17327880859375, -0.162384033203125, -0.1514892578125, -0.140594482421875, -0.12969970703125, -0.118804931640625, -0.10791015625, -0.097015380859375, -0.08612060546875, -0.075225830078125, -0.0643310546875, -0.053436279296875, -0.04254150390625, -0.031646728515625, -0.020751953125, -0.009857177734375, 0.00103759765625, 0.011932373046875, 0.0228271484375, 0.033721923828125, 0.04461669921875, 0.055511474609375, 0.06640625, 0.077301025390625, 0.08819580078125, 0.099090576171875, 0.1099853515625, 0.120880126953125, 0.13177490234375, 0.142669677734375, 0.153564453125, 0.164459228515625, 0.17535400390625, 0.186248779296875, 0.1971435546875, 0.208038330078125, 0.21893310546875, 0.229827880859375, 0.24072265625, 0.251617431640625, 0.26251220703125, 0.273406982421875, 0.2843017578125, 0.295196533203125, 0.30609130859375, 0.316986083984375, 0.327880859375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 5.0, 5.0, 7.0, 4.0, 11.0, 16.0, 26.0, 34.0, 109.0, 311.0, 288.0, 89.0, 39.0, 18.0, 14.0, 13.0, 8.0, 6.0, 7.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001456737518310547, -0.00014095008373260498, -0.00013622641563415527, -0.00013150274753570557, -0.00012677907943725586, -0.00012205541133880615, -0.00011733174324035645, -0.00011260807514190674, -0.00010788440704345703, -0.00010316073894500732, -9.843707084655762e-05, -9.371340274810791e-05, -8.89897346496582e-05, -8.42660665512085e-05, -7.954239845275879e-05, -7.481873035430908e-05, -7.009506225585938e-05, -6.537139415740967e-05, -6.064772605895996e-05, -5.5924057960510254e-05, -5.120038986206055e-05, -4.647672176361084e-05, -4.175305366516113e-05, -3.7029385566711426e-05, -3.230571746826172e-05, -2.7582049369812012e-05, -2.2858381271362305e-05, -1.8134713172912598e-05, -1.341104507446289e-05, -8.687376976013184e-06, -3.9637088775634766e-06, 7.599592208862305e-07, 5.4836273193359375e-06, 1.0207295417785645e-05, 1.4930963516235352e-05, 1.965463161468506e-05, 2.4378299713134766e-05, 2.9101967811584473e-05, 3.382563591003418e-05, 3.854930400848389e-05, 4.3272972106933594e-05, 4.79966402053833e-05, 5.272030830383301e-05, 5.7443976402282715e-05, 6.216764450073242e-05, 6.689131259918213e-05, 7.161498069763184e-05, 7.633864879608154e-05, 8.106231689453125e-05, 8.578598499298096e-05, 9.050965309143066e-05, 9.523332118988037e-05, 9.995698928833008e-05, 0.00010468065738677979, 0.00010940432548522949, 0.0001141279935836792, 0.0001188516616821289, 0.0001235753297805786, 0.00012829899787902832, 0.00013302266597747803, 0.00013774633407592773, 0.00014247000217437744, 0.00014719367027282715, 0.00015191733837127686, 0.00015664100646972656]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 5.0, 7.0, 2.0, 6.0, 3.0, 6.0, 10.0, 12.0, 12.0, 32.0, 34.0, 88.0, 84.0, 154.0, 238.0, 362.0, 512.0, 740.0, 1026.0, 1720.0, 3059.0, 6684.0, 17857.0, 74302.0, 829378.0, 78661.0, 18521.0, 6735.0, 3167.0, 1743.0, 1088.0, 699.0, 500.0, 368.0, 202.0, 175.0, 102.0, 83.0, 49.0, 44.0, 16.0, 18.0, 20.0, 10.0, 4.0, 0.0, 6.0, 1.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.34033203125, -0.3295326232910156, -0.31873321533203125, -0.3079338073730469, -0.2971343994140625, -0.2863349914550781, -0.27553558349609375, -0.2647361755371094, -0.253936767578125, -0.24313735961914062, -0.23233795166015625, -0.22153854370117188, -0.2107391357421875, -0.19993972778320312, -0.18914031982421875, -0.17834091186523438, -0.16754150390625, -0.15674209594726562, -0.14594268798828125, -0.13514328002929688, -0.1243438720703125, -0.11354446411132812, -0.10274505615234375, -0.09194564819335938, -0.081146240234375, -0.07034683227539062, -0.05954742431640625, -0.048748016357421875, -0.0379486083984375, -0.027149200439453125, -0.01634979248046875, -0.005550384521484375, 0.0052490234375, 0.016048431396484375, 0.02684783935546875, 0.037647247314453125, 0.0484466552734375, 0.059246063232421875, 0.07004547119140625, 0.08084487915039062, 0.091644287109375, 0.10244369506835938, 0.11324310302734375, 0.12404251098632812, 0.1348419189453125, 0.14564132690429688, 0.15644073486328125, 0.16724014282226562, 0.17803955078125, 0.18883895874023438, 0.19963836669921875, 0.21043777465820312, 0.2212371826171875, 0.23203659057617188, 0.24283599853515625, 0.2536354064941406, 0.264434814453125, 0.2752342224121094, 0.28603363037109375, 0.2968330383300781, 0.3076324462890625, 0.3184318542480469, 0.32923126220703125, 0.3400306701660156, 0.350830078125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 4.0, 8.0, 5.0, 10.0, 14.0, 14.0, 14.0, 32.0, 62.0, 178.0, 328.0, 139.0, 62.0, 35.0, 17.0, 16.0, 10.0, 14.0, 4.0, 5.0, 4.0, 8.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.36865234375, -0.3587989807128906, -0.34894561767578125, -0.3390922546386719, -0.3292388916015625, -0.3193855285644531, -0.30953216552734375, -0.2996788024902344, -0.289825439453125, -0.2799720764160156, -0.27011871337890625, -0.2602653503417969, -0.2504119873046875, -0.24055862426757812, -0.23070526123046875, -0.22085189819335938, -0.21099853515625, -0.20114517211914062, -0.19129180908203125, -0.18143844604492188, -0.1715850830078125, -0.16173171997070312, -0.15187835693359375, -0.14202499389648438, -0.132171630859375, -0.12231826782226562, -0.11246490478515625, -0.10261154174804688, -0.0927581787109375, -0.08290481567382812, -0.07305145263671875, -0.06319808959960938, -0.0533447265625, -0.043491363525390625, -0.03363800048828125, -0.023784637451171875, -0.0139312744140625, -0.004077911376953125, 0.00577545166015625, 0.015628814697265625, 0.025482177734375, 0.035335540771484375, 0.04518890380859375, 0.055042266845703125, 0.0648956298828125, 0.07474899291992188, 0.08460235595703125, 0.09445571899414062, 0.10430908203125, 0.11416244506835938, 0.12401580810546875, 0.13386917114257812, 0.1437225341796875, 0.15357589721679688, 0.16342926025390625, 0.17328262329101562, 0.183135986328125, 0.19298934936523438, 0.20284271240234375, 0.21269607543945312, 0.2225494384765625, 0.23240280151367188, 0.24225616455078125, 0.2521095275878906, 0.261962890625]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 6.0, 5.0, 28.0, 37.0, 90.0, 139.0, 206.0, 215.0, 141.0, 74.0, 29.0, 26.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.804680109024048, -3.663499355316162, -3.5223186016082764, -3.3811378479003906, -3.239956855773926, -3.098776340484619, -2.9575953483581543, -2.8164145946502686, -2.675233840942383, -2.534053087234497, -2.3928723335266113, -2.2516915798187256, -2.11051082611084, -1.9693299531936646, -1.8281490802764893, -1.6869683265686035, -1.5457875728607178, -1.404606819152832, -1.2634260654449463, -1.122245192527771, -0.9810644388198853, -0.8398836851119995, -0.698702871799469, -0.5575220584869385, -0.41634130477905273, -0.2751605212688446, -0.13397973775863647, 0.007201045751571655, 0.14838182926177979, 0.2895625829696655, 0.43074339628219604, 0.5719242095947266, 0.7131052017211914, 0.8542859554290771, 0.9954667687416077, 1.1366475820541382, 1.277828335762024, 1.4190090894699097, 1.560189962387085, 1.7013707160949707, 1.8425514698028564, 1.9837322235107422, 2.124912977218628, 2.2660937309265137, 2.4072747230529785, 2.548455238342285, 2.68963623046875, 2.8308169841766357, 2.9719977378845215, 3.1131784915924072, 3.254359245300293, 3.3955399990081787, 3.5367207527160645, 3.6779017448425293, 3.819082498550415, 3.960263252258301, 4.101444244384766, 4.2426252365112305, 4.383805751800537, 4.524986743927002, 4.666167259216309, 4.807348251342773, 4.94852876663208, 5.089709758758545, 5.230890274047852]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 3.0, 5.0, 5.0, 9.0, 11.0, 8.0, 12.0, 16.0, 22.0, 27.0, 24.0, 22.0, 30.0, 35.0, 37.0, 33.0, 31.0, 38.0, 47.0, 41.0, 58.0, 42.0, 42.0, 38.0, 49.0, 35.0, 34.0, 33.0, 33.0, 28.0, 26.0, 18.0, 11.0, 22.0, 12.0, 15.0, 5.0, 10.0, 6.0, 4.0, 8.0, 6.0, 3.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5043754577636719, -1.4553288221359253, -1.4062821865081787, -1.3572355508804321, -1.3081889152526855, -1.259142279624939, -1.2100956439971924, -1.1610491275787354, -1.1120023727416992, -1.0629557371139526, -1.013909101486206, -0.9648624658584595, -0.9158158302307129, -0.8667691946029663, -0.8177226185798645, -0.7686759829521179, -0.7196294069290161, -0.6705827713012695, -0.621536135673523, -0.5724895000457764, -0.5234428644180298, -0.4743962585926056, -0.4253496527671814, -0.3763030171394348, -0.32725638151168823, -0.27820974588394165, -0.22916312515735626, -0.18011650443077087, -0.1310698688030243, -0.08202323317527771, -0.032976627349853516, 0.016070008277893066, 0.06511664390563965, 0.11416327208280563, 0.16320990025997162, 0.212256520986557, 0.2613031566143036, 0.31034979224205017, 0.35939639806747437, 0.40844303369522095, 0.45748966932296753, 0.5065363049507141, 0.5555829405784607, 0.6046295166015625, 0.6536761522293091, 0.7027227878570557, 0.7517694234848022, 0.8008160591125488, 0.8498626947402954, 0.898909330368042, 0.9479559659957886, 0.9970026016235352, 1.0460492372512817, 1.0950958728790283, 1.1441423892974854, 1.1931891441345215, 1.2422356605529785, 1.291282296180725, 1.3403289318084717, 1.3893755674362183, 1.4384222030639648, 1.4874688386917114, 1.536515474319458, 1.585561990737915, 1.6346087455749512]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 1.0, 11.0, 10.0, 14.0, 23.0, 26.0, 37.0, 65.0, 83.0, 156.0, 215.0, 354.0, 674.0, 1249.0, 2543.0, 5499.0, 14515.0, 51157.0, 692791.0, 3331799.0, 64389.0, 16950.0, 6213.0, 2601.0, 1332.0, 651.0, 357.0, 191.0, 136.0, 81.0, 53.0, 39.0, 23.0, 12.0, 7.0, 11.0, 4.0, 3.0, 2.0, 4.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.525390625, -0.5108261108398438, -0.4962615966796875, -0.48169708251953125, -0.467132568359375, -0.45256805419921875, -0.4380035400390625, -0.42343902587890625, -0.40887451171875, -0.39430999755859375, -0.3797454833984375, -0.36518096923828125, -0.350616455078125, -0.33605194091796875, -0.3214874267578125, -0.30692291259765625, -0.2923583984375, -0.27779388427734375, -0.2632293701171875, -0.24866485595703125, -0.234100341796875, -0.21953582763671875, -0.2049713134765625, -0.19040679931640625, -0.17584228515625, -0.16127777099609375, -0.1467132568359375, -0.13214874267578125, -0.117584228515625, -0.10301971435546875, -0.0884552001953125, -0.07389068603515625, -0.059326171875, -0.04476165771484375, -0.0301971435546875, -0.01563262939453125, -0.001068115234375, 0.01349639892578125, 0.0280609130859375, 0.04262542724609375, 0.05718994140625, 0.07175445556640625, 0.0863189697265625, 0.10088348388671875, 0.115447998046875, 0.13001251220703125, 0.1445770263671875, 0.15914154052734375, 0.1737060546875, 0.18827056884765625, 0.2028350830078125, 0.21739959716796875, 0.231964111328125, 0.24652862548828125, 0.2610931396484375, 0.27565765380859375, 0.29022216796875, 0.30478668212890625, 0.3193511962890625, 0.33391571044921875, 0.348480224609375, 0.36304473876953125, 0.3776092529296875, 0.39217376708984375, 0.40673828125]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 6.0, 3.0, 4.0, 8.0, 14.0, 15.0, 12.0, 13.0, 21.0, 25.0, 25.0, 38.0, 36.0, 38.0, 51.0, 55.0, 44.0, 45.0, 40.0, 56.0, 36.0, 58.0, 39.0, 46.0, 49.0, 38.0, 30.0, 38.0, 23.0, 22.0, 23.0, 13.0, 4.0, 11.0, 13.0, 5.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.08831787109375, -0.08587169647216797, -0.08342552185058594, -0.0809793472290039, -0.07853317260742188, -0.07608699798583984, -0.07364082336425781, -0.07119464874267578, -0.06874847412109375, -0.06630229949951172, -0.06385612487792969, -0.061409950256347656, -0.058963775634765625, -0.056517601013183594, -0.05407142639160156, -0.05162525177001953, -0.0491790771484375, -0.04673290252685547, -0.04428672790527344, -0.041840553283691406, -0.039394378662109375, -0.036948204040527344, -0.03450202941894531, -0.03205585479736328, -0.02960968017578125, -0.02716350555419922, -0.024717330932617188, -0.022271156311035156, -0.019824981689453125, -0.017378807067871094, -0.014932632446289062, -0.012486457824707031, -0.010040283203125, -0.007594108581542969, -0.0051479339599609375, -0.0027017593383789062, -0.000255584716796875, 0.0021905899047851562, 0.0046367645263671875, 0.007082939147949219, 0.00952911376953125, 0.011975288391113281, 0.014421463012695312, 0.016867637634277344, 0.019313812255859375, 0.021759986877441406, 0.024206161499023438, 0.02665233612060547, 0.0290985107421875, 0.03154468536376953, 0.03399085998535156, 0.036437034606933594, 0.038883209228515625, 0.041329383850097656, 0.04377555847167969, 0.04622173309326172, 0.04866790771484375, 0.05111408233642578, 0.05356025695800781, 0.056006431579589844, 0.058452606201171875, 0.060898780822753906, 0.06334495544433594, 0.06579113006591797, 0.0682373046875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 14.0, 20.0, 23.0, 28.0, 48.0, 62.0, 76.0, 121.0, 200.0, 286.0, 448.0, 639.0, 972.0, 1637.0, 2577.0, 4430.0, 8439.0, 18132.0, 48368.0, 219672.0, 3604008.0, 200659.0, 46226.0, 17715.0, 8248.0, 4358.0, 2551.0, 1518.0, 966.0, 551.0, 400.0, 288.0, 170.0, 125.0, 93.0, 73.0, 45.0, 39.0, 22.0, 14.0, 8.0, 8.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.44970703125, -0.4349517822265625, -0.420196533203125, -0.4054412841796875, -0.39068603515625, -0.3759307861328125, -0.361175537109375, -0.3464202880859375, -0.3316650390625, -0.3169097900390625, -0.302154541015625, -0.2873992919921875, -0.27264404296875, -0.2578887939453125, -0.243133544921875, -0.2283782958984375, -0.213623046875, -0.1988677978515625, -0.184112548828125, -0.1693572998046875, -0.15460205078125, -0.1398468017578125, -0.125091552734375, -0.1103363037109375, -0.0955810546875, -0.0808258056640625, -0.066070556640625, -0.0513153076171875, -0.03656005859375, -0.0218048095703125, -0.007049560546875, 0.0077056884765625, 0.0224609375, 0.0372161865234375, 0.051971435546875, 0.0667266845703125, 0.08148193359375, 0.0962371826171875, 0.110992431640625, 0.1257476806640625, 0.1405029296875, 0.1552581787109375, 0.170013427734375, 0.1847686767578125, 0.19952392578125, 0.2142791748046875, 0.229034423828125, 0.2437896728515625, 0.258544921875, 0.2733001708984375, 0.288055419921875, 0.3028106689453125, 0.31756591796875, 0.3323211669921875, 0.347076416015625, 0.3618316650390625, 0.3765869140625, 0.3913421630859375, 0.406097412109375, 0.4208526611328125, 0.43560791015625, 0.4503631591796875, 0.465118408203125, 0.4798736572265625, 0.49462890625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 2.0, 3.0, 5.0, 1.0, 4.0, 3.0, 9.0, 10.0, 9.0, 12.0, 22.0, 30.0, 33.0, 61.0, 108.0, 304.0, 2340.0, 643.0, 196.0, 96.0, 55.0, 37.0, 23.0, 15.0, 14.0, 12.0, 8.0, 2.0, 3.0, 4.0, 7.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2193603515625, -0.21198463439941406, -0.20460891723632812, -0.1972332000732422, -0.18985748291015625, -0.1824817657470703, -0.17510604858398438, -0.16773033142089844, -0.1603546142578125, -0.15297889709472656, -0.14560317993164062, -0.1382274627685547, -0.13085174560546875, -0.12347602844238281, -0.11610031127929688, -0.10872459411621094, -0.101348876953125, -0.09397315979003906, -0.08659744262695312, -0.07922172546386719, -0.07184600830078125, -0.06447029113769531, -0.057094573974609375, -0.04971885681152344, -0.0423431396484375, -0.03496742248535156, -0.027591705322265625, -0.020215988159179688, -0.01284027099609375, -0.0054645538330078125, 0.001911163330078125, 0.009286880493164062, 0.01666259765625, 0.024038314819335938, 0.031414031982421875, 0.03878974914550781, 0.04616546630859375, 0.05354118347167969, 0.060916900634765625, 0.06829261779785156, 0.0756683349609375, 0.08304405212402344, 0.09041976928710938, 0.09779548645019531, 0.10517120361328125, 0.11254692077636719, 0.11992263793945312, 0.12729835510253906, 0.134674072265625, 0.14204978942871094, 0.14942550659179688, 0.1568012237548828, 0.16417694091796875, 0.1715526580810547, 0.17892837524414062, 0.18630409240722656, 0.1936798095703125, 0.20105552673339844, 0.20843124389648438, 0.2158069610595703, 0.22318267822265625, 0.2305583953857422, 0.23793411254882812, 0.24530982971191406, 0.252685546875]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 6.0, 10.0, 21.0, 41.0, 69.0, 87.0, 124.0, 144.0, 156.0, 110.0, 86.0, 62.0, 34.0, 25.0, 14.0, 5.0, 1.0, 7.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8972572684288025, -0.8539426922798157, -0.8106281757354736, -0.7673135995864868, -0.7239990234375, -0.6806844472885132, -0.6373698711395264, -0.5940553545951843, -0.5507407784461975, -0.5074262022972107, -0.46411165595054626, -0.42079710960388184, -0.377482533454895, -0.3341679573059082, -0.2908534109592438, -0.24753886461257935, -0.20422428846359253, -0.1609097272157669, -0.11759516596794128, -0.07428060472011566, -0.03096604347229004, 0.012348517775535583, 0.055663079023361206, 0.09897762537002563, 0.14229220151901245, 0.18560676276683807, 0.2289213240146637, 0.2722358703613281, 0.31555044651031494, 0.35886502265930176, 0.4021795690059662, 0.4454941153526306, 0.48880863189697266, 0.5321232080459595, 0.5754377841949463, 0.6187523007392883, 0.6620668768882751, 0.705381453037262, 0.748695969581604, 0.7920105457305908, 0.8353251218795776, 0.8786396980285645, 0.9219542741775513, 0.9652687907218933, 1.0085833072662354, 1.0518978834152222, 1.095212459564209, 1.1385270357131958, 1.1818416118621826, 1.2251561880111694, 1.2684707641601562, 1.311785340309143, 1.3550999164581299, 1.3984143733978271, 1.441728949546814, 1.4850435256958008, 1.5283581018447876, 1.5716726779937744, 1.6149872541427612, 1.658301830291748, 1.7016162872314453, 1.7449308633804321, 1.788245439529419, 1.8315600156784058, 1.8748745918273926]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 4.0, 7.0, 9.0, 11.0, 11.0, 11.0, 12.0, 10.0, 16.0, 20.0, 11.0, 25.0, 21.0, 30.0, 33.0, 27.0, 30.0, 53.0, 39.0, 40.0, 39.0, 45.0, 48.0, 32.0, 35.0, 33.0, 35.0, 35.0, 36.0, 19.0, 27.0, 26.0, 30.0, 17.0, 19.0, 23.0, 16.0, 13.0, 16.0, 10.0, 5.0, 8.0, 4.0, 2.0, 7.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.5524599552154541, -0.5349141359329224, -0.5173683166503906, -0.4998224973678589, -0.48227664828300476, -0.464730829000473, -0.4471850097179413, -0.42963919043540955, -0.4120933413505554, -0.3945475220680237, -0.37700170278549194, -0.3594558835029602, -0.3419100344181061, -0.32436421513557434, -0.3068183958530426, -0.28927257657051086, -0.2717267572879791, -0.2541809380054474, -0.23663510382175446, -0.21908928453922272, -0.20154345035552979, -0.18399763107299805, -0.1664518117904663, -0.14890599250793457, -0.13136015832424164, -0.1138143315911293, -0.09626850485801697, -0.07872268557548523, -0.061176858842372894, -0.04363103210926056, -0.02608521282672882, -0.008539386093616486, 0.00900644063949585, 0.026552265509963036, 0.04409809038043022, 0.06164391338825226, 0.0791897401213646, 0.09673556685447693, 0.11428138613700867, 0.1318272054195404, 0.14937303960323334, 0.16691885888576508, 0.184464693069458, 0.20201051235198975, 0.21955633163452148, 0.23710216581821442, 0.25464797019958496, 0.2721938192844391, 0.2897396385669708, 0.30728545784950256, 0.3248312771320343, 0.3423771262168884, 0.35992294549942017, 0.3774687647819519, 0.39501458406448364, 0.4125604033470154, 0.4301062226295471, 0.44765204191207886, 0.4651978611946106, 0.48274368047714233, 0.5002894997596741, 0.5178353786468506, 0.5353811979293823, 0.5529270172119141, 0.5704728364944458]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 6.0, 4.0, 4.0, 2.0, 7.0, 6.0, 14.0, 24.0, 19.0, 46.0, 49.0, 93.0, 91.0, 185.0, 257.0, 436.0, 651.0, 1039.0, 1705.0, 2930.0, 4793.0, 8325.0, 14451.0, 25542.0, 46654.0, 88678.0, 190621.0, 312192.0, 169476.0, 80725.0, 43242.0, 23781.0, 13584.0, 7601.0, 4408.0, 2596.0, 1556.0, 973.0, 647.0, 372.0, 269.0, 164.0, 103.0, 80.0, 43.0, 46.0, 22.0, 18.0, 10.0, 9.0, 3.0, 6.0, 3.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1846923828125, -0.17862319946289062, -0.17255401611328125, -0.16648483276367188, -0.1604156494140625, -0.15434646606445312, -0.14827728271484375, -0.14220809936523438, -0.136138916015625, -0.13006973266601562, -0.12400054931640625, -0.11793136596679688, -0.1118621826171875, -0.10579299926757812, -0.09972381591796875, -0.09365463256835938, -0.08758544921875, -0.08151626586914062, -0.07544708251953125, -0.06937789916992188, -0.0633087158203125, -0.057239532470703125, -0.05117034912109375, -0.045101165771484375, -0.039031982421875, -0.032962799072265625, -0.02689361572265625, -0.020824432373046875, -0.0147552490234375, -0.008686065673828125, -0.00261688232421875, 0.003452301025390625, 0.009521484375, 0.015590667724609375, 0.02165985107421875, 0.027729034423828125, 0.0337982177734375, 0.039867401123046875, 0.04593658447265625, 0.052005767822265625, 0.058074951171875, 0.06414413452148438, 0.07021331787109375, 0.07628250122070312, 0.0823516845703125, 0.08842086791992188, 0.09449005126953125, 0.10055923461914062, 0.10662841796875, 0.11269760131835938, 0.11876678466796875, 0.12483596801757812, 0.1309051513671875, 0.13697433471679688, 0.14304351806640625, 0.14911270141601562, 0.155181884765625, 0.16125106811523438, 0.16732025146484375, 0.17338943481445312, 0.1794586181640625, 0.18552780151367188, 0.19159698486328125, 0.19766616821289062, 0.2037353515625]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 6.0, 9.0, 7.0, 8.0, 9.0, 15.0, 10.0, 18.0, 19.0, 24.0, 24.0, 18.0, 36.0, 29.0, 33.0, 50.0, 52.0, 40.0, 51.0, 37.0, 31.0, 41.0, 44.0, 33.0, 40.0, 41.0, 50.0, 38.0, 31.0, 22.0, 27.0, 21.0, 18.0, 22.0, 9.0, 9.0, 11.0, 7.0, 5.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.0819091796875, -0.07945442199707031, -0.07699966430664062, -0.07454490661621094, -0.07209014892578125, -0.06963539123535156, -0.06718063354492188, -0.06472587585449219, -0.0622711181640625, -0.05981636047363281, -0.057361602783203125, -0.05490684509277344, -0.05245208740234375, -0.04999732971191406, -0.047542572021484375, -0.04508781433105469, -0.042633056640625, -0.04017829895019531, -0.037723541259765625, -0.03526878356933594, -0.03281402587890625, -0.030359268188476562, -0.027904510498046875, -0.025449752807617188, -0.0229949951171875, -0.020540237426757812, -0.018085479736328125, -0.015630722045898438, -0.01317596435546875, -0.010721206665039062, -0.008266448974609375, -0.0058116912841796875, -0.00335693359375, -0.0009021759033203125, 0.001552581787109375, 0.0040073394775390625, 0.00646209716796875, 0.008916854858398438, 0.011371612548828125, 0.013826370239257812, 0.0162811279296875, 0.018735885620117188, 0.021190643310546875, 0.023645401000976562, 0.02610015869140625, 0.028554916381835938, 0.031009674072265625, 0.03346443176269531, 0.035919189453125, 0.03837394714355469, 0.040828704833984375, 0.04328346252441406, 0.04573822021484375, 0.04819297790527344, 0.050647735595703125, 0.05310249328613281, 0.0555572509765625, 0.05801200866699219, 0.060466766357421875, 0.06292152404785156, 0.06537628173828125, 0.06783103942871094, 0.07028579711914062, 0.07274055480957031, 0.0751953125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 6.0, 9.0, 3.0, 9.0, 23.0, 16.0, 29.0, 28.0, 39.0, 59.0, 97.0, 161.0, 215.0, 307.0, 489.0, 837.0, 1556.0, 3521.0, 8939.0, 26640.0, 89165.0, 437279.0, 361724.0, 78566.0, 23545.0, 8218.0, 3346.0, 1545.0, 766.0, 471.0, 291.0, 181.0, 138.0, 94.0, 86.0, 36.0, 32.0, 28.0, 17.0, 15.0, 10.0, 4.0, 7.0, 4.0, 5.0, 1.0, 1.0, 0.0, 3.0, 3.0], "bins": [-0.455322265625, -0.442657470703125, -0.42999267578125, -0.417327880859375, -0.4046630859375, -0.391998291015625, -0.37933349609375, -0.366668701171875, -0.35400390625, -0.341339111328125, -0.32867431640625, -0.316009521484375, -0.3033447265625, -0.290679931640625, -0.27801513671875, -0.265350341796875, -0.252685546875, -0.240020751953125, -0.22735595703125, -0.214691162109375, -0.2020263671875, -0.189361572265625, -0.17669677734375, -0.164031982421875, -0.1513671875, -0.138702392578125, -0.12603759765625, -0.113372802734375, -0.1007080078125, -0.088043212890625, -0.07537841796875, -0.062713623046875, -0.050048828125, -0.037384033203125, -0.02471923828125, -0.012054443359375, 0.0006103515625, 0.013275146484375, 0.02593994140625, 0.038604736328125, 0.05126953125, 0.063934326171875, 0.07659912109375, 0.089263916015625, 0.1019287109375, 0.114593505859375, 0.12725830078125, 0.139923095703125, 0.152587890625, 0.165252685546875, 0.17791748046875, 0.190582275390625, 0.2032470703125, 0.215911865234375, 0.22857666015625, 0.241241455078125, 0.25390625, 0.266571044921875, 0.27923583984375, 0.291900634765625, 0.3045654296875, 0.317230224609375, 0.32989501953125, 0.342559814453125, 0.355224609375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 5.0, 7.0, 10.0, 5.0, 18.0, 10.0, 16.0, 20.0, 22.0, 31.0, 27.0, 39.0, 44.0, 34.0, 49.0, 55.0, 50.0, 58.0, 49.0, 41.0, 45.0, 41.0, 48.0, 39.0, 37.0, 31.0, 25.0, 24.0, 26.0, 24.0, 16.0, 10.0, 11.0, 4.0, 9.0, 9.0, 3.0, 5.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.379638671875, -0.3658714294433594, -0.35210418701171875, -0.3383369445800781, -0.3245697021484375, -0.3108024597167969, -0.29703521728515625, -0.2832679748535156, -0.269500732421875, -0.2557334899902344, -0.24196624755859375, -0.22819900512695312, -0.2144317626953125, -0.20066452026367188, -0.18689727783203125, -0.17313003540039062, -0.15936279296875, -0.14559555053710938, -0.13182830810546875, -0.11806106567382812, -0.1042938232421875, -0.09052658081054688, -0.07675933837890625, -0.06299209594726562, -0.049224853515625, -0.035457611083984375, -0.02169036865234375, -0.007923126220703125, 0.0058441162109375, 0.019611358642578125, 0.03337860107421875, 0.047145843505859375, 0.0609130859375, 0.07468032836914062, 0.08844757080078125, 0.10221481323242188, 0.1159820556640625, 0.12974929809570312, 0.14351654052734375, 0.15728378295898438, 0.171051025390625, 0.18481826782226562, 0.19858551025390625, 0.21235275268554688, 0.2261199951171875, 0.23988723754882812, 0.25365447998046875, 0.2674217224121094, 0.28118896484375, 0.2949562072753906, 0.30872344970703125, 0.3224906921386719, 0.3362579345703125, 0.3500251770019531, 0.36379241943359375, 0.3775596618652344, 0.391326904296875, 0.4050941467285156, 0.41886138916015625, 0.4326286315917969, 0.4463958740234375, 0.4601631164550781, 0.47393035888671875, 0.4876976013183594, 0.50146484375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 11.0, 9.0, 16.0, 21.0, 27.0, 48.0, 61.0, 80.0, 147.0, 221.0, 275.0, 453.0, 858.0, 1643.0, 3606.0, 10581.0, 43776.0, 343158.0, 564245.0, 57702.0, 13039.0, 4306.0, 1844.0, 878.0, 561.0, 340.0, 199.0, 138.0, 111.0, 66.0, 45.0, 22.0, 25.0, 17.0, 7.0, 12.0, 6.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.302490234375, -0.29132080078125, -0.2801513671875, -0.26898193359375, -0.2578125, -0.24664306640625, -0.2354736328125, -0.22430419921875, -0.213134765625, -0.20196533203125, -0.1907958984375, -0.17962646484375, -0.16845703125, -0.15728759765625, -0.1461181640625, -0.13494873046875, -0.123779296875, -0.11260986328125, -0.1014404296875, -0.09027099609375, -0.0791015625, -0.06793212890625, -0.0567626953125, -0.04559326171875, -0.034423828125, -0.02325439453125, -0.0120849609375, -0.00091552734375, 0.01025390625, 0.02142333984375, 0.0325927734375, 0.04376220703125, 0.054931640625, 0.06610107421875, 0.0772705078125, 0.08843994140625, 0.099609375, 0.11077880859375, 0.1219482421875, 0.13311767578125, 0.144287109375, 0.15545654296875, 0.1666259765625, 0.17779541015625, 0.18896484375, 0.20013427734375, 0.2113037109375, 0.22247314453125, 0.233642578125, 0.24481201171875, 0.2559814453125, 0.26715087890625, 0.2783203125, 0.28948974609375, 0.3006591796875, 0.31182861328125, 0.322998046875, 0.33416748046875, 0.3453369140625, 0.35650634765625, 0.36767578125, 0.37884521484375, 0.3900146484375, 0.40118408203125, 0.412353515625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 5.0, 6.0, 8.0, 13.0, 27.0, 41.0, 55.0, 98.0, 150.0, 243.0, 150.0, 89.0, 49.0, 31.0, 17.0, 5.0, 6.0, 6.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014066696166992188, -0.00013689789921045303, -0.0001331288367509842, -0.00012935977429151535, -0.0001255907118320465, -0.00012182164937257767, -0.00011805258691310883, -0.00011428352445363998, -0.00011051446199417114, -0.0001067453995347023, -0.00010297633707523346, -9.920727461576462e-05, -9.543821215629578e-05, -9.166914969682693e-05, -8.79000872373581e-05, -8.413102477788925e-05, -8.036196231842041e-05, -7.659289985895157e-05, -7.282383739948273e-05, -6.905477494001389e-05, -6.528571248054504e-05, -6.15166500210762e-05, -5.774758756160736e-05, -5.397852510213852e-05, -5.020946264266968e-05, -4.6440400183200836e-05, -4.2671337723731995e-05, -3.890227526426315e-05, -3.513321280479431e-05, -3.136415034532547e-05, -2.759508788585663e-05, -2.3826025426387787e-05, -2.0056962966918945e-05, -1.6287900507450104e-05, -1.2518838047981262e-05, -8.74977558851242e-06, -4.980713129043579e-06, -1.2116506695747375e-06, 2.557411789894104e-06, 6.3264742493629456e-06, 1.0095536708831787e-05, 1.3864599168300629e-05, 1.763366162776947e-05, 2.1402724087238312e-05, 2.5171786546707153e-05, 2.8940849006175995e-05, 3.2709911465644836e-05, 3.647897392511368e-05, 4.024803638458252e-05, 4.401709884405136e-05, 4.77861613035202e-05, 5.1555223762989044e-05, 5.5324286222457886e-05, 5.909334868192673e-05, 6.286241114139557e-05, 6.663147360086441e-05, 7.040053606033325e-05, 7.41695985198021e-05, 7.793866097927094e-05, 8.170772343873978e-05, 8.547678589820862e-05, 8.924584835767746e-05, 9.30149108171463e-05, 9.678397327661514e-05, 0.00010055303573608398]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 4.0, 2.0, 1.0, 8.0, 4.0, 4.0, 8.0, 8.0, 10.0, 15.0, 29.0, 46.0, 63.0, 117.0, 209.0, 349.0, 626.0, 1273.0, 2605.0, 6917.0, 23644.0, 130796.0, 714788.0, 130835.0, 23705.0, 7060.0, 2647.0, 1220.0, 664.0, 378.0, 190.0, 129.0, 77.0, 45.0, 25.0, 15.0, 14.0, 11.0, 6.0, 2.0, 4.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.377197265625, -0.36483001708984375, -0.3524627685546875, -0.34009552001953125, -0.327728271484375, -0.31536102294921875, -0.3029937744140625, -0.29062652587890625, -0.27825927734375, -0.26589202880859375, -0.2535247802734375, -0.24115753173828125, -0.228790283203125, -0.21642303466796875, -0.2040557861328125, -0.19168853759765625, -0.1793212890625, -0.16695404052734375, -0.1545867919921875, -0.14221954345703125, -0.129852294921875, -0.11748504638671875, -0.1051177978515625, -0.09275054931640625, -0.08038330078125, -0.06801605224609375, -0.0556488037109375, -0.04328155517578125, -0.030914306640625, -0.01854705810546875, -0.0061798095703125, 0.00618743896484375, 0.0185546875, 0.03092193603515625, 0.0432891845703125, 0.05565643310546875, 0.068023681640625, 0.08039093017578125, 0.0927581787109375, 0.10512542724609375, 0.11749267578125, 0.12985992431640625, 0.1422271728515625, 0.15459442138671875, 0.166961669921875, 0.17932891845703125, 0.1916961669921875, 0.20406341552734375, 0.2164306640625, 0.22879791259765625, 0.2411651611328125, 0.25353240966796875, 0.265899658203125, 0.27826690673828125, 0.2906341552734375, 0.30300140380859375, 0.31536865234375, 0.32773590087890625, 0.3401031494140625, 0.35247039794921875, 0.364837646484375, 0.37720489501953125, 0.3895721435546875, 0.40193939208984375, 0.414306640625]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 5.0, 7.0, 11.0, 4.0, 20.0, 10.0, 25.0, 32.0, 44.0, 61.0, 88.0, 131.0, 137.0, 122.0, 77.0, 59.0, 43.0, 37.0, 25.0, 12.0, 14.0, 7.0, 7.0, 7.0, 5.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25390625, -0.24465560913085938, -0.23540496826171875, -0.22615432739257812, -0.2169036865234375, -0.20765304565429688, -0.19840240478515625, -0.18915176391601562, -0.179901123046875, -0.17065048217773438, -0.16139984130859375, -0.15214920043945312, -0.1428985595703125, -0.13364791870117188, -0.12439727783203125, -0.11514663696289062, -0.10589599609375, -0.09664535522460938, -0.08739471435546875, -0.07814407348632812, -0.0688934326171875, -0.059642791748046875, -0.05039215087890625, -0.041141510009765625, -0.031890869140625, -0.022640228271484375, -0.01338958740234375, -0.004138946533203125, 0.0051116943359375, 0.014362335205078125, 0.02361297607421875, 0.032863616943359375, 0.0421142578125, 0.051364898681640625, 0.06061553955078125, 0.06986618041992188, 0.0791168212890625, 0.08836746215820312, 0.09761810302734375, 0.10686874389648438, 0.116119384765625, 0.12537002563476562, 0.13462066650390625, 0.14387130737304688, 0.1531219482421875, 0.16237258911132812, 0.17162322998046875, 0.18087387084960938, 0.19012451171875, 0.19937515258789062, 0.20862579345703125, 0.21787643432617188, 0.2271270751953125, 0.23637771606445312, 0.24562835693359375, 0.2548789978027344, 0.264129638671875, 0.2733802795410156, 0.28263092041015625, 0.2918815612792969, 0.3011322021484375, 0.3103828430175781, 0.31963348388671875, 0.3288841247558594, 0.338134765625]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 7.0, 13.0, 84.0, 165.0, 313.0, 268.0, 105.0, 37.0, 8.0, 5.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7446107864379883, -3.470951795578003, -3.1972928047180176, -2.9236338138580322, -2.649974822998047, -2.3763158321380615, -2.102656841278076, -1.8289978504180908, -1.5553388595581055, -1.2816798686981201, -1.0080208778381348, -0.7343618869781494, -0.46070289611816406, -0.1870439052581787, 0.08661508560180664, 0.360274076461792, 0.6339330673217773, 0.9075920581817627, 1.181251049041748, 1.4549100399017334, 1.7285690307617188, 2.002228021621704, 2.2758870124816895, 2.549546003341675, 2.82320499420166, 3.0968639850616455, 3.370522975921631, 3.644181966781616, 3.9178409576416016, 4.191499710083008, 4.465158939361572, 4.738818168640137, 5.012475967407227, 5.286134719848633, 5.559793949127197, 5.833453178405762, 6.107111930847168, 6.380770683288574, 6.654429912567139, 6.928089141845703, 7.201747894287109, 7.475406646728516, 7.74906587600708, 8.022725105285645, 8.29638385772705, 8.570042610168457, 8.84370231628418, 9.117361068725586, 9.391019821166992, 9.664678573608398, 9.938337326049805, 10.211997032165527, 10.485655784606934, 10.75931453704834, 11.032974243164062, 11.306632995605469, 11.580291748046875, 11.853950500488281, 12.127609252929688, 12.40126895904541, 12.674927711486816, 12.948586463928223, 13.222246170043945, 13.495904922485352, 13.769563674926758]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 1.0, 6.0, 4.0, 4.0, 7.0, 12.0, 9.0, 9.0, 20.0, 15.0, 16.0, 17.0, 27.0, 32.0, 31.0, 36.0, 50.0, 47.0, 50.0, 49.0, 40.0, 51.0, 35.0, 39.0, 31.0, 45.0, 33.0, 37.0, 40.0, 29.0, 37.0, 26.0, 22.0, 21.0, 18.0, 20.0, 9.0, 5.0, 7.0, 4.0, 3.0, 6.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.277494430541992, -2.2030272483825684, -2.1285598278045654, -2.0540926456451416, -1.9796253442764282, -1.9051580429077148, -1.830690860748291, -1.7562235593795776, -1.6817562580108643, -1.6072889566421509, -1.532821774482727, -1.4583544731140137, -1.3838871717453003, -1.309419870376587, -1.234952688217163, -1.1604853868484497, -1.0860182046890259, -1.0115509033203125, -0.9370836615562439, -0.8626164197921753, -0.7881491184234619, -0.7136818766593933, -0.6392146348953247, -0.5647473335266113, -0.4902800917625427, -0.41581282019615173, -0.34134554862976074, -0.26687830686569214, -0.19241103529930115, -0.11794376373291016, -0.04347652196884155, 0.030990779399871826, 0.10545802116394043, 0.17992529273033142, 0.2543925642967224, 0.328859806060791, 0.403327077627182, 0.477794349193573, 0.5522615909576416, 0.626728892326355, 0.7011961340904236, 0.7756633758544922, 0.8501306772232056, 0.9245979189872742, 0.9990651607513428, 1.0735324621200562, 1.1479997634887695, 1.2224669456481934, 1.2969342470169067, 1.3714015483856201, 1.445868730545044, 1.5203360319137573, 1.5948033332824707, 1.6692705154418945, 1.743737816810608, 1.8182051181793213, 1.8926723003387451, 1.9671396017074585, 2.041606903076172, 2.1160740852355957, 2.1905412673950195, 2.2650086879730225, 2.3394758701324463, 2.413943290710449, 2.488410472869873]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 6.0, 8.0, 9.0, 6.0, 14.0, 14.0, 20.0, 29.0, 38.0, 52.0, 92.0, 106.0, 181.0, 213.0, 310.0, 424.0, 680.0, 1043.0, 1646.0, 2768.0, 4803.0, 9031.0, 19490.0, 52281.0, 239593.0, 3558583.0, 212822.0, 50300.0, 19098.0, 8816.0, 4683.0, 2631.0, 1512.0, 983.0, 686.0, 442.0, 285.0, 172.0, 132.0, 77.0, 59.0, 50.0, 34.0, 25.0, 13.0, 12.0, 7.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.40283203125, -0.3914756774902344, -0.38011932373046875, -0.3687629699707031, -0.3574066162109375, -0.3460502624511719, -0.33469390869140625, -0.3233375549316406, -0.311981201171875, -0.3006248474121094, -0.28926849365234375, -0.2779121398925781, -0.2665557861328125, -0.2551994323730469, -0.24384307861328125, -0.23248672485351562, -0.22113037109375, -0.20977401733398438, -0.19841766357421875, -0.18706130981445312, -0.1757049560546875, -0.16434860229492188, -0.15299224853515625, -0.14163589477539062, -0.130279541015625, -0.11892318725585938, -0.10756683349609375, -0.09621047973632812, -0.0848541259765625, -0.07349777221679688, -0.06214141845703125, -0.050785064697265625, -0.0394287109375, -0.028072357177734375, -0.01671600341796875, -0.005359649658203125, 0.0059967041015625, 0.017353057861328125, 0.02870941162109375, 0.040065765380859375, 0.051422119140625, 0.06277847290039062, 0.07413482666015625, 0.08549118041992188, 0.0968475341796875, 0.10820388793945312, 0.11956024169921875, 0.13091659545898438, 0.14227294921875, 0.15362930297851562, 0.16498565673828125, 0.17634201049804688, 0.1876983642578125, 0.19905471801757812, 0.21041107177734375, 0.22176742553710938, 0.233123779296875, 0.24448013305664062, 0.25583648681640625, 0.2671928405761719, 0.2785491943359375, 0.2899055480957031, 0.30126190185546875, 0.3126182556152344, 0.323974609375]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 5.0, 3.0, 1.0, 4.0, 4.0, 6.0, 5.0, 5.0, 9.0, 8.0, 7.0, 19.0, 19.0, 13.0, 28.0, 19.0, 24.0, 29.0, 44.0, 32.0, 37.0, 39.0, 39.0, 46.0, 35.0, 39.0, 48.0, 30.0, 30.0, 40.0, 35.0, 41.0, 38.0, 41.0, 26.0, 18.0, 24.0, 15.0, 25.0, 14.0, 7.0, 13.0, 8.0, 10.0, 10.0, 3.0, 3.0, 4.0, 5.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.08551025390625, -0.08304214477539062, -0.08057403564453125, -0.07810592651367188, -0.0756378173828125, -0.07316970825195312, -0.07070159912109375, -0.06823348999023438, -0.065765380859375, -0.06329727172851562, -0.06082916259765625, -0.058361053466796875, -0.0558929443359375, -0.053424835205078125, -0.05095672607421875, -0.048488616943359375, -0.0460205078125, -0.043552398681640625, -0.04108428955078125, -0.038616180419921875, -0.0361480712890625, -0.033679962158203125, -0.03121185302734375, -0.028743743896484375, -0.026275634765625, -0.023807525634765625, -0.02133941650390625, -0.018871307373046875, -0.0164031982421875, -0.013935089111328125, -0.01146697998046875, -0.008998870849609375, -0.00653076171875, -0.004062652587890625, -0.00159454345703125, 0.000873565673828125, 0.0033416748046875, 0.005809783935546875, 0.00827789306640625, 0.010746002197265625, 0.013214111328125, 0.015682220458984375, 0.01815032958984375, 0.020618438720703125, 0.0230865478515625, 0.025554656982421875, 0.02802276611328125, 0.030490875244140625, 0.032958984375, 0.035427093505859375, 0.03789520263671875, 0.040363311767578125, 0.0428314208984375, 0.045299530029296875, 0.04776763916015625, 0.050235748291015625, 0.052703857421875, 0.055171966552734375, 0.05764007568359375, 0.060108184814453125, 0.0625762939453125, 0.06504440307617188, 0.06751251220703125, 0.06998062133789062, 0.07244873046875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 1.0, 8.0, 1.0, 8.0, 2.0, 8.0, 11.0, 12.0, 20.0, 21.0, 37.0, 33.0, 47.0, 74.0, 120.0, 168.0, 267.0, 465.0, 622.0, 1116.0, 2008.0, 3811.0, 8433.0, 22410.0, 86781.0, 2497476.0, 1450241.0, 81340.0, 21879.0, 8166.0, 3832.0, 1854.0, 1089.0, 719.0, 412.0, 261.0, 156.0, 110.0, 80.0, 54.0, 42.0, 17.0, 17.0, 17.0, 14.0, 10.0, 6.0, 2.0, 5.0, 3.0, 6.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.677734375, -0.6551284790039062, -0.6325225830078125, -0.6099166870117188, -0.587310791015625, -0.5647048950195312, -0.5420989990234375, -0.5194931030273438, -0.49688720703125, -0.47428131103515625, -0.4516754150390625, -0.42906951904296875, -0.406463623046875, -0.38385772705078125, -0.3612518310546875, -0.33864593505859375, -0.3160400390625, -0.29343414306640625, -0.2708282470703125, -0.24822235107421875, -0.225616455078125, -0.20301055908203125, -0.1804046630859375, -0.15779876708984375, -0.13519287109375, -0.11258697509765625, -0.0899810791015625, -0.06737518310546875, -0.044769287109375, -0.02216339111328125, 0.0004425048828125, 0.02304840087890625, 0.045654296875, 0.06826019287109375, 0.0908660888671875, 0.11347198486328125, 0.136077880859375, 0.15868377685546875, 0.1812896728515625, 0.20389556884765625, 0.22650146484375, 0.24910736083984375, 0.2717132568359375, 0.29431915283203125, 0.316925048828125, 0.33953094482421875, 0.3621368408203125, 0.38474273681640625, 0.4073486328125, 0.42995452880859375, 0.4525604248046875, 0.47516632080078125, 0.497772216796875, 0.5203781127929688, 0.5429840087890625, 0.5655899047851562, 0.58819580078125, 0.6108016967773438, 0.6334075927734375, 0.6560134887695312, 0.678619384765625, 0.7012252807617188, 0.7238311767578125, 0.7464370727539062, 0.76904296875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 1.0, 3.0, 5.0, 7.0, 11.0, 21.0, 27.0, 43.0, 73.0, 134.0, 356.0, 2337.0, 658.0, 168.0, 98.0, 47.0, 23.0, 23.0, 10.0, 7.0, 6.0, 5.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4443359375, -0.4303131103515625, -0.416290283203125, -0.4022674560546875, -0.38824462890625, -0.3742218017578125, -0.360198974609375, -0.3461761474609375, -0.3321533203125, -0.3181304931640625, -0.304107666015625, -0.2900848388671875, -0.27606201171875, -0.2620391845703125, -0.248016357421875, -0.2339935302734375, -0.219970703125, -0.2059478759765625, -0.191925048828125, -0.1779022216796875, -0.16387939453125, -0.1498565673828125, -0.135833740234375, -0.1218109130859375, -0.1077880859375, -0.0937652587890625, -0.079742431640625, -0.0657196044921875, -0.05169677734375, -0.0376739501953125, -0.023651123046875, -0.0096282958984375, 0.00439453125, 0.0184173583984375, 0.032440185546875, 0.0464630126953125, 0.06048583984375, 0.0745086669921875, 0.088531494140625, 0.1025543212890625, 0.1165771484375, 0.1305999755859375, 0.144622802734375, 0.1586456298828125, 0.17266845703125, 0.1866912841796875, 0.200714111328125, 0.2147369384765625, 0.228759765625, 0.2427825927734375, 0.256805419921875, 0.2708282470703125, 0.28485107421875, 0.2988739013671875, 0.312896728515625, 0.3269195556640625, 0.3409423828125, 0.3549652099609375, 0.368988037109375, 0.3830108642578125, 0.39703369140625, 0.4110565185546875, 0.425079345703125, 0.4391021728515625, 0.453125]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 10.0, 6.0, 11.0, 33.0, 45.0, 64.0, 121.0, 162.0, 165.0, 154.0, 107.0, 49.0, 33.0, 21.0, 13.0, 4.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.4327988624572754, -3.3454413414001465, -3.2580835819244385, -3.1707260608673096, -3.0833685398101807, -2.9960107803344727, -2.9086532592773438, -2.821295738220215, -2.733938217163086, -2.646580696105957, -2.559222936630249, -2.47186541557312, -2.384507894515991, -2.297150135040283, -2.2097926139831543, -2.1224350929260254, -2.0350773334503174, -1.947719693183899, -1.86036217212677, -1.7730045318603516, -1.6856470108032227, -1.5982893705368042, -1.5109317302703857, -1.4235742092132568, -1.3362165689468384, -1.24885892868042, -1.161501407623291, -1.0741437673568726, -0.9867861866950989, -0.8994286060333252, -0.8120709657669067, -0.7247133851051331, -0.6373560428619385, -0.5499984622001648, -0.4626408517360687, -0.37528324127197266, -0.287925660610199, -0.2005680799484253, -0.11321043968200684, -0.025852859020233154, 0.06150472164154053, 0.1488623172044754, 0.23621991276741028, 0.32357752323150635, 0.41093510389328003, 0.4982926845550537, 0.5856503248214722, 0.6730079054832458, 0.7603654861450195, 0.8477230668067932, 0.9350806474685669, 1.0224382877349854, 1.1097958087921143, 1.1971534490585327, 1.2845110893249512, 1.37186861038208, 1.4592262506484985, 1.546583890914917, 1.633941411972046, 1.7212990522384644, 1.8086566925048828, 1.8960142135620117, 1.9833718538284302, 2.0707294940948486, 2.1580870151519775]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 4.0, 5.0, 9.0, 5.0, 9.0, 8.0, 9.0, 14.0, 15.0, 9.0, 23.0, 23.0, 26.0, 29.0, 35.0, 33.0, 43.0, 40.0, 54.0, 47.0, 34.0, 37.0, 44.0, 45.0, 38.0, 26.0, 46.0, 45.0, 45.0, 25.0, 26.0, 30.0, 26.0, 16.0, 20.0, 7.0, 8.0, 14.0, 11.0, 5.0, 5.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-1.1031018495559692, -1.0700597763061523, -1.037017822265625, -1.0039758682250977, -0.9709337949752808, -0.9378917813301086, -0.9048497676849365, -0.8718077540397644, -0.8387657403945923, -0.8057237267494202, -0.772681713104248, -0.7396396994590759, -0.7065976858139038, -0.6735556721687317, -0.6405136585235596, -0.6074716448783875, -0.5744296312332153, -0.5413876175880432, -0.5083456039428711, -0.475303590297699, -0.44226157665252686, -0.40921956300735474, -0.3761775493621826, -0.3431355357170105, -0.3100935220718384, -0.27705150842666626, -0.24400949478149414, -0.21096748113632202, -0.1779254674911499, -0.14488345384597778, -0.11184144020080566, -0.07879942655563354, -0.045757293701171875, -0.012715280055999756, 0.020326733589172363, 0.05336874723434448, 0.0864107608795166, 0.11945277452468872, 0.15249478816986084, 0.18553680181503296, 0.21857881546020508, 0.2516208291053772, 0.2846628427505493, 0.31770485639572144, 0.35074687004089355, 0.3837888836860657, 0.4168308973312378, 0.4498729109764099, 0.48291492462158203, 0.5159569382667542, 0.5489989519119263, 0.5820409655570984, 0.6150829792022705, 0.6481249928474426, 0.6811670064926147, 0.7142090201377869, 0.747251033782959, 0.7802930474281311, 0.8133350610733032, 0.8463770747184753, 0.8794190883636475, 0.9124611020088196, 0.9455031156539917, 0.9785451292991638, 1.011587142944336]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 5.0, 11.0, 8.0, 17.0, 18.0, 29.0, 35.0, 55.0, 108.0, 134.0, 190.0, 332.0, 501.0, 793.0, 1214.0, 2054.0, 3435.0, 5803.0, 10425.0, 20567.0, 42894.0, 104386.0, 258389.0, 325445.0, 152079.0, 60587.0, 27226.0, 13575.0, 7475.0, 4185.0, 2441.0, 1474.0, 974.0, 559.0, 386.0, 254.0, 153.0, 94.0, 75.0, 54.0, 38.0, 33.0, 16.0, 11.0, 10.0, 8.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.29541015625, -0.28594207763671875, -0.2764739990234375, -0.26700592041015625, -0.257537841796875, -0.24806976318359375, -0.2386016845703125, -0.22913360595703125, -0.21966552734375, -0.21019744873046875, -0.2007293701171875, -0.19126129150390625, -0.181793212890625, -0.17232513427734375, -0.1628570556640625, -0.15338897705078125, -0.1439208984375, -0.13445281982421875, -0.1249847412109375, -0.11551666259765625, -0.106048583984375, -0.09658050537109375, -0.0871124267578125, -0.07764434814453125, -0.06817626953125, -0.05870819091796875, -0.0492401123046875, -0.03977203369140625, -0.030303955078125, -0.02083587646484375, -0.0113677978515625, -0.00189971923828125, 0.007568359375, 0.01703643798828125, 0.0265045166015625, 0.03597259521484375, 0.045440673828125, 0.05490875244140625, 0.0643768310546875, 0.07384490966796875, 0.08331298828125, 0.09278106689453125, 0.1022491455078125, 0.11171722412109375, 0.121185302734375, 0.13065338134765625, 0.1401214599609375, 0.14958953857421875, 0.1590576171875, 0.16852569580078125, 0.1779937744140625, 0.18746185302734375, 0.196929931640625, 0.20639801025390625, 0.2158660888671875, 0.22533416748046875, 0.23480224609375, 0.24427032470703125, 0.2537384033203125, 0.26320648193359375, 0.272674560546875, 0.28214263916015625, 0.2916107177734375, 0.30107879638671875, 0.310546875]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 5.0, 4.0, 9.0, 14.0, 12.0, 14.0, 12.0, 23.0, 19.0, 22.0, 38.0, 27.0, 41.0, 39.0, 42.0, 47.0, 52.0, 57.0, 42.0, 53.0, 36.0, 65.0, 50.0, 46.0, 33.0, 34.0, 21.0, 25.0, 27.0, 17.0, 14.0, 14.0, 19.0, 10.0, 4.0, 5.0, 2.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.10546875, -0.10201168060302734, -0.09855461120605469, -0.09509754180908203, -0.09164047241210938, -0.08818340301513672, -0.08472633361816406, -0.0812692642211914, -0.07781219482421875, -0.0743551254272461, -0.07089805603027344, -0.06744098663330078, -0.06398391723632812, -0.06052684783935547, -0.05706977844238281, -0.053612709045410156, -0.0501556396484375, -0.046698570251464844, -0.04324150085449219, -0.03978443145751953, -0.036327362060546875, -0.03287029266357422, -0.029413223266601562, -0.025956153869628906, -0.02249908447265625, -0.019042015075683594, -0.015584945678710938, -0.012127876281738281, -0.008670806884765625, -0.005213737487792969, -0.0017566680908203125, 0.0017004013061523438, 0.005157470703125, 0.008614540100097656, 0.012071609497070312, 0.015528678894042969, 0.018985748291015625, 0.02244281768798828, 0.025899887084960938, 0.029356956481933594, 0.03281402587890625, 0.036271095275878906, 0.03972816467285156, 0.04318523406982422, 0.046642303466796875, 0.05009937286376953, 0.05355644226074219, 0.057013511657714844, 0.0604705810546875, 0.06392765045166016, 0.06738471984863281, 0.07084178924560547, 0.07429885864257812, 0.07775592803955078, 0.08121299743652344, 0.0846700668334961, 0.08812713623046875, 0.0915842056274414, 0.09504127502441406, 0.09849834442138672, 0.10195541381835938, 0.10541248321533203, 0.10886955261230469, 0.11232662200927734, 0.11578369140625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 1.0, 1.0, 4.0, 4.0, 1.0, 4.0, 9.0, 10.0, 8.0, 15.0, 26.0, 29.0, 41.0, 71.0, 118.0, 204.0, 370.0, 868.0, 2330.0, 8798.0, 44156.0, 380054.0, 532958.0, 61980.0, 11372.0, 3094.0, 1011.0, 440.0, 202.0, 124.0, 72.0, 53.0, 35.0, 18.0, 24.0, 9.0, 10.0, 10.0, 5.0, 4.0, 2.0, 4.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6845703125, -0.6618194580078125, -0.639068603515625, -0.6163177490234375, -0.59356689453125, -0.5708160400390625, -0.548065185546875, -0.5253143310546875, -0.5025634765625, -0.4798126220703125, -0.457061767578125, -0.4343109130859375, -0.41156005859375, -0.3888092041015625, -0.366058349609375, -0.3433074951171875, -0.320556640625, -0.2978057861328125, -0.275054931640625, -0.2523040771484375, -0.22955322265625, -0.2068023681640625, -0.184051513671875, -0.1613006591796875, -0.1385498046875, -0.1157989501953125, -0.093048095703125, -0.0702972412109375, -0.04754638671875, -0.0247955322265625, -0.002044677734375, 0.0207061767578125, 0.04345703125, 0.0662078857421875, 0.088958740234375, 0.1117095947265625, 0.13446044921875, 0.1572113037109375, 0.179962158203125, 0.2027130126953125, 0.2254638671875, 0.2482147216796875, 0.270965576171875, 0.2937164306640625, 0.31646728515625, 0.3392181396484375, 0.361968994140625, 0.3847198486328125, 0.407470703125, 0.4302215576171875, 0.452972412109375, 0.4757232666015625, 0.49847412109375, 0.5212249755859375, 0.543975830078125, 0.5667266845703125, 0.5894775390625, 0.6122283935546875, 0.634979248046875, 0.6577301025390625, 0.68048095703125, 0.7032318115234375, 0.725982666015625, 0.7487335205078125, 0.771484375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 2.0, 4.0, 4.0, 5.0, 2.0, 3.0, 8.0, 7.0, 15.0, 14.0, 12.0, 23.0, 31.0, 25.0, 23.0, 22.0, 28.0, 43.0, 36.0, 35.0, 47.0, 40.0, 44.0, 55.0, 46.0, 47.0, 33.0, 32.0, 38.0, 40.0, 33.0, 21.0, 34.0, 20.0, 25.0, 26.0, 10.0, 18.0, 9.0, 9.0, 10.0, 5.0, 6.0, 7.0, 5.0, 1.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5419921875, -0.5248336791992188, -0.5076751708984375, -0.49051666259765625, -0.473358154296875, -0.45619964599609375, -0.4390411376953125, -0.42188262939453125, -0.40472412109375, -0.38756561279296875, -0.3704071044921875, -0.35324859619140625, -0.336090087890625, -0.31893157958984375, -0.3017730712890625, -0.28461456298828125, -0.2674560546875, -0.25029754638671875, -0.2331390380859375, -0.21598052978515625, -0.198822021484375, -0.18166351318359375, -0.1645050048828125, -0.14734649658203125, -0.13018798828125, -0.11302947998046875, -0.0958709716796875, -0.07871246337890625, -0.061553955078125, -0.04439544677734375, -0.0272369384765625, -0.01007843017578125, 0.007080078125, 0.02423858642578125, 0.0413970947265625, 0.05855560302734375, 0.075714111328125, 0.09287261962890625, 0.1100311279296875, 0.12718963623046875, 0.14434814453125, 0.16150665283203125, 0.1786651611328125, 0.19582366943359375, 0.212982177734375, 0.23014068603515625, 0.2472991943359375, 0.26445770263671875, 0.2816162109375, 0.29877471923828125, 0.3159332275390625, 0.33309173583984375, 0.350250244140625, 0.36740875244140625, 0.3845672607421875, 0.40172576904296875, 0.41888427734375, 0.43604278564453125, 0.4532012939453125, 0.47035980224609375, 0.487518310546875, 0.5046768188476562, 0.5218353271484375, 0.5389938354492188, 0.55615234375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 3.0, 6.0, 3.0, 6.0, 6.0, 14.0, 21.0, 31.0, 66.0, 129.0, 222.0, 543.0, 1503.0, 5319.0, 24280.0, 234395.0, 693604.0, 72556.0, 11369.0, 2818.0, 923.0, 376.0, 168.0, 74.0, 42.0, 24.0, 21.0, 16.0, 9.0, 4.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.36572265625, -0.35124969482421875, -0.3367767333984375, -0.32230377197265625, -0.307830810546875, -0.29335784912109375, -0.2788848876953125, -0.26441192626953125, -0.24993896484375, -0.23546600341796875, -0.2209930419921875, -0.20652008056640625, -0.192047119140625, -0.17757415771484375, -0.1631011962890625, -0.14862823486328125, -0.1341552734375, -0.11968231201171875, -0.1052093505859375, -0.09073638916015625, -0.076263427734375, -0.06179046630859375, -0.0473175048828125, -0.03284454345703125, -0.01837158203125, -0.00389862060546875, 0.0105743408203125, 0.02504730224609375, 0.039520263671875, 0.05399322509765625, 0.0684661865234375, 0.08293914794921875, 0.097412109375, 0.11188507080078125, 0.1263580322265625, 0.14083099365234375, 0.155303955078125, 0.16977691650390625, 0.1842498779296875, 0.19872283935546875, 0.21319580078125, 0.22766876220703125, 0.2421417236328125, 0.25661468505859375, 0.271087646484375, 0.28556060791015625, 0.3000335693359375, 0.31450653076171875, 0.3289794921875, 0.34345245361328125, 0.3579254150390625, 0.37239837646484375, 0.386871337890625, 0.40134429931640625, 0.4158172607421875, 0.43029022216796875, 0.44476318359375, 0.45923614501953125, 0.4737091064453125, 0.48818206787109375, 0.502655029296875, 0.5171279907226562, 0.5316009521484375, 0.5460739135742188, 0.560546875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 6.0, 2.0, 5.0, 4.0, 5.0, 9.0, 13.0, 23.0, 27.0, 49.0, 57.0, 74.0, 109.0, 138.0, 146.0, 94.0, 87.0, 53.0, 38.0, 14.0, 19.0, 9.0, 9.0, 10.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.328126907348633e-05, -9.015202522277832e-05, -8.702278137207031e-05, -8.38935375213623e-05, -8.07642936706543e-05, -7.763504981994629e-05, -7.450580596923828e-05, -7.137656211853027e-05, -6.824731826782227e-05, -6.511807441711426e-05, -6.198883056640625e-05, -5.885958671569824e-05, -5.5730342864990234e-05, -5.2601099014282227e-05, -4.947185516357422e-05, -4.634261131286621e-05, -4.32133674621582e-05, -4.0084123611450195e-05, -3.695487976074219e-05, -3.382563591003418e-05, -3.069639205932617e-05, -2.7567148208618164e-05, -2.4437904357910156e-05, -2.130866050720215e-05, -1.817941665649414e-05, -1.5050172805786133e-05, -1.1920928955078125e-05, -8.791685104370117e-06, -5.662441253662109e-06, -2.5331974029541016e-06, 5.960464477539062e-07, 3.725290298461914e-06, 6.854534149169922e-06, 9.98377799987793e-06, 1.3113021850585938e-05, 1.6242265701293945e-05, 1.9371509552001953e-05, 2.250075340270996e-05, 2.562999725341797e-05, 2.8759241104125977e-05, 3.1888484954833984e-05, 3.501772880554199e-05, 3.814697265625e-05, 4.127621650695801e-05, 4.4405460357666016e-05, 4.7534704208374023e-05, 5.066394805908203e-05, 5.379319190979004e-05, 5.692243576049805e-05, 6.0051679611206055e-05, 6.318092346191406e-05, 6.631016731262207e-05, 6.943941116333008e-05, 7.256865501403809e-05, 7.56978988647461e-05, 7.88271427154541e-05, 8.195638656616211e-05, 8.508563041687012e-05, 8.821487426757812e-05, 9.134411811828613e-05, 9.447336196899414e-05, 9.760260581970215e-05, 0.00010073184967041016, 0.00010386109352111816, 0.00010699033737182617]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 5.0, 1.0, 2.0, 6.0, 8.0, 5.0, 5.0, 6.0, 16.0, 31.0, 45.0, 53.0, 78.0, 103.0, 164.0, 303.0, 426.0, 825.0, 1509.0, 3065.0, 6448.0, 16102.0, 46941.0, 174048.0, 485243.0, 221205.0, 57728.0, 19089.0, 7536.0, 3400.0, 1773.0, 960.0, 516.0, 339.0, 198.0, 124.0, 81.0, 41.0, 34.0, 39.0, 15.0, 18.0, 7.0, 4.0, 5.0, 8.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.264404296875, -0.2562904357910156, -0.24817657470703125, -0.24006271362304688, -0.2319488525390625, -0.22383499145507812, -0.21572113037109375, -0.20760726928710938, -0.199493408203125, -0.19137954711914062, -0.18326568603515625, -0.17515182495117188, -0.1670379638671875, -0.15892410278320312, -0.15081024169921875, -0.14269638061523438, -0.13458251953125, -0.12646865844726562, -0.11835479736328125, -0.11024093627929688, -0.1021270751953125, -0.09401321411132812, -0.08589935302734375, -0.07778549194335938, -0.069671630859375, -0.061557769775390625, -0.05344390869140625, -0.045330047607421875, -0.0372161865234375, -0.029102325439453125, -0.02098846435546875, -0.012874603271484375, -0.0047607421875, 0.003353118896484375, 0.01146697998046875, 0.019580841064453125, 0.0276947021484375, 0.035808563232421875, 0.04392242431640625, 0.052036285400390625, 0.060150146484375, 0.06826400756835938, 0.07637786865234375, 0.08449172973632812, 0.0926055908203125, 0.10071945190429688, 0.10883331298828125, 0.11694717407226562, 0.12506103515625, 0.13317489624023438, 0.14128875732421875, 0.14940261840820312, 0.1575164794921875, 0.16563034057617188, 0.17374420166015625, 0.18185806274414062, 0.189971923828125, 0.19808578491210938, 0.20619964599609375, 0.21431350708007812, 0.2224273681640625, 0.23054122924804688, 0.23865509033203125, 0.24676895141601562, 0.2548828125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 6.0, 9.0, 20.0, 26.0, 26.0, 41.0, 73.0, 68.0, 105.0, 139.0, 125.0, 113.0, 94.0, 54.0, 33.0, 23.0, 11.0, 14.0, 7.0, 8.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.273193359375, -0.26171875, -0.250244140625, -0.23876953125, -0.227294921875, -0.2158203125, -0.204345703125, -0.19287109375, -0.181396484375, -0.169921875, -0.158447265625, -0.14697265625, -0.135498046875, -0.1240234375, -0.112548828125, -0.10107421875, -0.089599609375, -0.078125, -0.066650390625, -0.05517578125, -0.043701171875, -0.0322265625, -0.020751953125, -0.00927734375, 0.002197265625, 0.013671875, 0.025146484375, 0.03662109375, 0.048095703125, 0.0595703125, 0.071044921875, 0.08251953125, 0.093994140625, 0.10546875, 0.116943359375, 0.12841796875, 0.139892578125, 0.1513671875, 0.162841796875, 0.17431640625, 0.185791015625, 0.197265625, 0.208740234375, 0.22021484375, 0.231689453125, 0.2431640625, 0.254638671875, 0.26611328125, 0.277587890625, 0.2890625, 0.300537109375, 0.31201171875, 0.323486328125, 0.3349609375, 0.346435546875, 0.35791015625, 0.369384765625, 0.380859375, 0.392333984375, 0.40380859375, 0.415283203125, 0.4267578125, 0.438232421875, 0.44970703125, 0.461181640625]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 7.0, 15.0, 33.0, 68.0, 120.0, 216.0, 215.0, 155.0, 109.0, 38.0, 22.0, 11.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.987802028656006, -2.7788026332855225, -2.569803237915039, -2.3608040809631348, -2.1518044471740723, -1.9428051710128784, -1.7338058948516846, -1.5248064994812012, -1.3158071041107178, -1.1068077087402344, -0.8978083729743958, -0.6888090372085571, -0.47980964183807373, -0.27081024646759033, -0.061810970306396484, 0.14718842506408691, 0.3561878204345703, 0.5651872158050537, 0.7741865515708923, 0.983185887336731, 1.1921852827072144, 1.4011846780776978, 1.6101839542388916, 1.819183349609375, 2.0281827449798584, 2.237182140350342, 2.446181535720825, 2.6551809310913086, 2.864180088043213, 3.0731797218322754, 3.2821788787841797, 3.491178274154663, 3.7001771926879883, 3.9091765880584717, 4.118175983428955, 4.327175140380859, 4.536174774169922, 4.745173931121826, 4.9541730880737305, 5.163172721862793, 5.3721723556518555, 5.58117151260376, 5.790171146392822, 5.999170303344727, 6.208169937133789, 6.417169094085693, 6.626168251037598, 6.83516788482666, 7.0441670417785645, 7.253166198730469, 7.462165832519531, 7.6711649894714355, 7.880164623260498, 8.089163780212402, 8.298163414001465, 8.507162094116211, 8.716161727905273, 8.925161361694336, 9.134160041809082, 9.343159675598145, 9.552159309387207, 9.76115894317627, 9.970157623291016, 10.179157257080078, 10.38815689086914]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 4.0, 2.0, 2.0, 2.0, 2.0, 4.0, 1.0, 7.0, 11.0, 10.0, 13.0, 17.0, 14.0, 18.0, 21.0, 23.0, 14.0, 25.0, 41.0, 37.0, 40.0, 33.0, 33.0, 41.0, 44.0, 42.0, 52.0, 31.0, 43.0, 35.0, 39.0, 43.0, 38.0, 32.0, 27.0, 36.0, 20.0, 19.0, 23.0, 19.0, 7.0, 9.0, 8.0, 5.0, 3.0, 8.0, 4.0, 4.0, 4.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3804855346679688, -2.2952613830566406, -2.2100374698638916, -2.1248135566711426, -2.0395894050598145, -1.9543653726577759, -1.8691413402557373, -1.7839173078536987, -1.6986932754516602, -1.6134692430496216, -1.528245210647583, -1.4430211782455444, -1.3577971458435059, -1.2725731134414673, -1.1873490810394287, -1.1021250486373901, -1.0169010162353516, -0.931676983833313, -0.8464529514312744, -0.7612289190292358, -0.6760048866271973, -0.5907808542251587, -0.5055568218231201, -0.42033278942108154, -0.33510875701904297, -0.2498847246170044, -0.16466069221496582, -0.07943665981292725, 0.005787372589111328, 0.0910114049911499, 0.17623543739318848, 0.26145946979522705, 0.3466835021972656, 0.4319075345993042, 0.5171315670013428, 0.6023555994033813, 0.6875796318054199, 0.7728036642074585, 0.8580276966094971, 0.9432517290115356, 1.0284757614135742, 1.1136997938156128, 1.1989238262176514, 1.28414785861969, 1.3693718910217285, 1.454595923423767, 1.5398199558258057, 1.6250439882278442, 1.7102680206298828, 1.7954920530319214, 1.88071608543396, 1.9659401178359985, 2.051164150238037, 2.1363883018493652, 2.2216122150421143, 2.3068361282348633, 2.3920602798461914, 2.4772844314575195, 2.5625083446502686, 2.6477322578430176, 2.7329564094543457, 2.818180561065674, 2.903404474258423, 2.988628387451172, 3.0738525390625]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 2.0, 1.0, 2.0, 4.0, 6.0, 1.0, 4.0, 8.0, 5.0, 12.0, 17.0, 9.0, 22.0, 35.0, 43.0, 50.0, 70.0, 86.0, 133.0, 188.0, 274.0, 468.0, 751.0, 1324.0, 2525.0, 6502.0, 34900.0, 4116277.0, 20235.0, 5024.0, 2191.0, 1123.0, 719.0, 411.0, 229.0, 169.0, 116.0, 93.0, 60.0, 53.0, 34.0, 35.0, 27.0, 14.0, 16.0, 6.0, 6.0, 6.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 0.0, 1.0], "bins": [-1.244140625, -1.208984375, -1.173828125, -1.138671875, -1.103515625, -1.068359375, -1.033203125, -0.998046875, -0.962890625, -0.927734375, -0.892578125, -0.857421875, -0.822265625, -0.787109375, -0.751953125, -0.716796875, -0.681640625, -0.646484375, -0.611328125, -0.576171875, -0.541015625, -0.505859375, -0.470703125, -0.435546875, -0.400390625, -0.365234375, -0.330078125, -0.294921875, -0.259765625, -0.224609375, -0.189453125, -0.154296875, -0.119140625, -0.083984375, -0.048828125, -0.013671875, 0.021484375, 0.056640625, 0.091796875, 0.126953125, 0.162109375, 0.197265625, 0.232421875, 0.267578125, 0.302734375, 0.337890625, 0.373046875, 0.408203125, 0.443359375, 0.478515625, 0.513671875, 0.548828125, 0.583984375, 0.619140625, 0.654296875, 0.689453125, 0.724609375, 0.759765625, 0.794921875, 0.830078125, 0.865234375, 0.900390625, 0.935546875, 0.970703125, 1.005859375]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 7.0, 7.0, 11.0, 11.0, 13.0, 15.0, 21.0, 20.0, 26.0, 19.0, 32.0, 44.0, 47.0, 49.0, 47.0, 50.0, 40.0, 60.0, 51.0, 55.0, 56.0, 41.0, 35.0, 43.0, 34.0, 29.0, 24.0, 19.0, 29.0, 12.0, 13.0, 9.0, 8.0, 3.0, 7.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11187744140625, -0.10806751251220703, -0.10425758361816406, -0.1004476547241211, -0.09663772583007812, -0.09282779693603516, -0.08901786804199219, -0.08520793914794922, -0.08139801025390625, -0.07758808135986328, -0.07377815246582031, -0.06996822357177734, -0.06615829467773438, -0.062348365783691406, -0.05853843688964844, -0.05472850799560547, -0.0509185791015625, -0.04710865020751953, -0.04329872131347656, -0.039488792419433594, -0.035678863525390625, -0.031868934631347656, -0.028059005737304688, -0.02424907684326172, -0.02043914794921875, -0.01662921905517578, -0.012819290161132812, -0.009009361267089844, -0.005199432373046875, -0.0013895034790039062, 0.0024204254150390625, 0.006230354309082031, 0.010040283203125, 0.013850212097167969, 0.017660140991210938, 0.021470069885253906, 0.025279998779296875, 0.029089927673339844, 0.03289985656738281, 0.03670978546142578, 0.04051971435546875, 0.04432964324951172, 0.04813957214355469, 0.051949501037597656, 0.055759429931640625, 0.059569358825683594, 0.06337928771972656, 0.06718921661376953, 0.0709991455078125, 0.07480907440185547, 0.07861900329589844, 0.0824289321899414, 0.08623886108398438, 0.09004878997802734, 0.09385871887207031, 0.09766864776611328, 0.10147857666015625, 0.10528850555419922, 0.10909843444824219, 0.11290836334228516, 0.11671829223632812, 0.1205282211303711, 0.12433815002441406, 0.12814807891845703, 0.1319580078125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 6.0, 7.0, 8.0, 11.0, 16.0, 19.0, 19.0, 29.0, 45.0, 53.0, 53.0, 61.0, 89.0, 109.0, 163.0, 228.0, 351.0, 613.0, 1298.0, 2966.0, 8976.0, 77439.0, 4074369.0, 18222.0, 4843.0, 1885.0, 892.0, 435.0, 272.0, 208.0, 137.0, 99.0, 82.0, 61.0, 41.0, 48.0, 29.0, 26.0, 20.0, 14.0, 8.0, 12.0, 6.0, 1.0, 5.0, 1.0, 5.0, 1.0, 2.0, 4.0, 5.0], "bins": [-1.6728515625, -1.6253662109375, -1.577880859375, -1.5303955078125, -1.48291015625, -1.4354248046875, -1.387939453125, -1.3404541015625, -1.29296875, -1.2454833984375, -1.197998046875, -1.1505126953125, -1.10302734375, -1.0555419921875, -1.008056640625, -0.9605712890625, -0.9130859375, -0.8656005859375, -0.818115234375, -0.7706298828125, -0.72314453125, -0.6756591796875, -0.628173828125, -0.5806884765625, -0.533203125, -0.4857177734375, -0.438232421875, -0.3907470703125, -0.34326171875, -0.2957763671875, -0.248291015625, -0.2008056640625, -0.1533203125, -0.1058349609375, -0.058349609375, -0.0108642578125, 0.03662109375, 0.0841064453125, 0.131591796875, 0.1790771484375, 0.2265625, 0.2740478515625, 0.321533203125, 0.3690185546875, 0.41650390625, 0.4639892578125, 0.511474609375, 0.5589599609375, 0.6064453125, 0.6539306640625, 0.701416015625, 0.7489013671875, 0.79638671875, 0.8438720703125, 0.891357421875, 0.9388427734375, 0.986328125, 1.0338134765625, 1.081298828125, 1.1287841796875, 1.17626953125, 1.2237548828125, 1.271240234375, 1.3187255859375, 1.3662109375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 7.0, 8.0, 21.0, 26.0, 266.0, 3634.0, 55.0, 35.0, 10.0, 6.0, 7.0, 3.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.421875, -0.41082000732421875, -0.3997650146484375, -0.38871002197265625, -0.377655029296875, -0.36660003662109375, -0.3555450439453125, -0.34449005126953125, -0.33343505859375, -0.32238006591796875, -0.3113250732421875, -0.30027008056640625, -0.289215087890625, -0.27816009521484375, -0.2671051025390625, -0.25605010986328125, -0.2449951171875, -0.23394012451171875, -0.2228851318359375, -0.21183013916015625, -0.200775146484375, -0.18972015380859375, -0.1786651611328125, -0.16761016845703125, -0.15655517578125, -0.14550018310546875, -0.1344451904296875, -0.12339019775390625, -0.112335205078125, -0.10128021240234375, -0.0902252197265625, -0.07917022705078125, -0.068115234375, -0.05706024169921875, -0.0460052490234375, -0.03495025634765625, -0.023895263671875, -0.01284027099609375, -0.0017852783203125, 0.00926971435546875, 0.02032470703125, 0.03137969970703125, 0.0424346923828125, 0.05348968505859375, 0.064544677734375, 0.07559967041015625, 0.0866546630859375, 0.09770965576171875, 0.1087646484375, 0.11981964111328125, 0.1308746337890625, 0.14192962646484375, 0.152984619140625, 0.16403961181640625, 0.1750946044921875, 0.18614959716796875, 0.19720458984375, 0.20825958251953125, 0.2193145751953125, 0.23036956787109375, 0.241424560546875, 0.25247955322265625, 0.2635345458984375, 0.27458953857421875, 0.28564453125]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 8.0, 5.0, 15.0, 21.0, 40.0, 50.0, 101.0, 126.0, 126.0, 155.0, 102.0, 55.0, 63.0, 40.0, 34.0, 23.0, 17.0, 7.0, 5.0, 6.0, 3.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.322012186050415, -1.2915350198745728, -1.26105797290802, -1.2305808067321777, -1.200103759765625, -1.1696265935897827, -1.1391494274139404, -1.1086723804473877, -1.0781952142715454, -1.0477180480957031, -1.0172410011291504, -0.9867638349533081, -0.9562867283821106, -0.9258096218109131, -0.8953325152397156, -0.8648554086685181, -0.8343782424926758, -0.8039011359214783, -0.7734240293502808, -0.7429468631744385, -0.712469756603241, -0.6819926500320435, -0.651515543460846, -0.6210384368896484, -0.5905613303184509, -0.5600842237472534, -0.5296071171760559, -0.499129980802536, -0.4686528444290161, -0.4381757378578186, -0.4076986312866211, -0.3772214949131012, -0.3467443585395813, -0.3162672519683838, -0.2857901155948639, -0.2553130090236664, -0.22483587265014648, -0.19435876607894897, -0.16388164460659027, -0.13340452313423157, -0.10292740166187286, -0.07245028018951416, -0.041973162442445755, -0.01149604469537735, 0.018981076776981354, 0.04945819079875946, 0.07993531227111816, 0.11041243374347687, 0.14088955521583557, 0.17136667668819427, 0.20184379816055298, 0.2323209047317505, 0.2627980411052704, 0.2932751476764679, 0.3237522840499878, 0.3542293906211853, 0.3847064971923828, 0.4151836037635803, 0.4456607401371002, 0.47613784670829773, 0.5066149830818176, 0.5370920896530151, 0.5675691962242126, 0.5980463027954102, 0.6285234689712524]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 5.0, 5.0, 10.0, 9.0, 15.0, 16.0, 17.0, 20.0, 26.0, 19.0, 39.0, 39.0, 39.0, 24.0, 36.0, 44.0, 39.0, 43.0, 30.0, 38.0, 29.0, 37.0, 32.0, 41.0, 37.0, 38.0, 34.0, 36.0, 29.0, 32.0, 27.0, 26.0, 25.0, 13.0, 17.0, 8.0, 7.0, 4.0, 5.0, 5.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5178878903388977, -0.5019795298576355, -0.4860711693763733, -0.47016283869743347, -0.45425447821617126, -0.43834611773490906, -0.42243778705596924, -0.40652942657470703, -0.3906210660934448, -0.3747127056121826, -0.3588043451309204, -0.3428960144519806, -0.3269876539707184, -0.3110792934894562, -0.29517096281051636, -0.27926260232925415, -0.26335424184799194, -0.24744588136672974, -0.23153753578662872, -0.2156291902065277, -0.1997208297252655, -0.1838124692440033, -0.16790412366390228, -0.15199577808380127, -0.13608741760253906, -0.12017906457185745, -0.10427071154117584, -0.08836235851049423, -0.07245400547981262, -0.05654565244913101, -0.0406372994184494, -0.024728946387767792, -0.008820533752441406, 0.007087819278240204, 0.022996172308921814, 0.038904525339603424, 0.054812878370285034, 0.07072123140096664, 0.08662958443164825, 0.10253793746232986, 0.11844629049301147, 0.13435465097427368, 0.1502629965543747, 0.1661713421344757, 0.18207970261573792, 0.19798806309700012, 0.21389640867710114, 0.22980475425720215, 0.24571311473846436, 0.26162147521972656, 0.27752983570098877, 0.2934381663799286, 0.3093465268611908, 0.325254887342453, 0.3411632180213928, 0.35707157850265503, 0.37297993898391724, 0.38888829946517944, 0.40479665994644165, 0.42070499062538147, 0.4366133511066437, 0.4525217115879059, 0.4684300422668457, 0.4843384027481079, 0.5002467632293701]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 4.0, 16.0, 19.0, 16.0, 33.0, 63.0, 75.0, 120.0, 191.0, 289.0, 495.0, 830.0, 1393.0, 2509.0, 4797.0, 9345.0, 19601.0, 47541.0, 133874.0, 362436.0, 295145.0, 99701.0, 37069.0, 15934.0, 7808.0, 4028.0, 2152.0, 1209.0, 723.0, 405.0, 245.0, 162.0, 112.0, 59.0, 47.0, 30.0, 20.0, 16.0, 12.0, 17.0, 4.0, 3.0, 2.0, 2.0, 5.0, 1.0, 0.0, 1.0], "bins": [-0.52880859375, -0.5140647888183594, -0.49932098388671875, -0.4845771789550781, -0.4698333740234375, -0.4550895690917969, -0.44034576416015625, -0.4256019592285156, -0.410858154296875, -0.3961143493652344, -0.38137054443359375, -0.3666267395019531, -0.3518829345703125, -0.3371391296386719, -0.32239532470703125, -0.3076515197753906, -0.29290771484375, -0.2781639099121094, -0.26342010498046875, -0.24867630004882812, -0.2339324951171875, -0.21918869018554688, -0.20444488525390625, -0.18970108032226562, -0.174957275390625, -0.16021347045898438, -0.14546966552734375, -0.13072586059570312, -0.1159820556640625, -0.10123825073242188, -0.08649444580078125, -0.07175064086914062, -0.0570068359375, -0.042263031005859375, -0.02751922607421875, -0.012775421142578125, 0.0019683837890625, 0.016712188720703125, 0.03145599365234375, 0.046199798583984375, 0.060943603515625, 0.07568740844726562, 0.09043121337890625, 0.10517501831054688, 0.1199188232421875, 0.13466262817382812, 0.14940643310546875, 0.16415023803710938, 0.17889404296875, 0.19363784790039062, 0.20838165283203125, 0.22312545776367188, 0.2378692626953125, 0.2526130676269531, 0.26735687255859375, 0.2821006774902344, 0.296844482421875, 0.3115882873535156, 0.32633209228515625, 0.3410758972167969, 0.3558197021484375, 0.3705635070800781, 0.38530731201171875, 0.4000511169433594, 0.414794921875]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 3.0, 7.0, 2.0, 9.0, 12.0, 9.0, 14.0, 14.0, 16.0, 19.0, 24.0, 16.0, 27.0, 37.0, 36.0, 35.0, 38.0, 38.0, 46.0, 43.0, 37.0, 50.0, 45.0, 46.0, 43.0, 44.0, 38.0, 43.0, 34.0, 24.0, 27.0, 27.0, 27.0, 15.0, 14.0, 9.0, 3.0, 9.0, 4.0, 8.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1260986328125, -0.12201881408691406, -0.11793899536132812, -0.11385917663574219, -0.10977935791015625, -0.10569953918457031, -0.10161972045898438, -0.09753990173339844, -0.0934600830078125, -0.08938026428222656, -0.08530044555664062, -0.08122062683105469, -0.07714080810546875, -0.07306098937988281, -0.06898117065429688, -0.06490135192871094, -0.060821533203125, -0.05674171447753906, -0.052661895751953125, -0.04858207702636719, -0.04450225830078125, -0.04042243957519531, -0.036342620849609375, -0.03226280212402344, -0.0281829833984375, -0.024103164672851562, -0.020023345947265625, -0.015943527221679688, -0.01186370849609375, -0.0077838897705078125, -0.003704071044921875, 0.0003757476806640625, 0.00445556640625, 0.008535385131835938, 0.012615203857421875, 0.016695022583007812, 0.02077484130859375, 0.024854660034179688, 0.028934478759765625, 0.03301429748535156, 0.0370941162109375, 0.04117393493652344, 0.045253753662109375, 0.04933357238769531, 0.05341339111328125, 0.05749320983886719, 0.061573028564453125, 0.06565284729003906, 0.069732666015625, 0.07381248474121094, 0.07789230346679688, 0.08197212219238281, 0.08605194091796875, 0.09013175964355469, 0.09421157836914062, 0.09829139709472656, 0.1023712158203125, 0.10645103454589844, 0.11053085327148438, 0.11461067199707031, 0.11869049072265625, 0.12277030944824219, 0.12685012817382812, 0.13092994689941406, 0.135009765625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 6.0, 5.0, 11.0, 10.0, 13.0, 17.0, 24.0, 42.0, 50.0, 61.0, 102.0, 149.0, 227.0, 339.0, 511.0, 864.0, 1501.0, 2480.0, 5107.0, 11059.0, 28469.0, 89941.0, 332654.0, 404642.0, 110637.0, 33801.0, 13031.0, 5753.0, 2872.0, 1511.0, 899.0, 542.0, 401.0, 247.0, 180.0, 98.0, 76.0, 66.0, 37.0, 27.0, 22.0, 15.0, 17.0, 10.0, 7.0, 6.0, 5.0, 4.0, 2.0, 5.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.433837890625, -0.4198799133300781, -0.40592193603515625, -0.3919639587402344, -0.3780059814453125, -0.3640480041503906, -0.35009002685546875, -0.3361320495605469, -0.322174072265625, -0.3082160949707031, -0.29425811767578125, -0.2803001403808594, -0.2663421630859375, -0.2523841857910156, -0.23842620849609375, -0.22446823120117188, -0.21051025390625, -0.19655227661132812, -0.18259429931640625, -0.16863632202148438, -0.1546783447265625, -0.14072036743164062, -0.12676239013671875, -0.11280441284179688, -0.098846435546875, -0.08488845825195312, -0.07093048095703125, -0.056972503662109375, -0.0430145263671875, -0.029056549072265625, -0.01509857177734375, -0.001140594482421875, 0.0128173828125, 0.026775360107421875, 0.04073333740234375, 0.054691314697265625, 0.0686492919921875, 0.08260726928710938, 0.09656524658203125, 0.11052322387695312, 0.124481201171875, 0.13843917846679688, 0.15239715576171875, 0.16635513305664062, 0.1803131103515625, 0.19427108764648438, 0.20822906494140625, 0.22218704223632812, 0.23614501953125, 0.2501029968261719, 0.26406097412109375, 0.2780189514160156, 0.2919769287109375, 0.3059349060058594, 0.31989288330078125, 0.3338508605957031, 0.347808837890625, 0.3617668151855469, 0.37572479248046875, 0.3896827697753906, 0.4036407470703125, 0.4175987243652344, 0.43155670166015625, 0.4455146789550781, 0.45947265625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 1.0, 4.0, 5.0, 6.0, 9.0, 12.0, 19.0, 18.0, 35.0, 15.0, 44.0, 37.0, 50.0, 48.0, 41.0, 51.0, 61.0, 50.0, 51.0, 50.0, 52.0, 42.0, 42.0, 57.0, 31.0, 36.0, 30.0, 24.0, 18.0, 22.0, 10.0, 12.0, 10.0, 5.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.642578125, -0.617431640625, -0.59228515625, -0.567138671875, -0.5419921875, -0.516845703125, -0.49169921875, -0.466552734375, -0.44140625, -0.416259765625, -0.39111328125, -0.365966796875, -0.3408203125, -0.315673828125, -0.29052734375, -0.265380859375, -0.240234375, -0.215087890625, -0.18994140625, -0.164794921875, -0.1396484375, -0.114501953125, -0.08935546875, -0.064208984375, -0.0390625, -0.013916015625, 0.01123046875, 0.036376953125, 0.0615234375, 0.086669921875, 0.11181640625, 0.136962890625, 0.162109375, 0.187255859375, 0.21240234375, 0.237548828125, 0.2626953125, 0.287841796875, 0.31298828125, 0.338134765625, 0.36328125, 0.388427734375, 0.41357421875, 0.438720703125, 0.4638671875, 0.489013671875, 0.51416015625, 0.539306640625, 0.564453125, 0.589599609375, 0.61474609375, 0.639892578125, 0.6650390625, 0.690185546875, 0.71533203125, 0.740478515625, 0.765625, 0.790771484375, 0.81591796875, 0.841064453125, 0.8662109375, 0.891357421875, 0.91650390625, 0.941650390625, 0.966796875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 7.0, 4.0, 6.0, 4.0, 11.0, 18.0, 20.0, 29.0, 35.0, 58.0, 86.0, 120.0, 172.0, 282.0, 478.0, 851.0, 1786.0, 3753.0, 9491.0, 31748.0, 179988.0, 644234.0, 133647.0, 26105.0, 8497.0, 3401.0, 1633.0, 848.0, 465.0, 272.0, 155.0, 102.0, 65.0, 50.0, 31.0, 27.0, 23.0, 10.0, 14.0, 5.0, 7.0, 4.0, 2.0, 4.0, 4.0, 1.0, 1.0, 2.0], "bins": [-0.43603515625, -0.42438507080078125, -0.4127349853515625, -0.40108489990234375, -0.389434814453125, -0.37778472900390625, -0.3661346435546875, -0.35448455810546875, -0.34283447265625, -0.33118438720703125, -0.3195343017578125, -0.30788421630859375, -0.296234130859375, -0.28458404541015625, -0.2729339599609375, -0.26128387451171875, -0.2496337890625, -0.23798370361328125, -0.2263336181640625, -0.21468353271484375, -0.203033447265625, -0.19138336181640625, -0.1797332763671875, -0.16808319091796875, -0.15643310546875, -0.14478302001953125, -0.1331329345703125, -0.12148284912109375, -0.109832763671875, -0.09818267822265625, -0.0865325927734375, -0.07488250732421875, -0.063232421875, -0.05158233642578125, -0.0399322509765625, -0.02828216552734375, -0.016632080078125, -0.00498199462890625, 0.0066680908203125, 0.01831817626953125, 0.02996826171875, 0.04161834716796875, 0.0532684326171875, 0.06491851806640625, 0.076568603515625, 0.08821868896484375, 0.0998687744140625, 0.11151885986328125, 0.1231689453125, 0.13481903076171875, 0.1464691162109375, 0.15811920166015625, 0.169769287109375, 0.18141937255859375, 0.1930694580078125, 0.20471954345703125, 0.21636962890625, 0.22801971435546875, 0.2396697998046875, 0.25131988525390625, 0.262969970703125, 0.27462005615234375, 0.2862701416015625, 0.29792022705078125, 0.3095703125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 6.0, 7.0, 2.0, 14.0, 17.0, 26.0, 35.0, 36.0, 46.0, 72.0, 95.0, 96.0, 110.0, 105.0, 86.0, 65.0, 56.0, 34.0, 30.0, 17.0, 14.0, 10.0, 6.0, 4.0, 2.0, 3.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.343292236328125e-05, -7.093511521816254e-05, -6.843730807304382e-05, -6.593950092792511e-05, -6.34416937828064e-05, -6.094388663768768e-05, -5.844607949256897e-05, -5.5948272347450256e-05, -5.345046520233154e-05, -5.095265805721283e-05, -4.8454850912094116e-05, -4.59570437669754e-05, -4.345923662185669e-05, -4.0961429476737976e-05, -3.846362233161926e-05, -3.596581518650055e-05, -3.3468008041381836e-05, -3.097020089626312e-05, -2.847239375114441e-05, -2.5974586606025696e-05, -2.3476779460906982e-05, -2.097897231578827e-05, -1.8481165170669556e-05, -1.5983358025550842e-05, -1.3485550880432129e-05, -1.0987743735313416e-05, -8.489936590194702e-06, -5.992129445075989e-06, -3.4943222999572754e-06, -9.96515154838562e-07, 1.5012919902801514e-06, 3.999099135398865e-06, 6.496906280517578e-06, 8.994713425636292e-06, 1.1492520570755005e-05, 1.3990327715873718e-05, 1.648813486099243e-05, 1.8985942006111145e-05, 2.148374915122986e-05, 2.3981556296348572e-05, 2.6479363441467285e-05, 2.8977170586586e-05, 3.147497773170471e-05, 3.3972784876823425e-05, 3.647059202194214e-05, 3.896839916706085e-05, 4.1466206312179565e-05, 4.396401345729828e-05, 4.646182060241699e-05, 4.8959627747535706e-05, 5.145743489265442e-05, 5.395524203777313e-05, 5.6453049182891846e-05, 5.895085632801056e-05, 6.144866347312927e-05, 6.394647061824799e-05, 6.64442777633667e-05, 6.894208490848541e-05, 7.143989205360413e-05, 7.393769919872284e-05, 7.643550634384155e-05, 7.893331348896027e-05, 8.143112063407898e-05, 8.392892777919769e-05, 8.64267349243164e-05]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 4.0, 3.0, 1.0, 4.0, 8.0, 10.0, 24.0, 28.0, 51.0, 73.0, 106.0, 210.0, 322.0, 753.0, 1645.0, 4920.0, 19530.0, 171505.0, 749913.0, 81004.0, 12441.0, 3440.0, 1294.0, 510.0, 331.0, 183.0, 91.0, 55.0, 36.0, 26.0, 15.0, 6.0, 6.0, 5.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.625, -0.6073226928710938, -0.5896453857421875, -0.5719680786132812, -0.554290771484375, -0.5366134643554688, -0.5189361572265625, -0.5012588500976562, -0.48358154296875, -0.46590423583984375, -0.4482269287109375, -0.43054962158203125, -0.412872314453125, -0.39519500732421875, -0.3775177001953125, -0.35984039306640625, -0.3421630859375, -0.32448577880859375, -0.3068084716796875, -0.28913116455078125, -0.271453857421875, -0.25377655029296875, -0.2360992431640625, -0.21842193603515625, -0.20074462890625, -0.18306732177734375, -0.1653900146484375, -0.14771270751953125, -0.130035400390625, -0.11235809326171875, -0.0946807861328125, -0.07700347900390625, -0.059326171875, -0.04164886474609375, -0.0239715576171875, -0.00629425048828125, 0.011383056640625, 0.02906036376953125, 0.0467376708984375, 0.06441497802734375, 0.08209228515625, 0.09976959228515625, 0.1174468994140625, 0.13512420654296875, 0.152801513671875, 0.17047882080078125, 0.1881561279296875, 0.20583343505859375, 0.2235107421875, 0.24118804931640625, 0.2588653564453125, 0.27654266357421875, 0.294219970703125, 0.31189727783203125, 0.3295745849609375, 0.34725189208984375, 0.36492919921875, 0.38260650634765625, 0.4002838134765625, 0.41796112060546875, 0.435638427734375, 0.45331573486328125, 0.4709930419921875, 0.48867034912109375, 0.50634765625]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 3.0, 5.0, 4.0, 14.0, 28.0, 30.0, 53.0, 96.0, 141.0, 159.0, 154.0, 131.0, 82.0, 41.0, 28.0, 14.0, 12.0, 6.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.8369140625, -0.8194084167480469, -0.8019027709960938, -0.7843971252441406, -0.7668914794921875, -0.7493858337402344, -0.7318801879882812, -0.7143745422363281, -0.696868896484375, -0.6793632507324219, -0.6618576049804688, -0.6443519592285156, -0.6268463134765625, -0.6093406677246094, -0.5918350219726562, -0.5743293762207031, -0.55682373046875, -0.5393180847167969, -0.5218124389648438, -0.5043067932128906, -0.4868011474609375, -0.4692955017089844, -0.45178985595703125, -0.4342842102050781, -0.416778564453125, -0.3992729187011719, -0.38176727294921875, -0.3642616271972656, -0.3467559814453125, -0.3292503356933594, -0.31174468994140625, -0.2942390441894531, -0.2767333984375, -0.2592277526855469, -0.24172210693359375, -0.22421646118164062, -0.2067108154296875, -0.18920516967773438, -0.17169952392578125, -0.15419387817382812, -0.136688232421875, -0.11918258666992188, -0.10167694091796875, -0.08417129516601562, -0.0666656494140625, -0.049160003662109375, -0.03165435791015625, -0.014148712158203125, 0.00335693359375, 0.020862579345703125, 0.03836822509765625, 0.055873870849609375, 0.0733795166015625, 0.09088516235351562, 0.10839080810546875, 0.12589645385742188, 0.143402099609375, 0.16090774536132812, 0.17841339111328125, 0.19591903686523438, 0.2134246826171875, 0.23093032836914062, 0.24843597412109375, 0.2659416198730469, 0.283447265625]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 8.0, 15.0, 13.0, 25.0, 53.0, 75.0, 98.0, 143.0, 132.0, 118.0, 90.0, 86.0, 61.0, 30.0, 10.0, 17.0, 9.0, 6.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.910872220993042, -3.7437593936920166, -3.576646566390991, -3.409533739089966, -3.2424209117889404, -3.075308084487915, -2.9081954956054688, -2.7410826683044434, -2.573969841003418, -2.4068570137023926, -2.239744186401367, -2.072631359100342, -1.9055185317993164, -1.738405704498291, -1.5712929964065552, -1.4041801691055298, -1.2370672225952148, -1.0699543952941895, -0.9028415679931641, -0.7357288002967834, -0.5686159729957581, -0.40150314569473267, -0.23439037799835205, -0.06727755069732666, 0.09983527660369873, 0.2669481039047241, 0.4340609014034271, 0.6011736989021301, 0.7682865262031555, 0.9353993535041809, 1.1025121212005615, 1.269624948501587, 1.4367375373840332, 1.6038503646850586, 1.770963191986084, 1.9380760192871094, 2.1051888465881348, 2.27230167388916, 2.4394145011901855, 2.606527328491211, 2.7736401557922363, 2.9407529830932617, 3.107865810394287, 3.2749786376953125, 3.442091464996338, 3.6092042922973633, 3.7763171195983887, 3.943429946899414, 4.110542297363281, 4.277655124664307, 4.444767951965332, 4.611880779266357, 4.778993606567383, 4.946106433868408, 5.113219261169434, 5.280332088470459, 5.447444915771484, 5.61455774307251, 5.781670570373535, 5.9487833976745605, 6.115896224975586, 6.283009052276611, 6.450121879577637, 6.617234706878662, 6.7843475341796875]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 5.0, 2.0, 5.0, 6.0, 6.0, 4.0, 7.0, 11.0, 8.0, 19.0, 13.0, 17.0, 26.0, 26.0, 31.0, 31.0, 32.0, 36.0, 33.0, 47.0, 41.0, 34.0, 50.0, 53.0, 50.0, 43.0, 53.0, 37.0, 36.0, 34.0, 26.0, 31.0, 18.0, 20.0, 23.0, 11.0, 11.0, 8.0, 11.0, 13.0, 8.0, 11.0, 3.0, 9.0, 2.0, 2.0, 2.0, 5.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.3878402709960938, -3.2825968265533447, -3.1773533821105957, -3.072110176086426, -2.9668667316436768, -2.8616232872009277, -2.7563798427581787, -2.6511363983154297, -2.5458931922912598, -2.4406497478485107, -2.3354063034057617, -2.230163097381592, -2.1249196529388428, -2.0196762084960938, -1.9144327640533447, -1.8091894388198853, -1.7039459943771362, -1.5987025499343872, -1.4934592247009277, -1.3882157802581787, -1.2829724550247192, -1.1777290105819702, -1.0724856853485107, -0.9672422409057617, -0.8619988560676575, -0.7567554712295532, -0.651512086391449, -0.5462687015533447, -0.4410252869129181, -0.33578187227249146, -0.2305384874343872, -0.12529510259628296, -0.02005171775817871, 0.08519167453050613, 0.19043506681919098, 0.2956784665584564, 0.40092185139656067, 0.5061652660369873, 0.6114086508750916, 0.7166520357131958, 0.8218954205513, 0.9271388053894043, 1.0323822498321533, 1.1376255750656128, 1.2428690195083618, 1.3481123447418213, 1.4533557891845703, 1.5585992336273193, 1.6638425588607788, 1.7690860033035278, 1.8743293285369873, 1.9795727729797363, 2.0848162174224854, 2.1900596618652344, 2.2953028678894043, 2.4005463123321533, 2.5057897567749023, 2.6110332012176514, 2.7162766456604004, 2.8215198516845703, 2.9267632961273193, 3.0320067405700684, 3.1372501850128174, 3.2424936294555664, 3.3477368354797363]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 9.0, 9.0, 6.0, 12.0, 11.0, 12.0, 31.0, 25.0, 39.0, 46.0, 57.0, 78.0, 109.0, 141.0, 255.0, 375.0, 590.0, 963.0, 1684.0, 3071.0, 6573.0, 20916.0, 3949820.0, 180957.0, 16214.0, 5651.0, 2691.0, 1400.0, 901.0, 486.0, 361.0, 252.0, 123.0, 103.0, 78.0, 62.0, 48.0, 29.0, 25.0, 29.0, 10.0, 8.0, 8.0, 8.0, 5.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.87451171875, -0.8487167358398438, -0.8229217529296875, -0.7971267700195312, -0.771331787109375, -0.7455368041992188, -0.7197418212890625, -0.6939468383789062, -0.66815185546875, -0.6423568725585938, -0.6165618896484375, -0.5907669067382812, -0.564971923828125, -0.5391769409179688, -0.5133819580078125, -0.48758697509765625, -0.4617919921875, -0.43599700927734375, -0.4102020263671875, -0.38440704345703125, -0.358612060546875, -0.33281707763671875, -0.3070220947265625, -0.28122711181640625, -0.25543212890625, -0.22963714599609375, -0.2038421630859375, -0.17804718017578125, -0.152252197265625, -0.12645721435546875, -0.1006622314453125, -0.07486724853515625, -0.049072265625, -0.02327728271484375, 0.0025177001953125, 0.02831268310546875, 0.054107666015625, 0.07990264892578125, 0.1056976318359375, 0.13149261474609375, 0.15728759765625, 0.18308258056640625, 0.2088775634765625, 0.23467254638671875, 0.260467529296875, 0.28626251220703125, 0.3120574951171875, 0.33785247802734375, 0.3636474609375, 0.38944244384765625, 0.4152374267578125, 0.44103240966796875, 0.466827392578125, 0.49262237548828125, 0.5184173583984375, 0.5442123413085938, 0.57000732421875, 0.5958023071289062, 0.6215972900390625, 0.6473922729492188, 0.673187255859375, 0.6989822387695312, 0.7247772216796875, 0.7505722045898438, 0.7763671875]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 3.0, 3.0, 1.0, 1.0, 3.0, 5.0, 4.0, 5.0, 7.0, 9.0, 17.0, 15.0, 11.0, 24.0, 24.0, 35.0, 34.0, 38.0, 43.0, 43.0, 52.0, 55.0, 42.0, 57.0, 57.0, 51.0, 52.0, 59.0, 42.0, 45.0, 26.0, 26.0, 21.0, 23.0, 15.0, 19.0, 10.0, 8.0, 3.0, 5.0, 3.0, 3.0, 4.0, 4.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1492919921875, -0.14480018615722656, -0.14030838012695312, -0.1358165740966797, -0.13132476806640625, -0.1268329620361328, -0.12234115600585938, -0.11784934997558594, -0.1133575439453125, -0.10886573791503906, -0.10437393188476562, -0.09988212585449219, -0.09539031982421875, -0.09089851379394531, -0.08640670776367188, -0.08191490173339844, -0.077423095703125, -0.07293128967285156, -0.06843948364257812, -0.06394767761230469, -0.05945587158203125, -0.05496406555175781, -0.050472259521484375, -0.04598045349121094, -0.0414886474609375, -0.03699684143066406, -0.032505035400390625, -0.028013229370117188, -0.02352142333984375, -0.019029617309570312, -0.014537811279296875, -0.010046005249023438, -0.00555419921875, -0.0010623931884765625, 0.003429412841796875, 0.007921218872070312, 0.01241302490234375, 0.016904830932617188, 0.021396636962890625, 0.025888442993164062, 0.0303802490234375, 0.03487205505371094, 0.039363861083984375, 0.04385566711425781, 0.04834747314453125, 0.05283927917480469, 0.057331085205078125, 0.06182289123535156, 0.066314697265625, 0.07080650329589844, 0.07529830932617188, 0.07979011535644531, 0.08428192138671875, 0.08877372741699219, 0.09326553344726562, 0.09775733947753906, 0.1022491455078125, 0.10674095153808594, 0.11123275756835938, 0.11572456359863281, 0.12021636962890625, 0.12470817565917969, 0.12919998168945312, 0.13369178771972656, 0.13818359375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 6.0, 9.0, 11.0, 10.0, 12.0, 22.0, 34.0, 29.0, 46.0, 54.0, 75.0, 134.0, 171.0, 343.0, 701.0, 1316.0, 2972.0, 8733.0, 44805.0, 4093357.0, 29494.0, 6811.0, 2550.0, 1142.0, 561.0, 320.0, 155.0, 106.0, 79.0, 53.0, 45.0, 29.0, 26.0, 15.0, 14.0, 9.0, 10.0, 13.0, 4.0, 2.0, 3.0, 0.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.90234375, -1.8486175537109375, -1.794891357421875, -1.7411651611328125, -1.68743896484375, -1.6337127685546875, -1.579986572265625, -1.5262603759765625, -1.4725341796875, -1.4188079833984375, -1.365081787109375, -1.3113555908203125, -1.25762939453125, -1.2039031982421875, -1.150177001953125, -1.0964508056640625, -1.042724609375, -0.9889984130859375, -0.935272216796875, -0.8815460205078125, -0.82781982421875, -0.7740936279296875, -0.720367431640625, -0.6666412353515625, -0.6129150390625, -0.5591888427734375, -0.505462646484375, -0.4517364501953125, -0.39801025390625, -0.3442840576171875, -0.290557861328125, -0.2368316650390625, -0.18310546875, -0.1293792724609375, -0.075653076171875, -0.0219268798828125, 0.03179931640625, 0.0855255126953125, 0.139251708984375, 0.1929779052734375, 0.2467041015625, 0.3004302978515625, 0.354156494140625, 0.4078826904296875, 0.46160888671875, 0.5153350830078125, 0.569061279296875, 0.6227874755859375, 0.676513671875, 0.7302398681640625, 0.783966064453125, 0.8376922607421875, 0.89141845703125, 0.9451446533203125, 0.998870849609375, 1.0525970458984375, 1.1063232421875, 1.1600494384765625, 1.213775634765625, 1.2675018310546875, 1.32122802734375, 1.3749542236328125, 1.428680419921875, 1.4824066162109375, 1.5361328125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 1.0, 7.0, 9.0, 18.0, 20.0, 85.0, 3673.0, 189.0, 30.0, 18.0, 7.0, 8.0, 3.0, 3.0, 2.0, 6.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53271484375, -0.517791748046875, -0.50286865234375, -0.487945556640625, -0.4730224609375, -0.458099365234375, -0.44317626953125, -0.428253173828125, -0.413330078125, -0.398406982421875, -0.38348388671875, -0.368560791015625, -0.3536376953125, -0.338714599609375, -0.32379150390625, -0.308868408203125, -0.2939453125, -0.279022216796875, -0.26409912109375, -0.249176025390625, -0.2342529296875, -0.219329833984375, -0.20440673828125, -0.189483642578125, -0.174560546875, -0.159637451171875, -0.14471435546875, -0.129791259765625, -0.1148681640625, -0.099945068359375, -0.08502197265625, -0.070098876953125, -0.05517578125, -0.040252685546875, -0.02532958984375, -0.010406494140625, 0.0045166015625, 0.019439697265625, 0.03436279296875, 0.049285888671875, 0.064208984375, 0.079132080078125, 0.09405517578125, 0.108978271484375, 0.1239013671875, 0.138824462890625, 0.15374755859375, 0.168670654296875, 0.18359375, 0.198516845703125, 0.21343994140625, 0.228363037109375, 0.2432861328125, 0.258209228515625, 0.27313232421875, 0.288055419921875, 0.302978515625, 0.317901611328125, 0.33282470703125, 0.347747802734375, 0.3626708984375, 0.377593994140625, 0.39251708984375, 0.407440185546875, 0.42236328125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 8.0, 5.0, 10.0, 8.0, 18.0, 27.0, 24.0, 44.0, 73.0, 90.0, 93.0, 109.0, 131.0, 84.0, 87.0, 50.0, 36.0, 32.0, 24.0, 16.0, 8.0, 6.0, 7.0, 6.0, 3.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0571504831314087, -1.0264272689819336, -0.9957041144371033, -0.964980959892273, -0.9342578053474426, -0.9035346508026123, -0.8728114366531372, -0.8420882821083069, -0.8113651275634766, -0.7806419730186462, -0.7499187588691711, -0.7191956043243408, -0.6884724497795105, -0.6577492952346802, -0.6270260810852051, -0.5963029265403748, -0.5655797719955444, -0.5348566174507141, -0.504133403301239, -0.4734102487564087, -0.44268709421157837, -0.41196390986442566, -0.38124072551727295, -0.3505175709724426, -0.31979435682296753, -0.2890711724758148, -0.2583480179309845, -0.2276248335838318, -0.19690167903900146, -0.16617849469184875, -0.13545532524585724, -0.10473215579986572, -0.0740090012550354, -0.043285831809043884, -0.01256265863776207, 0.018160514533519745, 0.04888368397951126, 0.07960686087608337, 0.11033003032207489, 0.1410531997680664, 0.17177636921405792, 0.20249953866004944, 0.23322270810604095, 0.26394587755203247, 0.2946690618991852, 0.3253922462463379, 0.3561154007911682, 0.38683855533599854, 0.41756173968315125, 0.44828492403030396, 0.4790080785751343, 0.5097312331199646, 0.5404544472694397, 0.57117760181427, 0.6019007563591003, 0.6326239109039307, 0.6633471250534058, 0.6940702795982361, 0.7247934937477112, 0.7555166482925415, 0.7862398028373718, 0.8169629573822021, 0.8476861715316772, 0.8784093260765076, 0.9091324806213379]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 7.0, 3.0, 7.0, 5.0, 12.0, 10.0, 9.0, 14.0, 12.0, 14.0, 28.0, 29.0, 16.0, 27.0, 32.0, 29.0, 43.0, 27.0, 38.0, 40.0, 40.0, 34.0, 48.0, 52.0, 35.0, 43.0, 40.0, 33.0, 43.0, 39.0, 24.0, 30.0, 23.0, 22.0, 13.0, 20.0, 19.0, 11.0, 8.0, 11.0, 3.0, 7.0, 3.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.5670897960662842, -0.5485234260559082, -0.5299570560455322, -0.5113906860351562, -0.4928243160247803, -0.4742579460144043, -0.45569154620170593, -0.43712517619132996, -0.418558806180954, -0.399992436170578, -0.381426066160202, -0.36285969614982605, -0.3442932963371277, -0.3257269263267517, -0.30716055631637573, -0.28859418630599976, -0.2700278162956238, -0.2514614462852478, -0.23289507627487183, -0.21432869136333466, -0.19576232135295868, -0.1771959513425827, -0.15862956643104553, -0.14006319642066956, -0.12149682641029358, -0.1029304563999176, -0.08436407893896103, -0.06579770147800446, -0.04723133146762848, -0.028664961457252502, -0.010098583996295929, 0.008467793464660645, 0.027034103870391846, 0.04560047760605812, 0.0641668513417244, 0.08273322880268097, 0.10129959881305695, 0.11986596882343292, 0.1384323537349701, 0.15699872374534607, 0.17556509375572205, 0.19413146376609802, 0.212697833776474, 0.23126421868801117, 0.24983058869838715, 0.2683969736099243, 0.2869633436203003, 0.30552971363067627, 0.32409608364105225, 0.3426624536514282, 0.3612288236618042, 0.3797951936721802, 0.39836156368255615, 0.41692793369293213, 0.4354943335056305, 0.45406070351600647, 0.47262707352638245, 0.4911934435367584, 0.5097598433494568, 0.5283262133598328, 0.5468925833702087, 0.5654589533805847, 0.5840253233909607, 0.6025916934013367, 0.6211580634117126]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 5.0, 6.0, 9.0, 15.0, 30.0, 34.0, 58.0, 89.0, 181.0, 347.0, 560.0, 1013.0, 1973.0, 4013.0, 8240.0, 18621.0, 47117.0, 144742.0, 395093.0, 282105.0, 88009.0, 31174.0, 12979.0, 5871.0, 2983.0, 1486.0, 800.0, 451.0, 219.0, 138.0, 73.0, 41.0, 38.0, 16.0, 10.0, 8.0, 6.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4248046875, -0.4110069274902344, -0.39720916748046875, -0.3834114074707031, -0.3696136474609375, -0.3558158874511719, -0.34201812744140625, -0.3282203674316406, -0.314422607421875, -0.3006248474121094, -0.28682708740234375, -0.2730293273925781, -0.2592315673828125, -0.24543380737304688, -0.23163604736328125, -0.21783828735351562, -0.20404052734375, -0.19024276733398438, -0.17644500732421875, -0.16264724731445312, -0.1488494873046875, -0.13505172729492188, -0.12125396728515625, -0.10745620727539062, -0.093658447265625, -0.07986068725585938, -0.06606292724609375, -0.052265167236328125, -0.0384674072265625, -0.024669647216796875, -0.01087188720703125, 0.002925872802734375, 0.0167236328125, 0.030521392822265625, 0.04431915283203125, 0.058116912841796875, 0.0719146728515625, 0.08571243286132812, 0.09951019287109375, 0.11330795288085938, 0.127105712890625, 0.14090347290039062, 0.15470123291015625, 0.16849899291992188, 0.1822967529296875, 0.19609451293945312, 0.20989227294921875, 0.22369003295898438, 0.23748779296875, 0.2512855529785156, 0.26508331298828125, 0.2788810729980469, 0.2926788330078125, 0.3064765930175781, 0.32027435302734375, 0.3340721130371094, 0.347869873046875, 0.3616676330566406, 0.37546539306640625, 0.3892631530761719, 0.4030609130859375, 0.4168586730957031, 0.43065643310546875, 0.4444541931152344, 0.458251953125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 2.0, 3.0, 10.0, 8.0, 7.0, 17.0, 13.0, 22.0, 32.0, 13.0, 31.0, 42.0, 48.0, 43.0, 45.0, 44.0, 57.0, 55.0, 58.0, 52.0, 52.0, 67.0, 47.0, 62.0, 33.0, 26.0, 21.0, 21.0, 14.0, 17.0, 13.0, 9.0, 1.0, 7.0, 4.0, 4.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.2374267578125, -0.23132705688476562, -0.22522735595703125, -0.21912765502929688, -0.2130279541015625, -0.20692825317382812, -0.20082855224609375, -0.19472885131835938, -0.188629150390625, -0.18252944946289062, -0.17642974853515625, -0.17033004760742188, -0.1642303466796875, -0.15813064575195312, -0.15203094482421875, -0.14593124389648438, -0.13983154296875, -0.13373184204101562, -0.12763214111328125, -0.12153244018554688, -0.1154327392578125, -0.10933303833007812, -0.10323333740234375, -0.09713363647460938, -0.091033935546875, -0.08493423461914062, -0.07883453369140625, -0.07273483276367188, -0.0666351318359375, -0.060535430908203125, -0.05443572998046875, -0.048336029052734375, -0.042236328125, -0.036136627197265625, -0.03003692626953125, -0.023937225341796875, -0.0178375244140625, -0.011737823486328125, -0.00563812255859375, 0.000461578369140625, 0.006561279296875, 0.012660980224609375, 0.01876068115234375, 0.024860382080078125, 0.0309600830078125, 0.037059783935546875, 0.04315948486328125, 0.049259185791015625, 0.05535888671875, 0.061458587646484375, 0.06755828857421875, 0.07365798950195312, 0.0797576904296875, 0.08585739135742188, 0.09195709228515625, 0.09805679321289062, 0.104156494140625, 0.11025619506835938, 0.11635589599609375, 0.12245559692382812, 0.1285552978515625, 0.13465499877929688, 0.14075469970703125, 0.14685440063476562, 0.1529541015625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 6.0, 7.0, 3.0, 11.0, 14.0, 14.0, 20.0, 34.0, 60.0, 101.0, 116.0, 241.0, 370.0, 662.0, 1615.0, 4415.0, 17222.0, 130962.0, 765196.0, 105614.0, 14859.0, 3981.0, 1505.0, 644.0, 337.0, 193.0, 119.0, 60.0, 54.0, 35.0, 20.0, 19.0, 12.0, 8.0, 8.0, 3.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.748046875, -0.7208023071289062, -0.6935577392578125, -0.6663131713867188, -0.639068603515625, -0.6118240356445312, -0.5845794677734375, -0.5573348999023438, -0.53009033203125, -0.5028457641601562, -0.4756011962890625, -0.44835662841796875, -0.421112060546875, -0.39386749267578125, -0.3666229248046875, -0.33937835693359375, -0.3121337890625, -0.28488922119140625, -0.2576446533203125, -0.23040008544921875, -0.203155517578125, -0.17591094970703125, -0.1486663818359375, -0.12142181396484375, -0.09417724609375, -0.06693267822265625, -0.0396881103515625, -0.01244354248046875, 0.014801025390625, 0.04204559326171875, 0.0692901611328125, 0.09653472900390625, 0.123779296875, 0.15102386474609375, 0.1782684326171875, 0.20551300048828125, 0.232757568359375, 0.26000213623046875, 0.2872467041015625, 0.31449127197265625, 0.34173583984375, 0.36898040771484375, 0.3962249755859375, 0.42346954345703125, 0.450714111328125, 0.47795867919921875, 0.5052032470703125, 0.5324478149414062, 0.5596923828125, 0.5869369506835938, 0.6141815185546875, 0.6414260864257812, 0.668670654296875, 0.6959152221679688, 0.7231597900390625, 0.7504043579101562, 0.77764892578125, 0.8048934936523438, 0.8321380615234375, 0.8593826293945312, 0.886627197265625, 0.9138717651367188, 0.9411163330078125, 0.9683609008789062, 0.99560546875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 7.0, 6.0, 11.0, 12.0, 15.0, 16.0, 13.0, 31.0, 25.0, 24.0, 41.0, 36.0, 45.0, 47.0, 49.0, 71.0, 57.0, 52.0, 59.0, 61.0, 45.0, 45.0, 54.0, 27.0, 25.0, 27.0, 28.0, 17.0, 19.0, 10.0, 8.0, 5.0, 8.0, 2.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.1357421875, -1.1058578491210938, -1.0759735107421875, -1.0460891723632812, -1.016204833984375, -0.9863204956054688, -0.9564361572265625, -0.9265518188476562, -0.89666748046875, -0.8667831420898438, -0.8368988037109375, -0.8070144653320312, -0.777130126953125, -0.7472457885742188, -0.7173614501953125, -0.6874771118164062, -0.6575927734375, -0.6277084350585938, -0.5978240966796875, -0.5679397583007812, -0.538055419921875, -0.5081710815429688, -0.4782867431640625, -0.44840240478515625, -0.41851806640625, -0.38863372802734375, -0.3587493896484375, -0.32886505126953125, -0.298980712890625, -0.26909637451171875, -0.2392120361328125, -0.20932769775390625, -0.179443359375, -0.14955902099609375, -0.1196746826171875, -0.08979034423828125, -0.059906005859375, -0.03002166748046875, -0.0001373291015625, 0.02974700927734375, 0.05963134765625, 0.08951568603515625, 0.1194000244140625, 0.14928436279296875, 0.179168701171875, 0.20905303955078125, 0.2389373779296875, 0.26882171630859375, 0.2987060546875, 0.32859039306640625, 0.3584747314453125, 0.38835906982421875, 0.418243408203125, 0.44812774658203125, 0.4780120849609375, 0.5078964233398438, 0.53778076171875, 0.5676651000976562, 0.5975494384765625, 0.6274337768554688, 0.657318115234375, 0.6872024536132812, 0.7170867919921875, 0.7469711303710938, 0.77685546875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 8.0, 11.0, 10.0, 17.0, 26.0, 51.0, 67.0, 109.0, 169.0, 247.0, 406.0, 814.0, 1728.0, 4718.0, 18604.0, 134708.0, 730058.0, 130443.0, 17943.0, 4717.0, 1695.0, 823.0, 437.0, 251.0, 166.0, 121.0, 65.0, 29.0, 14.0, 29.0, 29.0, 12.0, 15.0, 2.0, 3.0, 6.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.394775390625, -0.3813896179199219, -0.36800384521484375, -0.3546180725097656, -0.3412322998046875, -0.3278465270996094, -0.31446075439453125, -0.3010749816894531, -0.287689208984375, -0.2743034362792969, -0.26091766357421875, -0.24753189086914062, -0.2341461181640625, -0.22076034545898438, -0.20737457275390625, -0.19398880004882812, -0.18060302734375, -0.16721725463867188, -0.15383148193359375, -0.14044570922851562, -0.1270599365234375, -0.11367416381835938, -0.10028839111328125, -0.08690261840820312, -0.073516845703125, -0.060131072998046875, -0.04674530029296875, -0.033359527587890625, -0.0199737548828125, -0.006587982177734375, 0.00679779052734375, 0.020183563232421875, 0.0335693359375, 0.046955108642578125, 0.06034088134765625, 0.07372665405273438, 0.0871124267578125, 0.10049819946289062, 0.11388397216796875, 0.12726974487304688, 0.140655517578125, 0.15404129028320312, 0.16742706298828125, 0.18081283569335938, 0.1941986083984375, 0.20758438110351562, 0.22097015380859375, 0.23435592651367188, 0.24774169921875, 0.2611274719238281, 0.27451324462890625, 0.2878990173339844, 0.3012847900390625, 0.3146705627441406, 0.32805633544921875, 0.3414421081542969, 0.354827880859375, 0.3682136535644531, 0.38159942626953125, 0.3949851989746094, 0.4083709716796875, 0.4217567443847656, 0.43514251708984375, 0.4485282897949219, 0.4619140625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 8.0, 2.0, 9.0, 10.0, 16.0, 39.0, 45.0, 72.0, 96.0, 119.0, 150.0, 103.0, 102.0, 70.0, 45.0, 32.0, 35.0, 17.0, 9.0, 8.0, 3.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00010126829147338867, -9.826663881540298e-05, -9.52649861574173e-05, -9.226333349943161e-05, -8.926168084144592e-05, -8.626002818346024e-05, -8.325837552547455e-05, -8.025672286748886e-05, -7.725507020950317e-05, -7.425341755151749e-05, -7.12517648935318e-05, -6.825011223554611e-05, -6.524845957756042e-05, -6.224680691957474e-05, -5.924515426158905e-05, -5.624350160360336e-05, -5.3241848945617676e-05, -5.024019628763199e-05, -4.72385436296463e-05, -4.4236890971660614e-05, -4.123523831367493e-05, -3.823358565568924e-05, -3.523193299770355e-05, -3.2230280339717865e-05, -2.9228627681732178e-05, -2.622697502374649e-05, -2.3225322365760803e-05, -2.0223669707775116e-05, -1.722201704978943e-05, -1.4220364391803741e-05, -1.1218711733818054e-05, -8.217059075832367e-06, -5.21540641784668e-06, -2.2137537598609924e-06, 7.878988981246948e-07, 3.789551556110382e-06, 6.791204214096069e-06, 9.792856872081757e-06, 1.2794509530067444e-05, 1.579616218805313e-05, 1.879781484603882e-05, 2.1799467504024506e-05, 2.4801120162010193e-05, 2.780277281999588e-05, 3.080442547798157e-05, 3.3806078135967255e-05, 3.680773079395294e-05, 3.980938345193863e-05, 4.2811036109924316e-05, 4.5812688767910004e-05, 4.881434142589569e-05, 5.181599408388138e-05, 5.4817646741867065e-05, 5.781929939985275e-05, 6.082095205783844e-05, 6.382260471582413e-05, 6.682425737380981e-05, 6.98259100317955e-05, 7.282756268978119e-05, 7.582921534776688e-05, 7.883086800575256e-05, 8.183252066373825e-05, 8.483417332172394e-05, 8.783582597970963e-05, 9.083747863769531e-05]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 2.0, 3.0, 1.0, 3.0, 7.0, 13.0, 15.0, 25.0, 31.0, 39.0, 94.0, 103.0, 214.0, 372.0, 693.0, 1408.0, 3473.0, 12579.0, 80242.0, 712014.0, 205298.0, 22494.0, 5440.0, 1934.0, 938.0, 444.0, 268.0, 143.0, 87.0, 54.0, 38.0, 36.0, 16.0, 13.0, 8.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.455078125, -0.44024658203125, -0.4254150390625, -0.41058349609375, -0.395751953125, -0.38092041015625, -0.3660888671875, -0.35125732421875, -0.33642578125, -0.32159423828125, -0.3067626953125, -0.29193115234375, -0.277099609375, -0.26226806640625, -0.2474365234375, -0.23260498046875, -0.2177734375, -0.20294189453125, -0.1881103515625, -0.17327880859375, -0.158447265625, -0.14361572265625, -0.1287841796875, -0.11395263671875, -0.09912109375, -0.08428955078125, -0.0694580078125, -0.05462646484375, -0.039794921875, -0.02496337890625, -0.0101318359375, 0.00469970703125, 0.01953125, 0.03436279296875, 0.0491943359375, 0.06402587890625, 0.078857421875, 0.09368896484375, 0.1085205078125, 0.12335205078125, 0.13818359375, 0.15301513671875, 0.1678466796875, 0.18267822265625, 0.197509765625, 0.21234130859375, 0.2271728515625, 0.24200439453125, 0.2568359375, 0.27166748046875, 0.2864990234375, 0.30133056640625, 0.316162109375, 0.33099365234375, 0.3458251953125, 0.36065673828125, 0.37548828125, 0.39031982421875, 0.4051513671875, 0.41998291015625, 0.434814453125, 0.44964599609375, 0.4644775390625, 0.47930908203125, 0.494140625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 8.0, 11.0, 19.0, 25.0, 25.0, 61.0, 82.0, 103.0, 128.0, 132.0, 118.0, 92.0, 67.0, 45.0, 36.0, 17.0, 12.0, 11.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.460693359375, -0.4444541931152344, -0.42821502685546875, -0.4119758605957031, -0.3957366943359375, -0.3794975280761719, -0.36325836181640625, -0.3470191955566406, -0.330780029296875, -0.3145408630371094, -0.29830169677734375, -0.2820625305175781, -0.2658233642578125, -0.24958419799804688, -0.23334503173828125, -0.21710586547851562, -0.20086669921875, -0.18462753295898438, -0.16838836669921875, -0.15214920043945312, -0.1359100341796875, -0.11967086791992188, -0.10343170166015625, -0.08719253540039062, -0.070953369140625, -0.054714202880859375, -0.03847503662109375, -0.022235870361328125, -0.0059967041015625, 0.010242462158203125, 0.02648162841796875, 0.042720794677734375, 0.0589599609375, 0.07519912719726562, 0.09143829345703125, 0.10767745971679688, 0.1239166259765625, 0.14015579223632812, 0.15639495849609375, 0.17263412475585938, 0.188873291015625, 0.20511245727539062, 0.22135162353515625, 0.23759078979492188, 0.2538299560546875, 0.2700691223144531, 0.28630828857421875, 0.3025474548339844, 0.31878662109375, 0.3350257873535156, 0.35126495361328125, 0.3675041198730469, 0.3837432861328125, 0.3999824523925781, 0.41622161865234375, 0.4324607849121094, 0.448699951171875, 0.4649391174316406, 0.48117828369140625, 0.4974174499511719, 0.5136566162109375, 0.5298957824707031, 0.5461349487304688, 0.5623741149902344, 0.57861328125]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 8.0, 20.0, 87.0, 272.0, 361.0, 193.0, 51.0, 14.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.31913423538208, -3.7977378368377686, -3.276341438293457, -2.7549452781677246, -2.233548879623413, -1.7121524810791016, -1.1907563209533691, -0.6693599224090576, -0.1479635238647461, 0.37343281507492065, 0.8948291540145874, 1.4162254333496094, 1.937621831893921, 2.4590182304382324, 2.980414390563965, 3.5018107891082764, 4.023207187652588, 4.54460334777832, 5.065999984741211, 5.587396144866943, 6.108792304992676, 6.630188941955566, 7.151585102081299, 7.672981262207031, 8.194377899169922, 8.715774536132812, 9.237170219421387, 9.758566856384277, 10.279963493347168, 10.801359176635742, 11.322755813598633, 11.844152450561523, 12.365547180175781, 12.886943817138672, 13.408339500427246, 13.929736137390137, 14.451132774353027, 14.972528457641602, 15.493925094604492, 16.015321731567383, 16.536718368530273, 17.058115005493164, 17.579511642456055, 18.100906372070312, 18.622303009033203, 19.143699645996094, 19.665096282958984, 20.186492919921875, 20.707889556884766, 21.229286193847656, 21.750682830810547, 22.272079467773438, 22.793474197387695, 23.314870834350586, 23.836267471313477, 24.357664108276367, 24.879058837890625, 25.400455474853516, 25.921852111816406, 26.443248748779297, 26.964643478393555, 27.486040115356445, 28.007436752319336, 28.528833389282227, 29.050230026245117]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 8.0, 4.0, 8.0, 8.0, 17.0, 17.0, 26.0, 18.0, 30.0, 27.0, 28.0, 45.0, 39.0, 70.0, 54.0, 52.0, 60.0, 60.0, 44.0, 55.0, 48.0, 40.0, 38.0, 31.0, 32.0, 27.0, 20.0, 19.0, 16.0, 12.0, 14.0, 8.0, 5.0, 3.0, 7.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-5.067383766174316, -4.918712615966797, -4.770041465759277, -4.621370315551758, -4.472699165344238, -4.3240275382995605, -4.175356388092041, -4.0266852378845215, -3.878014087677002, -3.7293429374694824, -3.580671787261963, -3.4320003986358643, -3.2833292484283447, -3.134658098220825, -2.9859867095947266, -2.837315559387207, -2.6886444091796875, -2.539973258972168, -2.3913021087646484, -2.24263072013855, -2.0939595699310303, -1.9452884197235107, -1.7966171503067017, -1.6479458808898926, -1.499274730682373, -1.3506035804748535, -1.2019323110580444, -1.0532610416412354, -0.9045898914337158, -0.7559186816215515, -0.6072474718093872, -0.4585762023925781, -0.3099050521850586, -0.1612338423728943, -0.01256263256072998, 0.13610857725143433, 0.28477978706359863, 0.43345099687576294, 0.5821222066879272, 0.7307934761047363, 0.8794646263122559, 1.0281357765197754, 1.1768070459365845, 1.3254783153533936, 1.474149465560913, 1.6228206157684326, 1.7714918851852417, 1.9201631546020508, 2.0688343048095703, 2.21750545501709, 2.3661766052246094, 2.514847993850708, 2.6635191440582275, 2.812190294265747, 2.9608616828918457, 3.1095328330993652, 3.2582039833068848, 3.4068751335144043, 3.555546283721924, 3.7042176723480225, 3.852888822555542, 4.001560211181641, 4.15023136138916, 4.29890251159668, 4.447573661804199]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 7.0, 10.0, 10.0, 7.0, 19.0, 23.0, 37.0, 36.0, 64.0, 123.0, 151.0, 245.0, 433.0, 739.0, 1639.0, 4853.0, 44110.0, 4126263.0, 10418.0, 2590.0, 1060.0, 527.0, 310.0, 194.0, 115.0, 88.0, 64.0, 50.0, 31.0, 25.0, 17.0, 14.0, 5.0, 6.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2314453125, -1.1907196044921875, -1.149993896484375, -1.1092681884765625, -1.06854248046875, -1.0278167724609375, -0.987091064453125, -0.9463653564453125, -0.9056396484375, -0.8649139404296875, -0.824188232421875, -0.7834625244140625, -0.74273681640625, -0.7020111083984375, -0.661285400390625, -0.6205596923828125, -0.579833984375, -0.5391082763671875, -0.498382568359375, -0.4576568603515625, -0.41693115234375, -0.3762054443359375, -0.335479736328125, -0.2947540283203125, -0.2540283203125, -0.2133026123046875, -0.172576904296875, -0.1318511962890625, -0.09112548828125, -0.0503997802734375, -0.009674072265625, 0.0310516357421875, 0.07177734375, 0.1125030517578125, 0.153228759765625, 0.1939544677734375, 0.23468017578125, 0.2754058837890625, 0.316131591796875, 0.3568572998046875, 0.3975830078125, 0.4383087158203125, 0.479034423828125, 0.5197601318359375, 0.56048583984375, 0.6012115478515625, 0.641937255859375, 0.6826629638671875, 0.723388671875, 0.7641143798828125, 0.804840087890625, 0.8455657958984375, 0.88629150390625, 0.9270172119140625, 0.967742919921875, 1.0084686279296875, 1.0491943359375, 1.0899200439453125, 1.130645751953125, 1.1713714599609375, 1.21209716796875, 1.2528228759765625, 1.293548583984375, 1.3342742919921875, 1.375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 1.0, 5.0, 2.0, 7.0, 1.0, 5.0, 6.0, 8.0, 20.0, 14.0, 18.0, 17.0, 33.0, 28.0, 40.0, 32.0, 53.0, 43.0, 62.0, 61.0, 64.0, 48.0, 45.0, 61.0, 52.0, 48.0, 51.0, 36.0, 27.0, 25.0, 22.0, 14.0, 12.0, 10.0, 6.0, 12.0, 5.0, 4.0, 4.0, 3.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.20703125, -0.2007007598876953, -0.19437026977539062, -0.18803977966308594, -0.18170928955078125, -0.17537879943847656, -0.16904830932617188, -0.1627178192138672, -0.1563873291015625, -0.1500568389892578, -0.14372634887695312, -0.13739585876464844, -0.13106536865234375, -0.12473487854003906, -0.11840438842773438, -0.11207389831542969, -0.105743408203125, -0.09941291809082031, -0.09308242797851562, -0.08675193786621094, -0.08042144775390625, -0.07409095764160156, -0.06776046752929688, -0.06142997741699219, -0.0550994873046875, -0.04876899719238281, -0.042438507080078125, -0.03610801696777344, -0.02977752685546875, -0.023447036743164062, -0.017116546630859375, -0.010786056518554688, -0.00445556640625, 0.0018749237060546875, 0.008205413818359375, 0.014535903930664062, 0.02086639404296875, 0.027196884155273438, 0.033527374267578125, 0.03985786437988281, 0.0461883544921875, 0.05251884460449219, 0.058849334716796875, 0.06517982482910156, 0.07151031494140625, 0.07784080505371094, 0.08417129516601562, 0.09050178527832031, 0.096832275390625, 0.10316276550292969, 0.10949325561523438, 0.11582374572753906, 0.12215423583984375, 0.12848472595214844, 0.13481521606445312, 0.1411457061767578, 0.1474761962890625, 0.1538066864013672, 0.16013717651367188, 0.16646766662597656, 0.17279815673828125, 0.17912864685058594, 0.18545913696289062, 0.1917896270751953, 0.1981201171875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 6.0, 6.0, 13.0, 24.0, 13.0, 39.0, 44.0, 68.0, 132.0, 154.0, 257.0, 360.0, 552.0, 869.0, 1260.0, 2133.0, 3649.0, 7864.0, 30385.0, 4072336.0, 53173.0, 10068.0, 4238.0, 2381.0, 1428.0, 942.0, 610.0, 452.0, 279.0, 173.0, 116.0, 101.0, 60.0, 30.0, 29.0, 13.0, 14.0, 7.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.0625, -1.0326690673828125, -1.002838134765625, -0.9730072021484375, -0.94317626953125, -0.9133453369140625, -0.883514404296875, -0.8536834716796875, -0.8238525390625, -0.7940216064453125, -0.764190673828125, -0.7343597412109375, -0.70452880859375, -0.6746978759765625, -0.644866943359375, -0.6150360107421875, -0.585205078125, -0.5553741455078125, -0.525543212890625, -0.4957122802734375, -0.46588134765625, -0.4360504150390625, -0.406219482421875, -0.3763885498046875, -0.3465576171875, -0.3167266845703125, -0.286895751953125, -0.2570648193359375, -0.22723388671875, -0.1974029541015625, -0.167572021484375, -0.1377410888671875, -0.10791015625, -0.0780792236328125, -0.048248291015625, -0.0184173583984375, 0.01141357421875, 0.0412445068359375, 0.071075439453125, 0.1009063720703125, 0.1307373046875, 0.1605682373046875, 0.190399169921875, 0.2202301025390625, 0.25006103515625, 0.2798919677734375, 0.309722900390625, 0.3395538330078125, 0.369384765625, 0.3992156982421875, 0.429046630859375, 0.4588775634765625, 0.48870849609375, 0.5185394287109375, 0.548370361328125, 0.5782012939453125, 0.6080322265625, 0.6378631591796875, 0.667694091796875, 0.6975250244140625, 0.72735595703125, 0.7571868896484375, 0.787017822265625, 0.8168487548828125, 0.8466796875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 6.0, 4.0, 5.0, 10.0, 25.0, 29.0, 222.0, 3597.0, 79.0, 32.0, 15.0, 16.0, 4.0, 7.0, 1.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.248779296875, -0.24190711975097656, -0.23503494262695312, -0.2281627655029297, -0.22129058837890625, -0.2144184112548828, -0.20754623413085938, -0.20067405700683594, -0.1938018798828125, -0.18692970275878906, -0.18005752563476562, -0.1731853485107422, -0.16631317138671875, -0.1594409942626953, -0.15256881713867188, -0.14569664001464844, -0.138824462890625, -0.13195228576660156, -0.12508010864257812, -0.11820793151855469, -0.11133575439453125, -0.10446357727050781, -0.09759140014648438, -0.09071922302246094, -0.0838470458984375, -0.07697486877441406, -0.07010269165039062, -0.06323051452636719, -0.05635833740234375, -0.04948616027832031, -0.042613983154296875, -0.03574180603027344, -0.02886962890625, -0.021997451782226562, -0.015125274658203125, -0.008253097534179688, -0.00138092041015625, 0.0054912567138671875, 0.012363433837890625, 0.019235610961914062, 0.0261077880859375, 0.03297996520996094, 0.039852142333984375, 0.04672431945800781, 0.05359649658203125, 0.06046867370605469, 0.06734085083007812, 0.07421302795410156, 0.081085205078125, 0.08795738220214844, 0.09482955932617188, 0.10170173645019531, 0.10857391357421875, 0.11544609069824219, 0.12231826782226562, 0.12919044494628906, 0.1360626220703125, 0.14293479919433594, 0.14980697631835938, 0.1566791534423828, 0.16355133056640625, 0.1704235076904297, 0.17729568481445312, 0.18416786193847656, 0.1910400390625]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 4.0, 8.0, 12.0, 25.0, 23.0, 33.0, 53.0, 70.0, 71.0, 96.0, 114.0, 121.0, 84.0, 80.0, 68.0, 47.0, 34.0, 27.0, 9.0, 4.0, 4.0, 2.0, 2.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6498937010765076, -0.624650239944458, -0.5994067788124084, -0.5741633176803589, -0.5489199161529541, -0.5236764550209045, -0.498432993888855, -0.4731895327568054, -0.44794610142707825, -0.4227026402950287, -0.3974592089653015, -0.37221574783325195, -0.3469722867012024, -0.3217288553714752, -0.29648539423942566, -0.2712419629096985, -0.24599850177764893, -0.22075505554676056, -0.1955116093158722, -0.17026814818382263, -0.14502470195293427, -0.1197812557220459, -0.09453779458999634, -0.06929434835910797, -0.044050902128219604, -0.01880745217204094, 0.006435997784137726, 0.03167945146560669, 0.056922897696495056, 0.08216634392738342, 0.10740980505943298, 0.13265325129032135, 0.15789663791656494, 0.1831400841474533, 0.20838353037834167, 0.23362699151039124, 0.2588704228401184, 0.28411388397216797, 0.30935734510421753, 0.3346008062362671, 0.35984423756599426, 0.3850876986980438, 0.410331130027771, 0.43557459115982056, 0.4608180522918701, 0.4860614836215973, 0.5113049745559692, 0.536548376083374, 0.5617918372154236, 0.5870352983474731, 0.6122787594795227, 0.6375222206115723, 0.662765622138977, 0.6880090832710266, 0.7132525444030762, 0.7384960055351257, 0.7637394666671753, 0.7889829277992249, 0.8142263889312744, 0.8394697904586792, 0.8647132515907288, 0.8899567127227783, 0.9152001738548279, 0.9404436349868774, 0.9656870365142822]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 4.0, 3.0, 4.0, 4.0, 8.0, 4.0, 16.0, 19.0, 13.0, 9.0, 13.0, 13.0, 24.0, 23.0, 23.0, 17.0, 33.0, 43.0, 33.0, 36.0, 34.0, 40.0, 37.0, 49.0, 41.0, 39.0, 38.0, 27.0, 33.0, 33.0, 38.0, 33.0, 34.0, 25.0, 19.0, 22.0, 15.0, 20.0, 13.0, 11.0, 12.0, 13.0, 7.0, 8.0, 5.0, 7.0, 1.0, 6.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.3959835171699524, -0.38427460193634033, -0.37256571650505066, -0.360856831073761, -0.3491479158401489, -0.33743900060653687, -0.3257301151752472, -0.3140212297439575, -0.30231231451034546, -0.2906033992767334, -0.2788945138454437, -0.26718562841415405, -0.255476713180542, -0.24376781284809113, -0.23205891251564026, -0.2203500121831894, -0.20864111185073853, -0.19693221151828766, -0.1852233111858368, -0.17351441085338593, -0.16180551052093506, -0.1500966101884842, -0.13838770985603333, -0.12667880952358246, -0.11496990919113159, -0.10326100885868073, -0.09155210852622986, -0.07984320819377899, -0.06813430786132812, -0.05642540752887726, -0.04471650719642639, -0.033007606863975525, -0.021298706531524658, -0.009589806199073792, 0.002119094133377075, 0.013827994465827942, 0.02553689479827881, 0.037245795130729675, 0.04895469546318054, 0.06066359579563141, 0.07237249612808228, 0.08408139646053314, 0.09579029679298401, 0.10749919712543488, 0.11920809745788574, 0.1309169977903366, 0.14262589812278748, 0.15433479845523834, 0.1660436987876892, 0.17775259912014008, 0.18946149945259094, 0.2011703997850418, 0.21287930011749268, 0.22458820044994354, 0.2362971007823944, 0.24800600111484528, 0.25971490144729614, 0.2714238166809082, 0.2831327021121979, 0.29484158754348755, 0.3065505027770996, 0.31825941801071167, 0.32996830344200134, 0.341677188873291, 0.3533861041069031]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 5.0, 4.0, 4.0, 12.0, 6.0, 13.0, 18.0, 22.0, 24.0, 35.0, 51.0, 73.0, 95.0, 160.0, 235.0, 354.0, 612.0, 1013.0, 1840.0, 3624.0, 7221.0, 16232.0, 39815.0, 103427.0, 267419.0, 350156.0, 153904.0, 58530.0, 23257.0, 9990.0, 4711.0, 2399.0, 1292.0, 730.0, 441.0, 273.0, 183.0, 107.0, 76.0, 56.0, 40.0, 30.0, 22.0, 15.0, 10.0, 7.0, 7.0, 4.0, 6.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.363525390625, -0.35257720947265625, -0.3416290283203125, -0.33068084716796875, -0.319732666015625, -0.30878448486328125, -0.2978363037109375, -0.28688812255859375, -0.27593994140625, -0.26499176025390625, -0.2540435791015625, -0.24309539794921875, -0.232147216796875, -0.22119903564453125, -0.2102508544921875, -0.19930267333984375, -0.1883544921875, -0.17740631103515625, -0.1664581298828125, -0.15550994873046875, -0.144561767578125, -0.13361358642578125, -0.1226654052734375, -0.11171722412109375, -0.10076904296875, -0.08982086181640625, -0.0788726806640625, -0.06792449951171875, -0.056976318359375, -0.04602813720703125, -0.0350799560546875, -0.02413177490234375, -0.01318359375, -0.00223541259765625, 0.0087127685546875, 0.01966094970703125, 0.030609130859375, 0.04155731201171875, 0.0525054931640625, 0.06345367431640625, 0.07440185546875, 0.08535003662109375, 0.0962982177734375, 0.10724639892578125, 0.118194580078125, 0.12914276123046875, 0.1400909423828125, 0.15103912353515625, 0.1619873046875, 0.17293548583984375, 0.1838836669921875, 0.19483184814453125, 0.205780029296875, 0.21672821044921875, 0.2276763916015625, 0.23862457275390625, 0.24957275390625, 0.26052093505859375, 0.2714691162109375, 0.28241729736328125, 0.293365478515625, 0.30431365966796875, 0.3152618408203125, 0.32621002197265625, 0.337158203125]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 6.0, 2.0, 5.0, 5.0, 5.0, 6.0, 10.0, 12.0, 11.0, 12.0, 12.0, 15.0, 21.0, 23.0, 27.0, 33.0, 28.0, 31.0, 32.0, 54.0, 58.0, 46.0, 45.0, 38.0, 58.0, 46.0, 42.0, 47.0, 41.0, 32.0, 29.0, 29.0, 20.0, 21.0, 16.0, 13.0, 13.0, 12.0, 14.0, 5.0, 11.0, 6.0, 6.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1837158203125, -0.17815017700195312, -0.17258453369140625, -0.16701889038085938, -0.1614532470703125, -0.15588760375976562, -0.15032196044921875, -0.14475631713867188, -0.139190673828125, -0.13362503051757812, -0.12805938720703125, -0.12249374389648438, -0.1169281005859375, -0.11136245727539062, -0.10579681396484375, -0.10023117065429688, -0.09466552734375, -0.08909988403320312, -0.08353424072265625, -0.07796859741210938, -0.0724029541015625, -0.06683731079101562, -0.06127166748046875, -0.055706024169921875, -0.050140380859375, -0.044574737548828125, -0.03900909423828125, -0.033443450927734375, -0.0278778076171875, -0.022312164306640625, -0.01674652099609375, -0.011180877685546875, -0.005615234375, -4.9591064453125e-05, 0.00551605224609375, 0.011081695556640625, 0.0166473388671875, 0.022212982177734375, 0.02777862548828125, 0.033344268798828125, 0.038909912109375, 0.044475555419921875, 0.05004119873046875, 0.055606842041015625, 0.0611724853515625, 0.06673812866210938, 0.07230377197265625, 0.07786941528320312, 0.08343505859375, 0.08900070190429688, 0.09456634521484375, 0.10013198852539062, 0.1056976318359375, 0.11126327514648438, 0.11682891845703125, 0.12239456176757812, 0.127960205078125, 0.13352584838867188, 0.13909149169921875, 0.14465713500976562, 0.1502227783203125, 0.15578842163085938, 0.16135406494140625, 0.16691970825195312, 0.1724853515625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 3.0, 6.0, 6.0, 8.0, 7.0, 8.0, 9.0, 22.0, 25.0, 29.0, 39.0, 49.0, 96.0, 102.0, 194.0, 288.0, 450.0, 731.0, 1457.0, 3450.0, 10922.0, 56817.0, 546957.0, 371302.0, 40953.0, 8539.0, 2812.0, 1307.0, 662.0, 457.0, 267.0, 163.0, 117.0, 74.0, 68.0, 37.0, 24.0, 23.0, 11.0, 11.0, 17.0, 10.0, 5.0, 9.0, 2.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 4.0], "bins": [-0.5830078125, -0.56414794921875, -0.5452880859375, -0.52642822265625, -0.507568359375, -0.48870849609375, -0.4698486328125, -0.45098876953125, -0.43212890625, -0.41326904296875, -0.3944091796875, -0.37554931640625, -0.356689453125, -0.33782958984375, -0.3189697265625, -0.30010986328125, -0.28125, -0.26239013671875, -0.2435302734375, -0.22467041015625, -0.205810546875, -0.18695068359375, -0.1680908203125, -0.14923095703125, -0.13037109375, -0.11151123046875, -0.0926513671875, -0.07379150390625, -0.054931640625, -0.03607177734375, -0.0172119140625, 0.00164794921875, 0.0205078125, 0.03936767578125, 0.0582275390625, 0.07708740234375, 0.095947265625, 0.11480712890625, 0.1336669921875, 0.15252685546875, 0.17138671875, 0.19024658203125, 0.2091064453125, 0.22796630859375, 0.246826171875, 0.26568603515625, 0.2845458984375, 0.30340576171875, 0.322265625, 0.34112548828125, 0.3599853515625, 0.37884521484375, 0.397705078125, 0.41656494140625, 0.4354248046875, 0.45428466796875, 0.47314453125, 0.49200439453125, 0.5108642578125, 0.52972412109375, 0.548583984375, 0.56744384765625, 0.5863037109375, 0.60516357421875, 0.6240234375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 7.0, 4.0, 4.0, 10.0, 13.0, 14.0, 10.0, 18.0, 21.0, 24.0, 24.0, 42.0, 40.0, 42.0, 36.0, 49.0, 38.0, 49.0, 42.0, 51.0, 53.0, 53.0, 42.0, 32.0, 38.0, 32.0, 42.0, 31.0, 24.0, 25.0, 13.0, 18.0, 14.0, 11.0, 6.0, 10.0, 5.0, 4.0, 5.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.837890625, -0.8110275268554688, -0.7841644287109375, -0.7573013305664062, -0.730438232421875, -0.7035751342773438, -0.6767120361328125, -0.6498489379882812, -0.62298583984375, -0.5961227416992188, -0.5692596435546875, -0.5423965454101562, -0.515533447265625, -0.48867034912109375, -0.4618072509765625, -0.43494415283203125, -0.4080810546875, -0.38121795654296875, -0.3543548583984375, -0.32749176025390625, -0.300628662109375, -0.27376556396484375, -0.2469024658203125, -0.22003936767578125, -0.19317626953125, -0.16631317138671875, -0.1394500732421875, -0.11258697509765625, -0.085723876953125, -0.05886077880859375, -0.0319976806640625, -0.00513458251953125, 0.021728515625, 0.04859161376953125, 0.0754547119140625, 0.10231781005859375, 0.129180908203125, 0.15604400634765625, 0.1829071044921875, 0.20977020263671875, 0.23663330078125, 0.26349639892578125, 0.2903594970703125, 0.31722259521484375, 0.344085693359375, 0.37094879150390625, 0.3978118896484375, 0.42467498779296875, 0.4515380859375, 0.47840118408203125, 0.5052642822265625, 0.5321273803710938, 0.558990478515625, 0.5858535766601562, 0.6127166748046875, 0.6395797729492188, 0.66644287109375, 0.6933059692382812, 0.7201690673828125, 0.7470321655273438, 0.773895263671875, 0.8007583618164062, 0.8276214599609375, 0.8544845581054688, 0.88134765625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 3.0, 4.0, 2.0, 5.0, 9.0, 10.0, 13.0, 26.0, 41.0, 93.0, 134.0, 316.0, 889.0, 3959.0, 48595.0, 967921.0, 22551.0, 2726.0, 673.0, 273.0, 126.0, 75.0, 39.0, 26.0, 10.0, 15.0, 9.0, 4.0, 6.0, 1.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-1.4541015625, -1.4180984497070312, -1.3820953369140625, -1.3460922241210938, -1.310089111328125, -1.2740859985351562, -1.2380828857421875, -1.2020797729492188, -1.16607666015625, -1.1300735473632812, -1.0940704345703125, -1.0580673217773438, -1.022064208984375, -0.9860610961914062, -0.9500579833984375, -0.9140548706054688, -0.8780517578125, -0.8420486450195312, -0.8060455322265625, -0.7700424194335938, -0.734039306640625, -0.6980361938476562, -0.6620330810546875, -0.6260299682617188, -0.59002685546875, -0.5540237426757812, -0.5180206298828125, -0.48201751708984375, -0.446014404296875, -0.41001129150390625, -0.3740081787109375, -0.33800506591796875, -0.302001953125, -0.26599884033203125, -0.2299957275390625, -0.19399261474609375, -0.157989501953125, -0.12198638916015625, -0.0859832763671875, -0.04998016357421875, -0.01397705078125, 0.02202606201171875, 0.0580291748046875, 0.09403228759765625, 0.130035400390625, 0.16603851318359375, 0.2020416259765625, 0.23804473876953125, 0.2740478515625, 0.31005096435546875, 0.3460540771484375, 0.38205718994140625, 0.418060302734375, 0.45406341552734375, 0.4900665283203125, 0.5260696411132812, 0.56207275390625, 0.5980758666992188, 0.6340789794921875, 0.6700820922851562, 0.706085205078125, 0.7420883178710938, 0.7780914306640625, 0.8140945434570312, 0.85009765625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 11.0, 15.0, 27.0, 45.0, 68.0, 132.0, 161.0, 192.0, 138.0, 86.0, 51.0, 32.0, 24.0, 10.0, 5.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014579296112060547, -0.00014187581837177277, -0.00013795867562294006, -0.00013404153287410736, -0.00013012439012527466, -0.00012620724737644196, -0.00012229010462760925, -0.00011837296187877655, -0.00011445581912994385, -0.00011053867638111115, -0.00010662153363227844, -0.00010270439088344574, -9.878724813461304e-05, -9.487010538578033e-05, -9.095296263694763e-05, -8.703581988811493e-05, -8.311867713928223e-05, -7.920153439044952e-05, -7.528439164161682e-05, -7.136724889278412e-05, -6.745010614395142e-05, -6.353296339511871e-05, -5.961582064628601e-05, -5.569867789745331e-05, -5.1781535148620605e-05, -4.78643923997879e-05, -4.39472496509552e-05, -4.00301069021225e-05, -3.6112964153289795e-05, -3.219582140445709e-05, -2.827867865562439e-05, -2.4361535906791687e-05, -2.0444393157958984e-05, -1.6527250409126282e-05, -1.2610107660293579e-05, -8.692964911460876e-06, -4.775822162628174e-06, -8.586794137954712e-07, 3.0584633350372314e-06, 6.975606083869934e-06, 1.0892748832702637e-05, 1.480989158153534e-05, 1.8727034330368042e-05, 2.2644177079200745e-05, 2.6561319828033447e-05, 3.047846257686615e-05, 3.439560532569885e-05, 3.8312748074531555e-05, 4.222989082336426e-05, 4.614703357219696e-05, 5.006417632102966e-05, 5.3981319069862366e-05, 5.789846181869507e-05, 6.181560456752777e-05, 6.573274731636047e-05, 6.964989006519318e-05, 7.356703281402588e-05, 7.748417556285858e-05, 8.140131831169128e-05, 8.531846106052399e-05, 8.923560380935669e-05, 9.315274655818939e-05, 9.70698893070221e-05, 0.0001009870320558548, 0.0001049041748046875]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 5.0, 5.0, 8.0, 12.0, 27.0, 36.0, 59.0, 113.0, 185.0, 384.0, 1074.0, 4561.0, 54405.0, 946373.0, 35794.0, 3795.0, 946.0, 370.0, 165.0, 101.0, 47.0, 32.0, 17.0, 17.0, 10.0, 6.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.1748046875, -1.1416549682617188, -1.1085052490234375, -1.0753555297851562, -1.042205810546875, -1.0090560913085938, -0.9759063720703125, -0.9427566528320312, -0.90960693359375, -0.8764572143554688, -0.8433074951171875, -0.8101577758789062, -0.777008056640625, -0.7438583374023438, -0.7107086181640625, -0.6775588989257812, -0.6444091796875, -0.6112594604492188, -0.5781097412109375, -0.5449600219726562, -0.511810302734375, -0.47866058349609375, -0.4455108642578125, -0.41236114501953125, -0.37921142578125, -0.34606170654296875, -0.3129119873046875, -0.27976226806640625, -0.246612548828125, -0.21346282958984375, -0.1803131103515625, -0.14716339111328125, -0.114013671875, -0.08086395263671875, -0.0477142333984375, -0.01456451416015625, 0.018585205078125, 0.05173492431640625, 0.0848846435546875, 0.11803436279296875, 0.15118408203125, 0.18433380126953125, 0.2174835205078125, 0.25063323974609375, 0.283782958984375, 0.31693267822265625, 0.3500823974609375, 0.38323211669921875, 0.4163818359375, 0.44953155517578125, 0.4826812744140625, 0.5158309936523438, 0.548980712890625, 0.5821304321289062, 0.6152801513671875, 0.6484298706054688, 0.68157958984375, 0.7147293090820312, 0.7478790283203125, 0.7810287475585938, 0.814178466796875, 0.8473281860351562, 0.8804779052734375, 0.9136276245117188, 0.94677734375]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 5.0, 2.0, 4.0, 7.0, 5.0, 17.0, 12.0, 32.0, 50.0, 96.0, 174.0, 210.0, 175.0, 90.0, 59.0, 19.0, 17.0, 9.0, 3.0, 9.0, 1.0, 3.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.60498046875, -0.5792770385742188, -0.5535736083984375, -0.5278701782226562, -0.502166748046875, -0.47646331787109375, -0.4507598876953125, -0.42505645751953125, -0.39935302734375, -0.37364959716796875, -0.3479461669921875, -0.32224273681640625, -0.296539306640625, -0.27083587646484375, -0.2451324462890625, -0.21942901611328125, -0.1937255859375, -0.16802215576171875, -0.1423187255859375, -0.11661529541015625, -0.090911865234375, -0.06520843505859375, -0.0395050048828125, -0.01380157470703125, 0.01190185546875, 0.03760528564453125, 0.0633087158203125, 0.08901214599609375, 0.114715576171875, 0.14041900634765625, 0.1661224365234375, 0.19182586669921875, 0.217529296875, 0.24323272705078125, 0.2689361572265625, 0.29463958740234375, 0.320343017578125, 0.34604644775390625, 0.3717498779296875, 0.39745330810546875, 0.42315673828125, 0.44886016845703125, 0.4745635986328125, 0.5002670288085938, 0.525970458984375, 0.5516738891601562, 0.5773773193359375, 0.6030807495117188, 0.6287841796875, 0.6544876098632812, 0.6801910400390625, 0.7058944702148438, 0.731597900390625, 0.7573013305664062, 0.7830047607421875, 0.8087081909179688, 0.83441162109375, 0.8601150512695312, 0.8858184814453125, 0.9115219116210938, 0.937225341796875, 0.9629287719726562, 0.9886322021484375, 1.0143356323242188, 1.0400390625]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 2.0, 3.0, 5.0, 16.0, 30.0, 59.0, 96.0, 188.0, 247.0, 160.0, 92.0, 51.0, 23.0, 13.0, 4.0, 5.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.260588645935059, -11.970691680908203, -11.680793762207031, -11.390896797180176, -11.10099983215332, -10.811101913452148, -10.521204948425293, -10.231307983398438, -9.941410064697266, -9.65151309967041, -9.361615180969238, -9.071718215942383, -8.781820297241211, -8.491923332214355, -8.2020263671875, -7.912128925323486, -7.622231483459473, -7.332334041595459, -7.042436599731445, -6.75253963470459, -6.462642192840576, -6.1727447509765625, -5.882847785949707, -5.592950344085693, -5.30305290222168, -5.013155460357666, -4.723258018493652, -4.433361053466797, -4.143463611602783, -3.8535661697387695, -3.563668966293335, -3.2737717628479004, -2.9838733673095703, -2.6939759254455566, -2.404078722000122, -2.1141815185546875, -1.8242840766906738, -1.5343867540359497, -1.2444894313812256, -0.954592227935791, -0.6646947860717773, -0.3747974634170532, -0.0849001407623291, 0.20499718189239502, 0.49489450454711914, 0.7847918272018433, 1.0746891498565674, 1.364586353302002, 1.6544837951660156, 1.9443811178207397, 2.234278440475464, 2.5241756439208984, 2.814073085784912, 3.103970527648926, 3.3938677310943604, 3.683764934539795, 3.9736623764038086, 4.263559818267822, 4.553457260131836, 4.843354225158691, 5.133251667022705, 5.423149108886719, 5.713046073913574, 6.002943515777588, 6.292840957641602]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 3.0, 5.0, 7.0, 10.0, 5.0, 12.0, 11.0, 14.0, 22.0, 22.0, 25.0, 28.0, 24.0, 38.0, 37.0, 36.0, 49.0, 44.0, 44.0, 50.0, 43.0, 54.0, 47.0, 49.0, 36.0, 37.0, 44.0, 24.0, 28.0, 21.0, 24.0, 20.0, 19.0, 16.0, 16.0, 6.0, 7.0, 10.0, 4.0, 5.0, 5.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.166521072387695, -4.029800891876221, -3.893080949783325, -3.7563610076904297, -3.619640827178955, -3.4829208850860596, -3.346200942993164, -3.2094807624816895, -3.072760581970215, -2.9360406398773193, -2.7993204593658447, -2.662600517272949, -2.5258803367614746, -2.389160394668579, -2.2524404525756836, -2.115720272064209, -1.9790003299713135, -1.8422802686691284, -1.7055602073669434, -1.5688402652740479, -1.4321200847625732, -1.2954001426696777, -1.1586800813674927, -1.0219600200653076, -0.8852399587631226, -0.7485198974609375, -0.6117998361587524, -0.47507983446121216, -0.3383597731590271, -0.20163971185684204, -0.06491971015930176, 0.0718003511428833, 0.20852041244506836, 0.3452404737472534, 0.4819605052471161, 0.6186805367469788, 0.7554005980491638, 0.8921206593513489, 1.0288406610488892, 1.1655607223510742, 1.3022807836532593, 1.4390008449554443, 1.5757209062576294, 1.7124409675598145, 1.84916090965271, 1.9858810901641846, 2.12260103225708, 2.2593212127685547, 2.39604115486145, 2.5327610969543457, 2.6694812774658203, 2.806201219558716, 2.9429214000701904, 3.079641342163086, 3.2163615226745605, 3.353081464767456, 3.4898014068603516, 3.626521348953247, 3.7632415294647217, 3.899961471557617, 4.036681652069092, 4.173401832580566, 4.310121536254883, 4.446841716766357, 4.583561897277832]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 4.0, 6.0, 5.0, 16.0, 16.0, 29.0, 65.0, 72.0, 102.0, 169.0, 297.0, 475.0, 850.0, 1513.0, 3107.0, 6960.0, 22890.0, 3744290.0, 380744.0, 19848.0, 6531.0, 2931.0, 1427.0, 781.0, 455.0, 269.0, 157.0, 107.0, 46.0, 36.0, 21.0, 18.0, 18.0, 7.0, 7.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.71728515625, -0.691619873046875, -0.66595458984375, -0.640289306640625, -0.6146240234375, -0.588958740234375, -0.56329345703125, -0.537628173828125, -0.511962890625, -0.486297607421875, -0.46063232421875, -0.434967041015625, -0.4093017578125, -0.383636474609375, -0.35797119140625, -0.332305908203125, -0.306640625, -0.280975341796875, -0.25531005859375, -0.229644775390625, -0.2039794921875, -0.178314208984375, -0.15264892578125, -0.126983642578125, -0.101318359375, -0.075653076171875, -0.04998779296875, -0.024322509765625, 0.0013427734375, 0.027008056640625, 0.05267333984375, 0.078338623046875, 0.10400390625, 0.129669189453125, 0.15533447265625, 0.180999755859375, 0.2066650390625, 0.232330322265625, 0.25799560546875, 0.283660888671875, 0.309326171875, 0.334991455078125, 0.36065673828125, 0.386322021484375, 0.4119873046875, 0.437652587890625, 0.46331787109375, 0.488983154296875, 0.5146484375, 0.540313720703125, 0.56597900390625, 0.591644287109375, 0.6173095703125, 0.642974853515625, 0.66864013671875, 0.694305419921875, 0.719970703125, 0.745635986328125, 0.77130126953125, 0.796966552734375, 0.8226318359375, 0.848297119140625, 0.87396240234375, 0.899627685546875, 0.92529296875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 6.0, 2.0, 3.0, 7.0, 10.0, 8.0, 18.0, 16.0, 23.0, 30.0, 32.0, 36.0, 31.0, 48.0, 48.0, 55.0, 52.0, 57.0, 69.0, 59.0, 66.0, 65.0, 40.0, 50.0, 46.0, 24.0, 22.0, 22.0, 13.0, 7.0, 13.0, 7.0, 6.0, 4.0, 3.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.21484375, -0.20786666870117188, -0.20088958740234375, -0.19391250610351562, -0.1869354248046875, -0.17995834350585938, -0.17298126220703125, -0.16600418090820312, -0.159027099609375, -0.15205001831054688, -0.14507293701171875, -0.13809585571289062, -0.1311187744140625, -0.12414169311523438, -0.11716461181640625, -0.11018753051757812, -0.10321044921875, -0.09623336791992188, -0.08925628662109375, -0.08227920532226562, -0.0753021240234375, -0.06832504272460938, -0.06134796142578125, -0.054370880126953125, -0.047393798828125, -0.040416717529296875, -0.03343963623046875, -0.026462554931640625, -0.0194854736328125, -0.012508392333984375, -0.00553131103515625, 0.001445770263671875, 0.0084228515625, 0.015399932861328125, 0.02237701416015625, 0.029354095458984375, 0.0363311767578125, 0.043308258056640625, 0.05028533935546875, 0.057262420654296875, 0.064239501953125, 0.07121658325195312, 0.07819366455078125, 0.08517074584960938, 0.0921478271484375, 0.09912490844726562, 0.10610198974609375, 0.11307907104492188, 0.12005615234375, 0.12703323364257812, 0.13401031494140625, 0.14098739624023438, 0.1479644775390625, 0.15494155883789062, 0.16191864013671875, 0.16889572143554688, 0.175872802734375, 0.18284988403320312, 0.18982696533203125, 0.19680404663085938, 0.2037811279296875, 0.21075820922851562, 0.21773529052734375, 0.22471237182617188, 0.231689453125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 6.0, 12.0, 17.0, 18.0, 48.0, 62.0, 120.0, 185.0, 324.0, 617.0, 1297.0, 2959.0, 8225.0, 32494.0, 3843624.0, 272007.0, 21347.0, 6236.0, 2390.0, 1112.0, 506.0, 255.0, 149.0, 98.0, 63.0, 35.0, 22.0, 18.0, 10.0, 8.0, 3.0, 4.0, 3.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.02734375, -0.992950439453125, -0.95855712890625, -0.924163818359375, -0.8897705078125, -0.855377197265625, -0.82098388671875, -0.786590576171875, -0.752197265625, -0.717803955078125, -0.68341064453125, -0.649017333984375, -0.6146240234375, -0.580230712890625, -0.54583740234375, -0.511444091796875, -0.47705078125, -0.442657470703125, -0.40826416015625, -0.373870849609375, -0.3394775390625, -0.305084228515625, -0.27069091796875, -0.236297607421875, -0.201904296875, -0.167510986328125, -0.13311767578125, -0.098724365234375, -0.0643310546875, -0.029937744140625, 0.00445556640625, 0.038848876953125, 0.0732421875, 0.107635498046875, 0.14202880859375, 0.176422119140625, 0.2108154296875, 0.245208740234375, 0.27960205078125, 0.313995361328125, 0.348388671875, 0.382781982421875, 0.41717529296875, 0.451568603515625, 0.4859619140625, 0.520355224609375, 0.55474853515625, 0.589141845703125, 0.62353515625, 0.657928466796875, 0.69232177734375, 0.726715087890625, 0.7611083984375, 0.795501708984375, 0.82989501953125, 0.864288330078125, 0.898681640625, 0.933074951171875, 0.96746826171875, 1.001861572265625, 1.0362548828125, 1.070648193359375, 1.10504150390625, 1.139434814453125, 1.173828125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 4.0, 7.0, 9.0, 18.0, 22.0, 30.0, 86.0, 252.0, 3271.0, 213.0, 53.0, 43.0, 18.0, 14.0, 6.0, 8.0, 5.0, 1.0, 5.0, 4.0, 4.0, 1.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.39306640625, -0.3781890869140625, -0.363311767578125, -0.3484344482421875, -0.33355712890625, -0.3186798095703125, -0.303802490234375, -0.2889251708984375, -0.2740478515625, -0.2591705322265625, -0.244293212890625, -0.2294158935546875, -0.21453857421875, -0.1996612548828125, -0.184783935546875, -0.1699066162109375, -0.155029296875, -0.1401519775390625, -0.125274658203125, -0.1103973388671875, -0.09552001953125, -0.0806427001953125, -0.065765380859375, -0.0508880615234375, -0.0360107421875, -0.0211334228515625, -0.006256103515625, 0.0086212158203125, 0.02349853515625, 0.0383758544921875, 0.053253173828125, 0.0681304931640625, 0.0830078125, 0.0978851318359375, 0.112762451171875, 0.1276397705078125, 0.14251708984375, 0.1573944091796875, 0.172271728515625, 0.1871490478515625, 0.2020263671875, 0.2169036865234375, 0.231781005859375, 0.2466583251953125, 0.26153564453125, 0.2764129638671875, 0.291290283203125, 0.3061676025390625, 0.321044921875, 0.3359222412109375, 0.350799560546875, 0.3656768798828125, 0.38055419921875, 0.3954315185546875, 0.410308837890625, 0.4251861572265625, 0.4400634765625, 0.4549407958984375, 0.469818115234375, 0.4846954345703125, 0.49957275390625, 0.5144500732421875, 0.529327392578125, 0.5442047119140625, 0.55908203125]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 10.0, 7.0, 17.0, 22.0, 52.0, 71.0, 103.0, 142.0, 137.0, 114.0, 86.0, 73.0, 48.0, 31.0, 32.0, 14.0, 9.0, 9.0, 5.0, 5.0, 5.0, 6.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.506753921508789, -1.4527078866958618, -1.3986618518829346, -1.3446158170700073, -1.29056978225708, -1.2365237474441528, -1.1824777126312256, -1.1284316778182983, -1.074385643005371, -1.0203396081924438, -0.9662935733795166, -0.9122475385665894, -0.8582015037536621, -0.8041554689407349, -0.7501094341278076, -0.6960633993148804, -0.6420173048973083, -0.5879712700843811, -0.5339252352714539, -0.4798792004585266, -0.42583316564559937, -0.37178710103034973, -0.3177410662174225, -0.26369503140449524, -0.209648996591568, -0.15560296177864075, -0.1015569195151329, -0.04751087725162506, 0.006535157561302185, 0.060581207275390625, 0.11462724208831787, 0.16867327690124512, 0.22271931171417236, 0.2767653465270996, 0.33081138134002686, 0.3848574161529541, 0.43890345096588135, 0.492949515581131, 0.5469955205917358, 0.6010415554046631, 0.6550875902175903, 0.7091336250305176, 0.7631796598434448, 0.8172256946563721, 0.8712717294692993, 0.9253177642822266, 0.9793637990951538, 1.033409833908081, 1.0874559879302979, 1.141502022743225, 1.1955480575561523, 1.2495940923690796, 1.3036401271820068, 1.357686161994934, 1.4117321968078613, 1.4657782316207886, 1.5198242664337158, 1.573870301246643, 1.6279163360595703, 1.6819623708724976, 1.7360084056854248, 1.790054440498352, 1.8441004753112793, 1.8981465101242065, 1.9521925449371338]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 7.0, 9.0, 9.0, 10.0, 12.0, 21.0, 29.0, 19.0, 20.0, 32.0, 29.0, 27.0, 40.0, 46.0, 34.0, 46.0, 44.0, 40.0, 41.0, 41.0, 43.0, 48.0, 45.0, 38.0, 33.0, 41.0, 34.0, 27.0, 29.0, 16.0, 20.0, 16.0, 12.0, 7.0, 11.0, 8.0, 5.0, 4.0, 3.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.1297924518585205, -1.098103404045105, -1.0664143562316895, -1.0347254276275635, -1.003036379814148, -0.9713473320007324, -0.9396582841873169, -0.9079692363739014, -0.8762801885604858, -0.8445911407470703, -0.8129021525382996, -0.781213104724884, -0.7495240569114685, -0.7178350687026978, -0.6861460208892822, -0.6544569730758667, -0.622767984867096, -0.5910789370536804, -0.5593899488449097, -0.5277009010314941, -0.4960118532180786, -0.4643228352069855, -0.43263381719589233, -0.4009447693824768, -0.36925575137138367, -0.3375667333602905, -0.305877685546875, -0.27418866753578186, -0.24249963462352753, -0.2108106017112732, -0.17912158370018005, -0.14743255078792572, -0.11574351787567139, -0.08405448496341705, -0.05236545950174332, -0.02067643404006958, 0.011012598872184753, 0.04270163178443909, 0.07439064979553223, 0.10607968270778656, 0.1377687156200409, 0.16945774853229523, 0.20114678144454956, 0.2328357994556427, 0.26452481746673584, 0.29621386528015137, 0.3279028832912445, 0.35959190130233765, 0.3912809491157532, 0.4229699671268463, 0.45465901494026184, 0.486348032951355, 0.5180370807647705, 0.549726128578186, 0.5814151167869568, 0.6131041646003723, 0.6447931528091431, 0.6764822006225586, 0.7081711888313293, 0.7398602366447449, 0.7715492844581604, 0.8032382726669312, 0.8349273204803467, 0.8666163682937622, 0.8983054161071777]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 1.0, 6.0, 3.0, 8.0, 12.0, 9.0, 23.0, 27.0, 40.0, 50.0, 82.0, 109.0, 172.0, 230.0, 374.0, 564.0, 893.0, 1474.0, 2404.0, 4112.0, 7825.0, 15552.0, 33230.0, 73323.0, 173120.0, 361926.0, 209085.0, 86504.0, 38444.0, 18116.0, 8926.0, 4817.0, 2691.0, 1546.0, 1014.0, 592.0, 426.0, 258.0, 176.0, 139.0, 75.0, 53.0, 36.0, 29.0, 18.0, 11.0, 18.0, 7.0, 2.0, 6.0, 4.0, 2.0, 2.0], "bins": [-0.488525390625, -0.4751777648925781, -0.46183013916015625, -0.4484825134277344, -0.4351348876953125, -0.4217872619628906, -0.40843963623046875, -0.3950920104980469, -0.381744384765625, -0.3683967590332031, -0.35504913330078125, -0.3417015075683594, -0.3283538818359375, -0.3150062561035156, -0.30165863037109375, -0.2883110046386719, -0.27496337890625, -0.2616157531738281, -0.24826812744140625, -0.23492050170898438, -0.2215728759765625, -0.20822525024414062, -0.19487762451171875, -0.18152999877929688, -0.168182373046875, -0.15483474731445312, -0.14148712158203125, -0.12813949584960938, -0.1147918701171875, -0.10144424438476562, -0.08809661865234375, -0.07474899291992188, -0.0614013671875, -0.048053741455078125, -0.03470611572265625, -0.021358489990234375, -0.0080108642578125, 0.005336761474609375, 0.01868438720703125, 0.032032012939453125, 0.045379638671875, 0.058727264404296875, 0.07207489013671875, 0.08542251586914062, 0.0987701416015625, 0.11211776733398438, 0.12546539306640625, 0.13881301879882812, 0.15216064453125, 0.16550827026367188, 0.17885589599609375, 0.19220352172851562, 0.2055511474609375, 0.21889877319335938, 0.23224639892578125, 0.24559402465820312, 0.258941650390625, 0.2722892761230469, 0.28563690185546875, 0.2989845275878906, 0.3123321533203125, 0.3256797790527344, 0.33902740478515625, 0.3523750305175781, 0.36572265625]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 5.0, 8.0, 7.0, 6.0, 8.0, 14.0, 17.0, 23.0, 21.0, 29.0, 42.0, 42.0, 44.0, 46.0, 46.0, 62.0, 66.0, 57.0, 51.0, 48.0, 60.0, 45.0, 45.0, 40.0, 38.0, 25.0, 24.0, 18.0, 20.0, 11.0, 9.0, 5.0, 7.0, 3.0, 1.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2469482421875, -0.23929405212402344, -0.23163986206054688, -0.2239856719970703, -0.21633148193359375, -0.2086772918701172, -0.20102310180664062, -0.19336891174316406, -0.1857147216796875, -0.17806053161621094, -0.17040634155273438, -0.1627521514892578, -0.15509796142578125, -0.1474437713623047, -0.13978958129882812, -0.13213539123535156, -0.124481201171875, -0.11682701110839844, -0.10917282104492188, -0.10151863098144531, -0.09386444091796875, -0.08621025085449219, -0.07855606079101562, -0.07090187072753906, -0.0632476806640625, -0.05559349060058594, -0.047939300537109375, -0.04028511047363281, -0.03263092041015625, -0.024976730346679688, -0.017322540283203125, -0.009668350219726562, -0.00201416015625, 0.0056400299072265625, 0.013294219970703125, 0.020948410034179688, 0.02860260009765625, 0.03625679016113281, 0.043910980224609375, 0.05156517028808594, 0.0592193603515625, 0.06687355041503906, 0.07452774047851562, 0.08218193054199219, 0.08983612060546875, 0.09749031066894531, 0.10514450073242188, 0.11279869079589844, 0.120452880859375, 0.12810707092285156, 0.13576126098632812, 0.1434154510498047, 0.15106964111328125, 0.1587238311767578, 0.16637802124023438, 0.17403221130371094, 0.1816864013671875, 0.18934059143066406, 0.19699478149414062, 0.2046489715576172, 0.21230316162109375, 0.2199573516845703, 0.22761154174804688, 0.23526573181152344, 0.242919921875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 4.0, 4.0, 6.0, 5.0, 14.0, 22.0, 42.0, 61.0, 81.0, 117.0, 190.0, 250.0, 435.0, 703.0, 1128.0, 2485.0, 7198.0, 35315.0, 377298.0, 560090.0, 48357.0, 8575.0, 2820.0, 1367.0, 674.0, 420.0, 264.0, 191.0, 132.0, 87.0, 62.0, 49.0, 38.0, 18.0, 20.0, 7.0, 10.0, 7.0, 4.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.0380859375, -1.0066986083984375, -0.975311279296875, -0.9439239501953125, -0.91253662109375, -0.8811492919921875, -0.849761962890625, -0.8183746337890625, -0.7869873046875, -0.7555999755859375, -0.724212646484375, -0.6928253173828125, -0.66143798828125, -0.6300506591796875, -0.598663330078125, -0.5672760009765625, -0.535888671875, -0.5045013427734375, -0.473114013671875, -0.4417266845703125, -0.41033935546875, -0.3789520263671875, -0.347564697265625, -0.3161773681640625, -0.2847900390625, -0.2534027099609375, -0.222015380859375, -0.1906280517578125, -0.15924072265625, -0.1278533935546875, -0.096466064453125, -0.0650787353515625, -0.03369140625, -0.0023040771484375, 0.029083251953125, 0.0604705810546875, 0.09185791015625, 0.1232452392578125, 0.154632568359375, 0.1860198974609375, 0.2174072265625, 0.2487945556640625, 0.280181884765625, 0.3115692138671875, 0.34295654296875, 0.3743438720703125, 0.405731201171875, 0.4371185302734375, 0.468505859375, 0.4998931884765625, 0.531280517578125, 0.5626678466796875, 0.59405517578125, 0.6254425048828125, 0.656829833984375, 0.6882171630859375, 0.7196044921875, 0.7509918212890625, 0.782379150390625, 0.8137664794921875, 0.84515380859375, 0.8765411376953125, 0.907928466796875, 0.9393157958984375, 0.970703125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 5.0, 3.0, 2.0, 6.0, 10.0, 15.0, 11.0, 15.0, 19.0, 25.0, 16.0, 27.0, 26.0, 40.0, 44.0, 39.0, 54.0, 50.0, 44.0, 49.0, 53.0, 31.0, 53.0, 44.0, 47.0, 39.0, 41.0, 28.0, 27.0, 23.0, 19.0, 16.0, 21.0, 15.0, 13.0, 8.0, 6.0, 8.0, 6.0, 5.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.974609375, -0.94317626953125, -0.9117431640625, -0.88031005859375, -0.848876953125, -0.81744384765625, -0.7860107421875, -0.75457763671875, -0.72314453125, -0.69171142578125, -0.6602783203125, -0.62884521484375, -0.597412109375, -0.56597900390625, -0.5345458984375, -0.50311279296875, -0.4716796875, -0.44024658203125, -0.4088134765625, -0.37738037109375, -0.345947265625, -0.31451416015625, -0.2830810546875, -0.25164794921875, -0.22021484375, -0.18878173828125, -0.1573486328125, -0.12591552734375, -0.094482421875, -0.06304931640625, -0.0316162109375, -0.00018310546875, 0.03125, 0.06268310546875, 0.0941162109375, 0.12554931640625, 0.156982421875, 0.18841552734375, 0.2198486328125, 0.25128173828125, 0.28271484375, 0.31414794921875, 0.3455810546875, 0.37701416015625, 0.408447265625, 0.43988037109375, 0.4713134765625, 0.50274658203125, 0.5341796875, 0.56561279296875, 0.5970458984375, 0.62847900390625, 0.659912109375, 0.69134521484375, 0.7227783203125, 0.75421142578125, 0.78564453125, 0.81707763671875, 0.8485107421875, 0.87994384765625, 0.911376953125, 0.94281005859375, 0.9742431640625, 1.00567626953125, 1.037109375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 7.0, 9.0, 5.0, 9.0, 9.0, 9.0, 18.0, 17.0, 41.0, 37.0, 59.0, 87.0, 110.0, 210.0, 337.0, 775.0, 1659.0, 4715.0, 20415.0, 231242.0, 724721.0, 50774.0, 8440.0, 2530.0, 999.0, 502.0, 286.0, 180.0, 116.0, 79.0, 41.0, 32.0, 22.0, 18.0, 15.0, 5.0, 4.0, 3.0, 4.0, 2.0, 2.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.449951171875, -0.4350624084472656, -0.42017364501953125, -0.4052848815917969, -0.3903961181640625, -0.3755073547363281, -0.36061859130859375, -0.3457298278808594, -0.330841064453125, -0.3159523010253906, -0.30106353759765625, -0.2861747741699219, -0.2712860107421875, -0.2563972473144531, -0.24150848388671875, -0.22661972045898438, -0.21173095703125, -0.19684219360351562, -0.18195343017578125, -0.16706466674804688, -0.1521759033203125, -0.13728713989257812, -0.12239837646484375, -0.10750961303710938, -0.092620849609375, -0.07773208618164062, -0.06284332275390625, -0.047954559326171875, -0.0330657958984375, -0.018177032470703125, -0.00328826904296875, 0.011600494384765625, 0.0264892578125, 0.041378021240234375, 0.05626678466796875, 0.07115554809570312, 0.0860443115234375, 0.10093307495117188, 0.11582183837890625, 0.13071060180664062, 0.145599365234375, 0.16048812866210938, 0.17537689208984375, 0.19026565551757812, 0.2051544189453125, 0.22004318237304688, 0.23493194580078125, 0.24982070922851562, 0.26470947265625, 0.2795982360839844, 0.29448699951171875, 0.3093757629394531, 0.3242645263671875, 0.3391532897949219, 0.35404205322265625, 0.3689308166503906, 0.383819580078125, 0.3987083435058594, 0.41359710693359375, 0.4284858703613281, 0.4433746337890625, 0.4582633972167969, 0.47315216064453125, 0.4880409240722656, 0.5029296875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 3.0, 4.0, 5.0, 6.0, 4.0, 14.0, 14.0, 21.0, 33.0, 46.0, 68.0, 90.0, 134.0, 176.0, 127.0, 73.0, 44.0, 44.0, 27.0, 13.0, 12.0, 18.0, 5.0, 5.0, 4.0, 2.0, 2.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.423494338989258e-05, -9.020697325468063e-05, -8.617900311946869e-05, -8.215103298425674e-05, -7.81230628490448e-05, -7.409509271383286e-05, -7.006712257862091e-05, -6.603915244340897e-05, -6.201118230819702e-05, -5.798321217298508e-05, -5.395524203777313e-05, -4.992727190256119e-05, -4.589930176734924e-05, -4.18713316321373e-05, -3.7843361496925354e-05, -3.381539136171341e-05, -2.9787421226501465e-05, -2.575945109128952e-05, -2.1731480956077576e-05, -1.770351082086563e-05, -1.3675540685653687e-05, -9.647570550441742e-06, -5.619600415229797e-06, -1.5916302800178528e-06, 2.436339855194092e-06, 6.464309990406036e-06, 1.0492280125617981e-05, 1.4520250260829926e-05, 1.854822039604187e-05, 2.2576190531253815e-05, 2.660416066646576e-05, 3.0632130801677704e-05, 3.466010093688965e-05, 3.868807107210159e-05, 4.271604120731354e-05, 4.674401134252548e-05, 5.077198147773743e-05, 5.479995161294937e-05, 5.8827921748161316e-05, 6.285589188337326e-05, 6.68838620185852e-05, 7.091183215379715e-05, 7.49398022890091e-05, 7.896777242422104e-05, 8.299574255943298e-05, 8.702371269464493e-05, 9.105168282985687e-05, 9.507965296506882e-05, 9.910762310028076e-05, 0.0001031355932354927, 0.00010716356337070465, 0.0001111915335059166, 0.00011521950364112854, 0.00011924747377634048, 0.00012327544391155243, 0.00012730341404676437, 0.00013133138418197632, 0.00013535935431718826, 0.0001393873244524002, 0.00014341529458761215, 0.0001474432647228241, 0.00015147123485803604, 0.00015549920499324799, 0.00015952717512845993, 0.00016355514526367188]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 1.0, 4.0, 11.0, 6.0, 16.0, 15.0, 27.0, 40.0, 45.0, 74.0, 102.0, 168.0, 258.0, 493.0, 976.0, 2311.0, 7116.0, 36179.0, 542531.0, 416807.0, 30599.0, 6524.0, 2120.0, 924.0, 459.0, 233.0, 174.0, 108.0, 69.0, 52.0, 37.0, 22.0, 23.0, 7.0, 10.0, 9.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.427490234375, -0.4136810302734375, -0.399871826171875, -0.3860626220703125, -0.37225341796875, -0.3584442138671875, -0.344635009765625, -0.3308258056640625, -0.3170166015625, -0.3032073974609375, -0.289398193359375, -0.2755889892578125, -0.26177978515625, -0.2479705810546875, -0.234161376953125, -0.2203521728515625, -0.20654296875, -0.1927337646484375, -0.178924560546875, -0.1651153564453125, -0.15130615234375, -0.1374969482421875, -0.123687744140625, -0.1098785400390625, -0.0960693359375, -0.0822601318359375, -0.068450927734375, -0.0546417236328125, -0.04083251953125, -0.0270233154296875, -0.013214111328125, 0.0005950927734375, 0.014404296875, 0.0282135009765625, 0.042022705078125, 0.0558319091796875, 0.06964111328125, 0.0834503173828125, 0.097259521484375, 0.1110687255859375, 0.1248779296875, 0.1386871337890625, 0.152496337890625, 0.1663055419921875, 0.18011474609375, 0.1939239501953125, 0.207733154296875, 0.2215423583984375, 0.2353515625, 0.2491607666015625, 0.262969970703125, 0.2767791748046875, 0.29058837890625, 0.3043975830078125, 0.318206787109375, 0.3320159912109375, 0.3458251953125, 0.3596343994140625, 0.373443603515625, 0.3872528076171875, 0.40106201171875, 0.4148712158203125, 0.428680419921875, 0.4424896240234375, 0.456298828125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 6.0, 8.0, 3.0, 8.0, 14.0, 15.0, 25.0, 35.0, 53.0, 66.0, 107.0, 96.0, 116.0, 109.0, 79.0, 79.0, 47.0, 37.0, 24.0, 19.0, 12.0, 9.0, 8.0, 11.0, 9.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.48974609375, -0.475921630859375, -0.46209716796875, -0.448272705078125, -0.4344482421875, -0.420623779296875, -0.40679931640625, -0.392974853515625, -0.379150390625, -0.365325927734375, -0.35150146484375, -0.337677001953125, -0.3238525390625, -0.310028076171875, -0.29620361328125, -0.282379150390625, -0.2685546875, -0.254730224609375, -0.24090576171875, -0.227081298828125, -0.2132568359375, -0.199432373046875, -0.18560791015625, -0.171783447265625, -0.157958984375, -0.144134521484375, -0.13031005859375, -0.116485595703125, -0.1026611328125, -0.088836669921875, -0.07501220703125, -0.061187744140625, -0.04736328125, -0.033538818359375, -0.01971435546875, -0.005889892578125, 0.0079345703125, 0.021759033203125, 0.03558349609375, 0.049407958984375, 0.063232421875, 0.077056884765625, 0.09088134765625, 0.104705810546875, 0.1185302734375, 0.132354736328125, 0.14617919921875, 0.160003662109375, 0.173828125, 0.187652587890625, 0.20147705078125, 0.215301513671875, 0.2291259765625, 0.242950439453125, 0.25677490234375, 0.270599365234375, 0.284423828125, 0.298248291015625, 0.31207275390625, 0.325897216796875, 0.3397216796875, 0.353546142578125, 0.36737060546875, 0.381195068359375, 0.39501953125]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 5.0, 13.0, 39.0, 143.0, 399.0, 300.0, 80.0, 21.0, 6.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.629871368408203, -14.041703224182129, -13.453536033630371, -12.865367889404297, -12.277200698852539, -11.689032554626465, -11.10086441040039, -10.512697219848633, -9.924530029296875, -9.3363618850708, -8.748194694519043, -8.160026550292969, -7.571859359741211, -6.983691215515137, -6.395523548126221, -5.807355880737305, -5.2191877365112305, -4.6310200691223145, -4.042852401733398, -3.4546844959259033, -2.8665168285369873, -2.2783491611480713, -1.6901812553405762, -1.1020135879516602, -0.5138459205627441, 0.07432180643081665, 0.6624895334243774, 1.250657320022583, 1.838824987411499, 2.426992654800415, 3.01516056060791, 3.603328227996826, 4.191495895385742, 4.779663562774658, 5.367831230163574, 5.955999374389648, 6.544166564941406, 7.1323347091674805, 7.7205023765563965, 8.308670043945312, 8.89683723449707, 9.485005378723145, 10.073172569274902, 10.661340713500977, 11.249507904052734, 11.837676048278809, 12.425844192504883, 13.01401138305664, 13.602179527282715, 14.190347671508789, 14.778514862060547, 15.366683006286621, 15.954850196838379, 16.543018341064453, 17.13118553161621, 17.71935272216797, 18.30752182006836, 18.895689010620117, 19.483858108520508, 20.072025299072266, 20.660192489624023, 21.24835968017578, 21.836528778076172, 22.42469596862793, 23.012863159179688]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 4.0, 4.0, 3.0, 8.0, 8.0, 21.0, 17.0, 13.0, 17.0, 19.0, 33.0, 29.0, 27.0, 45.0, 39.0, 50.0, 51.0, 49.0, 52.0, 50.0, 47.0, 59.0, 38.0, 47.0, 35.0, 37.0, 29.0, 19.0, 24.0, 26.0, 18.0, 12.0, 15.0, 10.0, 13.0, 9.0, 5.0, 7.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.276425838470459, -4.143445014953613, -4.010463714599609, -3.8774826526641846, -3.7445015907287598, -3.611520528793335, -3.47853946685791, -3.3455584049224854, -3.2125773429870605, -3.0795962810516357, -2.946615219116211, -2.813634157180786, -2.6806530952453613, -2.5476720333099365, -2.4146909713745117, -2.281709909439087, -2.148728847503662, -2.0157477855682373, -1.8827667236328125, -1.7497856616973877, -1.616804599761963, -1.483823537826538, -1.3508424758911133, -1.2178614139556885, -1.0848803520202637, -0.9518992900848389, -0.8189182281494141, -0.6859371662139893, -0.5529561042785645, -0.41997504234313965, -0.28699398040771484, -0.15401291847229004, -0.02103137969970703, 0.11194968223571777, 0.24493074417114258, 0.3779118061065674, 0.5108928680419922, 0.643873929977417, 0.7768549919128418, 0.9098360538482666, 1.0428171157836914, 1.1757981777191162, 1.308779239654541, 1.4417603015899658, 1.5747413635253906, 1.7077224254608154, 1.8407034873962402, 1.973684549331665, 2.10666561126709, 2.2396466732025146, 2.3726277351379395, 2.5056087970733643, 2.638589859008789, 2.771570920944214, 2.9045519828796387, 3.0375330448150635, 3.1705141067504883, 3.303495168685913, 3.436476230621338, 3.5694572925567627, 3.7024383544921875, 3.8354194164276123, 3.968400478363037, 4.101381301879883, 4.234362602233887]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 4.0, 4.0, 11.0, 6.0, 9.0, 6.0, 15.0, 12.0, 12.0, 27.0, 29.0, 46.0, 61.0, 94.0, 142.0, 206.0, 311.0, 552.0, 963.0, 1695.0, 2953.0, 5955.0, 12699.0, 34459.0, 149941.0, 2067632.0, 1722704.0, 135134.0, 33464.0, 12736.0, 5604.0, 2906.0, 1544.0, 877.0, 499.0, 325.0, 228.0, 153.0, 69.0, 61.0, 43.0, 29.0, 19.0, 15.0, 9.0, 7.0, 8.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 3.0], "bins": [-0.43505859375, -0.4226188659667969, -0.41017913818359375, -0.3977394104003906, -0.3852996826171875, -0.3728599548339844, -0.36042022705078125, -0.3479804992675781, -0.335540771484375, -0.3231010437011719, -0.31066131591796875, -0.2982215881347656, -0.2857818603515625, -0.2733421325683594, -0.26090240478515625, -0.24846267700195312, -0.23602294921875, -0.22358322143554688, -0.21114349365234375, -0.19870376586914062, -0.1862640380859375, -0.17382431030273438, -0.16138458251953125, -0.14894485473632812, -0.136505126953125, -0.12406539916992188, -0.11162567138671875, -0.09918594360351562, -0.0867462158203125, -0.07430648803710938, -0.06186676025390625, -0.049427032470703125, -0.0369873046875, -0.024547576904296875, -0.01210784912109375, 0.000331878662109375, 0.0127716064453125, 0.025211334228515625, 0.03765106201171875, 0.050090789794921875, 0.062530517578125, 0.07497024536132812, 0.08740997314453125, 0.09984970092773438, 0.1122894287109375, 0.12472915649414062, 0.13716888427734375, 0.14960861206054688, 0.16204833984375, 0.17448806762695312, 0.18692779541015625, 0.19936752319335938, 0.2118072509765625, 0.22424697875976562, 0.23668670654296875, 0.24912643432617188, 0.261566162109375, 0.2740058898925781, 0.28644561767578125, 0.2988853454589844, 0.3113250732421875, 0.3237648010253906, 0.33620452880859375, 0.3486442565917969, 0.361083984375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 6.0, 5.0, 4.0, 7.0, 15.0, 22.0, 28.0, 55.0, 65.0, 82.0, 95.0, 77.0, 101.0, 103.0, 90.0, 57.0, 63.0, 51.0, 28.0, 25.0, 11.0, 9.0, 7.0, 5.0, 3.0, 2.0, 1.0], "bins": [-0.5966796875, -0.5845756530761719, -0.5724716186523438, -0.5603675842285156, -0.5482635498046875, -0.5361595153808594, -0.5240554809570312, -0.5119514465332031, -0.499847412109375, -0.4877433776855469, -0.47563934326171875, -0.4635353088378906, -0.4514312744140625, -0.4393272399902344, -0.42722320556640625, -0.4151191711425781, -0.40301513671875, -0.3909111022949219, -0.37880706787109375, -0.3667030334472656, -0.3545989990234375, -0.3424949645996094, -0.33039093017578125, -0.3182868957519531, -0.306182861328125, -0.2940788269042969, -0.28197479248046875, -0.2698707580566406, -0.2577667236328125, -0.24566268920898438, -0.23355865478515625, -0.22145462036132812, -0.2093505859375, -0.19724655151367188, -0.18514251708984375, -0.17303848266601562, -0.1609344482421875, -0.14883041381835938, -0.13672637939453125, -0.12462234497070312, -0.112518310546875, -0.10041427612304688, -0.08831024169921875, -0.07620620727539062, -0.0641021728515625, -0.051998138427734375, -0.03989410400390625, -0.027790069580078125, -0.01568603515625, -0.003582000732421875, 0.00852203369140625, 0.020626068115234375, 0.0327301025390625, 0.044834136962890625, 0.05693817138671875, 0.06904220581054688, 0.081146240234375, 0.09325027465820312, 0.10535430908203125, 0.11745834350585938, 0.1295623779296875, 0.14166641235351562, 0.15377044677734375, 0.16587448120117188, 0.177978515625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 6.0, 1.0, 1.0, 6.0, 7.0, 7.0, 10.0, 12.0, 27.0, 43.0, 41.0, 75.0, 113.0, 225.0, 466.0, 876.0, 1866.0, 4726.0, 13872.0, 53293.0, 449267.0, 3443797.0, 179175.0, 31229.0, 9025.0, 3225.0, 1351.0, 703.0, 314.0, 185.0, 104.0, 82.0, 38.0, 38.0, 20.0, 24.0, 17.0, 4.0, 5.0, 7.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6943359375, -0.6728591918945312, -0.6513824462890625, -0.6299057006835938, -0.608428955078125, -0.5869522094726562, -0.5654754638671875, -0.5439987182617188, -0.52252197265625, -0.5010452270507812, -0.4795684814453125, -0.45809173583984375, -0.436614990234375, -0.41513824462890625, -0.3936614990234375, -0.37218475341796875, -0.3507080078125, -0.32923126220703125, -0.3077545166015625, -0.28627777099609375, -0.264801025390625, -0.24332427978515625, -0.2218475341796875, -0.20037078857421875, -0.17889404296875, -0.15741729736328125, -0.1359405517578125, -0.11446380615234375, -0.092987060546875, -0.07151031494140625, -0.0500335693359375, -0.02855682373046875, -0.007080078125, 0.01439666748046875, 0.0358734130859375, 0.05735015869140625, 0.078826904296875, 0.10030364990234375, 0.1217803955078125, 0.14325714111328125, 0.16473388671875, 0.18621063232421875, 0.2076873779296875, 0.22916412353515625, 0.250640869140625, 0.27211761474609375, 0.2935943603515625, 0.31507110595703125, 0.3365478515625, 0.35802459716796875, 0.3795013427734375, 0.40097808837890625, 0.422454833984375, 0.44393157958984375, 0.4654083251953125, 0.48688507080078125, 0.50836181640625, 0.5298385620117188, 0.5513153076171875, 0.5727920532226562, 0.594268798828125, 0.6157455444335938, 0.6372222900390625, 0.6586990356445312, 0.68017578125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 1.0, 2.0, 3.0, 7.0, 5.0, 6.0, 9.0, 18.0, 16.0, 25.0, 24.0, 53.0, 47.0, 78.0, 113.0, 137.0, 295.0, 615.0, 1070.0, 717.0, 353.0, 164.0, 100.0, 60.0, 41.0, 26.0, 22.0, 15.0, 11.0, 16.0, 6.0, 3.0, 4.0, 3.0, 1.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.7373046875, -0.7152328491210938, -0.6931610107421875, -0.6710891723632812, -0.649017333984375, -0.6269454956054688, -0.6048736572265625, -0.5828018188476562, -0.56072998046875, -0.5386581420898438, -0.5165863037109375, -0.49451446533203125, -0.472442626953125, -0.45037078857421875, -0.4282989501953125, -0.40622711181640625, -0.3841552734375, -0.36208343505859375, -0.3400115966796875, -0.31793975830078125, -0.295867919921875, -0.27379608154296875, -0.2517242431640625, -0.22965240478515625, -0.20758056640625, -0.18550872802734375, -0.1634368896484375, -0.14136505126953125, -0.119293212890625, -0.09722137451171875, -0.0751495361328125, -0.05307769775390625, -0.031005859375, -0.00893402099609375, 0.0131378173828125, 0.03520965576171875, 0.057281494140625, 0.07935333251953125, 0.1014251708984375, 0.12349700927734375, 0.14556884765625, 0.16764068603515625, 0.1897125244140625, 0.21178436279296875, 0.233856201171875, 0.25592803955078125, 0.2779998779296875, 0.30007171630859375, 0.3221435546875, 0.34421539306640625, 0.3662872314453125, 0.38835906982421875, 0.410430908203125, 0.43250274658203125, 0.4545745849609375, 0.47664642333984375, 0.49871826171875, 0.5207901000976562, 0.5428619384765625, 0.5649337768554688, 0.587005615234375, 0.6090774536132812, 0.6311492919921875, 0.6532211303710938, 0.67529296875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 3.0, 3.0, 24.0, 45.0, 119.0, 287.0, 295.0, 162.0, 46.0, 13.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.010629653930664, -9.642141342163086, -9.273652076721191, -8.905163764953613, -8.536675453186035, -8.16818618774414, -7.7996978759765625, -7.431209564208984, -7.062720775604248, -6.694231986999512, -6.325743675231934, -5.957254886627197, -5.588766098022461, -5.220277786254883, -4.8517889976501465, -4.48330020904541, -4.114811897277832, -3.746323347091675, -3.3778347969055176, -3.0093460083007812, -2.640857458114624, -2.272368907928467, -1.9038801193237305, -1.5353915691375732, -1.166903018951416, -0.798414409160614, -0.429925799369812, -0.061437129974365234, 0.307051420211792, 0.6755399703979492, 1.0440287590026855, 1.4125173091888428, 1.781005859375, 2.1494944095611572, 2.5179829597473145, 2.886471748352051, 3.254960298538208, 3.6234488487243652, 3.9919376373291016, 4.36042594909668, 4.728914737701416, 5.097403526306152, 5.4658918380737305, 5.834380626678467, 6.202869415283203, 6.571357727050781, 6.939846515655518, 7.308335304260254, 7.676823616027832, 8.04531192779541, 8.413801193237305, 8.782289505004883, 9.150777816772461, 9.519266128540039, 9.887755393981934, 10.256243705749512, 10.624732971191406, 10.993221282958984, 11.361710548400879, 11.730198860168457, 12.098687171936035, 12.46717643737793, 12.835664749145508, 13.204153060913086, 13.572641372680664]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 5.0, 6.0, 8.0, 10.0, 9.0, 12.0, 11.0, 16.0, 31.0, 35.0, 44.0, 45.0, 49.0, 58.0, 60.0, 64.0, 62.0, 67.0, 50.0, 57.0, 44.0, 40.0, 51.0, 40.0, 35.0, 26.0, 15.0, 19.0, 14.0, 3.0, 8.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.513559341430664, -3.3802833557128906, -3.247007369995117, -3.1137313842773438, -2.9804553985595703, -2.847179412841797, -2.7139036655426025, -2.580627679824829, -2.4473516941070557, -2.3140757083892822, -2.180799722671509, -2.0475237369537354, -1.9142478704452515, -1.780971884727478, -1.6476960182189941, -1.5144200325012207, -1.3811440467834473, -1.2478680610656738, -1.1145920753479004, -0.9813162088394165, -0.8480402231216431, -0.7147642374038696, -0.581488311290741, -0.4482123851776123, -0.31493639945983887, -0.18166044354438782, -0.04838448762893677, 0.08489146828651428, 0.21816742420196533, 0.35144340991973877, 0.48471933603286743, 0.6179952621459961, 0.7512707710266113, 0.8845467567443848, 1.0178227424621582, 1.151098608970642, 1.2843745946884155, 1.417650580406189, 1.5509264469146729, 1.6842024326324463, 1.8174784183502197, 1.9507544040679932, 2.0840303897857666, 2.21730637550354, 2.3505821228027344, 2.483858108520508, 2.6171340942382812, 2.7504100799560547, 2.883686065673828, 3.0169620513916016, 3.150238037109375, 3.2835140228271484, 3.416790008544922, 3.5500659942626953, 3.6833417415618896, 3.816617727279663, 3.9498937129974365, 4.083169460296631, 4.216445446014404, 4.349721431732178, 4.482997417449951, 4.616273403167725, 4.749549388885498, 4.8828253746032715, 5.016101360321045]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 7.0, 10.0, 15.0, 21.0, 31.0, 55.0, 113.0, 163.0, 358.0, 731.0, 1732.0, 4244.0, 12245.0, 45587.0, 285128.0, 588577.0, 80181.0, 19118.0, 5972.0, 2303.0, 963.0, 463.0, 228.0, 115.0, 68.0, 35.0, 29.0, 15.0, 13.0, 10.0, 6.0, 7.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.60693359375, -0.5818328857421875, -0.556732177734375, -0.5316314697265625, -0.50653076171875, -0.4814300537109375, -0.456329345703125, -0.4312286376953125, -0.4061279296875, -0.3810272216796875, -0.355926513671875, -0.3308258056640625, -0.30572509765625, -0.2806243896484375, -0.255523681640625, -0.2304229736328125, -0.205322265625, -0.1802215576171875, -0.155120849609375, -0.1300201416015625, -0.10491943359375, -0.0798187255859375, -0.054718017578125, -0.0296173095703125, -0.0045166015625, 0.0205841064453125, 0.045684814453125, 0.0707855224609375, 0.09588623046875, 0.1209869384765625, 0.146087646484375, 0.1711883544921875, 0.1962890625, 0.2213897705078125, 0.246490478515625, 0.2715911865234375, 0.29669189453125, 0.3217926025390625, 0.346893310546875, 0.3719940185546875, 0.3970947265625, 0.4221954345703125, 0.447296142578125, 0.4723968505859375, 0.49749755859375, 0.5225982666015625, 0.547698974609375, 0.5727996826171875, 0.597900390625, 0.6230010986328125, 0.648101806640625, 0.6732025146484375, 0.69830322265625, 0.7234039306640625, 0.748504638671875, 0.7736053466796875, 0.7987060546875, 0.8238067626953125, 0.848907470703125, 0.8740081787109375, 0.89910888671875, 0.9242095947265625, 0.949310302734375, 0.9744110107421875, 0.99951171875]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 8.0, 3.0, 11.0, 9.0, 4.0, 28.0, 25.0, 24.0, 35.0, 38.0, 53.0, 62.0, 75.0, 62.0, 66.0, 71.0, 67.0, 56.0, 61.0, 51.0, 32.0, 40.0, 34.0, 20.0, 22.0, 18.0, 10.0, 4.0, 7.0, 5.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.365478515625, -0.3565330505371094, -0.34758758544921875, -0.3386421203613281, -0.3296966552734375, -0.3207511901855469, -0.31180572509765625, -0.3028602600097656, -0.293914794921875, -0.2849693298339844, -0.27602386474609375, -0.2670783996582031, -0.2581329345703125, -0.24918746948242188, -0.24024200439453125, -0.23129653930664062, -0.22235107421875, -0.21340560913085938, -0.20446014404296875, -0.19551467895507812, -0.1865692138671875, -0.17762374877929688, -0.16867828369140625, -0.15973281860351562, -0.150787353515625, -0.14184188842773438, -0.13289642333984375, -0.12395095825195312, -0.1150054931640625, -0.10606002807617188, -0.09711456298828125, -0.08816909790039062, -0.0792236328125, -0.07027816772460938, -0.06133270263671875, -0.052387237548828125, -0.0434417724609375, -0.034496307373046875, -0.02555084228515625, -0.016605377197265625, -0.007659912109375, 0.001285552978515625, 0.01023101806640625, 0.019176483154296875, 0.0281219482421875, 0.037067413330078125, 0.04601287841796875, 0.054958343505859375, 0.06390380859375, 0.07284927368164062, 0.08179473876953125, 0.09074020385742188, 0.0996856689453125, 0.10863113403320312, 0.11757659912109375, 0.12652206420898438, 0.135467529296875, 0.14441299438476562, 0.15335845947265625, 0.16230392456054688, 0.1712493896484375, 0.18019485473632812, 0.18914031982421875, 0.19808578491210938, 0.20703125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 1.0, 7.0, 17.0, 6.0, 14.0, 22.0, 29.0, 36.0, 53.0, 67.0, 113.0, 163.0, 260.0, 410.0, 775.0, 1710.0, 4584.0, 19113.0, 258453.0, 720479.0, 31742.0, 6153.0, 2064.0, 910.0, 471.0, 288.0, 190.0, 142.0, 92.0, 65.0, 30.0, 26.0, 15.0, 16.0, 11.0, 9.0, 8.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0712890625, -1.03179931640625, -0.9923095703125, -0.95281982421875, -0.913330078125, -0.87384033203125, -0.8343505859375, -0.79486083984375, -0.75537109375, -0.71588134765625, -0.6763916015625, -0.63690185546875, -0.597412109375, -0.55792236328125, -0.5184326171875, -0.47894287109375, -0.439453125, -0.39996337890625, -0.3604736328125, -0.32098388671875, -0.281494140625, -0.24200439453125, -0.2025146484375, -0.16302490234375, -0.12353515625, -0.08404541015625, -0.0445556640625, -0.00506591796875, 0.034423828125, 0.07391357421875, 0.1134033203125, 0.15289306640625, 0.1923828125, 0.23187255859375, 0.2713623046875, 0.31085205078125, 0.350341796875, 0.38983154296875, 0.4293212890625, 0.46881103515625, 0.50830078125, 0.54779052734375, 0.5872802734375, 0.62677001953125, 0.666259765625, 0.70574951171875, 0.7452392578125, 0.78472900390625, 0.82421875, 0.86370849609375, 0.9031982421875, 0.94268798828125, 0.982177734375, 1.02166748046875, 1.0611572265625, 1.10064697265625, 1.14013671875, 1.17962646484375, 1.2191162109375, 1.25860595703125, 1.298095703125, 1.33758544921875, 1.3770751953125, 1.41656494140625, 1.4560546875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 4.0, 5.0, 6.0, 9.0, 7.0, 10.0, 11.0, 13.0, 20.0, 20.0, 33.0, 36.0, 31.0, 51.0, 39.0, 46.0, 53.0, 41.0, 52.0, 61.0, 48.0, 50.0, 47.0, 54.0, 39.0, 29.0, 32.0, 30.0, 21.0, 22.0, 10.0, 10.0, 14.0, 10.0, 11.0, 10.0, 4.0, 3.0, 5.0, 6.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.982421875, -0.949920654296875, -0.91741943359375, -0.884918212890625, -0.8524169921875, -0.819915771484375, -0.78741455078125, -0.754913330078125, -0.722412109375, -0.689910888671875, -0.65740966796875, -0.624908447265625, -0.5924072265625, -0.559906005859375, -0.52740478515625, -0.494903564453125, -0.46240234375, -0.429901123046875, -0.39739990234375, -0.364898681640625, -0.3323974609375, -0.299896240234375, -0.26739501953125, -0.234893798828125, -0.202392578125, -0.169891357421875, -0.13739013671875, -0.104888916015625, -0.0723876953125, -0.039886474609375, -0.00738525390625, 0.025115966796875, 0.0576171875, 0.090118408203125, 0.12261962890625, 0.155120849609375, 0.1876220703125, 0.220123291015625, 0.25262451171875, 0.285125732421875, 0.317626953125, 0.350128173828125, 0.38262939453125, 0.415130615234375, 0.4476318359375, 0.480133056640625, 0.51263427734375, 0.545135498046875, 0.57763671875, 0.610137939453125, 0.64263916015625, 0.675140380859375, 0.7076416015625, 0.740142822265625, 0.77264404296875, 0.805145263671875, 0.837646484375, 0.870147705078125, 0.90264892578125, 0.935150146484375, 0.9676513671875, 1.000152587890625, 1.03265380859375, 1.065155029296875, 1.09765625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 8.0, 6.0, 6.0, 10.0, 18.0, 34.0, 43.0, 74.0, 73.0, 176.0, 310.0, 607.0, 1566.0, 4492.0, 19866.0, 203253.0, 755706.0, 49621.0, 8347.0, 2442.0, 876.0, 393.0, 225.0, 139.0, 91.0, 59.0, 34.0, 19.0, 19.0, 10.0, 4.0, 8.0, 5.0, 3.0, 2.0, 3.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.425537109375, -0.4123344421386719, -0.39913177490234375, -0.3859291076660156, -0.3727264404296875, -0.3595237731933594, -0.34632110595703125, -0.3331184387207031, -0.319915771484375, -0.3067131042480469, -0.29351043701171875, -0.2803077697753906, -0.2671051025390625, -0.2539024353027344, -0.24069976806640625, -0.22749710083007812, -0.21429443359375, -0.20109176635742188, -0.18788909912109375, -0.17468643188476562, -0.1614837646484375, -0.14828109741210938, -0.13507843017578125, -0.12187576293945312, -0.108673095703125, -0.09547042846679688, -0.08226776123046875, -0.06906509399414062, -0.0558624267578125, -0.042659759521484375, -0.02945709228515625, -0.016254425048828125, -0.0030517578125, 0.010150909423828125, 0.02335357666015625, 0.036556243896484375, 0.0497589111328125, 0.06296157836914062, 0.07616424560546875, 0.08936691284179688, 0.102569580078125, 0.11577224731445312, 0.12897491455078125, 0.14217758178710938, 0.1553802490234375, 0.16858291625976562, 0.18178558349609375, 0.19498825073242188, 0.20819091796875, 0.22139358520507812, 0.23459625244140625, 0.24779891967773438, 0.2610015869140625, 0.2742042541503906, 0.28740692138671875, 0.3006095886230469, 0.313812255859375, 0.3270149230957031, 0.34021759033203125, 0.3534202575683594, 0.3666229248046875, 0.3798255920410156, 0.39302825927734375, 0.4062309265136719, 0.41943359375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 3.0, 2.0, 3.0, 4.0, 4.0, 9.0, 14.0, 20.0, 16.0, 29.0, 38.0, 61.0, 97.0, 149.0, 164.0, 136.0, 66.0, 60.0, 35.0, 26.0, 14.0, 12.0, 11.0, 7.0, 2.0, 7.0, 3.0, 7.0, 3.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0001131296157836914, -0.00011009536683559418, -0.00010706111788749695, -0.00010402686893939972, -0.00010099261999130249, -9.795837104320526e-05, -9.492412209510803e-05, -9.18898731470108e-05, -8.885562419891357e-05, -8.582137525081635e-05, -8.278712630271912e-05, -7.975287735462189e-05, -7.671862840652466e-05, -7.368437945842743e-05, -7.06501305103302e-05, -6.761588156223297e-05, -6.458163261413574e-05, -6.154738366603851e-05, -5.8513134717941284e-05, -5.5478885769844055e-05, -5.2444636821746826e-05, -4.94103878736496e-05, -4.637613892555237e-05, -4.334188997745514e-05, -4.030764102935791e-05, -3.727339208126068e-05, -3.423914313316345e-05, -3.120489418506622e-05, -2.8170645236968994e-05, -2.5136396288871765e-05, -2.2102147340774536e-05, -1.9067898392677307e-05, -1.6033649444580078e-05, -1.2999400496482849e-05, -9.96515154838562e-06, -6.930902600288391e-06, -3.896653652191162e-06, -8.624047040939331e-07, 2.171844244003296e-06, 5.206093192100525e-06, 8.240342140197754e-06, 1.1274591088294983e-05, 1.4308840036392212e-05, 1.734308898448944e-05, 2.037733793258667e-05, 2.34115868806839e-05, 2.6445835828781128e-05, 2.9480084776878357e-05, 3.2514333724975586e-05, 3.5548582673072815e-05, 3.8582831621170044e-05, 4.161708056926727e-05, 4.46513295173645e-05, 4.768557846546173e-05, 5.071982741355896e-05, 5.375407636165619e-05, 5.678832530975342e-05, 5.982257425785065e-05, 6.285682320594788e-05, 6.58910721540451e-05, 6.892532110214233e-05, 7.195957005023956e-05, 7.499381899833679e-05, 7.802806794643402e-05, 8.106231689453125e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 7.0, 10.0, 10.0, 8.0, 11.0, 34.0, 28.0, 42.0, 73.0, 95.0, 125.0, 190.0, 330.0, 545.0, 1017.0, 2182.0, 5759.0, 24874.0, 228758.0, 704347.0, 62658.0, 10870.0, 3288.0, 1476.0, 684.0, 402.0, 238.0, 140.0, 98.0, 65.0, 54.0, 35.0, 32.0, 17.0, 11.0, 10.0, 7.0, 4.0, 10.0, 7.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.326416015625, -0.31562042236328125, -0.3048248291015625, -0.29402923583984375, -0.283233642578125, -0.27243804931640625, -0.2616424560546875, -0.25084686279296875, -0.24005126953125, -0.22925567626953125, -0.2184600830078125, -0.20766448974609375, -0.196868896484375, -0.18607330322265625, -0.1752777099609375, -0.16448211669921875, -0.1536865234375, -0.14289093017578125, -0.1320953369140625, -0.12129974365234375, -0.110504150390625, -0.09970855712890625, -0.0889129638671875, -0.07811737060546875, -0.06732177734375, -0.05652618408203125, -0.0457305908203125, -0.03493499755859375, -0.024139404296875, -0.01334381103515625, -0.0025482177734375, 0.00824737548828125, 0.01904296875, 0.02983856201171875, 0.0406341552734375, 0.05142974853515625, 0.062225341796875, 0.07302093505859375, 0.0838165283203125, 0.09461212158203125, 0.10540771484375, 0.11620330810546875, 0.1269989013671875, 0.13779449462890625, 0.148590087890625, 0.15938568115234375, 0.1701812744140625, 0.18097686767578125, 0.1917724609375, 0.20256805419921875, 0.2133636474609375, 0.22415924072265625, 0.234954833984375, 0.24575042724609375, 0.2565460205078125, 0.26734161376953125, 0.27813720703125, 0.28893280029296875, 0.2997283935546875, 0.31052398681640625, 0.321319580078125, 0.33211517333984375, 0.3429107666015625, 0.35370635986328125, 0.364501953125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 5.0, 3.0, 4.0, 6.0, 5.0, 8.0, 11.0, 10.0, 20.0, 15.0, 17.0, 23.0, 42.0, 40.0, 44.0, 53.0, 59.0, 76.0, 76.0, 81.0, 83.0, 50.0, 39.0, 40.0, 36.0, 33.0, 22.0, 28.0, 16.0, 8.0, 9.0, 7.0, 2.0, 5.0, 5.0, 4.0, 4.0, 3.0, 6.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.28076171875, -0.2729034423828125, -0.265045166015625, -0.2571868896484375, -0.24932861328125, -0.2414703369140625, -0.233612060546875, -0.2257537841796875, -0.2178955078125, -0.2100372314453125, -0.202178955078125, -0.1943206787109375, -0.18646240234375, -0.1786041259765625, -0.170745849609375, -0.1628875732421875, -0.155029296875, -0.1471710205078125, -0.139312744140625, -0.1314544677734375, -0.12359619140625, -0.1157379150390625, -0.107879638671875, -0.1000213623046875, -0.0921630859375, -0.0843048095703125, -0.076446533203125, -0.0685882568359375, -0.06072998046875, -0.0528717041015625, -0.045013427734375, -0.0371551513671875, -0.029296875, -0.0214385986328125, -0.013580322265625, -0.0057220458984375, 0.00213623046875, 0.0099945068359375, 0.017852783203125, 0.0257110595703125, 0.0335693359375, 0.0414276123046875, 0.049285888671875, 0.0571441650390625, 0.06500244140625, 0.0728607177734375, 0.080718994140625, 0.0885772705078125, 0.096435546875, 0.1042938232421875, 0.112152099609375, 0.1200103759765625, 0.12786865234375, 0.1357269287109375, 0.143585205078125, 0.1514434814453125, 0.1593017578125, 0.1671600341796875, 0.175018310546875, 0.1828765869140625, 0.19073486328125, 0.1985931396484375, 0.206451416015625, 0.2143096923828125, 0.22216796875]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 7.0, 2.0, 11.0, 23.0, 59.0, 108.0, 201.0, 241.0, 173.0, 97.0, 44.0, 15.0, 8.0, 1.0, 4.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.356454849243164, -10.087518692016602, -9.818582534790039, -9.549646377563477, -9.280710220336914, -9.011774063110352, -8.742837905883789, -8.473901748657227, -8.204965591430664, -7.936029434204102, -7.667093276977539, -7.398157119750977, -7.129220962524414, -6.860284805297852, -6.591349124908447, -6.322412967681885, -6.0534772872924805, -5.784541130065918, -5.5156049728393555, -5.246668815612793, -4.9777326583862305, -4.708796501159668, -4.439860820770264, -4.170924663543701, -3.9019885063171387, -3.633052349090576, -3.3641161918640137, -3.0951802730560303, -2.8262441158294678, -2.5573079586029053, -2.288372039794922, -2.0194358825683594, -1.7505006790161133, -1.4815645217895508, -1.2126284837722778, -0.9436923861503601, -0.6747562885284424, -0.4058201313018799, -0.13688409328460693, 0.13205194473266602, 0.4009881019592285, 0.6699241995811462, 0.938860297203064, 1.207796335220337, 1.4767324924468994, 1.745668649673462, 2.0146045684814453, 2.283540725708008, 2.5524768829345703, 2.821413040161133, 3.0903491973876953, 3.3592851161956787, 3.628221273422241, 3.8971574306488037, 4.166093349456787, 4.43502950668335, 4.703965663909912, 4.972901821136475, 5.241837978363037, 5.5107741355896, 5.779709815979004, 6.048645973205566, 6.317582130432129, 6.586518287658691, 6.855454444885254]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 6.0, 12.0, 13.0, 8.0, 12.0, 22.0, 13.0, 17.0, 27.0, 29.0, 24.0, 36.0, 39.0, 54.0, 51.0, 68.0, 71.0, 73.0, 67.0, 49.0, 46.0, 44.0, 26.0, 31.0, 31.0, 31.0, 19.0, 19.0, 11.0, 14.0, 11.0, 6.0, 7.0, 6.0, 3.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.709228277206421, -3.574207067489624, -3.439185857772827, -3.3041646480560303, -3.1691434383392334, -3.0341222286224365, -2.8991007804870605, -2.7640795707702637, -2.629058361053467, -2.49403715133667, -2.359015941619873, -2.223994731903076, -2.0889735221862793, -1.9539523124694824, -1.818930983543396, -1.6839097738265991, -1.5488886833190918, -1.413867473602295, -1.278846263885498, -1.1438250541687012, -1.0088038444519043, -0.8737825751304626, -0.738761305809021, -0.6037400960922241, -0.46871888637542725, -0.33369767665863037, -0.1986764371395111, -0.06365519762039185, 0.07136601209640503, 0.2063872218132019, 0.34140849113464355, 0.47642970085144043, 0.6114506721496582, 0.7464718818664551, 0.881493091583252, 1.0165143013000488, 1.1515355110168457, 1.2865567207336426, 1.421578049659729, 1.5565992593765259, 1.6916204690933228, 1.8266416788101196, 1.9616628885269165, 2.096684217453003, 2.2317054271698, 2.3667266368865967, 2.5017478466033936, 2.6367690563201904, 2.7717902660369873, 2.906811475753784, 3.041832685470581, 3.176853895187378, 3.311875104904175, 3.4468963146209717, 3.5819177627563477, 3.7169389724731445, 3.8519601821899414, 3.9869813919067383, 4.122002601623535, 4.257023811340332, 4.392045021057129, 4.527066230773926, 4.662087440490723, 4.7971086502075195, 4.932129859924316]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 5.0, 3.0, 10.0, 9.0, 18.0, 13.0, 24.0, 42.0, 51.0, 72.0, 123.0, 226.0, 778.0, 7441.0, 2378182.0, 1798728.0, 7054.0, 856.0, 265.0, 130.0, 65.0, 69.0, 42.0, 19.0, 19.0, 10.0, 12.0, 5.0, 3.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.6806640625, -1.6281280517578125, -1.575592041015625, -1.5230560302734375, -1.47052001953125, -1.4179840087890625, -1.365447998046875, -1.3129119873046875, -1.2603759765625, -1.2078399658203125, -1.155303955078125, -1.1027679443359375, -1.05023193359375, -0.9976959228515625, -0.945159912109375, -0.8926239013671875, -0.840087890625, -0.7875518798828125, -0.735015869140625, -0.6824798583984375, -0.62994384765625, -0.5774078369140625, -0.524871826171875, -0.4723358154296875, -0.4197998046875, -0.3672637939453125, -0.314727783203125, -0.2621917724609375, -0.20965576171875, -0.1571197509765625, -0.104583740234375, -0.0520477294921875, 0.00048828125, 0.0530242919921875, 0.105560302734375, 0.1580963134765625, 0.21063232421875, 0.2631683349609375, 0.315704345703125, 0.3682403564453125, 0.4207763671875, 0.4733123779296875, 0.525848388671875, 0.5783843994140625, 0.63092041015625, 0.6834564208984375, 0.735992431640625, 0.7885284423828125, 0.841064453125, 0.8936004638671875, 0.946136474609375, 0.9986724853515625, 1.05120849609375, 1.1037445068359375, 1.156280517578125, 1.2088165283203125, 1.2613525390625, 1.3138885498046875, 1.366424560546875, 1.4189605712890625, 1.47149658203125, 1.5240325927734375, 1.576568603515625, 1.6291046142578125, 1.681640625]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 6.0, 7.0, 8.0, 12.0, 14.0, 17.0, 27.0, 32.0, 46.0, 59.0, 49.0, 60.0, 58.0, 67.0, 66.0, 61.0, 74.0, 55.0, 53.0, 50.0, 36.0, 33.0, 27.0, 28.0, 18.0, 11.0, 10.0, 8.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.217529296875, -0.20933151245117188, -0.20113372802734375, -0.19293594360351562, -0.1847381591796875, -0.17654037475585938, -0.16834259033203125, -0.16014480590820312, -0.151947021484375, -0.14374923706054688, -0.13555145263671875, -0.12735366821289062, -0.1191558837890625, -0.11095809936523438, -0.10276031494140625, -0.09456253051757812, -0.08636474609375, -0.07816696166992188, -0.06996917724609375, -0.061771392822265625, -0.0535736083984375, -0.045375823974609375, -0.03717803955078125, -0.028980255126953125, -0.020782470703125, -0.012584686279296875, -0.00438690185546875, 0.003810882568359375, 0.0120086669921875, 0.020206451416015625, 0.02840423583984375, 0.036602020263671875, 0.0447998046875, 0.052997589111328125, 0.06119537353515625, 0.06939315795898438, 0.0775909423828125, 0.08578872680664062, 0.09398651123046875, 0.10218429565429688, 0.110382080078125, 0.11857986450195312, 0.12677764892578125, 0.13497543334960938, 0.1431732177734375, 0.15137100219726562, 0.15956878662109375, 0.16776657104492188, 0.17596435546875, 0.18416213989257812, 0.19235992431640625, 0.20055770874023438, 0.2087554931640625, 0.21695327758789062, 0.22515106201171875, 0.23334884643554688, 0.241546630859375, 0.24974441528320312, 0.25794219970703125, 0.2661399841308594, 0.2743377685546875, 0.2825355529785156, 0.29073333740234375, 0.2989311218261719, 0.30712890625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 1.0, 8.0, 4.0, 14.0, 13.0, 30.0, 22.0, 29.0, 51.0, 99.0, 165.0, 293.0, 608.0, 1219.0, 2736.0, 6349.0, 15554.0, 43774.0, 189702.0, 2945377.0, 850390.0, 92443.0, 26969.0, 10156.0, 4333.0, 1910.0, 921.0, 462.0, 237.0, 150.0, 88.0, 53.0, 36.0, 22.0, 15.0, 9.0, 7.0, 12.0, 6.0, 8.0, 3.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5205078125, -0.5046310424804688, -0.4887542724609375, -0.47287750244140625, -0.457000732421875, -0.44112396240234375, -0.4252471923828125, -0.40937042236328125, -0.39349365234375, -0.37761688232421875, -0.3617401123046875, -0.34586334228515625, -0.329986572265625, -0.31410980224609375, -0.2982330322265625, -0.28235626220703125, -0.2664794921875, -0.25060272216796875, -0.2347259521484375, -0.21884918212890625, -0.202972412109375, -0.18709564208984375, -0.1712188720703125, -0.15534210205078125, -0.13946533203125, -0.12358856201171875, -0.1077117919921875, -0.09183502197265625, -0.075958251953125, -0.06008148193359375, -0.0442047119140625, -0.02832794189453125, -0.012451171875, 0.00342559814453125, 0.0193023681640625, 0.03517913818359375, 0.051055908203125, 0.06693267822265625, 0.0828094482421875, 0.09868621826171875, 0.11456298828125, 0.13043975830078125, 0.1463165283203125, 0.16219329833984375, 0.178070068359375, 0.19394683837890625, 0.2098236083984375, 0.22570037841796875, 0.2415771484375, 0.25745391845703125, 0.2733306884765625, 0.28920745849609375, 0.305084228515625, 0.32096099853515625, 0.3368377685546875, 0.35271453857421875, 0.36859130859375, 0.38446807861328125, 0.4003448486328125, 0.41622161865234375, 0.432098388671875, 0.44797515869140625, 0.4638519287109375, 0.47972869873046875, 0.49560546875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 5.0, 5.0, 5.0, 8.0, 6.0, 7.0, 9.0, 10.0, 20.0, 24.0, 24.0, 28.0, 43.0, 75.0, 108.0, 164.0, 314.0, 630.0, 993.0, 686.0, 319.0, 191.0, 106.0, 85.0, 52.0, 34.0, 27.0, 17.0, 16.0, 16.0, 6.0, 9.0, 7.0, 4.0, 9.0, 5.0, 3.0, 3.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.55908203125, -0.5419082641601562, -0.5247344970703125, -0.5075607299804688, -0.490386962890625, -0.47321319580078125, -0.4560394287109375, -0.43886566162109375, -0.42169189453125, -0.40451812744140625, -0.3873443603515625, -0.37017059326171875, -0.352996826171875, -0.33582305908203125, -0.3186492919921875, -0.30147552490234375, -0.2843017578125, -0.26712799072265625, -0.2499542236328125, -0.23278045654296875, -0.215606689453125, -0.19843292236328125, -0.1812591552734375, -0.16408538818359375, -0.14691162109375, -0.12973785400390625, -0.1125640869140625, -0.09539031982421875, -0.078216552734375, -0.06104278564453125, -0.0438690185546875, -0.02669525146484375, -0.009521484375, 0.00765228271484375, 0.0248260498046875, 0.04199981689453125, 0.059173583984375, 0.07634735107421875, 0.0935211181640625, 0.11069488525390625, 0.12786865234375, 0.14504241943359375, 0.1622161865234375, 0.17938995361328125, 0.196563720703125, 0.21373748779296875, 0.2309112548828125, 0.24808502197265625, 0.2652587890625, 0.28243255615234375, 0.2996063232421875, 0.31678009033203125, 0.333953857421875, 0.35112762451171875, 0.3683013916015625, 0.38547515869140625, 0.40264892578125, 0.41982269287109375, 0.4369964599609375, 0.45417022705078125, 0.471343994140625, 0.48851776123046875, 0.5056915283203125, 0.5228652954101562, 0.5400390625]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 4.0, 13.0, 18.0, 54.0, 129.0, 260.0, 243.0, 162.0, 54.0, 28.0, 10.0, 10.0, 5.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.792000770568848, -7.556621551513672, -7.321242809295654, -7.0858635902404785, -6.850484371185303, -6.615105628967285, -6.379726409912109, -6.144347190856934, -5.908967971801758, -5.673588752746582, -5.4382100105285645, -5.202830791473389, -4.967451572418213, -4.732072830200195, -4.4966936111450195, -4.261314392089844, -4.025935649871826, -3.7905566692352295, -3.5551774501800537, -3.319798469543457, -3.0844192504882812, -2.8490402698516846, -2.613661289215088, -2.378282070159912, -2.1429030895233154, -1.9075239896774292, -1.672144889831543, -1.4367659091949463, -1.20138680934906, -0.9660077095031738, -0.7306287288665771, -0.4952496290206909, -0.2598705291748047, -0.024491459131240845, 0.210887610912323, 0.44626665115356445, 0.6816457509994507, 0.9170248508453369, 1.1524038314819336, 1.3877829313278198, 1.623162031173706, 1.8585411310195923, 2.0939202308654785, 2.329299211502075, 2.564678192138672, 2.8000574111938477, 3.0354363918304443, 3.270815372467041, 3.506194591522217, 3.7415735721588135, 3.9769527912139893, 4.212331771850586, 4.447710990905762, 4.6830902099609375, 4.918468952178955, 5.153848171234131, 5.389226913452148, 5.624606132507324, 5.859984874725342, 6.095364093780518, 6.330743312835693, 6.566122055053711, 6.801501274108887, 7.0368804931640625, 7.272259712219238]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 3.0, 2.0, 2.0, 3.0, 2.0, 7.0, 2.0, 4.0, 6.0, 12.0, 11.0, 10.0, 11.0, 5.0, 11.0, 22.0, 21.0, 30.0, 22.0, 26.0, 36.0, 36.0, 29.0, 32.0, 37.0, 40.0, 44.0, 46.0, 37.0, 41.0, 40.0, 40.0, 31.0, 41.0, 31.0, 29.0, 30.0, 19.0, 22.0, 26.0, 17.0, 14.0, 8.0, 16.0, 8.0, 9.0, 2.0, 6.0, 9.0, 3.0, 6.0, 4.0, 4.0, 1.0, 1.0, 3.0, 5.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.027822256088257, -1.9634045362472534, -1.89898681640625, -1.8345690965652466, -1.7701513767242432, -1.7057336568832397, -1.6413159370422363, -1.576898217201233, -1.5124804973602295, -1.448062777519226, -1.3836450576782227, -1.3192273378372192, -1.2548096179962158, -1.1903918981552124, -1.125974178314209, -1.0615564584732056, -0.9971387386322021, -0.9327210187911987, -0.8683032989501953, -0.8038855791091919, -0.7394678592681885, -0.6750501394271851, -0.6106324195861816, -0.5462146997451782, -0.4817969799041748, -0.4173792600631714, -0.35296154022216797, -0.28854382038116455, -0.22412610054016113, -0.15970838069915771, -0.0952906608581543, -0.03087294101715088, 0.03354454040527344, 0.09796226024627686, 0.16237998008728027, 0.2267976999282837, 0.2912154197692871, 0.3556331396102905, 0.42005085945129395, 0.48446857929229736, 0.5488862991333008, 0.6133040189743042, 0.6777217388153076, 0.742139458656311, 0.8065571784973145, 0.8709748983383179, 0.9353926181793213, 0.9998103380203247, 1.0642280578613281, 1.1286457777023315, 1.193063497543335, 1.2574812173843384, 1.3218989372253418, 1.3863166570663452, 1.4507343769073486, 1.515152096748352, 1.5795698165893555, 1.6439875364303589, 1.7084052562713623, 1.7728229761123657, 1.8372406959533691, 1.9016584157943726, 1.966076135635376, 2.03049373626709, 2.094911575317383]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 7.0, 3.0, 4.0, 11.0, 9.0, 20.0, 30.0, 40.0, 71.0, 88.0, 148.0, 258.0, 387.0, 605.0, 1158.0, 1998.0, 3731.0, 7177.0, 14897.0, 34069.0, 95264.0, 326651.0, 377093.0, 111514.0, 39534.0, 16713.0, 7827.0, 3956.0, 2143.0, 1217.0, 733.0, 454.0, 313.0, 135.0, 111.0, 59.0, 51.0, 30.0, 18.0, 10.0, 9.0, 5.0, 3.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.3876953125, -0.3752174377441406, -0.36273956298828125, -0.3502616882324219, -0.3377838134765625, -0.3253059387207031, -0.31282806396484375, -0.3003501892089844, -0.287872314453125, -0.2753944396972656, -0.26291656494140625, -0.2504386901855469, -0.2379608154296875, -0.22548294067382812, -0.21300506591796875, -0.20052719116210938, -0.18804931640625, -0.17557144165039062, -0.16309356689453125, -0.15061569213867188, -0.1381378173828125, -0.12565994262695312, -0.11318206787109375, -0.10070419311523438, -0.088226318359375, -0.07574844360351562, -0.06327056884765625, -0.050792694091796875, -0.0383148193359375, -0.025836944580078125, -0.01335906982421875, -0.000881195068359375, 0.0115966796875, 0.024074554443359375, 0.03655242919921875, 0.049030303955078125, 0.0615081787109375, 0.07398605346679688, 0.08646392822265625, 0.09894180297851562, 0.111419677734375, 0.12389755249023438, 0.13637542724609375, 0.14885330200195312, 0.1613311767578125, 0.17380905151367188, 0.18628692626953125, 0.19876480102539062, 0.21124267578125, 0.22372055053710938, 0.23619842529296875, 0.24867630004882812, 0.2611541748046875, 0.2736320495605469, 0.28610992431640625, 0.2985877990722656, 0.311065673828125, 0.3235435485839844, 0.33602142333984375, 0.3484992980957031, 0.3609771728515625, 0.3734550476074219, 0.38593292236328125, 0.3984107971191406, 0.410888671875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 5.0, 8.0, 7.0, 7.0, 11.0, 24.0, 21.0, 22.0, 24.0, 31.0, 27.0, 40.0, 49.0, 60.0, 55.0, 59.0, 56.0, 54.0, 50.0, 54.0, 51.0, 52.0, 33.0, 33.0, 36.0, 23.0, 17.0, 26.0, 14.0, 10.0, 15.0, 8.0, 5.0, 5.0, 6.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.2440185546875, -0.23657608032226562, -0.22913360595703125, -0.22169113159179688, -0.2142486572265625, -0.20680618286132812, -0.19936370849609375, -0.19192123413085938, -0.184478759765625, -0.17703628540039062, -0.16959381103515625, -0.16215133666992188, -0.1547088623046875, -0.14726638793945312, -0.13982391357421875, -0.13238143920898438, -0.12493896484375, -0.11749649047851562, -0.11005401611328125, -0.10261154174804688, -0.0951690673828125, -0.08772659301757812, -0.08028411865234375, -0.07284164428710938, -0.065399169921875, -0.057956695556640625, -0.05051422119140625, -0.043071746826171875, -0.0356292724609375, -0.028186798095703125, -0.02074432373046875, -0.013301849365234375, -0.005859375, 0.001583099365234375, 0.00902557373046875, 0.016468048095703125, 0.0239105224609375, 0.031352996826171875, 0.03879547119140625, 0.046237945556640625, 0.053680419921875, 0.061122894287109375, 0.06856536865234375, 0.07600784301757812, 0.0834503173828125, 0.09089279174804688, 0.09833526611328125, 0.10577774047851562, 0.11322021484375, 0.12066268920898438, 0.12810516357421875, 0.13554763793945312, 0.1429901123046875, 0.15043258666992188, 0.15787506103515625, 0.16531753540039062, 0.172760009765625, 0.18020248413085938, 0.18764495849609375, 0.19508743286132812, 0.2025299072265625, 0.20997238159179688, 0.21741485595703125, 0.22485733032226562, 0.2322998046875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 3.0, 3.0, 7.0, 7.0, 17.0, 14.0, 22.0, 25.0, 34.0, 51.0, 78.0, 97.0, 159.0, 274.0, 451.0, 865.0, 1593.0, 4513.0, 18232.0, 133195.0, 787923.0, 81025.0, 13095.0, 3645.0, 1441.0, 693.0, 422.0, 220.0, 151.0, 86.0, 51.0, 38.0, 33.0, 22.0, 21.0, 16.0, 13.0, 4.0, 5.0, 2.0, 2.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.77392578125, -0.7446060180664062, -0.7152862548828125, -0.6859664916992188, -0.656646728515625, -0.6273269653320312, -0.5980072021484375, -0.5686874389648438, -0.53936767578125, -0.5100479125976562, -0.4807281494140625, -0.45140838623046875, -0.422088623046875, -0.39276885986328125, -0.3634490966796875, -0.33412933349609375, -0.3048095703125, -0.27548980712890625, -0.2461700439453125, -0.21685028076171875, -0.187530517578125, -0.15821075439453125, -0.1288909912109375, -0.09957122802734375, -0.07025146484375, -0.04093170166015625, -0.0116119384765625, 0.01770782470703125, 0.047027587890625, 0.07634735107421875, 0.1056671142578125, 0.13498687744140625, 0.164306640625, 0.19362640380859375, 0.2229461669921875, 0.25226593017578125, 0.281585693359375, 0.31090545654296875, 0.3402252197265625, 0.36954498291015625, 0.39886474609375, 0.42818450927734375, 0.4575042724609375, 0.48682403564453125, 0.516143798828125, 0.5454635620117188, 0.5747833251953125, 0.6041030883789062, 0.6334228515625, 0.6627426147460938, 0.6920623779296875, 0.7213821411132812, 0.750701904296875, 0.7800216674804688, 0.8093414306640625, 0.8386611938476562, 0.86798095703125, 0.8973007202148438, 0.9266204833984375, 0.9559402465820312, 0.985260009765625, 1.0145797729492188, 1.0438995361328125, 1.0732192993164062, 1.1025390625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 5.0, 3.0, 4.0, 1.0, 5.0, 8.0, 10.0, 4.0, 18.0, 19.0, 12.0, 26.0, 28.0, 22.0, 37.0, 42.0, 42.0, 52.0, 62.0, 56.0, 59.0, 61.0, 69.0, 56.0, 46.0, 51.0, 37.0, 36.0, 28.0, 21.0, 24.0, 13.0, 6.0, 16.0, 14.0, 7.0, 4.0, 6.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2587890625, -1.2254409790039062, -1.1920928955078125, -1.1587448120117188, -1.125396728515625, -1.0920486450195312, -1.0587005615234375, -1.0253524780273438, -0.99200439453125, -0.9586563110351562, -0.9253082275390625, -0.8919601440429688, -0.858612060546875, -0.8252639770507812, -0.7919158935546875, -0.7585678100585938, -0.7252197265625, -0.6918716430664062, -0.6585235595703125, -0.6251754760742188, -0.591827392578125, -0.5584793090820312, -0.5251312255859375, -0.49178314208984375, -0.45843505859375, -0.42508697509765625, -0.3917388916015625, -0.35839080810546875, -0.325042724609375, -0.29169464111328125, -0.2583465576171875, -0.22499847412109375, -0.191650390625, -0.15830230712890625, -0.1249542236328125, -0.09160614013671875, -0.058258056640625, -0.02490997314453125, 0.0084381103515625, 0.04178619384765625, 0.07513427734375, 0.10848236083984375, 0.1418304443359375, 0.17517852783203125, 0.208526611328125, 0.24187469482421875, 0.2752227783203125, 0.30857086181640625, 0.3419189453125, 0.37526702880859375, 0.4086151123046875, 0.44196319580078125, 0.475311279296875, 0.5086593627929688, 0.5420074462890625, 0.5753555297851562, 0.60870361328125, 0.6420516967773438, 0.6753997802734375, 0.7087478637695312, 0.742095947265625, 0.7754440307617188, 0.8087921142578125, 0.8421401977539062, 0.87548828125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 5.0, 8.0, 15.0, 18.0, 31.0, 59.0, 203.0, 625.0, 3319.0, 48707.0, 942639.0, 48514.0, 3393.0, 640.0, 206.0, 80.0, 38.0, 18.0, 15.0, 3.0, 5.0, 5.0, 7.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.138671875, -1.1124954223632812, -1.0863189697265625, -1.0601425170898438, -1.033966064453125, -1.0077896118164062, -0.9816131591796875, -0.9554367065429688, -0.92926025390625, -0.9030838012695312, -0.8769073486328125, -0.8507308959960938, -0.824554443359375, -0.7983779907226562, -0.7722015380859375, -0.7460250854492188, -0.7198486328125, -0.6936721801757812, -0.6674957275390625, -0.6413192749023438, -0.615142822265625, -0.5889663696289062, -0.5627899169921875, -0.5366134643554688, -0.51043701171875, -0.48426055908203125, -0.4580841064453125, -0.43190765380859375, -0.405731201171875, -0.37955474853515625, -0.3533782958984375, -0.32720184326171875, -0.301025390625, -0.27484893798828125, -0.2486724853515625, -0.22249603271484375, -0.196319580078125, -0.17014312744140625, -0.1439666748046875, -0.11779022216796875, -0.09161376953125, -0.06543731689453125, -0.0392608642578125, -0.01308441162109375, 0.013092041015625, 0.03926849365234375, 0.0654449462890625, 0.09162139892578125, 0.1177978515625, 0.14397430419921875, 0.1701507568359375, 0.19632720947265625, 0.222503662109375, 0.24868011474609375, 0.2748565673828125, 0.30103302001953125, 0.32720947265625, 0.35338592529296875, 0.3795623779296875, 0.40573883056640625, 0.431915283203125, 0.45809173583984375, 0.4842681884765625, 0.5104446411132812, 0.53662109375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 8.0, 4.0, 6.0, 8.0, 5.0, 14.0, 15.0, 24.0, 46.0, 43.0, 55.0, 76.0, 106.0, 148.0, 107.0, 87.0, 73.0, 55.0, 37.0, 21.0, 17.0, 10.0, 8.0, 9.0, 7.0, 2.0, 0.0, 3.0, 4.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.00011521577835083008, -0.00011245440691709518, -0.00010969303548336029, -0.0001069316640496254, -0.0001041702926158905, -0.00010140892118215561, -9.864754974842072e-05, -9.588617831468582e-05, -9.312480688095093e-05, -9.036343544721603e-05, -8.760206401348114e-05, -8.484069257974625e-05, -8.207932114601135e-05, -7.931794971227646e-05, -7.655657827854156e-05, -7.379520684480667e-05, -7.103383541107178e-05, -6.827246397733688e-05, -6.551109254360199e-05, -6.27497211098671e-05, -5.99883496761322e-05, -5.722697824239731e-05, -5.4465606808662415e-05, -5.170423537492752e-05, -4.894286394119263e-05, -4.618149250745773e-05, -4.342012107372284e-05, -4.0658749639987946e-05, -3.789737820625305e-05, -3.513600677251816e-05, -3.2374635338783264e-05, -2.961326390504837e-05, -2.6851892471313477e-05, -2.4090521037578583e-05, -2.132914960384369e-05, -1.8567778170108795e-05, -1.58064067363739e-05, -1.3045035302639008e-05, -1.0283663868904114e-05, -7.52229243516922e-06, -4.760921001434326e-06, -1.9995495676994324e-06, 7.618218660354614e-07, 3.5231932997703552e-06, 6.284564733505249e-06, 9.045936167240143e-06, 1.1807307600975037e-05, 1.456867903470993e-05, 1.7330050468444824e-05, 2.0091421902179718e-05, 2.2852793335914612e-05, 2.5614164769649506e-05, 2.83755362033844e-05, 3.113690763711929e-05, 3.389827907085419e-05, 3.665965050458908e-05, 3.9421021938323975e-05, 4.218239337205887e-05, 4.494376480579376e-05, 4.7705136239528656e-05, 5.046650767326355e-05, 5.3227879106998444e-05, 5.598925054073334e-05, 5.875062197446823e-05, 6.151199340820312e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 10.0, 16.0, 29.0, 68.0, 136.0, 310.0, 892.0, 4120.0, 55132.0, 926837.0, 55316.0, 4161.0, 923.0, 319.0, 154.0, 64.0, 30.0, 13.0, 13.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.83056640625, -0.8084182739257812, -0.7862701416015625, -0.7641220092773438, -0.741973876953125, -0.7198257446289062, -0.6976776123046875, -0.6755294799804688, -0.65338134765625, -0.6312332153320312, -0.6090850830078125, -0.5869369506835938, -0.564788818359375, -0.5426406860351562, -0.5204925537109375, -0.49834442138671875, -0.4761962890625, -0.45404815673828125, -0.4319000244140625, -0.40975189208984375, -0.387603759765625, -0.36545562744140625, -0.3433074951171875, -0.32115936279296875, -0.29901123046875, -0.27686309814453125, -0.2547149658203125, -0.23256683349609375, -0.210418701171875, -0.18827056884765625, -0.1661224365234375, -0.14397430419921875, -0.121826171875, -0.09967803955078125, -0.0775299072265625, -0.05538177490234375, -0.033233642578125, -0.01108551025390625, 0.0110626220703125, 0.03321075439453125, 0.05535888671875, 0.07750701904296875, 0.0996551513671875, 0.12180328369140625, 0.143951416015625, 0.16609954833984375, 0.1882476806640625, 0.21039581298828125, 0.2325439453125, 0.25469207763671875, 0.2768402099609375, 0.29898834228515625, 0.321136474609375, 0.34328460693359375, 0.3654327392578125, 0.38758087158203125, 0.40972900390625, 0.43187713623046875, 0.4540252685546875, 0.47617340087890625, 0.498321533203125, 0.5204696655273438, 0.5426177978515625, 0.5647659301757812, 0.5869140625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 4.0, 5.0, 11.0, 12.0, 11.0, 21.0, 26.0, 35.0, 40.0, 75.0, 72.0, 103.0, 111.0, 108.0, 76.0, 66.0, 59.0, 50.0, 29.0, 28.0, 12.0, 11.0, 16.0, 6.0, 6.0, 2.0, 4.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.331298828125, -0.3193626403808594, -0.30742645263671875, -0.2954902648925781, -0.2835540771484375, -0.2716178894042969, -0.25968170166015625, -0.24774551391601562, -0.235809326171875, -0.22387313842773438, -0.21193695068359375, -0.20000076293945312, -0.1880645751953125, -0.17612838745117188, -0.16419219970703125, -0.15225601196289062, -0.14031982421875, -0.12838363647460938, -0.11644744873046875, -0.10451126098632812, -0.0925750732421875, -0.08063888549804688, -0.06870269775390625, -0.056766510009765625, -0.044830322265625, -0.032894134521484375, -0.02095794677734375, -0.009021759033203125, 0.0029144287109375, 0.014850616455078125, 0.02678680419921875, 0.038722991943359375, 0.0506591796875, 0.06259536743164062, 0.07453155517578125, 0.08646774291992188, 0.0984039306640625, 0.11034011840820312, 0.12227630615234375, 0.13421249389648438, 0.146148681640625, 0.15808486938476562, 0.17002105712890625, 0.18195724487304688, 0.1938934326171875, 0.20582962036132812, 0.21776580810546875, 0.22970199584960938, 0.24163818359375, 0.2535743713378906, 0.26551055908203125, 0.2774467468261719, 0.2893829345703125, 0.3013191223144531, 0.31325531005859375, 0.3251914978027344, 0.337127685546875, 0.3490638732910156, 0.36100006103515625, 0.3729362487792969, 0.3848724365234375, 0.3968086242675781, 0.40874481201171875, 0.4206809997558594, 0.4326171875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 9.0, 8.0, 44.0, 143.0, 327.0, 294.0, 113.0, 39.0, 15.0, 11.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.595186233520508, -13.225724220275879, -12.856261253356934, -12.486799240112305, -12.11733627319336, -11.74787425994873, -11.378412246704102, -11.008949279785156, -10.639486312866211, -10.270024299621582, -9.900561332702637, -9.531099319458008, -9.161636352539062, -8.792174339294434, -8.422712326049805, -8.05324935913086, -7.6837873458862305, -7.314324855804443, -6.944862365722656, -6.575400352478027, -6.205937385559082, -5.836475372314453, -5.467012882232666, -5.097550392150879, -4.728087902069092, -4.358625411987305, -3.9891629219055176, -3.6197006702423096, -3.2502381801605225, -2.8807756900787354, -2.5113134384155273, -2.1418509483337402, -1.7723884582519531, -1.402925968170166, -1.0334635972976685, -0.6640012264251709, -0.2945387363433838, 0.07492375373840332, 0.44438600540161133, 0.8138484954833984, 1.1833109855651855, 1.5527734756469727, 1.9222358465194702, 2.2916982173919678, 2.661160707473755, 3.030623197555542, 3.40008544921875, 3.769547939300537, 4.139010429382324, 4.508472919464111, 4.877935409545898, 5.247397422790527, 5.616860389709473, 5.986322402954102, 6.355784893035889, 6.725247383117676, 7.094709873199463, 7.46417236328125, 7.833634853363037, 8.203097343444824, 8.572559356689453, 8.942022323608398, 9.311484336853027, 9.680946350097656, 10.050409317016602]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 4.0, 9.0, 3.0, 9.0, 14.0, 15.0, 16.0, 23.0, 29.0, 19.0, 34.0, 25.0, 26.0, 47.0, 58.0, 58.0, 60.0, 74.0, 60.0, 54.0, 41.0, 39.0, 38.0, 47.0, 26.0, 28.0, 23.0, 22.0, 23.0, 11.0, 21.0, 12.0, 9.0, 9.0, 9.0, 4.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.173884868621826, -4.039281368255615, -3.9046778678894043, -3.7700746059417725, -3.6354711055755615, -3.5008676052093506, -3.3662643432617188, -3.231660842895508, -3.097057342529297, -2.962453842163086, -2.827850341796875, -2.693247079849243, -2.5586435794830322, -2.4240400791168213, -2.2894368171691895, -2.1548333168029785, -2.0202298164367676, -1.8856263160705566, -1.7510229349136353, -1.6164195537567139, -1.481816053390503, -1.347212553024292, -1.2126091718673706, -1.0780057907104492, -0.9434022903442383, -0.8087988495826721, -0.674195408821106, -0.5395919680595398, -0.40498852729797363, -0.27038508653640747, -0.1357816457748413, -0.0011782050132751465, 0.1334247589111328, 0.268028199672699, 0.40263164043426514, 0.5372350811958313, 0.6718385219573975, 0.8064419627189636, 0.9410454034805298, 1.0756487846374512, 1.210252285003662, 1.344855785369873, 1.4794591665267944, 1.6140625476837158, 1.7486660480499268, 1.8832695484161377, 2.0178728103637695, 2.1524763107299805, 2.2870798110961914, 2.4216833114624023, 2.5562868118286133, 2.690890073776245, 2.825493574142456, 2.960097074508667, 3.094700336456299, 3.2293038368225098, 3.3639073371887207, 3.4985108375549316, 3.6331143379211426, 3.7677175998687744, 3.9023211002349854, 4.036924362182617, 4.171527862548828, 4.306131362915039, 4.44073486328125]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 4.0, 8.0, 12.0, 17.0, 40.0, 50.0, 105.0, 143.0, 208.0, 344.0, 602.0, 1124.0, 2122.0, 4198.0, 8782.0, 19756.0, 51365.0, 170507.0, 854504.0, 2279647.0, 602980.0, 126518.0, 40069.0, 16222.0, 7144.0, 3471.0, 1870.0, 1003.0, 545.0, 316.0, 196.0, 131.0, 89.0, 60.0, 40.0, 23.0, 14.0, 13.0, 15.0, 3.0, 7.0, 7.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.2401123046875, -0.2316570281982422, -0.22320175170898438, -0.21474647521972656, -0.20629119873046875, -0.19783592224121094, -0.18938064575195312, -0.1809253692626953, -0.1724700927734375, -0.1640148162841797, -0.15555953979492188, -0.14710426330566406, -0.13864898681640625, -0.13019371032714844, -0.12173843383789062, -0.11328315734863281, -0.104827880859375, -0.09637260437011719, -0.08791732788085938, -0.07946205139160156, -0.07100677490234375, -0.06255149841308594, -0.054096221923828125, -0.04564094543457031, -0.0371856689453125, -0.028730392456054688, -0.020275115966796875, -0.011819839477539062, -0.00336456298828125, 0.0050907135009765625, 0.013545989990234375, 0.022001266479492188, 0.03045654296875, 0.03891181945800781, 0.047367095947265625, 0.05582237243652344, 0.06427764892578125, 0.07273292541503906, 0.08118820190429688, 0.08964347839355469, 0.0980987548828125, 0.10655403137207031, 0.11500930786132812, 0.12346458435058594, 0.13191986083984375, 0.14037513732910156, 0.14883041381835938, 0.1572856903076172, 0.165740966796875, 0.1741962432861328, 0.18265151977539062, 0.19110679626464844, 0.19956207275390625, 0.20801734924316406, 0.21647262573242188, 0.2249279022216797, 0.2333831787109375, 0.2418384552001953, 0.2502937316894531, 0.25874900817871094, 0.26720428466796875, 0.27565956115722656, 0.2841148376464844, 0.2925701141357422, 0.301025390625]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 11.0, 19.0, 15.0, 20.0, 30.0, 39.0, 38.0, 61.0, 66.0, 71.0, 74.0, 91.0, 92.0, 80.0, 81.0, 58.0, 50.0, 34.0, 24.0, 17.0, 17.0, 6.0, 7.0, 6.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15771484375, -0.14758682250976562, -0.13745880126953125, -0.12733078002929688, -0.1172027587890625, -0.10707473754882812, -0.09694671630859375, -0.08681869506835938, -0.076690673828125, -0.06656265258789062, -0.05643463134765625, -0.046306610107421875, -0.0361785888671875, -0.026050567626953125, -0.01592254638671875, -0.005794525146484375, 0.00433349609375, 0.014461517333984375, 0.02458953857421875, 0.034717559814453125, 0.0448455810546875, 0.054973602294921875, 0.06510162353515625, 0.07522964477539062, 0.085357666015625, 0.09548568725585938, 0.10561370849609375, 0.11574172973632812, 0.1258697509765625, 0.13599777221679688, 0.14612579345703125, 0.15625381469726562, 0.1663818359375, 0.17650985717773438, 0.18663787841796875, 0.19676589965820312, 0.2068939208984375, 0.21702194213867188, 0.22714996337890625, 0.23727798461914062, 0.247406005859375, 0.2575340270996094, 0.26766204833984375, 0.2777900695800781, 0.2879180908203125, 0.2980461120605469, 0.30817413330078125, 0.3183021545410156, 0.32843017578125, 0.3385581970214844, 0.34868621826171875, 0.3588142395019531, 0.3689422607421875, 0.3790702819824219, 0.38919830322265625, 0.3993263244628906, 0.409454345703125, 0.4195823669433594, 0.42971038818359375, 0.4398384094238281, 0.4499664306640625, 0.4600944519042969, 0.47022247314453125, 0.4803504943847656, 0.490478515625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 2.0, 0.0, 10.0, 10.0, 9.0, 12.0, 15.0, 30.0, 31.0, 61.0, 93.0, 164.0, 235.0, 407.0, 675.0, 1338.0, 3037.0, 7986.0, 25472.0, 103899.0, 845978.0, 2868886.0, 260332.0, 51336.0, 14715.0, 5085.0, 2108.0, 1058.0, 491.0, 290.0, 138.0, 116.0, 72.0, 62.0, 33.0, 23.0, 13.0, 18.0, 9.0, 10.0, 5.0, 8.0, 5.0, 1.0, 2.0, 3.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.44873046875, -0.43285369873046875, -0.4169769287109375, -0.40110015869140625, -0.385223388671875, -0.36934661865234375, -0.3534698486328125, -0.33759307861328125, -0.32171630859375, -0.30583953857421875, -0.2899627685546875, -0.27408599853515625, -0.258209228515625, -0.24233245849609375, -0.2264556884765625, -0.21057891845703125, -0.1947021484375, -0.17882537841796875, -0.1629486083984375, -0.14707183837890625, -0.131195068359375, -0.11531829833984375, -0.0994415283203125, -0.08356475830078125, -0.06768798828125, -0.05181121826171875, -0.0359344482421875, -0.02005767822265625, -0.004180908203125, 0.01169586181640625, 0.0275726318359375, 0.04344940185546875, 0.059326171875, 0.07520294189453125, 0.0910797119140625, 0.10695648193359375, 0.122833251953125, 0.13871002197265625, 0.1545867919921875, 0.17046356201171875, 0.18634033203125, 0.20221710205078125, 0.2180938720703125, 0.23397064208984375, 0.249847412109375, 0.26572418212890625, 0.2816009521484375, 0.29747772216796875, 0.3133544921875, 0.32923126220703125, 0.3451080322265625, 0.36098480224609375, 0.376861572265625, 0.39273834228515625, 0.4086151123046875, 0.42449188232421875, 0.44036865234375, 0.45624542236328125, 0.4721221923828125, 0.48799896240234375, 0.503875732421875, 0.5197525024414062, 0.5356292724609375, 0.5515060424804688, 0.5673828125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 6.0, 3.0, 6.0, 4.0, 7.0, 18.0, 15.0, 21.0, 26.0, 38.0, 36.0, 65.0, 103.0, 158.0, 208.0, 324.0, 542.0, 698.0, 623.0, 410.0, 246.0, 142.0, 108.0, 65.0, 48.0, 40.0, 28.0, 17.0, 22.0, 13.0, 15.0, 9.0, 7.0, 7.0, 5.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.607421875, -0.5882797241210938, -0.5691375732421875, -0.5499954223632812, -0.530853271484375, -0.5117111206054688, -0.4925689697265625, -0.47342681884765625, -0.45428466796875, -0.43514251708984375, -0.4160003662109375, -0.39685821533203125, -0.377716064453125, -0.35857391357421875, -0.3394317626953125, -0.32028961181640625, -0.3011474609375, -0.28200531005859375, -0.2628631591796875, -0.24372100830078125, -0.224578857421875, -0.20543670654296875, -0.1862945556640625, -0.16715240478515625, -0.14801025390625, -0.12886810302734375, -0.1097259521484375, -0.09058380126953125, -0.071441650390625, -0.05229949951171875, -0.0331573486328125, -0.01401519775390625, 0.005126953125, 0.02426910400390625, 0.0434112548828125, 0.06255340576171875, 0.081695556640625, 0.10083770751953125, 0.1199798583984375, 0.13912200927734375, 0.15826416015625, 0.17740631103515625, 0.1965484619140625, 0.21569061279296875, 0.234832763671875, 0.25397491455078125, 0.2731170654296875, 0.29225921630859375, 0.3114013671875, 0.33054351806640625, 0.3496856689453125, 0.36882781982421875, 0.387969970703125, 0.40711212158203125, 0.4262542724609375, 0.44539642333984375, 0.46453857421875, 0.48368072509765625, 0.5028228759765625, 0.5219650268554688, 0.541107177734375, 0.5602493286132812, 0.5793914794921875, 0.5985336303710938, 0.61767578125]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 20.0, 90.0, 337.0, 393.0, 116.0, 30.0, 8.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.909759521484375, -5.4194464683532715, -4.929133892059326, -4.438820838928223, -3.9485080242156982, -3.458195209503174, -2.9678821563720703, -2.477569341659546, -1.9872565269470215, -1.496943712234497, -1.006630778312683, -0.5163178443908691, -0.026005029678344727, 0.4643077850341797, 0.9546208381652832, 1.4449336528778076, 1.935246467590332, 2.4255592823028564, 2.915872097015381, 3.4061851501464844, 3.896497964859009, 4.386810779571533, 4.877123832702637, 5.367436408996582, 5.8577494621276855, 6.348062515258789, 6.838375091552734, 7.328688144683838, 7.819001197814941, 8.309313774108887, 8.799627304077148, 9.289939880371094, 9.780252456665039, 10.270565032958984, 10.760878562927246, 11.251191139221191, 11.741503715515137, 12.231817245483398, 12.722129821777344, 13.212442398071289, 13.702754974365234, 14.19306755065918, 14.683381080627441, 15.173693656921387, 15.664006233215332, 16.154319763183594, 16.64463233947754, 17.134944915771484, 17.625259399414062, 18.115571975708008, 18.605884552001953, 19.09619903564453, 19.586511611938477, 20.076824188232422, 20.567136764526367, 21.057449340820312, 21.547761917114258, 22.038074493408203, 22.52838706970215, 23.018699645996094, 23.509014129638672, 23.999326705932617, 24.489639282226562, 24.979951858520508, 25.470264434814453]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 5.0, 6.0, 11.0, 5.0, 17.0, 11.0, 24.0, 26.0, 47.0, 46.0, 45.0, 59.0, 70.0, 72.0, 76.0, 71.0, 58.0, 64.0, 64.0, 50.0, 32.0, 38.0, 27.0, 27.0, 12.0, 16.0, 6.0, 8.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.914650917053223, -5.772266387939453, -5.629881858825684, -5.487497329711914, -5.3451128005981445, -5.202728271484375, -5.0603437423706055, -4.917959213256836, -4.775574684143066, -4.633190155029297, -4.490805625915527, -4.348421096801758, -4.206036567687988, -4.063652038574219, -3.921267509460449, -3.7788829803466797, -3.63649845123291, -3.4941139221191406, -3.351729393005371, -3.2093448638916016, -3.066960334777832, -2.9245758056640625, -2.782191276550293, -2.6398067474365234, -2.497422218322754, -2.3550376892089844, -2.212653160095215, -2.0702686309814453, -1.9278841018676758, -1.7854995727539062, -1.6431150436401367, -1.5007305145263672, -1.3583455085754395, -1.21596097946167, -1.0735764503479004, -0.9311919212341309, -0.7888073921203613, -0.6464228630065918, -0.5040383338928223, -0.36165380477905273, -0.2192692756652832, -0.07688474655151367, 0.06549978256225586, 0.2078843116760254, 0.3502688407897949, 0.49265336990356445, 0.635037899017334, 0.7774224281311035, 0.919806957244873, 1.0621914863586426, 1.204576015472412, 1.3469605445861816, 1.4893450736999512, 1.6317296028137207, 1.7741141319274902, 1.9164986610412598, 2.0588831901550293, 2.201267719268799, 2.3436522483825684, 2.486036777496338, 2.6284213066101074, 2.770805835723877, 2.9131903648376465, 3.055574893951416, 3.1979594230651855]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 7.0, 2.0, 10.0, 12.0, 14.0, 25.0, 27.0, 67.0, 105.0, 139.0, 237.0, 399.0, 723.0, 1327.0, 2660.0, 5630.0, 12510.0, 30212.0, 74504.0, 200475.0, 398908.0, 195003.0, 73011.0, 29407.0, 12238.0, 5428.0, 2518.0, 1246.0, 684.0, 384.0, 248.0, 133.0, 96.0, 46.0, 37.0, 28.0, 22.0, 11.0, 12.0, 9.0, 7.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.493408203125, -0.4795036315917969, -0.46559906005859375, -0.4516944885253906, -0.4377899169921875, -0.4238853454589844, -0.40998077392578125, -0.3960762023925781, -0.382171630859375, -0.3682670593261719, -0.35436248779296875, -0.3404579162597656, -0.3265533447265625, -0.3126487731933594, -0.29874420166015625, -0.2848396301269531, -0.27093505859375, -0.2570304870605469, -0.24312591552734375, -0.22922134399414062, -0.2153167724609375, -0.20141220092773438, -0.18750762939453125, -0.17360305786132812, -0.159698486328125, -0.14579391479492188, -0.13188934326171875, -0.11798477172851562, -0.1040802001953125, -0.09017562866210938, -0.07627105712890625, -0.062366485595703125, -0.0484619140625, -0.034557342529296875, -0.02065277099609375, -0.006748199462890625, 0.0071563720703125, 0.021060943603515625, 0.03496551513671875, 0.048870086669921875, 0.062774658203125, 0.07667922973632812, 0.09058380126953125, 0.10448837280273438, 0.1183929443359375, 0.13229751586914062, 0.14620208740234375, 0.16010665893554688, 0.17401123046875, 0.18791580200195312, 0.20182037353515625, 0.21572494506835938, 0.2296295166015625, 0.24353408813476562, 0.25743865966796875, 0.2713432312011719, 0.285247802734375, 0.2991523742675781, 0.31305694580078125, 0.3269615173339844, 0.3408660888671875, 0.3547706604003906, 0.36867523193359375, 0.3825798034667969, 0.396484375]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 6.0, 4.0, 5.0, 4.0, 15.0, 10.0, 14.0, 16.0, 19.0, 21.0, 21.0, 29.0, 18.0, 19.0, 49.0, 43.0, 42.0, 40.0, 32.0, 48.0, 36.0, 44.0, 42.0, 36.0, 39.0, 41.0, 41.0, 39.0, 28.0, 32.0, 17.0, 28.0, 23.0, 25.0, 13.0, 13.0, 9.0, 8.0, 6.0, 7.0, 4.0, 3.0, 4.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.164794921875, -0.15927886962890625, -0.1537628173828125, -0.14824676513671875, -0.142730712890625, -0.13721466064453125, -0.1316986083984375, -0.12618255615234375, -0.12066650390625, -0.11515045166015625, -0.1096343994140625, -0.10411834716796875, -0.098602294921875, -0.09308624267578125, -0.0875701904296875, -0.08205413818359375, -0.0765380859375, -0.07102203369140625, -0.0655059814453125, -0.05998992919921875, -0.054473876953125, -0.04895782470703125, -0.0434417724609375, -0.03792572021484375, -0.03240966796875, -0.02689361572265625, -0.0213775634765625, -0.01586151123046875, -0.010345458984375, -0.00482940673828125, 0.0006866455078125, 0.00620269775390625, 0.01171875, 0.01723480224609375, 0.0227508544921875, 0.02826690673828125, 0.033782958984375, 0.03929901123046875, 0.0448150634765625, 0.05033111572265625, 0.05584716796875, 0.06136322021484375, 0.0668792724609375, 0.07239532470703125, 0.077911376953125, 0.08342742919921875, 0.0889434814453125, 0.09445953369140625, 0.0999755859375, 0.10549163818359375, 0.1110076904296875, 0.11652374267578125, 0.122039794921875, 0.12755584716796875, 0.1330718994140625, 0.13858795166015625, 0.14410400390625, 0.14962005615234375, 0.1551361083984375, 0.16065216064453125, 0.166168212890625, 0.17168426513671875, 0.1772003173828125, 0.18271636962890625, 0.188232421875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 8.0, 11.0, 11.0, 17.0, 18.0, 45.0, 68.0, 82.0, 152.0, 220.0, 425.0, 793.0, 1606.0, 3935.0, 15949.0, 191636.0, 781653.0, 40362.0, 6698.0, 2362.0, 1085.0, 537.0, 321.0, 207.0, 131.0, 58.0, 52.0, 32.0, 28.0, 14.0, 13.0, 13.0, 3.0, 5.0, 4.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2744140625, -1.2335968017578125, -1.192779541015625, -1.1519622802734375, -1.11114501953125, -1.0703277587890625, -1.029510498046875, -0.9886932373046875, -0.9478759765625, -0.9070587158203125, -0.866241455078125, -0.8254241943359375, -0.78460693359375, -0.7437896728515625, -0.702972412109375, -0.6621551513671875, -0.621337890625, -0.5805206298828125, -0.539703369140625, -0.4988861083984375, -0.45806884765625, -0.4172515869140625, -0.376434326171875, -0.3356170654296875, -0.2947998046875, -0.2539825439453125, -0.213165283203125, -0.1723480224609375, -0.13153076171875, -0.0907135009765625, -0.049896240234375, -0.0090789794921875, 0.03173828125, 0.0725555419921875, 0.113372802734375, 0.1541900634765625, 0.19500732421875, 0.2358245849609375, 0.276641845703125, 0.3174591064453125, 0.3582763671875, 0.3990936279296875, 0.439910888671875, 0.4807281494140625, 0.52154541015625, 0.5623626708984375, 0.603179931640625, 0.6439971923828125, 0.684814453125, 0.7256317138671875, 0.766448974609375, 0.8072662353515625, 0.84808349609375, 0.8889007568359375, 0.929718017578125, 0.9705352783203125, 1.0113525390625, 1.0521697998046875, 1.092987060546875, 1.1338043212890625, 1.17462158203125, 1.2154388427734375, 1.256256103515625, 1.2970733642578125, 1.337890625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 4.0, 5.0, 15.0, 10.0, 13.0, 19.0, 22.0, 32.0, 37.0, 35.0, 40.0, 48.0, 56.0, 71.0, 72.0, 50.0, 54.0, 56.0, 40.0, 48.0, 37.0, 35.0, 48.0, 34.0, 33.0, 19.0, 15.0, 14.0, 18.0, 7.0, 1.0, 5.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.81689453125, -0.7822494506835938, -0.7476043701171875, -0.7129592895507812, -0.678314208984375, -0.6436691284179688, -0.6090240478515625, -0.5743789672851562, -0.53973388671875, -0.5050888061523438, -0.4704437255859375, -0.43579864501953125, -0.401153564453125, -0.36650848388671875, -0.3318634033203125, -0.29721832275390625, -0.2625732421875, -0.22792816162109375, -0.1932830810546875, -0.15863800048828125, -0.123992919921875, -0.08934783935546875, -0.0547027587890625, -0.02005767822265625, 0.01458740234375, 0.04923248291015625, 0.0838775634765625, 0.11852264404296875, 0.153167724609375, 0.18781280517578125, 0.2224578857421875, 0.25710296630859375, 0.291748046875, 0.32639312744140625, 0.3610382080078125, 0.39568328857421875, 0.430328369140625, 0.46497344970703125, 0.4996185302734375, 0.5342636108398438, 0.56890869140625, 0.6035537719726562, 0.6381988525390625, 0.6728439331054688, 0.707489013671875, 0.7421340942382812, 0.7767791748046875, 0.8114242553710938, 0.8460693359375, 0.8807144165039062, 0.9153594970703125, 0.9500045776367188, 0.984649658203125, 1.0192947387695312, 1.0539398193359375, 1.0885848999023438, 1.12322998046875, 1.1578750610351562, 1.1925201416015625, 1.2271652221679688, 1.261810302734375, 1.2964553833007812, 1.3311004638671875, 1.3657455444335938, 1.400390625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 4.0, 2.0, 2.0, 6.0, 4.0, 8.0, 9.0, 9.0, 16.0, 20.0, 34.0, 35.0, 57.0, 75.0, 109.0, 187.0, 273.0, 447.0, 828.0, 1495.0, 3184.0, 7266.0, 20138.0, 63827.0, 247404.0, 546713.0, 105754.0, 31241.0, 10491.0, 4227.0, 2038.0, 1034.0, 576.0, 363.0, 210.0, 149.0, 91.0, 60.0, 47.0, 32.0, 24.0, 23.0, 14.0, 10.0, 5.0, 5.0, 2.0, 5.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 1.0], "bins": [-0.226806640625, -0.21997451782226562, -0.21314239501953125, -0.20631027221679688, -0.1994781494140625, -0.19264602661132812, -0.18581390380859375, -0.17898178100585938, -0.172149658203125, -0.16531753540039062, -0.15848541259765625, -0.15165328979492188, -0.1448211669921875, -0.13798904418945312, -0.13115692138671875, -0.12432479858398438, -0.11749267578125, -0.11066055297851562, -0.10382843017578125, -0.09699630737304688, -0.0901641845703125, -0.08333206176757812, -0.07649993896484375, -0.06966781616210938, -0.062835693359375, -0.056003570556640625, -0.04917144775390625, -0.042339324951171875, -0.0355072021484375, -0.028675079345703125, -0.02184295654296875, -0.015010833740234375, -0.0081787109375, -0.001346588134765625, 0.00548553466796875, 0.012317657470703125, 0.0191497802734375, 0.025981903076171875, 0.03281402587890625, 0.039646148681640625, 0.046478271484375, 0.053310394287109375, 0.06014251708984375, 0.06697463989257812, 0.0738067626953125, 0.08063888549804688, 0.08747100830078125, 0.09430313110351562, 0.10113525390625, 0.10796737670898438, 0.11479949951171875, 0.12163162231445312, 0.1284637451171875, 0.13529586791992188, 0.14212799072265625, 0.14896011352539062, 0.155792236328125, 0.16262435913085938, 0.16945648193359375, 0.17628860473632812, 0.1831207275390625, 0.18995285034179688, 0.19678497314453125, 0.20361709594726562, 0.21044921875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 2.0, 1.0, 2.0, 2.0, 9.0, 9.0, 13.0, 7.0, 9.0, 16.0, 22.0, 25.0, 18.0, 30.0, 39.0, 49.0, 68.0, 101.0, 124.0, 97.0, 75.0, 67.0, 36.0, 42.0, 26.0, 24.0, 18.0, 16.0, 13.0, 15.0, 12.0, 3.0, 5.0, 5.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.808208465576172e-05, -7.543433457612991e-05, -7.278658449649811e-05, -7.01388344168663e-05, -6.74910843372345e-05, -6.484333425760269e-05, -6.219558417797089e-05, -5.954783409833908e-05, -5.6900084018707275e-05, -5.425233393907547e-05, -5.1604583859443665e-05, -4.895683377981186e-05, -4.6309083700180054e-05, -4.366133362054825e-05, -4.101358354091644e-05, -3.836583346128464e-05, -3.571808338165283e-05, -3.3070333302021027e-05, -3.042258322238922e-05, -2.7774833142757416e-05, -2.512708306312561e-05, -2.2479332983493805e-05, -1.9831582903862e-05, -1.7183832824230194e-05, -1.4536082744598389e-05, -1.1888332664966583e-05, -9.240582585334778e-06, -6.592832505702972e-06, -3.945082426071167e-06, -1.2973323464393616e-06, 1.3504177331924438e-06, 3.998167812824249e-06, 6.645917892456055e-06, 9.29366797208786e-06, 1.1941418051719666e-05, 1.4589168131351471e-05, 1.7236918210983276e-05, 1.9884668290615082e-05, 2.2532418370246887e-05, 2.5180168449878693e-05, 2.7827918529510498e-05, 3.0475668609142303e-05, 3.312341868877411e-05, 3.5771168768405914e-05, 3.841891884803772e-05, 4.1066668927669525e-05, 4.371441900730133e-05, 4.6362169086933136e-05, 4.900991916656494e-05, 5.165766924619675e-05, 5.430541932582855e-05, 5.695316940546036e-05, 5.960091948509216e-05, 6.224866956472397e-05, 6.489641964435577e-05, 6.754416972398758e-05, 7.019191980361938e-05, 7.283966988325119e-05, 7.5487419962883e-05, 7.81351700425148e-05, 8.07829201221466e-05, 8.343067020177841e-05, 8.607842028141022e-05, 8.872617036104202e-05, 9.137392044067383e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 7.0, 2.0, 7.0, 12.0, 9.0, 28.0, 23.0, 56.0, 53.0, 124.0, 202.0, 368.0, 547.0, 1120.0, 2506.0, 7279.0, 38860.0, 528763.0, 419353.0, 37340.0, 6986.0, 2471.0, 1076.0, 564.0, 317.0, 181.0, 121.0, 70.0, 35.0, 34.0, 17.0, 9.0, 12.0, 6.0, 3.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.29638671875, -0.2854042053222656, -0.27442169189453125, -0.2634391784667969, -0.2524566650390625, -0.24147415161132812, -0.23049163818359375, -0.21950912475585938, -0.208526611328125, -0.19754409790039062, -0.18656158447265625, -0.17557907104492188, -0.1645965576171875, -0.15361404418945312, -0.14263153076171875, -0.13164901733398438, -0.12066650390625, -0.10968399047851562, -0.09870147705078125, -0.08771896362304688, -0.0767364501953125, -0.06575393676757812, -0.05477142333984375, -0.043788909912109375, -0.032806396484375, -0.021823883056640625, -0.01084136962890625, 0.000141143798828125, 0.0111236572265625, 0.022106170654296875, 0.03308868408203125, 0.044071197509765625, 0.0550537109375, 0.06603622436523438, 0.07701873779296875, 0.08800125122070312, 0.0989837646484375, 0.10996627807617188, 0.12094879150390625, 0.13193130493164062, 0.142913818359375, 0.15389633178710938, 0.16487884521484375, 0.17586135864257812, 0.1868438720703125, 0.19782638549804688, 0.20880889892578125, 0.21979141235351562, 0.23077392578125, 0.24175643920898438, 0.25273895263671875, 0.2637214660644531, 0.2747039794921875, 0.2856864929199219, 0.29666900634765625, 0.3076515197753906, 0.318634033203125, 0.3296165466308594, 0.34059906005859375, 0.3515815734863281, 0.3625640869140625, 0.3735466003417969, 0.38452911376953125, 0.3955116271972656, 0.406494140625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 7.0, 2.0, 6.0, 8.0, 2.0, 10.0, 13.0, 16.0, 16.0, 19.0, 27.0, 24.0, 24.0, 37.0, 46.0, 55.0, 52.0, 75.0, 57.0, 74.0, 67.0, 64.0, 51.0, 40.0, 35.0, 25.0, 35.0, 23.0, 20.0, 8.0, 15.0, 11.0, 6.0, 8.0, 12.0, 3.0, 1.0, 4.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.232666015625, -0.22510147094726562, -0.21753692626953125, -0.20997238159179688, -0.2024078369140625, -0.19484329223632812, -0.18727874755859375, -0.17971420288085938, -0.172149658203125, -0.16458511352539062, -0.15702056884765625, -0.14945602416992188, -0.1418914794921875, -0.13432693481445312, -0.12676239013671875, -0.11919784545898438, -0.11163330078125, -0.10406875610351562, -0.09650421142578125, -0.08893966674804688, -0.0813751220703125, -0.07381057739257812, -0.06624603271484375, -0.058681488037109375, -0.051116943359375, -0.043552398681640625, -0.03598785400390625, -0.028423309326171875, -0.0208587646484375, -0.013294219970703125, -0.00572967529296875, 0.001834869384765625, 0.0093994140625, 0.016963958740234375, 0.02452850341796875, 0.032093048095703125, 0.0396575927734375, 0.047222137451171875, 0.05478668212890625, 0.062351226806640625, 0.069915771484375, 0.07748031616210938, 0.08504486083984375, 0.09260940551757812, 0.1001739501953125, 0.10773849487304688, 0.11530303955078125, 0.12286758422851562, 0.13043212890625, 0.13799667358398438, 0.14556121826171875, 0.15312576293945312, 0.1606903076171875, 0.16825485229492188, 0.17581939697265625, 0.18338394165039062, 0.190948486328125, 0.19851303100585938, 0.20607757568359375, 0.21364212036132812, 0.2212066650390625, 0.22877120971679688, 0.23633575439453125, 0.24390029907226562, 0.25146484375]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 3.0, 11.0, 25.0, 44.0, 119.0, 189.0, 286.0, 170.0, 75.0, 36.0, 17.0, 11.0, 3.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.636467933654785, -9.363018035888672, -9.089569091796875, -8.816119194030762, -8.542670249938965, -8.269220352172852, -7.9957709312438965, -7.722321510314941, -7.448872089385986, -7.175422668457031, -6.901973247528076, -6.628523826599121, -6.355073928833008, -6.081624984741211, -5.808175086975098, -5.534725666046143, -5.2612762451171875, -4.987826824188232, -4.714377403259277, -4.440927982330322, -4.167478561401367, -3.894028902053833, -3.620579242706299, -3.3471298217773438, -3.0736804008483887, -2.8002309799194336, -2.5267815589904785, -2.2533318996429443, -1.9798824787139893, -1.7064330577850342, -1.4329835176467896, -1.159533977508545, -0.886085033416748, -0.6126355528831482, -0.33918607234954834, -0.06573659181594849, 0.20771288871765137, 0.48116230964660645, 0.7546118497848511, 1.0280613899230957, 1.3015108108520508, 1.5749602317810059, 1.8484097719192505, 2.121859312057495, 2.39530873298645, 2.6687581539154053, 2.9422078132629395, 3.2156572341918945, 3.4891066551208496, 3.7625560760498047, 4.03600549697876, 4.309454917907715, 4.582904815673828, 4.856353759765625, 5.129803657531738, 5.403253078460693, 5.676702499389648, 5.9501519203186035, 6.223601341247559, 6.497050762176514, 6.770500183105469, 7.043950080871582, 7.317399501800537, 7.590848922729492, 7.864298343658447]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 2.0, 9.0, 10.0, 7.0, 13.0, 16.0, 12.0, 14.0, 14.0, 33.0, 20.0, 23.0, 25.0, 39.0, 28.0, 28.0, 41.0, 50.0, 56.0, 61.0, 61.0, 49.0, 51.0, 34.0, 30.0, 40.0, 32.0, 26.0, 28.0, 25.0, 22.0, 17.0, 15.0, 9.0, 12.0, 5.0, 11.0, 11.0, 4.0, 2.0, 4.0, 5.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.4706637859344482, -3.365431785583496, -3.260199546813965, -3.1549675464630127, -3.0497355461120605, -2.9445033073425293, -2.839271306991577, -2.734039306640625, -2.628807306289673, -2.5235753059387207, -2.4183430671691895, -2.3131110668182373, -2.207879066467285, -2.102646827697754, -1.9974148273468018, -1.8921828269958496, -1.786950707435608, -1.6817185878753662, -1.576486587524414, -1.4712544679641724, -1.3660224676132202, -1.2607903480529785, -1.1555583477020264, -1.0503262281417847, -0.9450941681861877, -0.8398621082305908, -0.7346300482749939, -0.629397988319397, -0.5241658687591553, -0.41893380880355835, -0.3137017488479614, -0.2084696888923645, -0.10323762893676758, 0.0019944384694099426, 0.10722650587558746, 0.21245858073234558, 0.3176906406879425, 0.4229227304458618, 0.5281547904014587, 0.6333868503570557, 0.7386189103126526, 0.8438509702682495, 0.9490830302238464, 1.0543150901794434, 1.159547209739685, 1.2647793292999268, 1.370011329650879, 1.475243330001831, 1.5804754495620728, 1.6857075691223145, 1.7909395694732666, 1.8961716890335083, 2.00140380859375, 2.106635808944702, 2.2118678092956543, 2.3171000480651855, 2.4223320484161377, 2.52756404876709, 2.632796287536621, 2.7380282878875732, 2.8432602882385254, 2.9484925270080566, 3.053724527359009, 3.158956527709961, 3.264188528060913]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 7.0, 9.0, 15.0, 16.0, 27.0, 30.0, 57.0, 83.0, 127.0, 205.0, 350.0, 750.0, 1256.0, 2286.0, 4524.0, 9601.0, 21822.0, 56463.0, 198282.0, 1026061.0, 2146598.0, 537878.0, 119089.0, 38364.0, 15695.0, 6954.0, 3544.0, 1804.0, 981.0, 528.0, 325.0, 194.0, 122.0, 73.0, 52.0, 32.0, 27.0, 16.0, 10.0, 12.0, 7.0, 7.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2354736328125, -0.2277050018310547, -0.21993637084960938, -0.21216773986816406, -0.20439910888671875, -0.19663047790527344, -0.18886184692382812, -0.1810932159423828, -0.1733245849609375, -0.1655559539794922, -0.15778732299804688, -0.15001869201660156, -0.14225006103515625, -0.13448143005371094, -0.12671279907226562, -0.11894416809082031, -0.111175537109375, -0.10340690612792969, -0.09563827514648438, -0.08786964416503906, -0.08010101318359375, -0.07233238220214844, -0.06456375122070312, -0.05679512023925781, -0.0490264892578125, -0.04125785827636719, -0.033489227294921875, -0.025720596313476562, -0.01795196533203125, -0.010183334350585938, -0.002414703369140625, 0.0053539276123046875, 0.01312255859375, 0.020891189575195312, 0.028659820556640625, 0.03642845153808594, 0.04419708251953125, 0.05196571350097656, 0.059734344482421875, 0.06750297546386719, 0.0752716064453125, 0.08304023742675781, 0.09080886840820312, 0.09857749938964844, 0.10634613037109375, 0.11411476135253906, 0.12188339233398438, 0.1296520233154297, 0.137420654296875, 0.1451892852783203, 0.15295791625976562, 0.16072654724121094, 0.16849517822265625, 0.17626380920410156, 0.18403244018554688, 0.1918010711669922, 0.1995697021484375, 0.2073383331298828, 0.21510696411132812, 0.22287559509277344, 0.23064422607421875, 0.23841285705566406, 0.24618148803710938, 0.2539501190185547, 0.26171875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 0.0, 2.0, 3.0, 1.0, 3.0, 2.0, 6.0, 4.0, 10.0, 12.0, 9.0, 6.0, 15.0, 13.0, 20.0, 30.0, 23.0, 24.0, 29.0, 25.0, 20.0, 37.0, 37.0, 29.0, 45.0, 46.0, 38.0, 42.0, 37.0, 38.0, 35.0, 48.0, 39.0, 37.0, 31.0, 29.0, 22.0, 19.0, 24.0, 18.0, 22.0, 21.0, 9.0, 10.0, 11.0, 10.0, 8.0, 3.0, 0.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.16357421875, -0.15834617614746094, -0.15311813354492188, -0.1478900909423828, -0.14266204833984375, -0.1374340057373047, -0.13220596313476562, -0.12697792053222656, -0.1217498779296875, -0.11652183532714844, -0.11129379272460938, -0.10606575012207031, -0.10083770751953125, -0.09560966491699219, -0.09038162231445312, -0.08515357971191406, -0.079925537109375, -0.07469749450683594, -0.06946945190429688, -0.06424140930175781, -0.05901336669921875, -0.05378532409667969, -0.048557281494140625, -0.04332923889160156, -0.0381011962890625, -0.03287315368652344, -0.027645111083984375, -0.022417068481445312, -0.01718902587890625, -0.011960983276367188, -0.006732940673828125, -0.0015048980712890625, 0.00372314453125, 0.008951187133789062, 0.014179229736328125, 0.019407272338867188, 0.02463531494140625, 0.029863357543945312, 0.035091400146484375, 0.04031944274902344, 0.0455474853515625, 0.05077552795410156, 0.056003570556640625, 0.06123161315917969, 0.06645965576171875, 0.07168769836425781, 0.07691574096679688, 0.08214378356933594, 0.087371826171875, 0.09259986877441406, 0.09782791137695312, 0.10305595397949219, 0.10828399658203125, 0.11351203918457031, 0.11874008178710938, 0.12396812438964844, 0.1291961669921875, 0.13442420959472656, 0.13965225219726562, 0.1448802947998047, 0.15010833740234375, 0.1553363800048828, 0.16056442260742188, 0.16579246520996094, 0.1710205078125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 2.0, 1.0, 4.0, 8.0, 10.0, 17.0, 29.0, 28.0, 59.0, 110.0, 219.0, 468.0, 1076.0, 3079.0, 11437.0, 60609.0, 929045.0, 3037698.0, 125540.0, 17772.0, 4363.0, 1470.0, 606.0, 256.0, 146.0, 81.0, 52.0, 27.0, 23.0, 11.0, 16.0, 10.0, 3.0, 5.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.77197265625, -0.750030517578125, -0.72808837890625, -0.706146240234375, -0.6842041015625, -0.662261962890625, -0.64031982421875, -0.618377685546875, -0.596435546875, -0.574493408203125, -0.55255126953125, -0.530609130859375, -0.5086669921875, -0.486724853515625, -0.46478271484375, -0.442840576171875, -0.4208984375, -0.398956298828125, -0.37701416015625, -0.355072021484375, -0.3331298828125, -0.311187744140625, -0.28924560546875, -0.267303466796875, -0.245361328125, -0.223419189453125, -0.20147705078125, -0.179534912109375, -0.1575927734375, -0.135650634765625, -0.11370849609375, -0.091766357421875, -0.06982421875, -0.047882080078125, -0.02593994140625, -0.003997802734375, 0.0179443359375, 0.039886474609375, 0.06182861328125, 0.083770751953125, 0.105712890625, 0.127655029296875, 0.14959716796875, 0.171539306640625, 0.1934814453125, 0.215423583984375, 0.23736572265625, 0.259307861328125, 0.28125, 0.303192138671875, 0.32513427734375, 0.347076416015625, 0.3690185546875, 0.390960693359375, 0.41290283203125, 0.434844970703125, 0.456787109375, 0.478729248046875, 0.50067138671875, 0.522613525390625, 0.5445556640625, 0.566497802734375, 0.58843994140625, 0.610382080078125, 0.63232421875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 7.0, 4.0, 7.0, 7.0, 12.0, 19.0, 24.0, 26.0, 32.0, 35.0, 75.0, 90.0, 115.0, 228.0, 444.0, 648.0, 786.0, 569.0, 344.0, 190.0, 121.0, 85.0, 53.0, 47.0, 34.0, 25.0, 7.0, 13.0, 10.0, 5.0, 4.0, 2.0, 3.0, 1.0, 4.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.525390625, -0.5054855346679688, -0.4855804443359375, -0.46567535400390625, -0.445770263671875, -0.42586517333984375, -0.4059600830078125, -0.38605499267578125, -0.36614990234375, -0.34624481201171875, -0.3263397216796875, -0.30643463134765625, -0.286529541015625, -0.26662445068359375, -0.2467193603515625, -0.22681427001953125, -0.2069091796875, -0.18700408935546875, -0.1670989990234375, -0.14719390869140625, -0.127288818359375, -0.10738372802734375, -0.0874786376953125, -0.06757354736328125, -0.04766845703125, -0.02776336669921875, -0.0078582763671875, 0.01204681396484375, 0.031951904296875, 0.05185699462890625, 0.0717620849609375, 0.09166717529296875, 0.111572265625, 0.13147735595703125, 0.1513824462890625, 0.17128753662109375, 0.191192626953125, 0.21109771728515625, 0.2310028076171875, 0.25090789794921875, 0.27081298828125, 0.29071807861328125, 0.3106231689453125, 0.33052825927734375, 0.350433349609375, 0.37033843994140625, 0.3902435302734375, 0.41014862060546875, 0.4300537109375, 0.44995880126953125, 0.4698638916015625, 0.48976898193359375, 0.509674072265625, 0.5295791625976562, 0.5494842529296875, 0.5693893432617188, 0.58929443359375, 0.6091995239257812, 0.6291046142578125, 0.6490097045898438, 0.668914794921875, 0.6888198852539062, 0.7087249755859375, 0.7286300659179688, 0.74853515625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 4.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 5.0, 7.0, 14.0, 18.0, 48.0, 73.0, 161.0, 188.0, 205.0, 141.0, 59.0, 31.0, 15.0, 7.0, 7.0, 2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-8.089385032653809, -7.897246837615967, -7.705108642578125, -7.512970447540283, -7.320832252502441, -7.128694534301758, -6.936555862426758, -6.744418144226074, -6.552279949188232, -6.360141754150391, -6.168003559112549, -5.975865364074707, -5.783727169036865, -5.591588973999023, -5.39945125579834, -5.207313060760498, -5.015174865722656, -4.8230366706848145, -4.630898475646973, -4.438760280609131, -4.246622085571289, -4.0544843673706055, -3.8623459339141846, -3.670207977294922, -3.478069305419922, -3.28593111038208, -3.0937929153442383, -2.9016547203063965, -2.709516763687134, -2.517378568649292, -2.32524037361145, -2.1331024169921875, -1.9409642219543457, -1.748826026916504, -1.5566879510879517, -1.3645497560501099, -1.1724116802215576, -0.9802734851837158, -0.788135290145874, -0.5959972143173218, -0.40385901927948, -0.21172086894512177, -0.01958271861076355, 0.17255544662475586, 0.3646935820579529, 0.5568317174911499, 0.7489699125289917, 0.941107988357544, 1.1332461833953857, 1.3253843784332275, 1.5175224542617798, 1.7096606492996216, 1.9017987251281738, 2.0939369201660156, 2.2860751152038574, 2.478213310241699, 2.670351505279541, 2.862489700317383, 3.0546278953552246, 3.2467660903930664, 3.438904047012329, 3.631042242050171, 3.8231804370880127, 4.015318393707275, 4.207456588745117]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 5.0, 2.0, 6.0, 5.0, 12.0, 7.0, 16.0, 9.0, 20.0, 22.0, 28.0, 36.0, 37.0, 48.0, 47.0, 38.0, 60.0, 53.0, 71.0, 53.0, 56.0, 45.0, 58.0, 45.0, 44.0, 35.0, 32.0, 27.0, 11.0, 15.0, 14.0, 9.0, 8.0, 12.0, 3.0, 5.0, 6.0, 3.0, 1.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.811023712158203, -2.7054712772369385, -2.5999186038970947, -2.49436616897583, -2.3888137340545654, -2.283261299133301, -2.177708625793457, -2.0721561908721924, -1.9666036367416382, -1.861051082611084, -1.7554986476898193, -1.6499460935592651, -1.544393539428711, -1.4388411045074463, -1.333288550376892, -1.227735996246338, -1.1221835613250732, -1.016631007194519, -0.9110785722732544, -0.8055260181427002, -0.6999735236167908, -0.5944210290908813, -0.48886847496032715, -0.3833159804344177, -0.2777634859085083, -0.17221097648143768, -0.06665846705436707, 0.038894057273864746, 0.14444655179977417, 0.2499990463256836, 0.3555516004562378, 0.4611040949821472, 0.5666563510894775, 0.672208845615387, 0.7777613401412964, 0.8833138942718506, 0.98886638879776, 1.0944188833236694, 1.1999714374542236, 1.3055238723754883, 1.4110764265060425, 1.5166289806365967, 1.6221814155578613, 1.7277339696884155, 1.8332865238189697, 1.9388389587402344, 2.044391632080078, 2.1499440670013428, 2.2554965019226074, 2.361048936843872, 2.466601610183716, 2.5721540451049805, 2.677706480026245, 2.7832589149475098, 2.8888115882873535, 2.994364023208618, 3.099916458129883, 3.2054688930511475, 3.311021566390991, 3.416574001312256, 3.5221264362335205, 3.627678871154785, 3.733231544494629, 3.8387839794158936, 3.9443366527557373]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 3.0, 7.0, 13.0, 16.0, 22.0, 21.0, 46.0, 67.0, 98.0, 156.0, 240.0, 330.0, 533.0, 809.0, 1398.0, 2214.0, 3913.0, 7064.0, 13934.0, 28905.0, 67016.0, 175969.0, 376958.0, 217251.0, 81846.0, 34557.0, 16136.0, 8149.0, 4374.0, 2401.0, 1501.0, 872.0, 562.0, 358.0, 266.0, 175.0, 119.0, 78.0, 63.0, 28.0, 32.0, 27.0, 9.0, 5.0, 5.0, 5.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.329833984375, -0.3190574645996094, -0.30828094482421875, -0.2975044250488281, -0.2867279052734375, -0.2759513854980469, -0.26517486572265625, -0.2543983459472656, -0.243621826171875, -0.23284530639648438, -0.22206878662109375, -0.21129226684570312, -0.2005157470703125, -0.18973922729492188, -0.17896270751953125, -0.16818618774414062, -0.15740966796875, -0.14663314819335938, -0.13585662841796875, -0.12508010864257812, -0.1143035888671875, -0.10352706909179688, -0.09275054931640625, -0.08197402954101562, -0.071197509765625, -0.060420989990234375, -0.04964447021484375, -0.038867950439453125, -0.0280914306640625, -0.017314910888671875, -0.00653839111328125, 0.004238128662109375, 0.0150146484375, 0.025791168212890625, 0.03656768798828125, 0.047344207763671875, 0.0581207275390625, 0.06889724731445312, 0.07967376708984375, 0.09045028686523438, 0.101226806640625, 0.11200332641601562, 0.12277984619140625, 0.13355636596679688, 0.1443328857421875, 0.15510940551757812, 0.16588592529296875, 0.17666244506835938, 0.18743896484375, 0.19821548461914062, 0.20899200439453125, 0.21976852416992188, 0.2305450439453125, 0.24132156372070312, 0.25209808349609375, 0.2628746032714844, 0.273651123046875, 0.2844276428222656, 0.29520416259765625, 0.3059806823730469, 0.3167572021484375, 0.3275337219238281, 0.33831024169921875, 0.3490867614746094, 0.35986328125]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 8.0, 4.0, 6.0, 6.0, 4.0, 4.0, 13.0, 10.0, 20.0, 23.0, 19.0, 26.0, 20.0, 28.0, 28.0, 34.0, 28.0, 41.0, 34.0, 40.0, 38.0, 40.0, 37.0, 36.0, 39.0, 40.0, 40.0, 41.0, 41.0, 37.0, 26.0, 28.0, 22.0, 29.0, 19.0, 12.0, 14.0, 9.0, 14.0, 8.0, 4.0, 6.0, 5.0, 7.0, 3.0, 5.0, 1.0, 4.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1807861328125, -0.17522621154785156, -0.16966629028320312, -0.1641063690185547, -0.15854644775390625, -0.1529865264892578, -0.14742660522460938, -0.14186668395996094, -0.1363067626953125, -0.13074684143066406, -0.12518692016601562, -0.11962699890136719, -0.11406707763671875, -0.10850715637207031, -0.10294723510742188, -0.09738731384277344, -0.091827392578125, -0.08626747131347656, -0.08070755004882812, -0.07514762878417969, -0.06958770751953125, -0.06402778625488281, -0.058467864990234375, -0.05290794372558594, -0.0473480224609375, -0.04178810119628906, -0.036228179931640625, -0.030668258666992188, -0.02510833740234375, -0.019548416137695312, -0.013988494873046875, -0.008428573608398438, -0.00286865234375, 0.0026912689208984375, 0.008251190185546875, 0.013811111450195312, 0.01937103271484375, 0.024930953979492188, 0.030490875244140625, 0.03605079650878906, 0.0416107177734375, 0.04717063903808594, 0.052730560302734375, 0.05829048156738281, 0.06385040283203125, 0.06941032409667969, 0.07497024536132812, 0.08053016662597656, 0.086090087890625, 0.09165000915527344, 0.09720993041992188, 0.10276985168457031, 0.10832977294921875, 0.11388969421386719, 0.11944961547851562, 0.12500953674316406, 0.1305694580078125, 0.13612937927246094, 0.14168930053710938, 0.1472492218017578, 0.15280914306640625, 0.1583690643310547, 0.16392898559570312, 0.16948890686035156, 0.175048828125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 0.0, 4.0, 5.0, 5.0, 2.0, 5.0, 9.0, 17.0, 22.0, 40.0, 48.0, 45.0, 70.0, 116.0, 202.0, 313.0, 528.0, 1003.0, 2219.0, 6539.0, 33606.0, 633257.0, 334903.0, 25942.0, 5377.0, 1930.0, 969.0, 519.0, 282.0, 190.0, 134.0, 72.0, 52.0, 36.0, 26.0, 19.0, 17.0, 13.0, 7.0, 8.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.84765625, -0.814971923828125, -0.78228759765625, -0.749603271484375, -0.7169189453125, -0.684234619140625, -0.65155029296875, -0.618865966796875, -0.586181640625, -0.553497314453125, -0.52081298828125, -0.488128662109375, -0.4554443359375, -0.422760009765625, -0.39007568359375, -0.357391357421875, -0.32470703125, -0.292022705078125, -0.25933837890625, -0.226654052734375, -0.1939697265625, -0.161285400390625, -0.12860107421875, -0.095916748046875, -0.063232421875, -0.030548095703125, 0.00213623046875, 0.034820556640625, 0.0675048828125, 0.100189208984375, 0.13287353515625, 0.165557861328125, 0.1982421875, 0.230926513671875, 0.26361083984375, 0.296295166015625, 0.3289794921875, 0.361663818359375, 0.39434814453125, 0.427032470703125, 0.459716796875, 0.492401123046875, 0.52508544921875, 0.557769775390625, 0.5904541015625, 0.623138427734375, 0.65582275390625, 0.688507080078125, 0.72119140625, 0.753875732421875, 0.78656005859375, 0.819244384765625, 0.8519287109375, 0.884613037109375, 0.91729736328125, 0.949981689453125, 0.982666015625, 1.015350341796875, 1.04803466796875, 1.080718994140625, 1.1134033203125, 1.146087646484375, 1.17877197265625, 1.211456298828125, 1.244140625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 7.0, 1.0, 6.0, 7.0, 2.0, 12.0, 15.0, 24.0, 25.0, 27.0, 29.0, 39.0, 47.0, 58.0, 56.0, 69.0, 71.0, 79.0, 62.0, 54.0, 47.0, 60.0, 42.0, 43.0, 37.0, 24.0, 10.0, 15.0, 16.0, 6.0, 9.0, 4.0, 8.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1806640625, -1.14300537109375, -1.1053466796875, -1.06768798828125, -1.030029296875, -0.99237060546875, -0.9547119140625, -0.91705322265625, -0.87939453125, -0.84173583984375, -0.8040771484375, -0.76641845703125, -0.728759765625, -0.69110107421875, -0.6534423828125, -0.61578369140625, -0.578125, -0.54046630859375, -0.5028076171875, -0.46514892578125, -0.427490234375, -0.38983154296875, -0.3521728515625, -0.31451416015625, -0.27685546875, -0.23919677734375, -0.2015380859375, -0.16387939453125, -0.126220703125, -0.08856201171875, -0.0509033203125, -0.01324462890625, 0.0244140625, 0.06207275390625, 0.0997314453125, 0.13739013671875, 0.175048828125, 0.21270751953125, 0.2503662109375, 0.28802490234375, 0.32568359375, 0.36334228515625, 0.4010009765625, 0.43865966796875, 0.476318359375, 0.51397705078125, 0.5516357421875, 0.58929443359375, 0.626953125, 0.66461181640625, 0.7022705078125, 0.73992919921875, 0.777587890625, 0.81524658203125, 0.8529052734375, 0.89056396484375, 0.92822265625, 0.96588134765625, 1.0035400390625, 1.04119873046875, 1.078857421875, 1.11651611328125, 1.1541748046875, 1.19183349609375, 1.2294921875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 6.0, 8.0, 6.0, 9.0, 24.0, 28.0, 26.0, 52.0, 85.0, 149.0, 256.0, 432.0, 679.0, 1390.0, 3154.0, 8714.0, 30127.0, 147238.0, 674794.0, 138682.0, 28288.0, 8222.0, 3127.0, 1391.0, 650.0, 414.0, 190.0, 132.0, 81.0, 48.0, 47.0, 29.0, 24.0, 17.0, 5.0, 6.0, 6.0, 4.0, 4.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.261962890625, -0.2541389465332031, -0.24631500244140625, -0.23849105834960938, -0.2306671142578125, -0.22284317016601562, -0.21501922607421875, -0.20719528198242188, -0.199371337890625, -0.19154739379882812, -0.18372344970703125, -0.17589950561523438, -0.1680755615234375, -0.16025161743164062, -0.15242767333984375, -0.14460372924804688, -0.13677978515625, -0.12895584106445312, -0.12113189697265625, -0.11330795288085938, -0.1054840087890625, -0.09766006469726562, -0.08983612060546875, -0.08201217651367188, -0.074188232421875, -0.06636428833007812, -0.05854034423828125, -0.050716400146484375, -0.0428924560546875, -0.035068511962890625, -0.02724456787109375, -0.019420623779296875, -0.0115966796875, -0.003772735595703125, 0.00405120849609375, 0.011875152587890625, 0.0196990966796875, 0.027523040771484375, 0.03534698486328125, 0.043170928955078125, 0.050994873046875, 0.058818817138671875, 0.06664276123046875, 0.07446670532226562, 0.0822906494140625, 0.09011459350585938, 0.09793853759765625, 0.10576248168945312, 0.11358642578125, 0.12141036987304688, 0.12923431396484375, 0.13705825805664062, 0.1448822021484375, 0.15270614624023438, 0.16053009033203125, 0.16835403442382812, 0.176177978515625, 0.18400192260742188, 0.19182586669921875, 0.19964981079101562, 0.2074737548828125, 0.21529769897460938, 0.22312164306640625, 0.23094558715820312, 0.23876953125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 0.0, 4.0, 5.0, 9.0, 9.0, 13.0, 13.0, 18.0, 18.0, 29.0, 38.0, 46.0, 74.0, 98.0, 121.0, 116.0, 108.0, 74.0, 51.0, 39.0, 35.0, 21.0, 18.0, 12.0, 11.0, 9.0, 3.0, 4.0, 5.0, 0.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.0001061558723449707, -0.00010344944894313812, -0.00010074302554130554, -9.803660213947296e-05, -9.533017873764038e-05, -9.26237553358078e-05, -8.991733193397522e-05, -8.721090853214264e-05, -8.450448513031006e-05, -8.179806172847748e-05, -7.90916383266449e-05, -7.638521492481232e-05, -7.367879152297974e-05, -7.097236812114716e-05, -6.826594471931458e-05, -6.5559521317482e-05, -6.285309791564941e-05, -6.0146674513816833e-05, -5.744025111198425e-05, -5.473382771015167e-05, -5.202740430831909e-05, -4.932098090648651e-05, -4.661455750465393e-05, -4.390813410282135e-05, -4.120171070098877e-05, -3.849528729915619e-05, -3.578886389732361e-05, -3.308244049549103e-05, -3.0376017093658447e-05, -2.7669593691825867e-05, -2.4963170289993286e-05, -2.2256746888160706e-05, -1.9550323486328125e-05, -1.6843900084495544e-05, -1.4137476682662964e-05, -1.1431053280830383e-05, -8.724629878997803e-06, -6.018206477165222e-06, -3.3117830753326416e-06, -6.05359673500061e-07, 2.1010637283325195e-06, 4.8074871301651e-06, 7.513910531997681e-06, 1.0220333933830261e-05, 1.2926757335662842e-05, 1.5633180737495422e-05, 1.8339604139328003e-05, 2.1046027541160583e-05, 2.3752450942993164e-05, 2.6458874344825745e-05, 2.9165297746658325e-05, 3.1871721148490906e-05, 3.4578144550323486e-05, 3.728456795215607e-05, 3.999099135398865e-05, 4.269741475582123e-05, 4.540383815765381e-05, 4.811026155948639e-05, 5.081668496131897e-05, 5.352310836315155e-05, 5.622953176498413e-05, 5.893595516681671e-05, 6.164237856864929e-05, 6.434880197048187e-05, 6.705522537231445e-05]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 4.0, 5.0, 0.0, 4.0, 5.0, 5.0, 4.0, 15.0, 13.0, 20.0, 35.0, 33.0, 44.0, 71.0, 134.0, 204.0, 330.0, 515.0, 974.0, 1879.0, 4443.0, 13318.0, 58731.0, 506193.0, 384495.0, 55569.0, 12782.0, 4418.0, 1902.0, 949.0, 558.0, 289.0, 215.0, 146.0, 65.0, 46.0, 46.0, 32.0, 19.0, 15.0, 8.0, 11.0, 4.0, 3.0, 4.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.2410888671875, -0.2337799072265625, -0.226470947265625, -0.2191619873046875, -0.21185302734375, -0.2045440673828125, -0.197235107421875, -0.1899261474609375, -0.1826171875, -0.1753082275390625, -0.167999267578125, -0.1606903076171875, -0.15338134765625, -0.1460723876953125, -0.138763427734375, -0.1314544677734375, -0.1241455078125, -0.1168365478515625, -0.109527587890625, -0.1022186279296875, -0.09490966796875, -0.0876007080078125, -0.080291748046875, -0.0729827880859375, -0.065673828125, -0.0583648681640625, -0.051055908203125, -0.0437469482421875, -0.03643798828125, -0.0291290283203125, -0.021820068359375, -0.0145111083984375, -0.0072021484375, 0.0001068115234375, 0.007415771484375, 0.0147247314453125, 0.02203369140625, 0.0293426513671875, 0.036651611328125, 0.0439605712890625, 0.05126953125, 0.0585784912109375, 0.065887451171875, 0.0731964111328125, 0.08050537109375, 0.0878143310546875, 0.095123291015625, 0.1024322509765625, 0.1097412109375, 0.1170501708984375, 0.124359130859375, 0.1316680908203125, 0.13897705078125, 0.1462860107421875, 0.153594970703125, 0.1609039306640625, 0.168212890625, 0.1755218505859375, 0.182830810546875, 0.1901397705078125, 0.19744873046875, 0.2047576904296875, 0.212066650390625, 0.2193756103515625, 0.2266845703125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 5.0, 6.0, 4.0, 12.0, 16.0, 13.0, 20.0, 34.0, 41.0, 56.0, 75.0, 101.0, 108.0, 91.0, 109.0, 93.0, 58.0, 44.0, 29.0, 25.0, 20.0, 7.0, 8.0, 7.0, 10.0, 9.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.219970703125, -0.21078109741210938, -0.20159149169921875, -0.19240188598632812, -0.1832122802734375, -0.17402267456054688, -0.16483306884765625, -0.15564346313476562, -0.146453857421875, -0.13726425170898438, -0.12807464599609375, -0.11888504028320312, -0.1096954345703125, -0.10050582885742188, -0.09131622314453125, -0.08212661743164062, -0.07293701171875, -0.06374740600585938, -0.05455780029296875, -0.045368194580078125, -0.0361785888671875, -0.026988983154296875, -0.01779937744140625, -0.008609771728515625, 0.000579833984375, 0.009769439697265625, 0.01895904541015625, 0.028148651123046875, 0.0373382568359375, 0.046527862548828125, 0.05571746826171875, 0.06490707397460938, 0.0740966796875, 0.08328628540039062, 0.09247589111328125, 0.10166549682617188, 0.1108551025390625, 0.12004470825195312, 0.12923431396484375, 0.13842391967773438, 0.147613525390625, 0.15680313110351562, 0.16599273681640625, 0.17518234252929688, 0.1843719482421875, 0.19356155395507812, 0.20275115966796875, 0.21194076538085938, 0.22113037109375, 0.23031997680664062, 0.23950958251953125, 0.24869918823242188, 0.2578887939453125, 0.2670783996582031, 0.27626800537109375, 0.2854576110839844, 0.294647216796875, 0.3038368225097656, 0.31302642822265625, 0.3222160339355469, 0.3314056396484375, 0.3405952453613281, 0.34978485107421875, 0.3589744567871094, 0.3681640625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 7.0, 2.0, 1.0, 3.0, 1.0, 2.0, 5.0, 9.0, 16.0, 31.0, 46.0, 80.0, 104.0, 175.0, 184.0, 126.0, 82.0, 49.0, 29.0, 22.0, 8.0, 5.0, 2.0, 6.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0], "bins": [-5.8701324462890625, -5.723775386810303, -5.577418327331543, -5.431060791015625, -5.284703731536865, -5.1383466720581055, -4.9919891357421875, -4.845632076263428, -4.699275016784668, -4.552917957305908, -4.406560897827148, -4.2602033615112305, -4.113846302032471, -3.967489242553711, -3.821131944656372, -3.674774646759033, -3.5284175872802734, -3.3820605278015137, -3.235703229904175, -3.089345932006836, -2.942988872528076, -2.7966318130493164, -2.6502745151519775, -2.5039172172546387, -2.357560157775879, -2.211203098297119, -2.0648458003997803, -1.918488621711731, -1.7721314430236816, -1.6257742643356323, -1.479417085647583, -1.3330599069595337, -1.1867024898529053, -1.040345311164856, -0.8939881324768066, -0.7476309537887573, -0.601273775100708, -0.4549165964126587, -0.3085594177246094, -0.16220223903656006, -0.015845060348510742, 0.13051211833953857, 0.2768692970275879, 0.4232264757156372, 0.5695836544036865, 0.7159408330917358, 0.8622980117797852, 1.0086551904678345, 1.1550123691558838, 1.301369547843933, 1.4477267265319824, 1.5940839052200317, 1.740441083908081, 1.8867982625961304, 2.0331554412841797, 2.1795125007629395, 2.3258697986602783, 2.472227096557617, 2.618584156036377, 2.7649412155151367, 2.9112985134124756, 3.0576558113098145, 3.204012870788574, 3.350369930267334, 3.496727228164673]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 5.0, 4.0, 9.0, 7.0, 10.0, 11.0, 14.0, 19.0, 11.0, 20.0, 23.0, 23.0, 22.0, 30.0, 38.0, 30.0, 38.0, 32.0, 63.0, 72.0, 84.0, 80.0, 48.0, 48.0, 36.0, 23.0, 26.0, 22.0, 28.0, 20.0, 7.0, 22.0, 11.0, 16.0, 21.0, 6.0, 10.0, 8.0, 2.0, 7.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.274181365966797, -4.14931058883667, -4.024440288543701, -3.899569511413574, -3.7746989727020264, -3.6498284339904785, -3.5249578952789307, -3.400087356567383, -3.275216579437256, -3.150346040725708, -3.02547550201416, -2.900604724884033, -2.7757341861724854, -2.6508636474609375, -2.5259931087493896, -2.401122570037842, -2.276252031326294, -2.151381492614746, -2.0265109539031982, -1.9016402959823608, -1.7767696380615234, -1.6518990993499756, -1.5270285606384277, -1.4021580219268799, -1.2772873640060425, -1.1524168252944946, -1.0275461673736572, -0.9026756286621094, -0.7778050303459167, -0.6529344320297241, -0.5280638933181763, -0.40319329500198364, -0.278322696685791, -0.15345211327075958, -0.02858152985572815, 0.09628903865814209, 0.22115963697433472, 0.34603023529052734, 0.4709007740020752, 0.5957713723182678, 0.7206419706344604, 0.8455125689506531, 0.9703831672668457, 1.0952537059783936, 1.2201242446899414, 1.3449949026107788, 1.4698654413223267, 1.594736099243164, 1.719606637954712, 1.8444771766662598, 1.9693478345870972, 2.0942182540893555, 2.2190890312194824, 2.3439595699310303, 2.468830108642578, 2.593700647354126, 2.718571186065674, 2.8434417247772217, 2.9683122634887695, 3.0931830406188965, 3.2180535793304443, 3.342924118041992, 3.46779465675354, 3.592665195465088, 3.717535972595215]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 7.0, 5.0, 9.0, 15.0, 19.0, 30.0, 49.0, 61.0, 96.0, 163.0, 250.0, 422.0, 701.0, 1246.0, 2461.0, 5230.0, 12887.0, 38719.0, 181671.0, 1643660.0, 2003345.0, 232041.0, 44923.0, 14368.0, 5787.0, 2743.0, 1391.0, 743.0, 420.0, 276.0, 170.0, 122.0, 78.0, 50.0, 38.0, 20.0, 18.0, 14.0, 9.0, 13.0, 7.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2666015625, -0.2574272155761719, -0.24825286865234375, -0.23907852172851562, -0.2299041748046875, -0.22072982788085938, -0.21155548095703125, -0.20238113403320312, -0.193206787109375, -0.18403244018554688, -0.17485809326171875, -0.16568374633789062, -0.1565093994140625, -0.14733505249023438, -0.13816070556640625, -0.12898635864257812, -0.11981201171875, -0.11063766479492188, -0.10146331787109375, -0.09228897094726562, -0.0831146240234375, -0.07394027709960938, -0.06476593017578125, -0.055591583251953125, -0.046417236328125, -0.037242889404296875, -0.02806854248046875, -0.018894195556640625, -0.0097198486328125, -0.000545501708984375, 0.00862884521484375, 0.017803192138671875, 0.0269775390625, 0.036151885986328125, 0.04532623291015625, 0.054500579833984375, 0.0636749267578125, 0.07284927368164062, 0.08202362060546875, 0.09119796752929688, 0.100372314453125, 0.10954666137695312, 0.11872100830078125, 0.12789535522460938, 0.1370697021484375, 0.14624404907226562, 0.15541839599609375, 0.16459274291992188, 0.17376708984375, 0.18294143676757812, 0.19211578369140625, 0.20129013061523438, 0.2104644775390625, 0.21963882446289062, 0.22881317138671875, 0.23798751831054688, 0.247161865234375, 0.2563362121582031, 0.26551055908203125, 0.2746849060058594, 0.2838592529296875, 0.2930335998535156, 0.30220794677734375, 0.3113822937011719, 0.320556640625]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 3.0, 5.0, 6.0, 5.0, 6.0, 14.0, 12.0, 11.0, 12.0, 10.0, 10.0, 25.0, 26.0, 36.0, 41.0, 40.0, 29.0, 33.0, 39.0, 38.0, 48.0, 29.0, 58.0, 46.0, 45.0, 43.0, 36.0, 34.0, 39.0, 35.0, 39.0, 22.0, 19.0, 23.0, 13.0, 21.0, 11.0, 10.0, 11.0, 6.0, 7.0, 3.0, 2.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1861572265625, -0.18033218383789062, -0.17450714111328125, -0.16868209838867188, -0.1628570556640625, -0.15703201293945312, -0.15120697021484375, -0.14538192749023438, -0.139556884765625, -0.13373184204101562, -0.12790679931640625, -0.12208175659179688, -0.1162567138671875, -0.11043167114257812, -0.10460662841796875, -0.09878158569335938, -0.09295654296875, -0.08713150024414062, -0.08130645751953125, -0.07548141479492188, -0.0696563720703125, -0.06383132934570312, -0.05800628662109375, -0.052181243896484375, -0.046356201171875, -0.040531158447265625, -0.03470611572265625, -0.028881072998046875, -0.0230560302734375, -0.017230987548828125, -0.01140594482421875, -0.005580902099609375, 0.000244140625, 0.006069183349609375, 0.01189422607421875, 0.017719268798828125, 0.0235443115234375, 0.029369354248046875, 0.03519439697265625, 0.041019439697265625, 0.046844482421875, 0.052669525146484375, 0.05849456787109375, 0.06431961059570312, 0.0701446533203125, 0.07596969604492188, 0.08179473876953125, 0.08761978149414062, 0.09344482421875, 0.09926986694335938, 0.10509490966796875, 0.11091995239257812, 0.1167449951171875, 0.12257003784179688, 0.12839508056640625, 0.13422012329101562, 0.140045166015625, 0.14587020874023438, 0.15169525146484375, 0.15752029418945312, 0.1633453369140625, 0.16917037963867188, 0.17499542236328125, 0.18082046508789062, 0.1866455078125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 6.0, 9.0, 5.0, 15.0, 33.0, 59.0, 198.0, 649.0, 4825.0, 154960.0, 3994572.0, 36118.0, 2225.0, 407.0, 113.0, 48.0, 23.0, 12.0, 6.0, 6.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.95703125, -0.9121551513671875, -0.867279052734375, -0.8224029541015625, -0.77752685546875, -0.7326507568359375, -0.687774658203125, -0.6428985595703125, -0.5980224609375, -0.5531463623046875, -0.508270263671875, -0.4633941650390625, -0.41851806640625, -0.3736419677734375, -0.328765869140625, -0.2838897705078125, -0.239013671875, -0.1941375732421875, -0.149261474609375, -0.1043853759765625, -0.05950927734375, -0.0146331787109375, 0.030242919921875, 0.0751190185546875, 0.1199951171875, 0.1648712158203125, 0.209747314453125, 0.2546234130859375, 0.29949951171875, 0.3443756103515625, 0.389251708984375, 0.4341278076171875, 0.47900390625, 0.5238800048828125, 0.568756103515625, 0.6136322021484375, 0.65850830078125, 0.7033843994140625, 0.748260498046875, 0.7931365966796875, 0.8380126953125, 0.8828887939453125, 0.927764892578125, 0.9726409912109375, 1.01751708984375, 1.0623931884765625, 1.107269287109375, 1.1521453857421875, 1.197021484375, 1.2418975830078125, 1.286773681640625, 1.3316497802734375, 1.37652587890625, 1.4214019775390625, 1.466278076171875, 1.5111541748046875, 1.5560302734375, 1.6009063720703125, 1.645782470703125, 1.6906585693359375, 1.73553466796875, 1.7804107666015625, 1.825286865234375, 1.8701629638671875, 1.9150390625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 3.0, 5.0, 5.0, 5.0, 13.0, 18.0, 17.0, 33.0, 43.0, 70.0, 120.0, 194.0, 450.0, 785.0, 1005.0, 591.0, 279.0, 154.0, 94.0, 61.0, 36.0, 29.0, 26.0, 12.0, 3.0, 8.0, 4.0, 6.0, 6.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7568359375, -0.7365188598632812, -0.7162017822265625, -0.6958847045898438, -0.675567626953125, -0.6552505493164062, -0.6349334716796875, -0.6146163940429688, -0.59429931640625, -0.5739822387695312, -0.5536651611328125, -0.5333480834960938, -0.513031005859375, -0.49271392822265625, -0.4723968505859375, -0.45207977294921875, -0.4317626953125, -0.41144561767578125, -0.3911285400390625, -0.37081146240234375, -0.350494384765625, -0.33017730712890625, -0.3098602294921875, -0.28954315185546875, -0.26922607421875, -0.24890899658203125, -0.2285919189453125, -0.20827484130859375, -0.187957763671875, -0.16764068603515625, -0.1473236083984375, -0.12700653076171875, -0.106689453125, -0.08637237548828125, -0.0660552978515625, -0.04573822021484375, -0.025421142578125, -0.00510406494140625, 0.0152130126953125, 0.03553009033203125, 0.05584716796875, 0.07616424560546875, 0.0964813232421875, 0.11679840087890625, 0.137115478515625, 0.15743255615234375, 0.1777496337890625, 0.19806671142578125, 0.2183837890625, 0.23870086669921875, 0.2590179443359375, 0.27933502197265625, 0.299652099609375, 0.31996917724609375, 0.3402862548828125, 0.36060333251953125, 0.38092041015625, 0.40123748779296875, 0.4215545654296875, 0.44187164306640625, 0.462188720703125, 0.48250579833984375, 0.5028228759765625, 0.5231399536132812, 0.54345703125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 6.0, 11.0, 44.0, 120.0, 192.0, 230.0, 189.0, 102.0, 47.0, 15.0, 10.0, 9.0, 3.0, 3.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.550397872924805, -6.359920978546143, -6.169444561004639, -5.978967666625977, -5.788491249084473, -5.5980143547058105, -5.407537937164307, -5.2170610427856445, -5.026584625244141, -4.8361077308654785, -4.645631313323975, -4.4551544189453125, -4.264678001403809, -4.0742011070251465, -3.8837246894836426, -3.6932477951049805, -3.5027711391448975, -3.3122944831848145, -3.1218178272247314, -2.9313411712646484, -2.7408645153045654, -2.5503878593444824, -2.3599109649658203, -2.1694345474243164, -1.9789577722549438, -1.7884811162948608, -1.5980044603347778, -1.4075276851654053, -1.2170510292053223, -1.0265743732452393, -0.8360977172851562, -0.6456210613250732, -0.45514440536499023, -0.2646677494049072, -0.07419106364250183, 0.11628562211990356, 0.3067622780799866, 0.4972389340400696, 0.6877156496047974, 0.8781923055648804, 1.0686689615249634, 1.2591456174850464, 1.4496222734451294, 1.640099048614502, 1.830575704574585, 2.021052360534668, 2.211529016494751, 2.402005672454834, 2.592482328414917, 2.782958984375, 2.973435640335083, 3.163912296295166, 3.354388952255249, 3.544865608215332, 3.735342502593994, 3.925818920135498, 4.11629581451416, 4.306772708892822, 4.497249126434326, 4.687726020812988, 4.878202438354492, 5.068679332733154, 5.259155750274658, 5.44963264465332, 5.640109062194824]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 8.0, 7.0, 8.0, 4.0, 10.0, 10.0, 11.0, 10.0, 12.0, 10.0, 15.0, 26.0, 23.0, 31.0, 35.0, 34.0, 41.0, 37.0, 30.0, 50.0, 59.0, 38.0, 52.0, 59.0, 32.0, 44.0, 31.0, 32.0, 32.0, 25.0, 35.0, 28.0, 19.0, 12.0, 9.0, 14.0, 16.0, 9.0, 14.0, 13.0, 9.0, 7.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8522539138793945, -1.790534496307373, -1.7288150787353516, -1.66709566116333, -1.6053762435913086, -1.543656826019287, -1.4819374084472656, -1.4202179908752441, -1.3584985733032227, -1.2967791557312012, -1.2350597381591797, -1.1733403205871582, -1.1116209030151367, -1.0499014854431152, -0.9881820678710938, -0.9264626502990723, -0.864743173122406, -0.8030237555503845, -0.741304337978363, -0.6795849204063416, -0.6178655028343201, -0.5561460256576538, -0.4944266378879547, -0.4327072203159332, -0.37098780274391174, -0.30926838517189026, -0.24754896759986877, -0.1858295351266861, -0.12411011755466461, -0.062390685081481934, -0.0006712675094604492, 0.061048150062561035, 0.12276756763458252, 0.184486985206604, 0.2462064027786255, 0.307925820350647, 0.36964523792266846, 0.43136468529701233, 0.4930841028690338, 0.5548034906387329, 0.6165229082107544, 0.6782423257827759, 0.7399617433547974, 0.8016811609268188, 0.8634005784988403, 0.9251199960708618, 0.9868394136428833, 1.0485588312149048, 1.1102783679962158, 1.1719977855682373, 1.2337172031402588, 1.2954366207122803, 1.3571560382843018, 1.4188754558563232, 1.4805948734283447, 1.5423142910003662, 1.6040337085723877, 1.6657531261444092, 1.7274725437164307, 1.7891919612884521, 1.8509113788604736, 1.9126307964324951, 1.9743502140045166, 2.036069631576538, 2.0977890491485596]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 6.0, 5.0, 3.0, 10.0, 16.0, 23.0, 37.0, 52.0, 76.0, 118.0, 206.0, 300.0, 503.0, 966.0, 1734.0, 3367.0, 6964.0, 15491.0, 41145.0, 121494.0, 328344.0, 331524.0, 123616.0, 42001.0, 15986.0, 7148.0, 3396.0, 1738.0, 940.0, 506.0, 322.0, 187.0, 112.0, 77.0, 56.0, 24.0, 22.0, 11.0, 11.0, 8.0, 5.0, 3.0, 4.0, 0.0, 5.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.306884765625, -0.29811859130859375, -0.2893524169921875, -0.28058624267578125, -0.271820068359375, -0.26305389404296875, -0.2542877197265625, -0.24552154541015625, -0.23675537109375, -0.22798919677734375, -0.2192230224609375, -0.21045684814453125, -0.201690673828125, -0.19292449951171875, -0.1841583251953125, -0.17539215087890625, -0.1666259765625, -0.15785980224609375, -0.1490936279296875, -0.14032745361328125, -0.131561279296875, -0.12279510498046875, -0.1140289306640625, -0.10526275634765625, -0.09649658203125, -0.08773040771484375, -0.0789642333984375, -0.07019805908203125, -0.061431884765625, -0.05266571044921875, -0.0438995361328125, -0.03513336181640625, -0.0263671875, -0.01760101318359375, -0.0088348388671875, -6.866455078125e-05, 0.008697509765625, 0.01746368408203125, 0.0262298583984375, 0.03499603271484375, 0.04376220703125, 0.05252838134765625, 0.0612945556640625, 0.07006072998046875, 0.078826904296875, 0.08759307861328125, 0.0963592529296875, 0.10512542724609375, 0.1138916015625, 0.12265777587890625, 0.1314239501953125, 0.14019012451171875, 0.148956298828125, 0.15772247314453125, 0.1664886474609375, 0.17525482177734375, 0.18402099609375, 0.19278717041015625, 0.2015533447265625, 0.21031951904296875, 0.219085693359375, 0.22785186767578125, 0.2366180419921875, 0.24538421630859375, 0.254150390625]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 4.0, 6.0, 8.0, 13.0, 5.0, 14.0, 20.0, 20.0, 24.0, 20.0, 26.0, 34.0, 34.0, 38.0, 34.0, 28.0, 45.0, 35.0, 39.0, 38.0, 43.0, 49.0, 43.0, 52.0, 34.0, 36.0, 32.0, 31.0, 29.0, 22.0, 23.0, 18.0, 17.0, 19.0, 12.0, 6.0, 13.0, 7.0, 6.0, 6.0, 4.0, 6.0, 5.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.20849609375, -0.2026805877685547, -0.19686508178710938, -0.19104957580566406, -0.18523406982421875, -0.17941856384277344, -0.17360305786132812, -0.1677875518798828, -0.1619720458984375, -0.1561565399169922, -0.15034103393554688, -0.14452552795410156, -0.13871002197265625, -0.13289451599121094, -0.12707901000976562, -0.12126350402832031, -0.115447998046875, -0.10963249206542969, -0.10381698608398438, -0.09800148010253906, -0.09218597412109375, -0.08637046813964844, -0.08055496215820312, -0.07473945617675781, -0.0689239501953125, -0.06310844421386719, -0.057292938232421875, -0.05147743225097656, -0.04566192626953125, -0.03984642028808594, -0.034030914306640625, -0.028215408325195312, -0.02239990234375, -0.016584396362304688, -0.010768890380859375, -0.0049533843994140625, 0.00086212158203125, 0.0066776275634765625, 0.012493133544921875, 0.018308639526367188, 0.0241241455078125, 0.029939651489257812, 0.035755157470703125, 0.04157066345214844, 0.04738616943359375, 0.05320167541503906, 0.059017181396484375, 0.06483268737792969, 0.070648193359375, 0.07646369934082031, 0.08227920532226562, 0.08809471130371094, 0.09391021728515625, 0.09972572326660156, 0.10554122924804688, 0.11135673522949219, 0.1171722412109375, 0.12298774719238281, 0.12880325317382812, 0.13461875915527344, 0.14043426513671875, 0.14624977111816406, 0.15206527709960938, 0.1578807830810547, 0.1636962890625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 5.0, 8.0, 9.0, 14.0, 20.0, 18.0, 27.0, 45.0, 65.0, 108.0, 188.0, 366.0, 892.0, 2355.0, 8555.0, 55067.0, 707147.0, 242614.0, 23429.0, 4809.0, 1477.0, 655.0, 261.0, 165.0, 80.0, 48.0, 33.0, 29.0, 22.0, 10.0, 11.0, 5.0, 4.0, 3.0, 2.0, 6.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.57470703125, -0.555419921875, -0.5361328125, -0.516845703125, -0.49755859375, -0.478271484375, -0.458984375, -0.439697265625, -0.42041015625, -0.401123046875, -0.3818359375, -0.362548828125, -0.34326171875, -0.323974609375, -0.3046875, -0.285400390625, -0.26611328125, -0.246826171875, -0.2275390625, -0.208251953125, -0.18896484375, -0.169677734375, -0.150390625, -0.131103515625, -0.11181640625, -0.092529296875, -0.0732421875, -0.053955078125, -0.03466796875, -0.015380859375, 0.00390625, 0.023193359375, 0.04248046875, 0.061767578125, 0.0810546875, 0.100341796875, 0.11962890625, 0.138916015625, 0.158203125, 0.177490234375, 0.19677734375, 0.216064453125, 0.2353515625, 0.254638671875, 0.27392578125, 0.293212890625, 0.3125, 0.331787109375, 0.35107421875, 0.370361328125, 0.3896484375, 0.408935546875, 0.42822265625, 0.447509765625, 0.466796875, 0.486083984375, 0.50537109375, 0.524658203125, 0.5439453125, 0.563232421875, 0.58251953125, 0.601806640625, 0.62109375, 0.640380859375, 0.65966796875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 7.0, 3.0, 7.0, 13.0, 12.0, 18.0, 20.0, 24.0, 23.0, 34.0, 39.0, 50.0, 62.0, 78.0, 72.0, 72.0, 69.0, 83.0, 81.0, 58.0, 48.0, 35.0, 26.0, 14.0, 19.0, 15.0, 11.0, 9.0, 2.0, 6.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.26953125, -1.234832763671875, -1.20013427734375, -1.165435791015625, -1.1307373046875, -1.096038818359375, -1.06134033203125, -1.026641845703125, -0.991943359375, -0.957244873046875, -0.92254638671875, -0.887847900390625, -0.8531494140625, -0.818450927734375, -0.78375244140625, -0.749053955078125, -0.71435546875, -0.679656982421875, -0.64495849609375, -0.610260009765625, -0.5755615234375, -0.540863037109375, -0.50616455078125, -0.471466064453125, -0.436767578125, -0.402069091796875, -0.36737060546875, -0.332672119140625, -0.2979736328125, -0.263275146484375, -0.22857666015625, -0.193878173828125, -0.1591796875, -0.124481201171875, -0.08978271484375, -0.055084228515625, -0.0203857421875, 0.014312744140625, 0.04901123046875, 0.083709716796875, 0.118408203125, 0.153106689453125, 0.18780517578125, 0.222503662109375, 0.2572021484375, 0.291900634765625, 0.32659912109375, 0.361297607421875, 0.39599609375, 0.430694580078125, 0.46539306640625, 0.500091552734375, 0.5347900390625, 0.569488525390625, 0.60418701171875, 0.638885498046875, 0.673583984375, 0.708282470703125, 0.74298095703125, 0.777679443359375, 0.8123779296875, 0.847076416015625, 0.88177490234375, 0.916473388671875, 0.951171875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 4.0, 4.0, 4.0, 8.0, 8.0, 20.0, 16.0, 13.0, 32.0, 40.0, 106.0, 116.0, 194.0, 383.0, 922.0, 2554.0, 9414.0, 71371.0, 852835.0, 94550.0, 11164.0, 2796.0, 991.0, 441.0, 245.0, 108.0, 67.0, 48.0, 38.0, 18.0, 16.0, 9.0, 8.0, 3.0, 5.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.306884765625, -0.29613494873046875, -0.2853851318359375, -0.27463531494140625, -0.263885498046875, -0.25313568115234375, -0.2423858642578125, -0.23163604736328125, -0.22088623046875, -0.21013641357421875, -0.1993865966796875, -0.18863677978515625, -0.177886962890625, -0.16713714599609375, -0.1563873291015625, -0.14563751220703125, -0.1348876953125, -0.12413787841796875, -0.1133880615234375, -0.10263824462890625, -0.091888427734375, -0.08113861083984375, -0.0703887939453125, -0.05963897705078125, -0.04888916015625, -0.03813934326171875, -0.0273895263671875, -0.01663970947265625, -0.005889892578125, 0.00485992431640625, 0.0156097412109375, 0.02635955810546875, 0.037109375, 0.04785919189453125, 0.0586090087890625, 0.06935882568359375, 0.080108642578125, 0.09085845947265625, 0.1016082763671875, 0.11235809326171875, 0.12310791015625, 0.13385772705078125, 0.1446075439453125, 0.15535736083984375, 0.166107177734375, 0.17685699462890625, 0.1876068115234375, 0.19835662841796875, 0.2091064453125, 0.21985626220703125, 0.2306060791015625, 0.24135589599609375, 0.252105712890625, 0.26285552978515625, 0.2736053466796875, 0.28435516357421875, 0.29510498046875, 0.30585479736328125, 0.3166046142578125, 0.32735443115234375, 0.338104248046875, 0.34885406494140625, 0.3596038818359375, 0.37035369873046875, 0.381103515625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 0.0, 4.0, 0.0, 5.0, 10.0, 9.0, 8.0, 26.0, 130.0, 362.0, 312.0, 89.0, 22.0, 6.0, 7.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002465248107910156, -0.00024002045392990112, -0.00023351609706878662, -0.00022701174020767212, -0.00022050738334655762, -0.00021400302648544312, -0.0002074986696243286, -0.0002009943127632141, -0.0001944899559020996, -0.0001879855990409851, -0.0001814812421798706, -0.0001749768853187561, -0.0001684725284576416, -0.0001619681715965271, -0.0001554638147354126, -0.0001489594578742981, -0.0001424551010131836, -0.0001359507441520691, -0.0001294463872909546, -0.0001229420304298401, -0.00011643767356872559, -0.00010993331670761108, -0.00010342895984649658, -9.692460298538208e-05, -9.042024612426758e-05, -8.391588926315308e-05, -7.741153240203857e-05, -7.090717554092407e-05, -6.440281867980957e-05, -5.789846181869507e-05, -5.1394104957580566e-05, -4.4889748096466064e-05, -3.838539123535156e-05, -3.188103437423706e-05, -2.537667751312256e-05, -1.8872320652008057e-05, -1.2367963790893555e-05, -5.863606929779053e-06, 6.407499313354492e-07, 7.145106792449951e-06, 1.3649463653564453e-05, 2.0153820514678955e-05, 2.6658177375793457e-05, 3.316253423690796e-05, 3.966689109802246e-05, 4.617124795913696e-05, 5.2675604820251465e-05, 5.917996168136597e-05, 6.568431854248047e-05, 7.218867540359497e-05, 7.869303226470947e-05, 8.519738912582397e-05, 9.170174598693848e-05, 9.820610284805298e-05, 0.00010471045970916748, 0.00011121481657028198, 0.00011771917343139648, 0.00012422353029251099, 0.0001307278871536255, 0.00013723224401474, 0.0001437366008758545, 0.000150240957736969, 0.0001567453145980835, 0.000163249671459198, 0.0001697540283203125]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 1.0, 4.0, 7.0, 10.0, 21.0, 21.0, 49.0, 54.0, 91.0, 144.0, 277.0, 528.0, 1245.0, 3312.0, 12206.0, 95870.0, 819944.0, 96386.0, 12570.0, 3375.0, 1201.0, 574.0, 272.0, 149.0, 91.0, 53.0, 32.0, 23.0, 15.0, 10.0, 7.0, 1.0, 1.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.3056640625, -0.2956428527832031, -0.28562164306640625, -0.2756004333496094, -0.2655792236328125, -0.2555580139160156, -0.24553680419921875, -0.23551559448242188, -0.225494384765625, -0.21547317504882812, -0.20545196533203125, -0.19543075561523438, -0.1854095458984375, -0.17538833618164062, -0.16536712646484375, -0.15534591674804688, -0.14532470703125, -0.13530349731445312, -0.12528228759765625, -0.11526107788085938, -0.1052398681640625, -0.09521865844726562, -0.08519744873046875, -0.07517623901367188, -0.065155029296875, -0.055133819580078125, -0.04511260986328125, -0.035091400146484375, -0.0250701904296875, -0.015048980712890625, -0.00502777099609375, 0.004993438720703125, 0.0150146484375, 0.025035858154296875, 0.03505706787109375, 0.045078277587890625, 0.0550994873046875, 0.06512069702148438, 0.07514190673828125, 0.08516311645507812, 0.095184326171875, 0.10520553588867188, 0.11522674560546875, 0.12524795532226562, 0.1352691650390625, 0.14529037475585938, 0.15531158447265625, 0.16533279418945312, 0.17535400390625, 0.18537521362304688, 0.19539642333984375, 0.20541763305664062, 0.2154388427734375, 0.22546005249023438, 0.23548126220703125, 0.24550247192382812, 0.255523681640625, 0.2655448913574219, 0.27556610107421875, 0.2855873107910156, 0.2956085205078125, 0.3056297302246094, 0.31565093994140625, 0.3256721496582031, 0.335693359375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 1.0, 5.0, 2.0, 1.0, 5.0, 13.0, 10.0, 11.0, 19.0, 23.0, 44.0, 67.0, 106.0, 110.0, 127.0, 125.0, 97.0, 78.0, 44.0, 34.0, 23.0, 18.0, 7.0, 8.0, 8.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.252197265625, -0.24393463134765625, -0.2356719970703125, -0.22740936279296875, -0.219146728515625, -0.21088409423828125, -0.2026214599609375, -0.19435882568359375, -0.18609619140625, -0.17783355712890625, -0.1695709228515625, -0.16130828857421875, -0.153045654296875, -0.14478302001953125, -0.1365203857421875, -0.12825775146484375, -0.1199951171875, -0.11173248291015625, -0.1034698486328125, -0.09520721435546875, -0.086944580078125, -0.07868194580078125, -0.0704193115234375, -0.06215667724609375, -0.05389404296875, -0.04563140869140625, -0.0373687744140625, -0.02910614013671875, -0.020843505859375, -0.01258087158203125, -0.0043182373046875, 0.00394439697265625, 0.01220703125, 0.02046966552734375, 0.0287322998046875, 0.03699493408203125, 0.045257568359375, 0.05352020263671875, 0.0617828369140625, 0.07004547119140625, 0.07830810546875, 0.08657073974609375, 0.0948333740234375, 0.10309600830078125, 0.111358642578125, 0.11962127685546875, 0.1278839111328125, 0.13614654541015625, 0.1444091796875, 0.15267181396484375, 0.1609344482421875, 0.16919708251953125, 0.177459716796875, 0.18572235107421875, 0.1939849853515625, 0.20224761962890625, 0.21051025390625, 0.21877288818359375, 0.2270355224609375, 0.23529815673828125, 0.243560791015625, 0.25182342529296875, 0.2600860595703125, 0.26834869384765625, 0.276611328125]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 11.0, 17.0, 101.0, 475.0, 303.0, 71.0, 22.0, 2.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0348992347717285, -3.6630659103393555, -3.2912325859069824, -2.9193992614746094, -2.5475659370422363, -2.1757326126098633, -1.8038995265960693, -1.4320662021636963, -1.0602328777313232, -0.6883995532989502, -0.3165662884712219, 0.05526697635650635, 0.4271003007888794, 0.7989336252212524, 1.170766830444336, 1.542600154876709, 1.914433479309082, 2.286266803741455, 2.658100128173828, 3.029933452606201, 3.401766777038574, 3.7736001014709473, 4.14543342590332, 4.517266273498535, 4.889100074768066, 5.2609333992004395, 5.6327667236328125, 6.0046000480651855, 6.376433372497559, 6.748266696929932, 7.120100021362305, 7.4919328689575195, 7.863766670227051, 8.235599517822266, 8.607433319091797, 8.979266166687012, 9.351099967956543, 9.722932815551758, 10.094766616821289, 10.466599464416504, 10.838433265686035, 11.21026611328125, 11.582099914550781, 11.953932762145996, 12.325766563415527, 12.697599411010742, 13.069433212280273, 13.441266059875488, 13.813098907470703, 14.184931755065918, 14.55676555633545, 14.928598403930664, 15.300432205200195, 15.67226505279541, 16.044097900390625, 16.415931701660156, 16.787765502929688, 17.15959930419922, 17.531431198120117, 17.90326499938965, 18.27509880065918, 18.64693260192871, 19.01876449584961, 19.39059829711914, 19.762432098388672]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 1.0, 2.0, 7.0, 6.0, 5.0, 12.0, 16.0, 16.0, 10.0, 11.0, 22.0, 21.0, 23.0, 25.0, 44.0, 34.0, 36.0, 49.0, 58.0, 79.0, 73.0, 66.0, 43.0, 42.0, 33.0, 37.0, 36.0, 23.0, 22.0, 24.0, 14.0, 21.0, 15.0, 11.0, 7.0, 14.0, 11.0, 5.0, 6.0, 3.0, 6.0, 4.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.664245843887329, -2.5767669677734375, -2.489287853240967, -2.401808977127075, -2.3143301010131836, -2.226851224899292, -2.1393723487854004, -2.0518932342529297, -1.964414358139038, -1.8769354820251465, -1.7894564867019653, -1.7019774913787842, -1.6144986152648926, -1.527019739151001, -1.4395407438278198, -1.3520617485046387, -1.264582872390747, -1.1771039962768555, -1.0896250009536743, -1.0021460056304932, -0.9146671295166016, -0.8271881937980652, -0.7397092580795288, -0.6522303223609924, -0.564751386642456, -0.4772724509239197, -0.3897935152053833, -0.3023145794868469, -0.21483564376831055, -0.12735670804977417, -0.03987777233123779, 0.047601163387298584, 0.13508033752441406, 0.22255927324295044, 0.3100382089614868, 0.3975171446800232, 0.48499608039855957, 0.572475016117096, 0.6599539518356323, 0.7474328875541687, 0.8349118232727051, 0.9223907589912415, 1.0098696947097778, 1.097348690032959, 1.1848275661468506, 1.2723064422607422, 1.3597854375839233, 1.4472644329071045, 1.534743309020996, 1.6222221851348877, 1.7097011804580688, 1.79718017578125, 1.8846590518951416, 1.9721379280090332, 2.059617042541504, 2.1470959186553955, 2.234574794769287, 2.3220536708831787, 2.4095325469970703, 2.497011661529541, 2.5844905376434326, 2.671969413757324, 2.759448528289795, 2.8469274044036865, 2.934406280517578]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 5.0, 11.0, 5.0, 26.0, 34.0, 47.0, 72.0, 155.0, 245.0, 442.0, 781.0, 1533.0, 2988.0, 6471.0, 16255.0, 58563.0, 374553.0, 2556402.0, 1002037.0, 126980.0, 28393.0, 9835.0, 4151.0, 2009.0, 1026.0, 533.0, 315.0, 187.0, 91.0, 51.0, 26.0, 22.0, 16.0, 10.0, 6.0, 4.0, 5.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.25146484375, -0.24271011352539062, -0.23395538330078125, -0.22520065307617188, -0.2164459228515625, -0.20769119262695312, -0.19893646240234375, -0.19018173217773438, -0.181427001953125, -0.17267227172851562, -0.16391754150390625, -0.15516281127929688, -0.1464080810546875, -0.13765335083007812, -0.12889862060546875, -0.12014389038085938, -0.11138916015625, -0.10263442993164062, -0.09387969970703125, -0.08512496948242188, -0.0763702392578125, -0.06761550903320312, -0.05886077880859375, -0.050106048583984375, -0.041351318359375, -0.032596588134765625, -0.02384185791015625, -0.015087127685546875, -0.0063323974609375, 0.002422332763671875, 0.01117706298828125, 0.019931793212890625, 0.0286865234375, 0.037441253662109375, 0.04619598388671875, 0.054950714111328125, 0.0637054443359375, 0.07246017456054688, 0.08121490478515625, 0.08996963500976562, 0.098724365234375, 0.10747909545898438, 0.11623382568359375, 0.12498855590820312, 0.1337432861328125, 0.14249801635742188, 0.15125274658203125, 0.16000747680664062, 0.16876220703125, 0.17751693725585938, 0.18627166748046875, 0.19502639770507812, 0.2037811279296875, 0.21253585815429688, 0.22129058837890625, 0.23004531860351562, 0.238800048828125, 0.24755477905273438, 0.25630950927734375, 0.2650642395019531, 0.2738189697265625, 0.2825736999511719, 0.29132843017578125, 0.3000831604003906, 0.308837890625]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 4.0, 6.0, 2.0, 1.0, 4.0, 4.0, 4.0, 8.0, 12.0, 9.0, 12.0, 13.0, 13.0, 18.0, 18.0, 31.0, 28.0, 36.0, 41.0, 37.0, 40.0, 36.0, 39.0, 36.0, 34.0, 43.0, 41.0, 40.0, 40.0, 44.0, 28.0, 30.0, 41.0, 35.0, 26.0, 26.0, 19.0, 20.0, 14.0, 12.0, 16.0, 7.0, 9.0, 10.0, 5.0, 1.0, 7.0, 5.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.190185546875, -0.18480491638183594, -0.17942428588867188, -0.1740436553955078, -0.16866302490234375, -0.1632823944091797, -0.15790176391601562, -0.15252113342285156, -0.1471405029296875, -0.14175987243652344, -0.13637924194335938, -0.1309986114501953, -0.12561798095703125, -0.12023735046386719, -0.11485671997070312, -0.10947608947753906, -0.104095458984375, -0.09871482849121094, -0.09333419799804688, -0.08795356750488281, -0.08257293701171875, -0.07719230651855469, -0.07181167602539062, -0.06643104553222656, -0.0610504150390625, -0.05566978454589844, -0.050289154052734375, -0.04490852355957031, -0.03952789306640625, -0.03414726257324219, -0.028766632080078125, -0.023386001586914062, -0.01800537109375, -0.012624740600585938, -0.007244110107421875, -0.0018634796142578125, 0.00351715087890625, 0.008897781372070312, 0.014278411865234375, 0.019659042358398438, 0.0250396728515625, 0.030420303344726562, 0.035800933837890625, 0.04118156433105469, 0.04656219482421875, 0.05194282531738281, 0.057323455810546875, 0.06270408630371094, 0.068084716796875, 0.07346534729003906, 0.07884597778320312, 0.08422660827636719, 0.08960723876953125, 0.09498786926269531, 0.10036849975585938, 0.10574913024902344, 0.1111297607421875, 0.11651039123535156, 0.12189102172851562, 0.1272716522216797, 0.13265228271484375, 0.1380329132080078, 0.14341354370117188, 0.14879417419433594, 0.1541748046875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 10.0, 13.0, 17.0, 22.0, 45.0, 136.0, 428.0, 2143.0, 43832.0, 4103546.0, 41382.0, 2050.0, 392.0, 136.0, 61.0, 34.0, 19.0, 9.0, 4.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6181640625, -1.568359375, -1.5185546875, -1.46875, -1.4189453125, -1.369140625, -1.3193359375, -1.26953125, -1.2197265625, -1.169921875, -1.1201171875, -1.0703125, -1.0205078125, -0.970703125, -0.9208984375, -0.87109375, -0.8212890625, -0.771484375, -0.7216796875, -0.671875, -0.6220703125, -0.572265625, -0.5224609375, -0.47265625, -0.4228515625, -0.373046875, -0.3232421875, -0.2734375, -0.2236328125, -0.173828125, -0.1240234375, -0.07421875, -0.0244140625, 0.025390625, 0.0751953125, 0.125, 0.1748046875, 0.224609375, 0.2744140625, 0.32421875, 0.3740234375, 0.423828125, 0.4736328125, 0.5234375, 0.5732421875, 0.623046875, 0.6728515625, 0.72265625, 0.7724609375, 0.822265625, 0.8720703125, 0.921875, 0.9716796875, 1.021484375, 1.0712890625, 1.12109375, 1.1708984375, 1.220703125, 1.2705078125, 1.3203125, 1.3701171875, 1.419921875, 1.4697265625, 1.51953125, 1.5693359375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 5.0, 8.0, 2.0, 9.0, 11.0, 12.0, 21.0, 18.0, 42.0, 89.0, 207.0, 381.0, 814.0, 1168.0, 605.0, 292.0, 150.0, 87.0, 60.0, 32.0, 17.0, 16.0, 10.0, 5.0, 3.0, 7.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5244140625, -0.5037384033203125, -0.483062744140625, -0.4623870849609375, -0.44171142578125, -0.4210357666015625, -0.400360107421875, -0.3796844482421875, -0.3590087890625, -0.3383331298828125, -0.317657470703125, -0.2969818115234375, -0.27630615234375, -0.2556304931640625, -0.234954833984375, -0.2142791748046875, -0.193603515625, -0.1729278564453125, -0.152252197265625, -0.1315765380859375, -0.11090087890625, -0.0902252197265625, -0.069549560546875, -0.0488739013671875, -0.0281982421875, -0.0075225830078125, 0.013153076171875, 0.0338287353515625, 0.05450439453125, 0.0751800537109375, 0.095855712890625, 0.1165313720703125, 0.13720703125, 0.1578826904296875, 0.178558349609375, 0.1992340087890625, 0.21990966796875, 0.2405853271484375, 0.261260986328125, 0.2819366455078125, 0.3026123046875, 0.3232879638671875, 0.343963623046875, 0.3646392822265625, 0.38531494140625, 0.4059906005859375, 0.426666259765625, 0.4473419189453125, 0.468017578125, 0.4886932373046875, 0.509368896484375, 0.5300445556640625, 0.55072021484375, 0.5713958740234375, 0.592071533203125, 0.6127471923828125, 0.6334228515625, 0.6540985107421875, 0.674774169921875, 0.6954498291015625, 0.71612548828125, 0.7368011474609375, 0.757476806640625, 0.7781524658203125, 0.798828125]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 6.0, 7.0, 11.0, 25.0, 62.0, 159.0, 249.0, 249.0, 148.0, 53.0, 19.0, 9.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.129081726074219, -3.9313509464263916, -3.7336199283599854, -3.535889148712158, -3.338158369064331, -3.140427589416504, -2.9426965713500977, -2.7449657917022705, -2.5472350120544434, -2.349504232406616, -2.15177321434021, -1.9540424346923828, -1.7563116550445557, -1.558580756187439, -1.3608498573303223, -1.1631190776824951, -0.9653880596160889, -0.7676572203636169, -0.569926381111145, -0.3721954822540283, -0.1744646430015564, 0.023266196250915527, 0.22099709510803223, 0.4187278747558594, 0.6164587736129761, 0.814189612865448, 1.01192045211792, 1.2096513509750366, 1.4073822498321533, 1.6051130294799805, 1.8028439283370972, 2.0005745887756348, 2.198305606842041, 2.396036386489868, 2.5937674045562744, 2.7914981842041016, 2.9892289638519287, 3.186959743499756, 3.384690761566162, 3.5824215412139893, 3.7801523208618164, 3.9778831005096436, 4.175613880157471, 4.373344898223877, 4.571075916290283, 4.768806457519531, 4.9665374755859375, 5.164268493652344, 5.36199951171875, 5.559730529785156, 5.757461071014404, 5.9551920890808105, 6.152923107147217, 6.350653648376465, 6.548384666442871, 6.746115684509277, 6.943846225738525, 7.141577243804932, 7.33930778503418, 7.537038803100586, 7.734769821166992, 7.93250036239624, 8.130231857299805, 8.327961921691895, 8.5256929397583]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 6.0, 1.0, 5.0, 5.0, 3.0, 4.0, 7.0, 16.0, 14.0, 14.0, 9.0, 17.0, 23.0, 28.0, 24.0, 35.0, 35.0, 41.0, 33.0, 41.0, 48.0, 41.0, 37.0, 44.0, 40.0, 38.0, 42.0, 41.0, 31.0, 37.0, 34.0, 32.0, 25.0, 22.0, 21.0, 26.0, 10.0, 16.0, 14.0, 6.0, 9.0, 10.0, 7.0, 2.0, 2.0, 4.0, 1.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.006152391433716, -1.9449986219406128, -1.8838447332382202, -1.8226909637451172, -1.7615370750427246, -1.7003833055496216, -1.6392295360565186, -1.578075647354126, -1.5169217586517334, -1.4557679891586304, -1.3946141004562378, -1.3334603309631348, -1.2723064422607422, -1.2111526727676392, -1.1499989032745361, -1.0888450145721436, -1.0276912450790405, -0.9665374159812927, -0.9053835868835449, -0.8442298173904419, -0.7830759286880493, -0.7219221591949463, -0.6607683300971985, -0.5996145009994507, -0.5384606719017029, -0.4773068428039551, -0.4161530137062073, -0.35499921441078186, -0.29384538531303406, -0.23269155621528625, -0.17153775691986084, -0.11038392782211304, -0.049230098724365234, 0.011923722922801971, 0.07307754456996918, 0.1342313587665558, 0.1953851878643036, 0.2565390169620514, 0.3176928162574768, 0.3788466453552246, 0.4400004744529724, 0.5011543035507202, 0.562308132648468, 0.6234619617462158, 0.6846157312393188, 0.7457696199417114, 0.8069233894348145, 0.8680772185325623, 0.9292310476303101, 0.9903848767280579, 1.0515387058258057, 1.1126924753189087, 1.1738463640213013, 1.2350001335144043, 1.2961540222167969, 1.3573077917099, 1.418461561203003, 1.479615330696106, 1.5407692193984985, 1.6019229888916016, 1.6630768775939941, 1.7242306470870972, 1.7853844165802002, 1.8465383052825928, 1.9076921939849854]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 4.0, 5.0, 8.0, 5.0, 13.0, 23.0, 30.0, 37.0, 61.0, 64.0, 112.0, 139.0, 218.0, 331.0, 489.0, 721.0, 1132.0, 1857.0, 3113.0, 5342.0, 9656.0, 18495.0, 38947.0, 88148.0, 214720.0, 335047.0, 182651.0, 75474.0, 33646.0, 16700.0, 8685.0, 5004.0, 2901.0, 1737.0, 1051.0, 677.0, 415.0, 275.0, 189.0, 122.0, 97.0, 62.0, 44.0, 41.0, 27.0, 16.0, 15.0, 3.0, 4.0, 6.0, 3.0, 2.0, 2.0, 1.0], "bins": [-0.2459716796875, -0.23902511596679688, -0.23207855224609375, -0.22513198852539062, -0.2181854248046875, -0.21123886108398438, -0.20429229736328125, -0.19734573364257812, -0.190399169921875, -0.18345260620117188, -0.17650604248046875, -0.16955947875976562, -0.1626129150390625, -0.15566635131835938, -0.14871978759765625, -0.14177322387695312, -0.13482666015625, -0.12788009643554688, -0.12093353271484375, -0.11398696899414062, -0.1070404052734375, -0.10009384155273438, -0.09314727783203125, -0.08620071411132812, -0.079254150390625, -0.07230758666992188, -0.06536102294921875, -0.058414459228515625, -0.0514678955078125, -0.044521331787109375, -0.03757476806640625, -0.030628204345703125, -0.023681640625, -0.016735076904296875, -0.00978851318359375, -0.002841949462890625, 0.0041046142578125, 0.011051177978515625, 0.01799774169921875, 0.024944305419921875, 0.031890869140625, 0.038837432861328125, 0.04578399658203125, 0.052730560302734375, 0.0596771240234375, 0.06662368774414062, 0.07357025146484375, 0.08051681518554688, 0.08746337890625, 0.09440994262695312, 0.10135650634765625, 0.10830307006835938, 0.1152496337890625, 0.12219619750976562, 0.12914276123046875, 0.13608932495117188, 0.143035888671875, 0.14998245239257812, 0.15692901611328125, 0.16387557983398438, 0.1708221435546875, 0.17776870727539062, 0.18471527099609375, 0.19166183471679688, 0.1986083984375]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 3.0, 2.0, 5.0, 2.0, 5.0, 12.0, 7.0, 13.0, 12.0, 28.0, 29.0, 20.0, 34.0, 24.0, 30.0, 36.0, 46.0, 25.0, 48.0, 44.0, 45.0, 41.0, 38.0, 39.0, 56.0, 40.0, 30.0, 35.0, 35.0, 33.0, 24.0, 32.0, 25.0, 16.0, 18.0, 22.0, 13.0, 5.0, 6.0, 4.0, 4.0, 6.0, 2.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.208251953125, -0.2019062042236328, -0.19556045532226562, -0.18921470642089844, -0.18286895751953125, -0.17652320861816406, -0.17017745971679688, -0.1638317108154297, -0.1574859619140625, -0.1511402130126953, -0.14479446411132812, -0.13844871520996094, -0.13210296630859375, -0.12575721740722656, -0.11941146850585938, -0.11306571960449219, -0.106719970703125, -0.10037422180175781, -0.09402847290039062, -0.08768272399902344, -0.08133697509765625, -0.07499122619628906, -0.06864547729492188, -0.06229972839355469, -0.0559539794921875, -0.04960823059082031, -0.043262481689453125, -0.03691673278808594, -0.03057098388671875, -0.024225234985351562, -0.017879486083984375, -0.011533737182617188, -0.00518798828125, 0.0011577606201171875, 0.007503509521484375, 0.013849258422851562, 0.02019500732421875, 0.026540756225585938, 0.032886505126953125, 0.03923225402832031, 0.0455780029296875, 0.05192375183105469, 0.058269500732421875, 0.06461524963378906, 0.07096099853515625, 0.07730674743652344, 0.08365249633789062, 0.08999824523925781, 0.096343994140625, 0.10268974304199219, 0.10903549194335938, 0.11538124084472656, 0.12172698974609375, 0.12807273864746094, 0.13441848754882812, 0.1407642364501953, 0.1471099853515625, 0.1534557342529297, 0.15980148315429688, 0.16614723205566406, 0.17249298095703125, 0.17883872985839844, 0.18518447875976562, 0.1915302276611328, 0.1978759765625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 8.0, 9.0, 7.0, 15.0, 21.0, 26.0, 31.0, 50.0, 83.0, 90.0, 171.0, 234.0, 398.0, 758.0, 1594.0, 4329.0, 16587.0, 116836.0, 779117.0, 105186.0, 15563.0, 4155.0, 1497.0, 708.0, 373.0, 245.0, 130.0, 93.0, 77.0, 43.0, 21.0, 22.0, 17.0, 16.0, 6.0, 11.0, 3.0, 5.0, 4.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.51904296875, -0.5008163452148438, -0.4825897216796875, -0.46436309814453125, -0.446136474609375, -0.42790985107421875, -0.4096832275390625, -0.39145660400390625, -0.37322998046875, -0.35500335693359375, -0.3367767333984375, -0.31855010986328125, -0.300323486328125, -0.28209686279296875, -0.2638702392578125, -0.24564361572265625, -0.2274169921875, -0.20919036865234375, -0.1909637451171875, -0.17273712158203125, -0.154510498046875, -0.13628387451171875, -0.1180572509765625, -0.09983062744140625, -0.08160400390625, -0.06337738037109375, -0.0451507568359375, -0.02692413330078125, -0.008697509765625, 0.00952911376953125, 0.0277557373046875, 0.04598236083984375, 0.064208984375, 0.08243560791015625, 0.1006622314453125, 0.11888885498046875, 0.137115478515625, 0.15534210205078125, 0.1735687255859375, 0.19179534912109375, 0.21002197265625, 0.22824859619140625, 0.2464752197265625, 0.26470184326171875, 0.282928466796875, 0.30115509033203125, 0.3193817138671875, 0.33760833740234375, 0.3558349609375, 0.37406158447265625, 0.3922882080078125, 0.41051483154296875, 0.428741455078125, 0.44696807861328125, 0.4651947021484375, 0.48342132568359375, 0.50164794921875, 0.5198745727539062, 0.5381011962890625, 0.5563278198242188, 0.574554443359375, 0.5927810668945312, 0.6110076904296875, 0.6292343139648438, 0.6474609375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 6.0, 4.0, 4.0, 11.0, 14.0, 11.0, 13.0, 19.0, 25.0, 25.0, 31.0, 47.0, 58.0, 69.0, 62.0, 68.0, 73.0, 65.0, 60.0, 56.0, 53.0, 37.0, 37.0, 21.0, 24.0, 26.0, 22.0, 19.0, 12.0, 10.0, 8.0, 11.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2578125, -1.22528076171875, -1.1927490234375, -1.16021728515625, -1.127685546875, -1.09515380859375, -1.0626220703125, -1.03009033203125, -0.99755859375, -0.96502685546875, -0.9324951171875, -0.89996337890625, -0.867431640625, -0.83489990234375, -0.8023681640625, -0.76983642578125, -0.7373046875, -0.70477294921875, -0.6722412109375, -0.63970947265625, -0.607177734375, -0.57464599609375, -0.5421142578125, -0.50958251953125, -0.47705078125, -0.44451904296875, -0.4119873046875, -0.37945556640625, -0.346923828125, -0.31439208984375, -0.2818603515625, -0.24932861328125, -0.216796875, -0.18426513671875, -0.1517333984375, -0.11920166015625, -0.086669921875, -0.05413818359375, -0.0216064453125, 0.01092529296875, 0.04345703125, 0.07598876953125, 0.1085205078125, 0.14105224609375, 0.173583984375, 0.20611572265625, 0.2386474609375, 0.27117919921875, 0.3037109375, 0.33624267578125, 0.3687744140625, 0.40130615234375, 0.433837890625, 0.46636962890625, 0.4989013671875, 0.53143310546875, 0.56396484375, 0.59649658203125, 0.6290283203125, 0.66156005859375, 0.694091796875, 0.72662353515625, 0.7591552734375, 0.79168701171875, 0.82421875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 6.0, 6.0, 11.0, 10.0, 17.0, 24.0, 46.0, 64.0, 105.0, 200.0, 353.0, 681.0, 1566.0, 4437.0, 17104.0, 157211.0, 809686.0, 44132.0, 8268.0, 2474.0, 1051.0, 496.0, 242.0, 126.0, 80.0, 50.0, 29.0, 19.0, 15.0, 13.0, 14.0, 5.0, 6.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.272705078125, -0.26305389404296875, -0.2534027099609375, -0.24375152587890625, -0.234100341796875, -0.22444915771484375, -0.2147979736328125, -0.20514678955078125, -0.19549560546875, -0.18584442138671875, -0.1761932373046875, -0.16654205322265625, -0.156890869140625, -0.14723968505859375, -0.1375885009765625, -0.12793731689453125, -0.1182861328125, -0.10863494873046875, -0.0989837646484375, -0.08933258056640625, -0.079681396484375, -0.07003021240234375, -0.0603790283203125, -0.05072784423828125, -0.04107666015625, -0.03142547607421875, -0.0217742919921875, -0.01212310791015625, -0.002471923828125, 0.00717926025390625, 0.0168304443359375, 0.02648162841796875, 0.0361328125, 0.04578399658203125, 0.0554351806640625, 0.06508636474609375, 0.074737548828125, 0.08438873291015625, 0.0940399169921875, 0.10369110107421875, 0.11334228515625, 0.12299346923828125, 0.1326446533203125, 0.14229583740234375, 0.151947021484375, 0.16159820556640625, 0.1712493896484375, 0.18090057373046875, 0.1905517578125, 0.20020294189453125, 0.2098541259765625, 0.21950531005859375, 0.229156494140625, 0.23880767822265625, 0.2484588623046875, 0.25811004638671875, 0.26776123046875, 0.27741241455078125, 0.2870635986328125, 0.29671478271484375, 0.306365966796875, 0.31601715087890625, 0.3256683349609375, 0.33531951904296875, 0.344970703125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 6.0, 4.0, 1.0, 4.0, 5.0, 12.0, 9.0, 15.0, 22.0, 35.0, 54.0, 88.0, 153.0, 209.0, 155.0, 73.0, 55.0, 41.0, 15.0, 10.0, 9.0, 3.0, 5.0, 3.0, 3.0, 2.0, 4.0, 3.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.594989776611328e-05, -8.311867713928223e-05, -8.028745651245117e-05, -7.745623588562012e-05, -7.462501525878906e-05, -7.179379463195801e-05, -6.896257400512695e-05, -6.61313533782959e-05, -6.330013275146484e-05, -6.046891212463379e-05, -5.7637691497802734e-05, -5.480647087097168e-05, -5.1975250244140625e-05, -4.914402961730957e-05, -4.6312808990478516e-05, -4.348158836364746e-05, -4.0650367736816406e-05, -3.781914710998535e-05, -3.49879264831543e-05, -3.215670585632324e-05, -2.9325485229492188e-05, -2.6494264602661133e-05, -2.3663043975830078e-05, -2.0831823348999023e-05, -1.800060272216797e-05, -1.5169382095336914e-05, -1.233816146850586e-05, -9.506940841674805e-06, -6.67572021484375e-06, -3.844499588012695e-06, -1.0132789611816406e-06, 1.817941665649414e-06, 4.649162292480469e-06, 7.4803829193115234e-06, 1.0311603546142578e-05, 1.3142824172973633e-05, 1.5974044799804688e-05, 1.8805265426635742e-05, 2.1636486053466797e-05, 2.446770668029785e-05, 2.7298927307128906e-05, 3.013014793395996e-05, 3.2961368560791016e-05, 3.579258918762207e-05, 3.8623809814453125e-05, 4.145503044128418e-05, 4.4286251068115234e-05, 4.711747169494629e-05, 4.9948692321777344e-05, 5.27799129486084e-05, 5.561113357543945e-05, 5.844235420227051e-05, 6.127357482910156e-05, 6.410479545593262e-05, 6.693601608276367e-05, 6.976723670959473e-05, 7.259845733642578e-05, 7.542967796325684e-05, 7.826089859008789e-05, 8.109211921691895e-05, 8.392333984375e-05, 8.675456047058105e-05, 8.958578109741211e-05, 9.241700172424316e-05, 9.524822235107422e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 5.0, 2.0, 0.0, 1.0, 3.0, 7.0, 8.0, 2.0, 9.0, 16.0, 18.0, 33.0, 53.0, 96.0, 147.0, 315.0, 643.0, 1332.0, 3891.0, 14781.0, 125403.0, 831099.0, 56443.0, 9341.0, 2743.0, 1057.0, 491.0, 251.0, 153.0, 79.0, 39.0, 27.0, 26.0, 23.0, 7.0, 6.0, 4.0, 4.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2442626953125, -0.23462486267089844, -0.22498703002929688, -0.2153491973876953, -0.20571136474609375, -0.1960735321044922, -0.18643569946289062, -0.17679786682128906, -0.1671600341796875, -0.15752220153808594, -0.14788436889648438, -0.1382465362548828, -0.12860870361328125, -0.11897087097167969, -0.10933303833007812, -0.09969520568847656, -0.090057373046875, -0.08041954040527344, -0.07078170776367188, -0.06114387512207031, -0.05150604248046875, -0.04186820983886719, -0.032230377197265625, -0.022592544555664062, -0.0129547119140625, -0.0033168792724609375, 0.006320953369140625, 0.015958786010742188, 0.02559661865234375, 0.03523445129394531, 0.044872283935546875, 0.05451011657714844, 0.06414794921875, 0.07378578186035156, 0.08342361450195312, 0.09306144714355469, 0.10269927978515625, 0.11233711242675781, 0.12197494506835938, 0.13161277770996094, 0.1412506103515625, 0.15088844299316406, 0.16052627563476562, 0.1701641082763672, 0.17980194091796875, 0.1894397735595703, 0.19907760620117188, 0.20871543884277344, 0.218353271484375, 0.22799110412597656, 0.23762893676757812, 0.2472667694091797, 0.25690460205078125, 0.2665424346923828, 0.2761802673339844, 0.28581809997558594, 0.2954559326171875, 0.30509376525878906, 0.3147315979003906, 0.3243694305419922, 0.33400726318359375, 0.3436450958251953, 0.3532829284667969, 0.36292076110839844, 0.37255859375]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 9.0, 6.0, 3.0, 8.0, 11.0, 7.0, 18.0, 21.0, 34.0, 53.0, 65.0, 93.0, 124.0, 135.0, 104.0, 88.0, 64.0, 41.0, 35.0, 23.0, 9.0, 4.0, 6.0, 12.0, 11.0, 8.0, 5.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.283203125, -0.27541351318359375, -0.2676239013671875, -0.25983428955078125, -0.252044677734375, -0.24425506591796875, -0.2364654541015625, -0.22867584228515625, -0.22088623046875, -0.21309661865234375, -0.2053070068359375, -0.19751739501953125, -0.189727783203125, -0.18193817138671875, -0.1741485595703125, -0.16635894775390625, -0.1585693359375, -0.15077972412109375, -0.1429901123046875, -0.13520050048828125, -0.127410888671875, -0.11962127685546875, -0.1118316650390625, -0.10404205322265625, -0.09625244140625, -0.08846282958984375, -0.0806732177734375, -0.07288360595703125, -0.065093994140625, -0.05730438232421875, -0.0495147705078125, -0.04172515869140625, -0.033935546875, -0.02614593505859375, -0.0183563232421875, -0.01056671142578125, -0.002777099609375, 0.00501251220703125, 0.0128021240234375, 0.02059173583984375, 0.02838134765625, 0.03617095947265625, 0.0439605712890625, 0.05175018310546875, 0.059539794921875, 0.06732940673828125, 0.0751190185546875, 0.08290863037109375, 0.0906982421875, 0.09848785400390625, 0.1062774658203125, 0.11406707763671875, 0.121856689453125, 0.12964630126953125, 0.1374359130859375, 0.14522552490234375, 0.15301513671875, 0.16080474853515625, 0.1685943603515625, 0.17638397216796875, 0.184173583984375, 0.19196319580078125, 0.1997528076171875, 0.20754241943359375, 0.21533203125]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 12.0, 37.0, 133.0, 423.0, 250.0, 76.0, 38.0, 18.0, 7.0, 6.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.4286065101623535, -5.153811454772949, -4.879016399383545, -4.604221343994141, -4.329425811767578, -4.054630756378174, -3.7798357009887695, -3.5050406455993652, -3.230245351791382, -2.9554502964019775, -2.680655002593994, -2.40585994720459, -2.1310648918151855, -1.8562695980072021, -1.5814745426177979, -1.306679368019104, -1.0318841934204102, -0.7570890188217163, -0.48229390382766724, -0.20749878883361816, 0.06729638576507568, 0.34209156036376953, 0.6168866157531738, 0.8916817903518677, 1.1664769649505615, 1.4412721395492554, 1.7160673141479492, 1.9908623695373535, 2.265657424926758, 2.540452718734741, 2.8152477741241455, 3.090043067932129, 3.364837646484375, 3.6396327018737793, 3.9144279956817627, 4.189223289489746, 4.46401834487915, 4.738813400268555, 5.013608455657959, 5.288403511047363, 5.563199043273926, 5.83799409866333, 6.112789154052734, 6.387584686279297, 6.662379741668701, 6.9371747970581055, 7.21196985244751, 7.486764907836914, 7.761559963226318, 8.036355018615723, 8.311150550842285, 8.585945129394531, 8.860740661621094, 9.135536193847656, 9.410330772399902, 9.685126304626465, 9.959920883178711, 10.234716415405273, 10.50951099395752, 10.784306526184082, 11.059101104736328, 11.33389663696289, 11.608692169189453, 11.8834867477417, 12.158282279968262]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 2.0, 6.0, 2.0, 4.0, 1.0, 3.0, 3.0, 6.0, 9.0, 11.0, 9.0, 17.0, 15.0, 15.0, 22.0, 24.0, 20.0, 19.0, 24.0, 27.0, 34.0, 47.0, 54.0, 65.0, 93.0, 77.0, 68.0, 44.0, 37.0, 41.0, 22.0, 32.0, 20.0, 21.0, 15.0, 20.0, 13.0, 14.0, 12.0, 6.0, 5.0, 7.0, 6.0, 2.0, 4.0, 5.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0460667610168457, -2.946803569793701, -2.8475406169891357, -2.748277425765991, -2.649014472961426, -2.5497512817382812, -2.450488328933716, -2.3512251377105713, -2.251962184906006, -2.1526989936828613, -2.053436040878296, -1.954172968864441, -1.854909896850586, -1.755646824836731, -1.656383752822876, -1.5571205615997314, -1.4578574895858765, -1.3585944175720215, -1.2593313455581665, -1.1600682735443115, -1.0608052015304565, -0.9615421295166016, -0.8622789978981018, -0.7630159258842468, -0.6637528538703918, -0.5644897818565369, -0.4652267098426819, -0.3659636080265045, -0.26670053601264954, -0.16743746399879456, -0.06817436218261719, 0.031088709831237793, 0.13035178184509277, 0.22961485385894775, 0.32887792587280273, 0.4281410276889801, 0.5274040699005127, 0.6266671419143677, 0.7259302735328674, 0.8251933455467224, 0.9244564175605774, 1.0237195491790771, 1.1229826211929321, 1.222245693206787, 1.321508765220642, 1.420771837234497, 1.520034909248352, 1.619297981262207, 1.718561053276062, 1.817824125289917, 1.917087197303772, 2.016350269317627, 2.1156134605407715, 2.214876413345337, 2.3141396045684814, 2.413402557373047, 2.5126657485961914, 2.611928939819336, 2.7111918926239014, 2.810455083847046, 2.9097180366516113, 3.008981227874756, 3.1082441806793213, 3.207507371902466, 3.3067703247070312]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 3.0, 5.0, 2.0, 4.0, 8.0, 5.0, 5.0, 7.0, 13.0, 18.0, 27.0, 27.0, 39.0, 47.0, 74.0, 141.0, 220.0, 448.0, 1120.0, 3309.0, 13377.0, 106019.0, 2637079.0, 1357452.0, 61609.0, 9032.0, 2395.0, 864.0, 365.0, 199.0, 99.0, 81.0, 62.0, 25.0, 23.0, 24.0, 16.0, 11.0, 13.0, 5.0, 11.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.423828125, -0.4080657958984375, -0.392303466796875, -0.3765411376953125, -0.36077880859375, -0.3450164794921875, -0.329254150390625, -0.3134918212890625, -0.2977294921875, -0.2819671630859375, -0.266204833984375, -0.2504425048828125, -0.23468017578125, -0.2189178466796875, -0.203155517578125, -0.1873931884765625, -0.171630859375, -0.1558685302734375, -0.140106201171875, -0.1243438720703125, -0.10858154296875, -0.0928192138671875, -0.077056884765625, -0.0612945556640625, -0.0455322265625, -0.0297698974609375, -0.014007568359375, 0.0017547607421875, 0.01751708984375, 0.0332794189453125, 0.049041748046875, 0.0648040771484375, 0.08056640625, 0.0963287353515625, 0.112091064453125, 0.1278533935546875, 0.14361572265625, 0.1593780517578125, 0.175140380859375, 0.1909027099609375, 0.2066650390625, 0.2224273681640625, 0.238189697265625, 0.2539520263671875, 0.26971435546875, 0.2854766845703125, 0.301239013671875, 0.3170013427734375, 0.332763671875, 0.3485260009765625, 0.364288330078125, 0.3800506591796875, 0.39581298828125, 0.4115753173828125, 0.427337646484375, 0.4430999755859375, 0.4588623046875, 0.4746246337890625, 0.490386962890625, 0.5061492919921875, 0.52191162109375, 0.5376739501953125, 0.553436279296875, 0.5691986083984375, 0.5849609375]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 3.0, 5.0, 0.0, 1.0, 6.0, 3.0, 7.0, 5.0, 5.0, 9.0, 6.0, 13.0, 9.0, 6.0, 10.0, 15.0, 26.0, 22.0, 21.0, 26.0, 25.0, 34.0, 38.0, 40.0, 35.0, 43.0, 38.0, 47.0, 42.0, 42.0, 48.0, 43.0, 42.0, 35.0, 34.0, 26.0, 24.0, 22.0, 28.0, 13.0, 28.0, 16.0, 11.0, 10.0, 4.0, 13.0, 8.0, 9.0, 4.0, 4.0, 5.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.171875, -0.1660003662109375, -0.160125732421875, -0.1542510986328125, -0.14837646484375, -0.1425018310546875, -0.136627197265625, -0.1307525634765625, -0.1248779296875, -0.1190032958984375, -0.113128662109375, -0.1072540283203125, -0.10137939453125, -0.0955047607421875, -0.089630126953125, -0.0837554931640625, -0.077880859375, -0.0720062255859375, -0.066131591796875, -0.0602569580078125, -0.05438232421875, -0.0485076904296875, -0.042633056640625, -0.0367584228515625, -0.0308837890625, -0.0250091552734375, -0.019134521484375, -0.0132598876953125, -0.00738525390625, -0.0015106201171875, 0.004364013671875, 0.0102386474609375, 0.01611328125, 0.0219879150390625, 0.027862548828125, 0.0337371826171875, 0.03961181640625, 0.0454864501953125, 0.051361083984375, 0.0572357177734375, 0.0631103515625, 0.0689849853515625, 0.074859619140625, 0.0807342529296875, 0.08660888671875, 0.0924835205078125, 0.098358154296875, 0.1042327880859375, 0.110107421875, 0.1159820556640625, 0.121856689453125, 0.1277313232421875, 0.13360595703125, 0.1394805908203125, 0.145355224609375, 0.1512298583984375, 0.1571044921875, 0.1629791259765625, 0.168853759765625, 0.1747283935546875, 0.18060302734375, 0.1864776611328125, 0.192352294921875, 0.1982269287109375, 0.2041015625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 6.0, 8.0, 10.0, 25.0, 33.0, 83.0, 164.0, 514.0, 3489.0, 98485.0, 4058333.0, 30444.0, 2037.0, 379.0, 151.0, 48.0, 23.0, 21.0, 10.0, 12.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6884765625, -1.64447021484375, -1.6004638671875, -1.55645751953125, -1.512451171875, -1.46844482421875, -1.4244384765625, -1.38043212890625, -1.33642578125, -1.29241943359375, -1.2484130859375, -1.20440673828125, -1.160400390625, -1.11639404296875, -1.0723876953125, -1.02838134765625, -0.984375, -0.94036865234375, -0.8963623046875, -0.85235595703125, -0.808349609375, -0.76434326171875, -0.7203369140625, -0.67633056640625, -0.63232421875, -0.58831787109375, -0.5443115234375, -0.50030517578125, -0.456298828125, -0.41229248046875, -0.3682861328125, -0.32427978515625, -0.2802734375, -0.23626708984375, -0.1922607421875, -0.14825439453125, -0.104248046875, -0.06024169921875, -0.0162353515625, 0.02777099609375, 0.07177734375, 0.11578369140625, 0.1597900390625, 0.20379638671875, 0.247802734375, 0.29180908203125, 0.3358154296875, 0.37982177734375, 0.423828125, 0.46783447265625, 0.5118408203125, 0.55584716796875, 0.599853515625, 0.64385986328125, 0.6878662109375, 0.73187255859375, 0.77587890625, 0.81988525390625, 0.8638916015625, 0.90789794921875, 0.951904296875, 0.99591064453125, 1.0399169921875, 1.08392333984375, 1.1279296875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 4.0, 8.0, 11.0, 7.0, 17.0, 18.0, 27.0, 30.0, 52.0, 87.0, 119.0, 209.0, 300.0, 570.0, 806.0, 673.0, 431.0, 249.0, 146.0, 78.0, 51.0, 43.0, 36.0, 29.0, 12.0, 12.0, 12.0, 5.0, 6.0, 4.0, 2.0, 2.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.4501953125, -0.43506622314453125, -0.4199371337890625, -0.40480804443359375, -0.389678955078125, -0.37454986572265625, -0.3594207763671875, -0.34429168701171875, -0.32916259765625, -0.31403350830078125, -0.2989044189453125, -0.28377532958984375, -0.268646240234375, -0.25351715087890625, -0.2383880615234375, -0.22325897216796875, -0.2081298828125, -0.19300079345703125, -0.1778717041015625, -0.16274261474609375, -0.147613525390625, -0.13248443603515625, -0.1173553466796875, -0.10222625732421875, -0.08709716796875, -0.07196807861328125, -0.0568389892578125, -0.04170989990234375, -0.026580810546875, -0.01145172119140625, 0.0036773681640625, 0.01880645751953125, 0.033935546875, 0.04906463623046875, 0.0641937255859375, 0.07932281494140625, 0.094451904296875, 0.10958099365234375, 0.1247100830078125, 0.13983917236328125, 0.15496826171875, 0.17009735107421875, 0.1852264404296875, 0.20035552978515625, 0.215484619140625, 0.23061370849609375, 0.2457427978515625, 0.26087188720703125, 0.2760009765625, 0.29113006591796875, 0.3062591552734375, 0.32138824462890625, 0.336517333984375, 0.35164642333984375, 0.3667755126953125, 0.38190460205078125, 0.39703369140625, 0.41216278076171875, 0.4272918701171875, 0.44242095947265625, 0.457550048828125, 0.47267913818359375, 0.4878082275390625, 0.5029373168945312, 0.51806640625]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 8.0, 14.0, 15.0, 50.0, 64.0, 129.0, 157.0, 187.0, 143.0, 96.0, 53.0, 28.0, 14.0, 12.0, 11.0, 6.0, 4.0, 5.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.864886283874512, -4.737573623657227, -4.610260486602783, -4.482947826385498, -4.355634689331055, -4.2283220291137695, -4.101008892059326, -3.973696231842041, -3.8463833332061768, -3.7190704345703125, -3.5917575359344482, -3.464444637298584, -3.337131977081299, -3.2098188400268555, -3.0825061798095703, -2.955193281173706, -2.827880382537842, -2.7005674839019775, -2.5732545852661133, -2.445941686630249, -2.3186287879943848, -2.1913161277770996, -2.0640032291412354, -1.936690330505371, -1.8093774318695068, -1.6820645332336426, -1.5547516345977783, -1.4274388551712036, -1.3001259565353394, -1.172813057899475, -1.0455002784729004, -0.9181873798370361, -0.7908740043640137, -0.6635611057281494, -0.5362482666969299, -0.40893539786338806, -0.2816225290298462, -0.15430963039398193, -0.02699679136276245, 0.10031604766845703, 0.2276289463043213, 0.35494181513786316, 0.48225468397140503, 0.6095675230026245, 0.7368804216384888, 0.864193320274353, 0.9915061593055725, 1.118818998336792, 1.2461318969726562, 1.3734447956085205, 1.5007576942443848, 1.6280704736709595, 1.7553833723068237, 1.882696270942688, 2.0100090503692627, 2.137321949005127, 2.264634847640991, 2.3919477462768555, 2.5192606449127197, 2.646573543548584, 2.773886203765869, 2.9011993408203125, 3.0285120010375977, 3.155824899673462, 3.283137798309326]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 5.0, 6.0, 6.0, 11.0, 10.0, 10.0, 16.0, 18.0, 14.0, 25.0, 26.0, 21.0, 32.0, 35.0, 44.0, 54.0, 65.0, 49.0, 61.0, 48.0, 62.0, 46.0, 49.0, 42.0, 34.0, 34.0, 33.0, 29.0, 28.0, 27.0, 12.0, 9.0, 9.0, 8.0, 8.0, 7.0, 3.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9927042722702026, -1.9288220405578613, -1.86493980884552, -1.8010575771331787, -1.7371753454208374, -1.673293113708496, -1.6094107627868652, -1.5455286502838135, -1.4816462993621826, -1.4177640676498413, -1.3538818359375, -1.2899996042251587, -1.2261173725128174, -1.162235140800476, -1.0983529090881348, -1.034470558166504, -0.9705884456634521, -0.9067062139511108, -0.8428239822387695, -0.7789417505264282, -0.7150595188140869, -0.6511772871017456, -0.5872949957847595, -0.5234127640724182, -0.4595305323600769, -0.3956483006477356, -0.3317660689353943, -0.2678838074207306, -0.20400157570838928, -0.14011934399604797, -0.07623708248138428, -0.012354850769042969, 0.05152726173400879, 0.1154095008969307, 0.1792917400598526, 0.2431739866733551, 0.3070562183856964, 0.3709384500980377, 0.4348207116127014, 0.4987029433250427, 0.562585175037384, 0.6264674067497253, 0.6903496384620667, 0.7542319297790527, 0.818114161491394, 0.8819963932037354, 0.9458786249160767, 1.009760856628418, 1.0736430883407593, 1.1375253200531006, 1.201407551765442, 1.2652897834777832, 1.3291720151901245, 1.3930542469024658, 1.4569365978240967, 1.5208187103271484, 1.5847010612487793, 1.6485832929611206, 1.712465524673462, 1.7763477563858032, 1.8402299880981445, 1.9041122198104858, 1.9679944515228271, 2.031876802444458, 2.0957589149475098]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 6.0, 6.0, 2.0, 7.0, 9.0, 19.0, 34.0, 51.0, 93.0, 125.0, 213.0, 432.0, 841.0, 1647.0, 3894.0, 9977.0, 28955.0, 112683.0, 532098.0, 274157.0, 55371.0, 16685.0, 6159.0, 2529.0, 1244.0, 604.0, 296.0, 162.0, 94.0, 66.0, 39.0, 18.0, 9.0, 12.0, 8.0, 3.0, 8.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.52587890625, -0.5123100280761719, -0.49874114990234375, -0.4851722717285156, -0.4716033935546875, -0.4580345153808594, -0.44446563720703125, -0.4308967590332031, -0.417327880859375, -0.4037590026855469, -0.39019012451171875, -0.3766212463378906, -0.3630523681640625, -0.3494834899902344, -0.33591461181640625, -0.3223457336425781, -0.30877685546875, -0.2952079772949219, -0.28163909912109375, -0.2680702209472656, -0.2545013427734375, -0.24093246459960938, -0.22736358642578125, -0.21379470825195312, -0.200225830078125, -0.18665695190429688, -0.17308807373046875, -0.15951919555664062, -0.1459503173828125, -0.13238143920898438, -0.11881256103515625, -0.10524368286132812, -0.0916748046875, -0.07810592651367188, -0.06453704833984375, -0.050968170166015625, -0.0373992919921875, -0.023830413818359375, -0.01026153564453125, 0.003307342529296875, 0.016876220703125, 0.030445098876953125, 0.04401397705078125, 0.057582855224609375, 0.0711517333984375, 0.08472061157226562, 0.09828948974609375, 0.11185836791992188, 0.12542724609375, 0.13899612426757812, 0.15256500244140625, 0.16613388061523438, 0.1797027587890625, 0.19327163696289062, 0.20684051513671875, 0.22040939331054688, 0.233978271484375, 0.24754714965820312, 0.26111602783203125, 0.2746849060058594, 0.2882537841796875, 0.3018226623535156, 0.31539154052734375, 0.3289604187011719, 0.342529296875]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 5.0, 5.0, 2.0, 7.0, 6.0, 7.0, 13.0, 16.0, 17.0, 18.0, 15.0, 31.0, 37.0, 34.0, 27.0, 30.0, 37.0, 30.0, 32.0, 58.0, 58.0, 51.0, 40.0, 44.0, 36.0, 47.0, 43.0, 35.0, 33.0, 31.0, 16.0, 20.0, 24.0, 19.0, 15.0, 12.0, 8.0, 7.0, 6.0, 6.0, 6.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.2117919921875, -0.20538902282714844, -0.19898605346679688, -0.1925830841064453, -0.18618011474609375, -0.1797771453857422, -0.17337417602539062, -0.16697120666503906, -0.1605682373046875, -0.15416526794433594, -0.14776229858398438, -0.1413593292236328, -0.13495635986328125, -0.1285533905029297, -0.12215042114257812, -0.11574745178222656, -0.109344482421875, -0.10294151306152344, -0.09653854370117188, -0.09013557434082031, -0.08373260498046875, -0.07732963562011719, -0.07092666625976562, -0.06452369689941406, -0.0581207275390625, -0.05171775817871094, -0.045314788818359375, -0.03891181945800781, -0.03250885009765625, -0.026105880737304688, -0.019702911376953125, -0.013299942016601562, -0.00689697265625, -0.0004940032958984375, 0.005908966064453125, 0.012311935424804688, 0.01871490478515625, 0.025117874145507812, 0.031520843505859375, 0.03792381286621094, 0.0443267822265625, 0.05072975158691406, 0.057132720947265625, 0.06353569030761719, 0.06993865966796875, 0.07634162902832031, 0.08274459838867188, 0.08914756774902344, 0.095550537109375, 0.10195350646972656, 0.10835647583007812, 0.11475944519042969, 0.12116241455078125, 0.1275653839111328, 0.13396835327148438, 0.14037132263183594, 0.1467742919921875, 0.15317726135253906, 0.15958023071289062, 0.1659832000732422, 0.17238616943359375, 0.1787891387939453, 0.18519210815429688, 0.19159507751464844, 0.197998046875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 5.0, 2.0, 6.0, 8.0, 11.0, 8.0, 12.0, 25.0, 31.0, 55.0, 68.0, 102.0, 209.0, 335.0, 695.0, 1574.0, 4411.0, 19488.0, 222266.0, 753335.0, 35421.0, 6561.0, 2026.0, 852.0, 429.0, 214.0, 135.0, 75.0, 62.0, 35.0, 31.0, 13.0, 16.0, 13.0, 6.0, 7.0, 5.0, 3.0, 3.0, 1.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.83740234375, -0.814239501953125, -0.79107666015625, -0.767913818359375, -0.7447509765625, -0.721588134765625, -0.69842529296875, -0.675262451171875, -0.652099609375, -0.628936767578125, -0.60577392578125, -0.582611083984375, -0.5594482421875, -0.536285400390625, -0.51312255859375, -0.489959716796875, -0.466796875, -0.443634033203125, -0.42047119140625, -0.397308349609375, -0.3741455078125, -0.350982666015625, -0.32781982421875, -0.304656982421875, -0.281494140625, -0.258331298828125, -0.23516845703125, -0.212005615234375, -0.1888427734375, -0.165679931640625, -0.14251708984375, -0.119354248046875, -0.09619140625, -0.073028564453125, -0.04986572265625, -0.026702880859375, -0.0035400390625, 0.019622802734375, 0.04278564453125, 0.065948486328125, 0.089111328125, 0.112274169921875, 0.13543701171875, 0.158599853515625, 0.1817626953125, 0.204925537109375, 0.22808837890625, 0.251251220703125, 0.2744140625, 0.297576904296875, 0.32073974609375, 0.343902587890625, 0.3670654296875, 0.390228271484375, 0.41339111328125, 0.436553955078125, 0.459716796875, 0.482879638671875, 0.50604248046875, 0.529205322265625, 0.5523681640625, 0.575531005859375, 0.59869384765625, 0.621856689453125, 0.64501953125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 11.0, 13.0, 10.0, 6.0, 18.0, 13.0, 23.0, 23.0, 16.0, 31.0, 37.0, 39.0, 42.0, 59.0, 40.0, 65.0, 47.0, 57.0, 41.0, 55.0, 50.0, 54.0, 38.0, 38.0, 36.0, 26.0, 21.0, 17.0, 10.0, 9.0, 8.0, 7.0, 13.0, 2.0, 8.0, 6.0, 4.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.82373046875, -0.7971115112304688, -0.7704925537109375, -0.7438735961914062, -0.717254638671875, -0.6906356811523438, -0.6640167236328125, -0.6373977661132812, -0.61077880859375, -0.5841598510742188, -0.5575408935546875, -0.5309219360351562, -0.504302978515625, -0.47768402099609375, -0.4510650634765625, -0.42444610595703125, -0.3978271484375, -0.37120819091796875, -0.3445892333984375, -0.31797027587890625, -0.291351318359375, -0.26473236083984375, -0.2381134033203125, -0.21149444580078125, -0.18487548828125, -0.15825653076171875, -0.1316375732421875, -0.10501861572265625, -0.078399658203125, -0.05178070068359375, -0.0251617431640625, 0.00145721435546875, 0.028076171875, 0.05469512939453125, 0.0813140869140625, 0.10793304443359375, 0.134552001953125, 0.16117095947265625, 0.1877899169921875, 0.21440887451171875, 0.24102783203125, 0.26764678955078125, 0.2942657470703125, 0.32088470458984375, 0.347503662109375, 0.37412261962890625, 0.4007415771484375, 0.42736053466796875, 0.4539794921875, 0.48059844970703125, 0.5072174072265625, 0.5338363647460938, 0.560455322265625, 0.5870742797851562, 0.6136932373046875, 0.6403121948242188, 0.66693115234375, 0.6935501098632812, 0.7201690673828125, 0.7467880249023438, 0.773406982421875, 0.8000259399414062, 0.8266448974609375, 0.8532638549804688, 0.8798828125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 6.0, 2.0, 4.0, 9.0, 10.0, 18.0, 22.0, 27.0, 51.0, 88.0, 183.0, 326.0, 868.0, 2487.0, 13069.0, 768339.0, 249877.0, 9566.0, 2157.0, 758.0, 333.0, 161.0, 89.0, 44.0, 21.0, 13.0, 11.0, 5.0, 4.0, 6.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.341552734375, -0.3288688659667969, -0.31618499755859375, -0.3035011291503906, -0.2908172607421875, -0.2781333923339844, -0.26544952392578125, -0.2527656555175781, -0.240081787109375, -0.22739791870117188, -0.21471405029296875, -0.20203018188476562, -0.1893463134765625, -0.17666244506835938, -0.16397857666015625, -0.15129470825195312, -0.13861083984375, -0.12592697143554688, -0.11324310302734375, -0.10055923461914062, -0.0878753662109375, -0.07519149780273438, -0.06250762939453125, -0.049823760986328125, -0.037139892578125, -0.024456024169921875, -0.01177215576171875, 0.000911712646484375, 0.0135955810546875, 0.026279449462890625, 0.03896331787109375, 0.051647186279296875, 0.0643310546875, 0.07701492309570312, 0.08969879150390625, 0.10238265991210938, 0.1150665283203125, 0.12775039672851562, 0.14043426513671875, 0.15311813354492188, 0.165802001953125, 0.17848587036132812, 0.19116973876953125, 0.20385360717773438, 0.2165374755859375, 0.22922134399414062, 0.24190521240234375, 0.2545890808105469, 0.26727294921875, 0.2799568176269531, 0.29264068603515625, 0.3053245544433594, 0.3180084228515625, 0.3306922912597656, 0.34337615966796875, 0.3560600280761719, 0.368743896484375, 0.3814277648925781, 0.39411163330078125, 0.4067955017089844, 0.4194793701171875, 0.4321632385253906, 0.44484710693359375, 0.4575309753417969, 0.47021484375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 3.0, 2.0, 5.0, 9.0, 13.0, 31.0, 89.0, 333.0, 362.0, 79.0, 30.0, 17.0, 8.0, 10.0, 2.0, 2.0, 2.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.00032520294189453125, -0.0003184322267770767, -0.0003116615116596222, -0.00030489079654216766, -0.00029812008142471313, -0.0002913493663072586, -0.0002845786511898041, -0.00027780793607234955, -0.000271037220954895, -0.0002642665058374405, -0.00025749579071998596, -0.00025072507560253143, -0.0002439543604850769, -0.00023718364536762238, -0.00023041293025016785, -0.00022364221513271332, -0.0002168715000152588, -0.00021010078489780426, -0.00020333006978034973, -0.0001965593546628952, -0.00018978863954544067, -0.00018301792442798615, -0.00017624720931053162, -0.0001694764941930771, -0.00016270577907562256, -0.00015593506395816803, -0.0001491643488407135, -0.00014239363372325897, -0.00013562291860580444, -0.00012885220348834991, -0.00012208148837089539, -0.00011531077325344086, -0.00010854005813598633, -0.0001017693430185318, -9.499862790107727e-05, -8.822791278362274e-05, -8.145719766616821e-05, -7.468648254871368e-05, -6.791576743125916e-05, -6.114505231380463e-05, -5.43743371963501e-05, -4.760362207889557e-05, -4.083290696144104e-05, -3.406219184398651e-05, -2.7291476726531982e-05, -2.0520761609077454e-05, -1.3750046491622925e-05, -6.979331374168396e-06, -2.086162567138672e-07, 6.562098860740662e-06, 1.333281397819519e-05, 2.010352909564972e-05, 2.6874244213104248e-05, 3.364495933055878e-05, 4.0415674448013306e-05, 4.7186389565467834e-05, 5.395710468292236e-05, 6.072781980037689e-05, 6.749853491783142e-05, 7.426925003528595e-05, 8.103996515274048e-05, 8.781068027019501e-05, 9.458139538764954e-05, 0.00010135211050510406, 0.0001081228256225586]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 2.0, 3.0, 3.0, 8.0, 10.0, 15.0, 18.0, 31.0, 54.0, 52.0, 102.0, 160.0, 307.0, 614.0, 1741.0, 6154.0, 79463.0, 926386.0, 27272.0, 3801.0, 1181.0, 500.0, 251.0, 145.0, 100.0, 63.0, 32.0, 21.0, 19.0, 17.0, 6.0, 8.0, 2.0, 9.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.34375, -0.3311767578125, -0.318603515625, -0.3060302734375, -0.29345703125, -0.2808837890625, -0.268310546875, -0.2557373046875, -0.2431640625, -0.2305908203125, -0.218017578125, -0.2054443359375, -0.19287109375, -0.1802978515625, -0.167724609375, -0.1551513671875, -0.142578125, -0.1300048828125, -0.117431640625, -0.1048583984375, -0.09228515625, -0.0797119140625, -0.067138671875, -0.0545654296875, -0.0419921875, -0.0294189453125, -0.016845703125, -0.0042724609375, 0.00830078125, 0.0208740234375, 0.033447265625, 0.0460205078125, 0.05859375, 0.0711669921875, 0.083740234375, 0.0963134765625, 0.10888671875, 0.1214599609375, 0.134033203125, 0.1466064453125, 0.1591796875, 0.1717529296875, 0.184326171875, 0.1968994140625, 0.20947265625, 0.2220458984375, 0.234619140625, 0.2471923828125, 0.259765625, 0.2723388671875, 0.284912109375, 0.2974853515625, 0.31005859375, 0.3226318359375, 0.335205078125, 0.3477783203125, 0.3603515625, 0.3729248046875, 0.385498046875, 0.3980712890625, 0.41064453125, 0.4232177734375, 0.435791015625, 0.4483642578125, 0.4609375]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 5.0, 6.0, 3.0, 5.0, 5.0, 13.0, 24.0, 41.0, 45.0, 114.0, 157.0, 195.0, 156.0, 83.0, 55.0, 34.0, 18.0, 14.0, 10.0, 5.0, 3.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.369140625, -0.35950279235839844, -0.3498649597167969, -0.3402271270751953, -0.33058929443359375, -0.3209514617919922, -0.3113136291503906, -0.30167579650878906, -0.2920379638671875, -0.28240013122558594, -0.2727622985839844, -0.2631244659423828, -0.25348663330078125, -0.2438488006591797, -0.23421096801757812, -0.22457313537597656, -0.214935302734375, -0.20529747009277344, -0.19565963745117188, -0.1860218048095703, -0.17638397216796875, -0.1667461395263672, -0.15710830688476562, -0.14747047424316406, -0.1378326416015625, -0.12819480895996094, -0.11855697631835938, -0.10891914367675781, -0.09928131103515625, -0.08964347839355469, -0.08000564575195312, -0.07036781311035156, -0.06072998046875, -0.05109214782714844, -0.041454315185546875, -0.03181648254394531, -0.02217864990234375, -0.012540817260742188, -0.002902984619140625, 0.0067348480224609375, 0.0163726806640625, 0.026010513305664062, 0.035648345947265625, 0.04528617858886719, 0.05492401123046875, 0.06456184387207031, 0.07419967651367188, 0.08383750915527344, 0.093475341796875, 0.10311317443847656, 0.11275100708007812, 0.12238883972167969, 0.13202667236328125, 0.1416645050048828, 0.15130233764648438, 0.16094017028808594, 0.1705780029296875, 0.18021583557128906, 0.18985366821289062, 0.1994915008544922, 0.20912933349609375, 0.2187671661376953, 0.22840499877929688, 0.23804283142089844, 0.2476806640625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 8.0, 15.0, 58.0, 157.0, 498.0, 190.0, 45.0, 19.0, 8.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.972320556640625, -10.694829940795898, -10.417340278625488, -10.139849662780762, -9.862359046936035, -9.584869384765625, -9.307378768920898, -9.029888153076172, -8.752397537231445, -8.474906921386719, -8.197417259216309, -7.919926643371582, -7.6424360275268555, -7.364945888519287, -7.087455749511719, -6.809965133666992, -6.532475471496582, -6.254985332489014, -5.977494716644287, -5.700004577636719, -5.422513961791992, -5.145023822784424, -4.8675336837768555, -4.590043067932129, -4.3125529289245605, -4.035062789916992, -3.7575721740722656, -3.4800820350646973, -3.20259165763855, -2.9251012802124023, -2.647611141204834, -2.3701207637786865, -2.0926294326782227, -1.8151390552520752, -1.5376487970352173, -1.2601585388183594, -0.9826681613922119, -0.7051777839660645, -0.42768752574920654, -0.15019726753234863, 0.12729310989379883, 0.4047834277153015, 0.6822737455368042, 0.9597640633583069, 1.2372543811798096, 1.514744758605957, 1.792235016822815, 2.069725275039673, 2.3472156524658203, 2.6247060298919678, 2.9021964073181152, 3.1796865463256836, 3.457176923751831, 3.7346673011779785, 4.012157440185547, 4.289648056030273, 4.567138195037842, 4.84462833404541, 5.122118949890137, 5.399609088897705, 5.677099227905273, 5.95458984375, 6.232079982757568, 6.509570121765137, 6.787060737609863]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 4.0, 3.0, 6.0, 7.0, 11.0, 2.0, 8.0, 14.0, 10.0, 18.0, 23.0, 16.0, 19.0, 18.0, 26.0, 30.0, 21.0, 27.0, 54.0, 64.0, 74.0, 86.0, 94.0, 55.0, 49.0, 27.0, 27.0, 22.0, 25.0, 16.0, 16.0, 19.0, 19.0, 11.0, 21.0, 10.0, 8.0, 6.0, 6.0, 5.0, 4.0, 6.0, 5.0, 4.0, 2.0, 0.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-2.8594861030578613, -2.7713756561279297, -2.683264970779419, -2.5951545238494873, -2.5070438385009766, -2.418933391571045, -2.3308229446411133, -2.2427124977111816, -2.154601812362671, -2.0664913654327393, -1.9783806800842285, -1.8902702331542969, -1.8021596670150757, -1.7140491008758545, -1.6259386539459229, -1.5378280878067017, -1.4497175216674805, -1.3616069555282593, -1.273496389389038, -1.1853859424591064, -1.0972753763198853, -1.009164810180664, -0.9210543036460876, -0.8329437971115112, -0.74483323097229, -0.6567226648330688, -0.5686121582984924, -0.48050162196159363, -0.3923910856246948, -0.304280549287796, -0.21617001295089722, -0.1280595064163208, -0.03994917869567871, 0.04816135764122009, 0.1362718939781189, 0.2243824303150177, 0.3124929666519165, 0.4006035029888153, 0.4887140393257141, 0.5768245458602905, 0.6649351119995117, 0.7530456781387329, 0.8411561846733093, 0.9292666912078857, 1.017377257347107, 1.1054878234863281, 1.1935982704162598, 1.281708836555481, 1.3698194026947021, 1.4579299688339233, 1.5460405349731445, 1.6341509819030762, 1.7222615480422974, 1.8103721141815186, 1.8984825611114502, 1.9865931272506714, 2.0747036933898926, 2.162814140319824, 2.250924825668335, 2.3390352725982666, 2.4271459579467773, 2.515256404876709, 2.6033668518066406, 2.6914772987365723, 2.779587984085083]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 3.0, 13.0, 8.0, 20.0, 22.0, 39.0, 51.0, 110.0, 126.0, 263.0, 462.0, 788.0, 1591.0, 3555.0, 9040.0, 28942.0, 136104.0, 1023603.0, 2419042.0, 469788.0, 71384.0, 18017.0, 5977.0, 2575.0, 1242.0, 623.0, 317.0, 235.0, 119.0, 72.0, 42.0, 37.0, 17.0, 23.0, 10.0, 9.0, 7.0, 3.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.48486328125, -0.4693756103515625, -0.453887939453125, -0.4384002685546875, -0.42291259765625, -0.4074249267578125, -0.391937255859375, -0.3764495849609375, -0.3609619140625, -0.3454742431640625, -0.329986572265625, -0.3144989013671875, -0.29901123046875, -0.2835235595703125, -0.268035888671875, -0.2525482177734375, -0.237060546875, -0.2215728759765625, -0.206085205078125, -0.1905975341796875, -0.17510986328125, -0.1596221923828125, -0.144134521484375, -0.1286468505859375, -0.1131591796875, -0.0976715087890625, -0.082183837890625, -0.0666961669921875, -0.05120849609375, -0.0357208251953125, -0.020233154296875, -0.0047454833984375, 0.0107421875, 0.0262298583984375, 0.041717529296875, 0.0572052001953125, 0.07269287109375, 0.0881805419921875, 0.103668212890625, 0.1191558837890625, 0.1346435546875, 0.1501312255859375, 0.165618896484375, 0.1811065673828125, 0.19659423828125, 0.2120819091796875, 0.227569580078125, 0.2430572509765625, 0.258544921875, 0.2740325927734375, 0.289520263671875, 0.3050079345703125, 0.32049560546875, 0.3359832763671875, 0.351470947265625, 0.3669586181640625, 0.3824462890625, 0.3979339599609375, 0.413421630859375, 0.4289093017578125, 0.44439697265625, 0.4598846435546875, 0.475372314453125, 0.4908599853515625, 0.50634765625]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 6.0, 7.0, 6.0, 16.0, 9.0, 11.0, 20.0, 19.0, 15.0, 43.0, 33.0, 35.0, 41.0, 37.0, 51.0, 59.0, 48.0, 60.0, 60.0, 62.0, 53.0, 44.0, 49.0, 38.0, 29.0, 25.0, 24.0, 28.0, 21.0, 16.0, 10.0, 10.0, 3.0, 6.0, 1.0, 5.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.281494140625, -0.2739696502685547, -0.2664451599121094, -0.25892066955566406, -0.25139617919921875, -0.24387168884277344, -0.23634719848632812, -0.2288227081298828, -0.2212982177734375, -0.2137737274169922, -0.20624923706054688, -0.19872474670410156, -0.19120025634765625, -0.18367576599121094, -0.17615127563476562, -0.1686267852783203, -0.161102294921875, -0.1535778045654297, -0.14605331420898438, -0.13852882385253906, -0.13100433349609375, -0.12347984313964844, -0.11595535278320312, -0.10843086242675781, -0.1009063720703125, -0.09338188171386719, -0.08585739135742188, -0.07833290100097656, -0.07080841064453125, -0.06328392028808594, -0.055759429931640625, -0.04823493957519531, -0.04071044921875, -0.03318595886230469, -0.025661468505859375, -0.018136978149414062, -0.01061248779296875, -0.0030879974365234375, 0.004436492919921875, 0.011960983276367188, 0.0194854736328125, 0.027009963989257812, 0.034534454345703125, 0.04205894470214844, 0.04958343505859375, 0.05710792541503906, 0.06463241577148438, 0.07215690612792969, 0.079681396484375, 0.08720588684082031, 0.09473037719726562, 0.10225486755371094, 0.10977935791015625, 0.11730384826660156, 0.12482833862304688, 0.1323528289794922, 0.1398773193359375, 0.1474018096923828, 0.15492630004882812, 0.16245079040527344, 0.16997528076171875, 0.17749977111816406, 0.18502426147460938, 0.1925487518310547, 0.2000732421875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 6.0, 4.0, 11.0, 15.0, 27.0, 59.0, 111.0, 325.0, 1256.0, 23576.0, 4160329.0, 7361.0, 791.0, 223.0, 100.0, 38.0, 26.0, 11.0, 6.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.37890625, -5.24566650390625, -5.1124267578125, -4.97918701171875, -4.845947265625, -4.71270751953125, -4.5794677734375, -4.44622802734375, -4.31298828125, -4.17974853515625, -4.0465087890625, -3.91326904296875, -3.780029296875, -3.64678955078125, -3.5135498046875, -3.38031005859375, -3.2470703125, -3.11383056640625, -2.9805908203125, -2.84735107421875, -2.714111328125, -2.58087158203125, -2.4476318359375, -2.31439208984375, -2.18115234375, -2.04791259765625, -1.9146728515625, -1.78143310546875, -1.648193359375, -1.51495361328125, -1.3817138671875, -1.24847412109375, -1.115234375, -0.98199462890625, -0.8487548828125, -0.71551513671875, -0.582275390625, -0.44903564453125, -0.3157958984375, -0.18255615234375, -0.04931640625, 0.08392333984375, 0.2171630859375, 0.35040283203125, 0.483642578125, 0.61688232421875, 0.7501220703125, 0.88336181640625, 1.0166015625, 1.14984130859375, 1.2830810546875, 1.41632080078125, 1.549560546875, 1.68280029296875, 1.8160400390625, 1.94927978515625, 2.08251953125, 2.21575927734375, 2.3489990234375, 2.48223876953125, 2.615478515625, 2.74871826171875, 2.8819580078125, 3.01519775390625, 3.1484375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 0.0, 1.0, 4.0, 6.0, 5.0, 16.0, 31.0, 45.0, 92.0, 155.0, 259.0, 503.0, 954.0, 968.0, 497.0, 224.0, 148.0, 59.0, 45.0, 26.0, 11.0, 11.0, 10.0, 5.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.154296875, -1.1131134033203125, -1.071929931640625, -1.0307464599609375, -0.98956298828125, -0.9483795166015625, -0.907196044921875, -0.8660125732421875, -0.8248291015625, -0.7836456298828125, -0.742462158203125, -0.7012786865234375, -0.66009521484375, -0.6189117431640625, -0.577728271484375, -0.5365447998046875, -0.495361328125, -0.4541778564453125, -0.412994384765625, -0.3718109130859375, -0.33062744140625, -0.2894439697265625, -0.248260498046875, -0.2070770263671875, -0.1658935546875, -0.1247100830078125, -0.083526611328125, -0.0423431396484375, -0.00115966796875, 0.0400238037109375, 0.081207275390625, 0.1223907470703125, 0.16357421875, 0.2047576904296875, 0.245941162109375, 0.2871246337890625, 0.32830810546875, 0.3694915771484375, 0.410675048828125, 0.4518585205078125, 0.4930419921875, 0.5342254638671875, 0.575408935546875, 0.6165924072265625, 0.65777587890625, 0.6989593505859375, 0.740142822265625, 0.7813262939453125, 0.822509765625, 0.8636932373046875, 0.904876708984375, 0.9460601806640625, 0.98724365234375, 1.0284271240234375, 1.069610595703125, 1.1107940673828125, 1.1519775390625, 1.1931610107421875, 1.234344482421875, 1.2755279541015625, 1.31671142578125, 1.3578948974609375, 1.399078369140625, 1.4402618408203125, 1.4814453125]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 2.0, 15.0, 50.0, 236.0, 466.0, 171.0, 41.0, 14.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.747618675231934, -11.972113609313965, -11.196608543395996, -10.421104431152344, -9.645599365234375, -8.870094299316406, -8.094589233398438, -7.319084167480469, -6.5435791015625, -5.768074035644531, -4.9925689697265625, -4.217064380645752, -3.441559314727783, -2.6660542488098145, -1.890549659729004, -1.1150445938110352, -0.3395395278930664, 0.4359654188156128, 1.211470365524292, 1.9869751930236816, 2.7624802589416504, 3.537985324859619, 4.31348991394043, 5.088994979858398, 5.864500045776367, 6.640005111694336, 7.415510177612305, 8.191015243530273, 8.966520309448242, 9.742025375366211, 10.517529487609863, 11.293034553527832, 12.068538665771484, 12.844043731689453, 13.619548797607422, 14.39505386352539, 15.17055892944336, 15.946063995361328, 16.721569061279297, 17.497074127197266, 18.272579193115234, 19.048084259033203, 19.823589324951172, 20.59909439086914, 21.37459945678711, 22.150104522705078, 22.925609588623047, 23.701114654541016, 24.47661781311035, 25.25212287902832, 26.02762794494629, 26.803133010864258, 27.578638076782227, 28.354143142700195, 29.12964630126953, 29.9051513671875, 30.68065643310547, 31.456161499023438, 32.231666564941406, 33.007171630859375, 33.782676696777344, 34.55818176269531, 35.33368682861328, 36.10919189453125, 36.88469696044922]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 6.0, 1.0, 6.0, 9.0, 10.0, 9.0, 15.0, 13.0, 14.0, 17.0, 21.0, 38.0, 36.0, 41.0, 38.0, 43.0, 42.0, 61.0, 76.0, 59.0, 50.0, 47.0, 48.0, 49.0, 40.0, 33.0, 31.0, 33.0, 22.0, 20.0, 18.0, 9.0, 13.0, 11.0, 10.0, 6.0, 6.0, 6.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.924989700317383, -3.778637170791626, -3.632284641265869, -3.485931873321533, -3.3395793437957764, -3.1932268142700195, -3.0468740463256836, -2.9005215167999268, -2.75416898727417, -2.607816457748413, -2.4614639282226562, -2.3151111602783203, -2.1687586307525635, -2.0224061012268066, -1.8760534524917603, -1.7297008037567139, -1.583348274230957, -1.4369957447052002, -1.2906430959701538, -1.1442904472351074, -0.9979379177093506, -0.851585328578949, -0.7052327394485474, -0.558880090713501, -0.41252756118774414, -0.26617497205734253, -0.11982238292694092, 0.026530206203460693, 0.1728827953338623, 0.3192353844642639, 0.4655879735946655, 0.6119406223297119, 0.7582931518554688, 0.9046457409858704, 1.050998330116272, 1.1973509788513184, 1.3437035083770752, 1.490056037902832, 1.6364086866378784, 1.7827613353729248, 1.9291138648986816, 2.0754663944244385, 2.2218189239501953, 2.3681716918945312, 2.514524221420288, 2.660876750946045, 2.807229518890381, 2.9535820484161377, 3.0999345779418945, 3.2462871074676514, 3.392639636993408, 3.538992404937744, 3.685344934463501, 3.831697463989258, 3.9780502319335938, 4.12440299987793, 4.270755290985107, 4.417108058929443, 4.563460350036621, 4.709813117980957, 4.856165885925293, 5.002518177032471, 5.148870944976807, 5.295223236083984, 5.44157600402832]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 3.0, 11.0, 8.0, 8.0, 7.0, 16.0, 16.0, 19.0, 34.0, 45.0, 104.0, 305.0, 1134.0, 5583.0, 46435.0, 811663.0, 166800.0, 13263.0, 2161.0, 538.0, 180.0, 73.0, 48.0, 22.0, 13.0, 16.0, 8.0, 9.0, 5.0, 9.0, 9.0, 2.0, 6.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.068359375, -1.0400390625, -1.01171875, -0.9833984375, -0.955078125, -0.9267578125, -0.8984375, -0.8701171875, -0.841796875, -0.8134765625, -0.78515625, -0.7568359375, -0.728515625, -0.7001953125, -0.671875, -0.6435546875, -0.615234375, -0.5869140625, -0.55859375, -0.5302734375, -0.501953125, -0.4736328125, -0.4453125, -0.4169921875, -0.388671875, -0.3603515625, -0.33203125, -0.3037109375, -0.275390625, -0.2470703125, -0.21875, -0.1904296875, -0.162109375, -0.1337890625, -0.10546875, -0.0771484375, -0.048828125, -0.0205078125, 0.0078125, 0.0361328125, 0.064453125, 0.0927734375, 0.12109375, 0.1494140625, 0.177734375, 0.2060546875, 0.234375, 0.2626953125, 0.291015625, 0.3193359375, 0.34765625, 0.3759765625, 0.404296875, 0.4326171875, 0.4609375, 0.4892578125, 0.517578125, 0.5458984375, 0.57421875, 0.6025390625, 0.630859375, 0.6591796875, 0.6875, 0.7158203125, 0.744140625]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 10.0, 12.0, 29.0, 40.0, 77.0, 96.0, 151.0, 156.0, 144.0, 122.0, 75.0, 47.0, 27.0, 11.0, 11.0, 3.0, 1.0, 7.0], "bins": [-1.677734375, -1.6464385986328125, -1.615142822265625, -1.5838470458984375, -1.55255126953125, -1.5212554931640625, -1.489959716796875, -1.4586639404296875, -1.4273681640625, -1.3960723876953125, -1.364776611328125, -1.3334808349609375, -1.30218505859375, -1.2708892822265625, -1.239593505859375, -1.2082977294921875, -1.177001953125, -1.1457061767578125, -1.114410400390625, -1.0831146240234375, -1.05181884765625, -1.0205230712890625, -0.989227294921875, -0.9579315185546875, -0.9266357421875, -0.8953399658203125, -0.864044189453125, -0.8327484130859375, -0.80145263671875, -0.7701568603515625, -0.738861083984375, -0.7075653076171875, -0.67626953125, -0.6449737548828125, -0.613677978515625, -0.5823822021484375, -0.55108642578125, -0.5197906494140625, -0.488494873046875, -0.4571990966796875, -0.4259033203125, -0.3946075439453125, -0.363311767578125, -0.3320159912109375, -0.30072021484375, -0.2694244384765625, -0.238128662109375, -0.2068328857421875, -0.175537109375, -0.1442413330078125, -0.112945556640625, -0.0816497802734375, -0.05035400390625, -0.0190582275390625, 0.012237548828125, 0.0435333251953125, 0.0748291015625, 0.1061248779296875, 0.137420654296875, 0.1687164306640625, 0.20001220703125, 0.2313079833984375, 0.262603759765625, 0.2938995361328125, 0.3251953125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 9.0, 10.0, 16.0, 25.0, 35.0, 59.0, 79.0, 178.0, 316.0, 761.0, 2056.0, 7994.0, 61268.0, 908799.0, 55750.0, 7774.0, 1943.0, 723.0, 297.0, 184.0, 105.0, 63.0, 41.0, 19.0, 18.0, 7.0, 5.0, 7.0, 6.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58544921875, -0.5624771118164062, -0.5395050048828125, -0.5165328979492188, -0.493560791015625, -0.47058868408203125, -0.4476165771484375, -0.42464447021484375, -0.40167236328125, -0.37870025634765625, -0.3557281494140625, -0.33275604248046875, -0.309783935546875, -0.28681182861328125, -0.2638397216796875, -0.24086761474609375, -0.2178955078125, -0.19492340087890625, -0.1719512939453125, -0.14897918701171875, -0.126007080078125, -0.10303497314453125, -0.0800628662109375, -0.05709075927734375, -0.03411865234375, -0.01114654541015625, 0.0118255615234375, 0.03479766845703125, 0.057769775390625, 0.08074188232421875, 0.1037139892578125, 0.12668609619140625, 0.149658203125, 0.17263031005859375, 0.1956024169921875, 0.21857452392578125, 0.241546630859375, 0.26451873779296875, 0.2874908447265625, 0.31046295166015625, 0.33343505859375, 0.35640716552734375, 0.3793792724609375, 0.40235137939453125, 0.425323486328125, 0.44829559326171875, 0.4712677001953125, 0.49423980712890625, 0.5172119140625, 0.5401840209960938, 0.5631561279296875, 0.5861282348632812, 0.609100341796875, 0.6320724487304688, 0.6550445556640625, 0.6780166625976562, 0.70098876953125, 0.7239608764648438, 0.7469329833984375, 0.7699050903320312, 0.792877197265625, 0.8158493041992188, 0.8388214111328125, 0.8617935180664062, 0.884765625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 5.0, 7.0, 6.0, 9.0, 12.0, 6.0, 11.0, 18.0, 13.0, 10.0, 27.0, 23.0, 21.0, 29.0, 44.0, 37.0, 49.0, 64.0, 65.0, 86.0, 72.0, 73.0, 52.0, 54.0, 33.0, 25.0, 27.0, 21.0, 20.0, 12.0, 9.0, 17.0, 10.0, 7.0, 5.0, 5.0, 4.0, 5.0, 1.0, 4.0, 4.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.423828125, -1.3787384033203125, -1.333648681640625, -1.2885589599609375, -1.24346923828125, -1.1983795166015625, -1.153289794921875, -1.1082000732421875, -1.0631103515625, -1.0180206298828125, -0.972930908203125, -0.9278411865234375, -0.88275146484375, -0.8376617431640625, -0.792572021484375, -0.7474822998046875, -0.702392578125, -0.6573028564453125, -0.612213134765625, -0.5671234130859375, -0.52203369140625, -0.4769439697265625, -0.431854248046875, -0.3867645263671875, -0.3416748046875, -0.2965850830078125, -0.251495361328125, -0.2064056396484375, -0.16131591796875, -0.1162261962890625, -0.071136474609375, -0.0260467529296875, 0.01904296875, 0.0641326904296875, 0.109222412109375, 0.1543121337890625, 0.19940185546875, 0.2444915771484375, 0.289581298828125, 0.3346710205078125, 0.3797607421875, 0.4248504638671875, 0.469940185546875, 0.5150299072265625, 0.56011962890625, 0.6052093505859375, 0.650299072265625, 0.6953887939453125, 0.740478515625, 0.7855682373046875, 0.830657958984375, 0.8757476806640625, 0.92083740234375, 0.9659271240234375, 1.011016845703125, 1.0561065673828125, 1.1011962890625, 1.1462860107421875, 1.191375732421875, 1.2364654541015625, 1.28155517578125, 1.3266448974609375, 1.371734619140625, 1.4168243408203125, 1.4619140625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 3.0, 5.0, 8.0, 9.0, 5.0, 9.0, 16.0, 22.0, 37.0, 46.0, 89.0, 162.0, 294.0, 657.0, 1486.0, 4189.0, 16307.0, 113123.0, 854329.0, 44253.0, 8934.0, 2565.0, 1004.0, 462.0, 214.0, 120.0, 68.0, 46.0, 25.0, 17.0, 22.0, 13.0, 4.0, 3.0, 3.0, 4.0, 1.0, 3.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1439208984375, -0.13916969299316406, -0.13441848754882812, -0.1296672821044922, -0.12491607666015625, -0.12016487121582031, -0.11541366577148438, -0.11066246032714844, -0.1059112548828125, -0.10116004943847656, -0.09640884399414062, -0.09165763854980469, -0.08690643310546875, -0.08215522766113281, -0.07740402221679688, -0.07265281677246094, -0.067901611328125, -0.06315040588378906, -0.058399200439453125, -0.05364799499511719, -0.04889678955078125, -0.04414558410644531, -0.039394378662109375, -0.03464317321777344, -0.0298919677734375, -0.025140762329101562, -0.020389556884765625, -0.015638351440429688, -0.01088714599609375, -0.0061359405517578125, -0.001384735107421875, 0.0033664703369140625, 0.00811767578125, 0.012868881225585938, 0.017620086669921875, 0.022371292114257812, 0.02712249755859375, 0.03187370300292969, 0.036624908447265625, 0.04137611389160156, 0.0461273193359375, 0.05087852478027344, 0.055629730224609375, 0.06038093566894531, 0.06513214111328125, 0.06988334655761719, 0.07463455200195312, 0.07938575744628906, 0.084136962890625, 0.08888816833496094, 0.09363937377929688, 0.09839057922363281, 0.10314178466796875, 0.10789299011230469, 0.11264419555664062, 0.11739540100097656, 0.1221466064453125, 0.12689781188964844, 0.13164901733398438, 0.1364002227783203, 0.14115142822265625, 0.1459026336669922, 0.15065383911132812, 0.15540504455566406, 0.16015625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 5.0, 10.0, 3.0, 10.0, 7.0, 7.0, 6.0, 13.0, 21.0, 20.0, 35.0, 30.0, 49.0, 59.0, 80.0, 115.0, 103.0, 91.0, 79.0, 63.0, 45.0, 26.0, 23.0, 15.0, 12.0, 20.0, 10.0, 6.0, 6.0, 10.0, 4.0, 6.0, 5.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-2.9981136322021484e-05, -2.895388752222061e-05, -2.792663872241974e-05, -2.6899389922618866e-05, -2.5872141122817993e-05, -2.484489232301712e-05, -2.3817643523216248e-05, -2.2790394723415375e-05, -2.1763145923614502e-05, -2.073589712381363e-05, -1.9708648324012756e-05, -1.8681399524211884e-05, -1.765415072441101e-05, -1.6626901924610138e-05, -1.5599653124809265e-05, -1.4572404325008392e-05, -1.354515552520752e-05, -1.2517906725406647e-05, -1.1490657925605774e-05, -1.0463409125804901e-05, -9.436160326004028e-06, -8.408911526203156e-06, -7.381662726402283e-06, -6.35441392660141e-06, -5.327165126800537e-06, -4.299916326999664e-06, -3.2726675271987915e-06, -2.2454187273979187e-06, -1.218169927597046e-06, -1.909211277961731e-07, 8.363276720046997e-07, 1.8635764718055725e-06, 2.8908252716064453e-06, 3.918074071407318e-06, 4.945322871208191e-06, 5.972571671009064e-06, 6.9998204708099365e-06, 8.02706927061081e-06, 9.054318070411682e-06, 1.0081566870212555e-05, 1.1108815670013428e-05, 1.21360644698143e-05, 1.3163313269615173e-05, 1.4190562069416046e-05, 1.5217810869216919e-05, 1.6245059669017792e-05, 1.7272308468818665e-05, 1.8299557268619537e-05, 1.932680606842041e-05, 2.0354054868221283e-05, 2.1381303668022156e-05, 2.240855246782303e-05, 2.34358012676239e-05, 2.4463050067424774e-05, 2.5490298867225647e-05, 2.651754766702652e-05, 2.7544796466827393e-05, 2.8572045266628265e-05, 2.9599294066429138e-05, 3.062654286623001e-05, 3.1653791666030884e-05, 3.2681040465831757e-05, 3.370828926563263e-05, 3.47355380654335e-05, 3.5762786865234375e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 6.0, 3.0, 13.0, 11.0, 18.0, 20.0, 41.0, 96.0, 184.0, 451.0, 1779.0, 9885.0, 168127.0, 848172.0, 16293.0, 2450.0, 614.0, 192.0, 75.0, 49.0, 27.0, 15.0, 9.0, 11.0, 6.0, 3.0, 0.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.259521484375, -0.2509040832519531, -0.24228668212890625, -0.23366928100585938, -0.2250518798828125, -0.21643447875976562, -0.20781707763671875, -0.19919967651367188, -0.190582275390625, -0.18196487426757812, -0.17334747314453125, -0.16473007202148438, -0.1561126708984375, -0.14749526977539062, -0.13887786865234375, -0.13026046752929688, -0.12164306640625, -0.11302566528320312, -0.10440826416015625, -0.09579086303710938, -0.0871734619140625, -0.07855606079101562, -0.06993865966796875, -0.061321258544921875, -0.052703857421875, -0.044086456298828125, -0.03546905517578125, -0.026851654052734375, -0.0182342529296875, -0.009616851806640625, -0.00099945068359375, 0.007617950439453125, 0.0162353515625, 0.024852752685546875, 0.03347015380859375, 0.042087554931640625, 0.0507049560546875, 0.059322357177734375, 0.06793975830078125, 0.07655715942382812, 0.085174560546875, 0.09379196166992188, 0.10240936279296875, 0.11102676391601562, 0.1196441650390625, 0.12826156616210938, 0.13687896728515625, 0.14549636840820312, 0.15411376953125, 0.16273117065429688, 0.17134857177734375, 0.17996597290039062, 0.1885833740234375, 0.19720077514648438, 0.20581817626953125, 0.21443557739257812, 0.223052978515625, 0.23167037963867188, 0.24028778076171875, 0.24890518188476562, 0.2575225830078125, 0.2661399841308594, 0.27475738525390625, 0.2833747863769531, 0.2919921875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 4.0, 4.0, 6.0, 5.0, 3.0, 5.0, 4.0, 9.0, 9.0, 25.0, 25.0, 20.0, 37.0, 41.0, 43.0, 52.0, 64.0, 83.0, 81.0, 88.0, 85.0, 60.0, 60.0, 33.0, 36.0, 34.0, 19.0, 16.0, 12.0, 7.0, 14.0, 5.0, 8.0, 4.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1654052734375, -0.16049575805664062, -0.15558624267578125, -0.15067672729492188, -0.1457672119140625, -0.14085769653320312, -0.13594818115234375, -0.13103866577148438, -0.126129150390625, -0.12121963500976562, -0.11631011962890625, -0.11140060424804688, -0.1064910888671875, -0.10158157348632812, -0.09667205810546875, -0.09176254272460938, -0.08685302734375, -0.08194351196289062, -0.07703399658203125, -0.07212448120117188, -0.0672149658203125, -0.062305450439453125, -0.05739593505859375, -0.052486419677734375, -0.047576904296875, -0.042667388916015625, -0.03775787353515625, -0.032848358154296875, -0.0279388427734375, -0.023029327392578125, -0.01811981201171875, -0.013210296630859375, -0.00830078125, -0.003391265869140625, 0.00151824951171875, 0.006427764892578125, 0.0113372802734375, 0.016246795654296875, 0.02115631103515625, 0.026065826416015625, 0.030975341796875, 0.035884857177734375, 0.04079437255859375, 0.045703887939453125, 0.0506134033203125, 0.055522918701171875, 0.06043243408203125, 0.06534194946289062, 0.07025146484375, 0.07516098022460938, 0.08007049560546875, 0.08498001098632812, 0.0898895263671875, 0.09479904174804688, 0.09970855712890625, 0.10461807250976562, 0.109527587890625, 0.11443710327148438, 0.11934661865234375, 0.12425613403320312, 0.1291656494140625, 0.13407516479492188, 0.13898468017578125, 0.14389419555664062, 0.1488037109375]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 5.0, 2.0, 1.0, 2.0, 4.0, 5.0, 10.0, 4.0, 18.0, 35.0, 51.0, 82.0, 327.0, 262.0, 76.0, 51.0, 30.0, 16.0, 12.0, 5.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.079756736755371, -3.922390937805176, -3.7650251388549805, -3.607659339904785, -3.45029354095459, -3.2929277420043945, -3.135561943054199, -2.978196144104004, -2.8208303451538086, -2.6634645462036133, -2.506098747253418, -2.3487329483032227, -2.1913671493530273, -2.034001350402832, -1.8766355514526367, -1.7192697525024414, -1.561903953552246, -1.4045381546020508, -1.2471723556518555, -1.0898065567016602, -0.9324407577514648, -0.7750749588012695, -0.6177091598510742, -0.4603433609008789, -0.3029775619506836, -0.14561176300048828, 0.011754035949707031, 0.16911983489990234, 0.32648563385009766, 0.48385143280029297, 0.6412172317504883, 0.7985830307006836, 0.9559488296508789, 1.1133146286010742, 1.2706804275512695, 1.4280462265014648, 1.5854120254516602, 1.7427778244018555, 1.9001436233520508, 2.057509422302246, 2.2148752212524414, 2.3722410202026367, 2.529606819152832, 2.6869726181030273, 2.8443384170532227, 3.001704216003418, 3.1590700149536133, 3.3164358139038086, 3.473801612854004, 3.631167411804199, 3.7885332107543945, 3.94589900970459, 4.103264808654785, 4.2606306076049805, 4.417996406555176, 4.575362205505371, 4.732728004455566, 4.890093803405762, 5.047459602355957, 5.204825401306152, 5.362191200256348, 5.519556999206543, 5.676922798156738, 5.834288597106934, 5.991654396057129]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 7.0, 6.0, 5.0, 12.0, 6.0, 9.0, 9.0, 16.0, 12.0, 14.0, 22.0, 13.0, 21.0, 22.0, 27.0, 65.0, 95.0, 114.0, 109.0, 90.0, 84.0, 47.0, 18.0, 20.0, 23.0, 18.0, 20.0, 13.0, 12.0, 7.0, 7.0, 13.0, 5.0, 6.0, 4.0, 4.0, 1.0, 5.0, 5.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0], "bins": [-3.4178333282470703, -3.3118650913238525, -3.205897092819214, -3.099928855895996, -2.9939608573913574, -2.8879926204681396, -2.782024383544922, -2.676056385040283, -2.5700881481170654, -2.4641199111938477, -2.358151912689209, -2.252183675765991, -2.1462154388427734, -2.0402474403381348, -1.934279203414917, -1.8283110857009888, -1.7223429679870605, -1.6163748502731323, -1.510406732559204, -1.4044384956359863, -1.298470377922058, -1.1925022602081299, -1.086534023284912, -0.9805659055709839, -0.8745977878570557, -0.7686296701431274, -0.6626614928245544, -0.5566933155059814, -0.4507251977920532, -0.344757080078125, -0.238788902759552, -0.132820725440979, -0.026852846145629883, 0.07911530137062073, 0.18508344888687134, 0.29105159640312195, 0.39701974391937256, 0.5029878616333008, 0.6089560389518738, 0.7149242162704468, 0.820892333984375, 0.9268604516983032, 1.0328285694122314, 1.1387968063354492, 1.2447649240493774, 1.3507330417633057, 1.4567012786865234, 1.5626693964004517, 1.6686375141143799, 1.774605631828308, 1.8805737495422363, 1.986541986465454, 2.092510223388672, 2.1984782218933105, 2.3044464588165283, 2.410414695739746, 2.5163826942443848, 2.6223509311676025, 2.728318929672241, 2.834287166595459, 2.9402551651000977, 3.0462234020233154, 3.152191638946533, 3.258159637451172, 3.3641278743743896]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 6.0, 9.0, 6.0, 4.0, 9.0, 17.0, 11.0, 18.0, 19.0, 37.0, 35.0, 43.0, 40.0, 65.0, 139.0, 196.0, 84.0, 41.0, 39.0, 38.0, 36.0, 25.0, 13.0, 17.0, 18.0, 14.0, 7.0, 4.0, 3.0, 5.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.49169921875, -0.477691650390625, -0.46368408203125, -0.449676513671875, -0.4356689453125, -0.421661376953125, -0.40765380859375, -0.393646240234375, -0.379638671875, -0.365631103515625, -0.35162353515625, -0.337615966796875, -0.3236083984375, -0.309600830078125, -0.29559326171875, -0.281585693359375, -0.267578125, -0.253570556640625, -0.23956298828125, -0.225555419921875, -0.2115478515625, -0.197540283203125, -0.18353271484375, -0.169525146484375, -0.155517578125, -0.141510009765625, -0.12750244140625, -0.113494873046875, -0.0994873046875, -0.085479736328125, -0.07147216796875, -0.057464599609375, -0.04345703125, -0.029449462890625, -0.01544189453125, -0.001434326171875, 0.0125732421875, 0.026580810546875, 0.04058837890625, 0.054595947265625, 0.068603515625, 0.082611083984375, 0.09661865234375, 0.110626220703125, 0.1246337890625, 0.138641357421875, 0.15264892578125, 0.166656494140625, 0.1806640625, 0.194671630859375, 0.20867919921875, 0.222686767578125, 0.2366943359375, 0.250701904296875, 0.26470947265625, 0.278717041015625, 0.292724609375, 0.306732177734375, 0.32073974609375, 0.334747314453125, 0.3487548828125, 0.362762451171875, 0.37677001953125, 0.390777587890625, 0.40478515625]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 7.0, 4.0, 5.0, 3.0, 5.0, 1.0, 6.0, 5.0, 8.0, 6.0, 9.0, 7.0, 11.0, 26.0, 45.0, 57.0, 88.0, 162.0, 277.0, 567.0, 1209.0, 3033.0, 11080.0, 801048.0, 7553075.0, 11709.0, 3495.0, 1338.0, 585.0, 259.0, 135.0, 86.0, 60.0, 50.0, 37.0, 27.0, 19.0, 9.0, 2.0, 5.0, 12.0, 5.0, 8.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0], "bins": [-1.5678791999816895, -1.51895010471344, -1.4700210094451904, -1.4210920333862305, -1.372162938117981, -1.3232338428497314, -1.274304747581482, -1.2253756523132324, -1.1764466762542725, -1.127517580986023, -1.0785884857177734, -1.0296595096588135, -0.980730414390564, -0.9318013191223145, -0.8828722238540649, -0.8339431285858154, -0.7850140333175659, -0.7360849380493164, -0.6871559023857117, -0.6382268071174622, -0.5892977714538574, -0.5403686761856079, -0.4914395809173584, -0.4425105154514313, -0.39358144998550415, -0.344652384519577, -0.2957233190536499, -0.2467942237854004, -0.19786515831947327, -0.14893609285354614, -0.10000699758529663, -0.05107793211936951, -0.002148747444152832, 0.04678032547235489, 0.09570939838886261, 0.14463847875595093, 0.19356754422187805, 0.24249660968780518, 0.2914257049560547, 0.3403547704219818, 0.38928383588790894, 0.43821290135383606, 0.4871419668197632, 0.5360710620880127, 0.5850001573562622, 0.6339291930198669, 0.6828582882881165, 0.7317873239517212, 0.7807164192199707, 0.8296455144882202, 0.878574550151825, 0.9275036454200745, 0.9764326810836792, 1.0253617763519287, 1.0742908716201782, 1.1232199668884277, 1.1721489429473877, 1.2210780382156372, 1.2700071334838867, 1.3189361095428467, 1.3678652048110962, 1.4167943000793457, 1.4657233953475952, 1.5146524906158447, 1.5635815858840942]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 4.0, 4.0, 6.0, 3.0, 13.0, 4.0, 6.0, 7.0, 5.0, 9.0, 5.0, 11.0, 7.0, 10.0, 4.0, 3.0, 1.0, 5.0, 3.0, 2.0, 1.0, 1.0], "bins": [-10.238897323608398, -10.036127090454102, -9.833356857299805, -9.630587577819824, -9.427817344665527, -9.22504711151123, -9.022276878356934, -8.819507598876953, -8.616737365722656, -8.41396713256836, -8.211196899414062, -8.008427619934082, -7.805657386779785, -7.602887153625488, -7.400116920471191, -7.197347164154053, -6.994576930999756, -6.791806697845459, -6.58903694152832, -6.386266708374023, -6.183496952056885, -5.980726718902588, -5.777956962585449, -5.575186729431152, -5.3724164962768555, -5.169646263122559, -4.96687650680542, -4.764106273651123, -4.561336517333984, -4.3585662841796875, -4.155796051025391, -3.953026294708252, -3.7502570152282715, -3.5474870204925537, -3.344717025756836, -3.141946792602539, -2.9391770362854004, -2.7364068031311035, -2.5336368083953857, -2.330866813659668, -2.12809681892395, -1.9253268241882324, -1.7225568294525146, -1.5197867155075073, -1.3170167207717896, -1.1142467260360718, -0.9114766120910645, -0.7087066173553467, -0.5059366226196289, -0.30316659808158875, -0.10039657354354858, 0.10237348079681396, 0.30514347553253174, 0.5079134702682495, 0.7106835842132568, 0.9134535789489746, 1.1162235736846924, 1.3189935684204102, 1.521763563156128, 1.7245336771011353, 1.927303671836853, 2.1300735473632812, 2.332843780517578, 2.535613775253296, 2.7383837699890137]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 4.0, 3.0, 1.0, 4.0, 6.0, 5.0, 9.0, 5.0, 24.0, 12.0, 30.0, 35.0, 44.0, 43.0, 70.0, 78.0, 64.0, 60.0, 69.0, 71.0, 73.0, 58.0, 49.0, 49.0, 34.0, 26.0, 13.0, 18.0, 10.0, 11.0, 8.0, 6.0, 6.0, 4.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3134765625, -0.3018646240234375, -0.290252685546875, -0.2786407470703125, -0.26702880859375, -0.2554168701171875, -0.243804931640625, -0.2321929931640625, -0.2205810546875, -0.2089691162109375, -0.197357177734375, -0.1857452392578125, -0.17413330078125, -0.1625213623046875, -0.150909423828125, -0.1392974853515625, -0.127685546875, -0.1160736083984375, -0.104461669921875, -0.0928497314453125, -0.08123779296875, -0.0696258544921875, -0.058013916015625, -0.0464019775390625, -0.0347900390625, -0.0231781005859375, -0.011566162109375, 4.57763671875e-05, 0.01165771484375, 0.0232696533203125, 0.034881591796875, 0.0464935302734375, 0.05810546875, 0.0697174072265625, 0.081329345703125, 0.0929412841796875, 0.10455322265625, 0.1161651611328125, 0.127777099609375, 0.1393890380859375, 0.1510009765625, 0.1626129150390625, 0.174224853515625, 0.1858367919921875, 0.19744873046875, 0.2090606689453125, 0.220672607421875, 0.2322845458984375, 0.243896484375, 0.2555084228515625, 0.267120361328125, 0.2787322998046875, 0.29034423828125, 0.3019561767578125, 0.313568115234375, 0.3251800537109375, 0.3367919921875, 0.3484039306640625, 0.360015869140625, 0.3716278076171875, 0.38323974609375, 0.3948516845703125, 0.406463623046875, 0.4180755615234375, 0.4296875]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 5.0, 6.0, 10.0, 16.0, 20.0, 29.0, 39.0, 69.0, 112.0, 159.0, 238.0, 419.0, 719.0, 1420.0, 2874.0, 6284.0, 15060.0, 39028.0, 102712.0, 182009.0, 105552.0, 39658.0, 15596.0, 6461.0, 2862.0, 1368.0, 700.0, 320.0, 194.0, 113.0, 80.0, 50.0, 21.0, 22.0, 16.0, 3.0, 5.0, 4.0, 4.0, 6.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.59765625, -1.551361083984375, -1.50506591796875, -1.458770751953125, -1.4124755859375, -1.366180419921875, -1.31988525390625, -1.273590087890625, -1.227294921875, -1.180999755859375, -1.13470458984375, -1.088409423828125, -1.0421142578125, -0.995819091796875, -0.94952392578125, -0.903228759765625, -0.85693359375, -0.810638427734375, -0.76434326171875, -0.718048095703125, -0.6717529296875, -0.625457763671875, -0.57916259765625, -0.532867431640625, -0.486572265625, -0.440277099609375, -0.39398193359375, -0.347686767578125, -0.3013916015625, -0.255096435546875, -0.20880126953125, -0.162506103515625, -0.1162109375, -0.069915771484375, -0.02362060546875, 0.022674560546875, 0.0689697265625, 0.115264892578125, 0.16156005859375, 0.207855224609375, 0.254150390625, 0.300445556640625, 0.34674072265625, 0.393035888671875, 0.4393310546875, 0.485626220703125, 0.53192138671875, 0.578216552734375, 0.62451171875, 0.670806884765625, 0.71710205078125, 0.763397216796875, 0.8096923828125, 0.855987548828125, 0.90228271484375, 0.948577880859375, 0.994873046875, 1.041168212890625, 1.08746337890625, 1.133758544921875, 1.1800537109375, 1.226348876953125, 1.27264404296875, 1.318939208984375, 1.365234375]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 3.0, 5.0, 8.0, 4.0, 6.0, 10.0, 6.0, 8.0, 11.0, 17.0, 16.0, 20.0, 25.0, 25.0, 45.0, 35.0, 31.0, 52.0, 50.0, 59.0, 52.0, 55.0, 60.0, 45.0, 54.0, 49.0, 34.0, 33.0, 38.0, 32.0, 23.0, 19.0, 10.0, 8.0, 12.0, 11.0, 4.0, 6.0, 3.0, 3.0, 5.0, 2.0, 3.0, 3.0, 2.0, 0.0, 3.0], "bins": [-0.27734375, -0.2700366973876953, -0.2627296447753906, -0.25542259216308594, -0.24811553955078125, -0.24080848693847656, -0.23350143432617188, -0.2261943817138672, -0.2188873291015625, -0.2115802764892578, -0.20427322387695312, -0.19696617126464844, -0.18965911865234375, -0.18235206604003906, -0.17504501342773438, -0.1677379608154297, -0.160430908203125, -0.1531238555908203, -0.14581680297851562, -0.13850975036621094, -0.13120269775390625, -0.12389564514160156, -0.11658859252929688, -0.10928153991699219, -0.1019744873046875, -0.09466743469238281, -0.08736038208007812, -0.08005332946777344, -0.07274627685546875, -0.06543922424316406, -0.058132171630859375, -0.05082511901855469, -0.04351806640625, -0.03621101379394531, -0.028903961181640625, -0.021596908569335938, -0.01428985595703125, -0.0069828033447265625, 0.000324249267578125, 0.0076313018798828125, 0.0149383544921875, 0.022245407104492188, 0.029552459716796875, 0.03685951232910156, 0.04416656494140625, 0.05147361755371094, 0.058780670166015625, 0.06608772277832031, 0.073394775390625, 0.08070182800292969, 0.08800888061523438, 0.09531593322753906, 0.10262298583984375, 0.10993003845214844, 0.11723709106445312, 0.12454414367675781, 0.1318511962890625, 0.1391582489013672, 0.14646530151367188, 0.15377235412597656, 0.16107940673828125, 0.16838645935058594, 0.17569351196289062, 0.1830005645751953, 0.1903076171875]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 5.0, 8.0, 4.0, 8.0, 11.0, 12.0, 11.0, 31.0, 44.0, 76.0, 100.0, 82.0, 44.0, 23.0, 10.0, 3.0, 5.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5849573612213135, -2.513430595397949, -2.441904067993164, -2.3703773021698, -2.2988505363464355, -2.2273240089416504, -2.155797243118286, -2.084270477294922, -2.0127439498901367, -1.941217303276062, -1.8696905374526978, -1.798163890838623, -1.7266372442245483, -1.6551105976104736, -1.5835838317871094, -1.5120571851730347, -1.4405304193496704, -1.3690037727355957, -1.2974770069122314, -1.2259503602981567, -1.154423713684082, -1.0828969478607178, -1.011370301246643, -0.9398436546325684, -0.8683169484138489, -0.7967902421951294, -0.7252635955810547, -0.6537368893623352, -0.5822101831436157, -0.510683536529541, -0.43915683031082153, -0.3676301836967468, -0.2961033582687378, -0.2245766818523407, -0.1530499905347824, -0.08152329921722412, -0.009996622800827026, 0.06153005361557007, 0.13305675983428955, 0.20458340644836426, 0.27611011266708374, 0.34763678908348083, 0.41916346549987793, 0.4906901717185974, 0.5622168779373169, 0.6337435245513916, 0.7052702307701111, 0.7767968773841858, 0.8483235836029053, 0.9198502898216248, 0.9913769364356995, 1.062903642654419, 1.1344302892684937, 1.2059569358825684, 1.2774837017059326, 1.3490103483200073, 1.420536994934082, 1.4920636415481567, 1.563590407371521, 1.6351170539855957, 1.7066437005996704, 1.7781703472137451, 1.8496971130371094, 1.921223759651184, 1.9927505254745483]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 5.0, 5.0, 4.0, 1.0, 5.0, 6.0, 4.0, 4.0, 4.0, 4.0, 3.0, 8.0, 19.0, 28.0, 50.0, 77.0, 65.0, 59.0, 44.0, 16.0, 17.0, 15.0, 6.0, 7.0, 9.0, 5.0, 1.0, 2.0, 3.0, 4.0, 2.0, 0.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0], "bins": [-1.6058992147445679, -1.5647358894348145, -1.5235724449157715, -1.482409119606018, -1.4412457942962646, -1.4000824689865112, -1.3589191436767578, -1.3177556991577148, -1.2765923738479614, -1.235429048538208, -1.194265604019165, -1.1531022787094116, -1.1119389533996582, -1.0707756280899048, -1.0296123027801514, -0.9884488582611084, -0.947285532951355, -0.9061222076416016, -0.8649588227272034, -0.8237954378128052, -0.7826321125030518, -0.7414687871932983, -0.7003054022789001, -0.659142017364502, -0.6179786920547485, -0.5768153667449951, -0.5356519818305969, -0.4944886267185211, -0.4533252716064453, -0.4121619164943695, -0.3709985613822937, -0.3298352062702179, -0.28867197036743164, -0.24750861525535583, -0.20634526014328003, -0.16518190503120422, -0.12401854991912842, -0.08285519480705261, -0.04169183969497681, -0.000528484582901001, 0.040634870529174805, 0.08179822564125061, 0.12296158075332642, 0.16412493586540222, 0.20528829097747803, 0.24645164608955383, 0.28761500120162964, 0.32877835631370544, 0.36994171142578125, 0.41110506653785706, 0.45226842164993286, 0.49343177676200867, 0.5345951318740845, 0.5757584571838379, 0.6169218420982361, 0.6580852270126343, 0.6992485523223877, 0.7404118776321411, 0.7815752625465393, 0.8227386474609375, 0.8639019727706909, 0.9050652980804443, 0.9462286829948425, 0.9873920679092407, 1.0285553932189941]}, "eval/loss": 0.32974740862846375, "eval/wer": 0.09492264974216581, "eval/runtime": 555.2371, "eval/samples_per_second": 4.758, "eval/steps_per_second": 0.596, "train/train_runtime": 26664.6603, "train/train_samples_per_second": 5.351, "train/train_steps_per_second": 0.084, "train/total_flos": 0.0, "train/train_loss": 1.6266609489166015} \ No newline at end of file