diff --git "a/wandb/run-20220504_142129-1tmxz74i/files/wandb-summary.json" "b/wandb/run-20220504_142129-1tmxz74i/files/wandb-summary.json" --- "a/wandb/run-20220504_142129-1tmxz74i/files/wandb-summary.json" +++ "b/wandb/run-20220504_142129-1tmxz74i/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 1.9175, "train/learning_rate": 8.159054565325461e-06, "train/epoch": 2.93, "train/global_step": 9500, "_runtime": 92651, "_timestamp": 1651766740, "_step": 9518, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 86.0, 853.0, 78.0], "bins": [-51.6225700378418, -50.79640197753906, -49.97023010253906, -49.14406204223633, -48.31789016723633, -47.491722106933594, -46.665550231933594, -45.83938217163086, -45.01321029663086, -44.187042236328125, -43.360870361328125, -42.53470230102539, -41.70853042602539, -40.882362365722656, -40.056190490722656, -39.23002243041992, -38.40385437011719, -37.57768630981445, -36.75151443481445, -35.92534637451172, -35.09917449951172, -34.273006439208984, -33.446834564208984, -32.62066650390625, -31.79449462890625, -30.968324661254883, -30.142154693603516, -29.31598472595215, -28.48981475830078, -27.663646697998047, -26.837474822998047, -26.011306762695312, -25.185134887695312, -24.358964920043945, -23.532794952392578, -22.70662498474121, -21.880455017089844, -21.05428695678711, -20.22811508178711, -19.401947021484375, -18.575777053833008, -17.74960708618164, -16.923437118530273, -16.097267150878906, -15.271098136901855, -14.444928169250488, -13.618758201599121, -12.79258918762207, -11.966418266296387, -11.14024829864502, -10.314078330993652, -9.487909317016602, -8.661739349365234, -7.835569381713867, -7.0093994140625, -6.183229923248291, -5.357060432434082, -4.530890464782715, -3.704720973968506, -2.8785510063171387, -2.0523812770843506, -1.2262115478515625, -0.4000415802001953, 0.42612791061401367, 1.2522979974746704]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 4.0, 5.0, 4.0, 5.0, 7.0, 10.0, 21.0, 12.0, 13.0, 18.0, 28.0, 26.0, 29.0, 33.0, 34.0, 34.0, 40.0, 39.0, 47.0, 44.0, 38.0, 33.0, 42.0, 47.0, 39.0, 36.0, 42.0, 46.0, 29.0, 26.0, 29.0, 19.0, 18.0, 25.0, 10.0, 18.0, 15.0, 10.0, 8.0, 8.0, 4.0, 3.0, 5.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.5299746990203857, -2.4536519050598145, -2.377329111099243, -2.301006317138672, -2.2246835231781006, -2.1483607292175293, -2.072037935256958, -1.9957151412963867, -1.9193923473358154, -1.8430695533752441, -1.7667467594146729, -1.6904239654541016, -1.6141011714935303, -1.537778377532959, -1.4614555835723877, -1.3851327896118164, -1.3088099956512451, -1.2324872016906738, -1.1561644077301025, -1.0798416137695312, -1.00351881980896, -0.9271960258483887, -0.8508732318878174, -0.7745504379272461, -0.6982276439666748, -0.6219048500061035, -0.5455820560455322, -0.46925926208496094, -0.39293646812438965, -0.31661367416381836, -0.24029088020324707, -0.16396808624267578, -0.08764505386352539, -0.011322259902954102, 0.06500053405761719, 0.14132332801818848, 0.21764612197875977, 0.29396891593933105, 0.37029170989990234, 0.44661450386047363, 0.5229372978210449, 0.5992600917816162, 0.6755828857421875, 0.7519056797027588, 0.8282284736633301, 0.9045512676239014, 0.9808740615844727, 1.057196855545044, 1.1335196495056152, 1.2098424434661865, 1.2861652374267578, 1.362488031387329, 1.4388108253479004, 1.5151336193084717, 1.591456413269043, 1.6677792072296143, 1.7441020011901855, 1.8204247951507568, 1.8967475891113281, 1.9730703830718994, 2.0493931770324707, 2.125715970993042, 2.2020387649536133, 2.2783615589141846, 2.354684352874756]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 5.0, 7.0, 13.0, 21.0, 17.0, 22.0, 29.0, 48.0, 82.0, 117.0, 162.0, 317.0, 488.0, 835.0, 1465.0, 2579.0, 4827.0, 9063.0, 17758.0, 34332.0, 68316.0, 153998.0, 571725.0, 2492355.0, 544245.0, 152036.0, 67764.0, 34262.0, 17580.0, 9050.0, 4658.0, 2550.0, 1471.0, 810.0, 484.0, 273.0, 167.0, 108.0, 59.0, 58.0, 33.0, 34.0, 23.0, 13.0, 4.0, 6.0, 4.0, 3.0, 10.0, 3.0, 1.0, 2.0], "bins": [-1.970703125, -1.9151611328125, -1.859619140625, -1.8040771484375, -1.74853515625, -1.6929931640625, -1.637451171875, -1.5819091796875, -1.5263671875, -1.4708251953125, -1.415283203125, -1.3597412109375, -1.30419921875, -1.2486572265625, -1.193115234375, -1.1375732421875, -1.08203125, -1.0264892578125, -0.970947265625, -0.9154052734375, -0.85986328125, -0.8043212890625, -0.748779296875, -0.6932373046875, -0.6376953125, -0.5821533203125, -0.526611328125, -0.4710693359375, -0.41552734375, -0.3599853515625, -0.304443359375, -0.2489013671875, -0.193359375, -0.1378173828125, -0.082275390625, -0.0267333984375, 0.02880859375, 0.0843505859375, 0.139892578125, 0.1954345703125, 0.2509765625, 0.3065185546875, 0.362060546875, 0.4176025390625, 0.47314453125, 0.5286865234375, 0.584228515625, 0.6397705078125, 0.6953125, 0.7508544921875, 0.806396484375, 0.8619384765625, 0.91748046875, 0.9730224609375, 1.028564453125, 1.0841064453125, 1.1396484375, 1.1951904296875, 1.250732421875, 1.3062744140625, 1.36181640625, 1.4173583984375, 1.472900390625, 1.5284423828125, 1.583984375]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 4.0, 4.0, 5.0, 7.0, 19.0, 16.0, 15.0, 14.0, 28.0, 26.0, 25.0, 43.0, 34.0, 44.0, 43.0, 49.0, 50.0, 50.0, 45.0, 49.0, 45.0, 47.0, 42.0, 47.0, 51.0, 32.0, 36.0, 23.0, 27.0, 21.0, 13.0, 10.0, 14.0, 7.0, 7.0, 2.0, 7.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.787109375, -3.670928955078125, -3.55474853515625, -3.438568115234375, -3.3223876953125, -3.206207275390625, -3.09002685546875, -2.973846435546875, -2.857666015625, -2.741485595703125, -2.62530517578125, -2.509124755859375, -2.3929443359375, -2.276763916015625, -2.16058349609375, -2.044403076171875, -1.92822265625, -1.812042236328125, -1.69586181640625, -1.579681396484375, -1.4635009765625, -1.347320556640625, -1.23114013671875, -1.114959716796875, -0.998779296875, -0.882598876953125, -0.76641845703125, -0.650238037109375, -0.5340576171875, -0.417877197265625, -0.30169677734375, -0.185516357421875, -0.0693359375, 0.046844482421875, 0.16302490234375, 0.279205322265625, 0.3953857421875, 0.511566162109375, 0.62774658203125, 0.743927001953125, 0.860107421875, 0.976287841796875, 1.09246826171875, 1.208648681640625, 1.3248291015625, 1.441009521484375, 1.55718994140625, 1.673370361328125, 1.78955078125, 1.905731201171875, 2.02191162109375, 2.138092041015625, 2.2542724609375, 2.370452880859375, 2.48663330078125, 2.602813720703125, 2.718994140625, 2.835174560546875, 2.95135498046875, 3.067535400390625, 3.1837158203125, 3.299896240234375, 3.41607666015625, 3.532257080078125, 3.6484375]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 6.0, 7.0, 13.0, 11.0, 17.0, 22.0, 21.0, 28.0, 44.0, 60.0, 78.0, 179.0, 601.0, 3679726.0, 512441.0, 563.0, 158.0, 96.0, 61.0, 44.0, 15.0, 23.0, 17.0, 16.0, 20.0, 5.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.1875, -39.85791015625, -38.5283203125, -37.19873046875, -35.869140625, -34.53955078125, -33.2099609375, -31.88037109375, -30.55078125, -29.22119140625, -27.8916015625, -26.56201171875, -25.232421875, -23.90283203125, -22.5732421875, -21.24365234375, -19.9140625, -18.58447265625, -17.2548828125, -15.92529296875, -14.595703125, -13.26611328125, -11.9365234375, -10.60693359375, -9.27734375, -7.94775390625, -6.6181640625, -5.28857421875, -3.958984375, -2.62939453125, -1.2998046875, 0.02978515625, 1.359375, 2.68896484375, 4.0185546875, 5.34814453125, 6.677734375, 8.00732421875, 9.3369140625, 10.66650390625, 11.99609375, 13.32568359375, 14.6552734375, 15.98486328125, 17.314453125, 18.64404296875, 19.9736328125, 21.30322265625, 22.6328125, 23.96240234375, 25.2919921875, 26.62158203125, 27.951171875, 29.28076171875, 30.6103515625, 31.93994140625, 33.26953125, 34.59912109375, 35.9287109375, 37.25830078125, 38.587890625, 39.91748046875, 41.2470703125, 42.57666015625, 43.90625]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 5.0, 7.0, 6.0, 12.0, 13.0, 21.0, 32.0, 24.0, 39.0, 59.0, 70.0, 147.0, 326.0, 1421.0, 1207.0, 288.0, 111.0, 75.0, 65.0, 35.0, 21.0, 23.0, 19.0, 16.0, 11.0, 7.0, 3.0, 5.0, 0.0, 2.0, 1.0, 0.0, 5.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2255859375, -1.18463134765625, -1.1436767578125, -1.10272216796875, -1.061767578125, -1.02081298828125, -0.9798583984375, -0.93890380859375, -0.89794921875, -0.85699462890625, -0.8160400390625, -0.77508544921875, -0.734130859375, -0.69317626953125, -0.6522216796875, -0.61126708984375, -0.5703125, -0.52935791015625, -0.4884033203125, -0.44744873046875, -0.406494140625, -0.36553955078125, -0.3245849609375, -0.28363037109375, -0.24267578125, -0.20172119140625, -0.1607666015625, -0.11981201171875, -0.078857421875, -0.03790283203125, 0.0030517578125, 0.04400634765625, 0.0849609375, 0.12591552734375, 0.1668701171875, 0.20782470703125, 0.248779296875, 0.28973388671875, 0.3306884765625, 0.37164306640625, 0.41259765625, 0.45355224609375, 0.4945068359375, 0.53546142578125, 0.576416015625, 0.61737060546875, 0.6583251953125, 0.69927978515625, 0.740234375, 0.78118896484375, 0.8221435546875, 0.86309814453125, 0.904052734375, 0.94500732421875, 0.9859619140625, 1.02691650390625, 1.06787109375, 1.10882568359375, 1.1497802734375, 1.19073486328125, 1.231689453125, 1.27264404296875, 1.3135986328125, 1.35455322265625, 1.3955078125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 7.0, 6.0, 13.0, 22.0, 21.0, 43.0, 62.0, 77.0, 110.0, 127.0, 121.0, 100.0, 87.0, 64.0, 56.0, 33.0, 22.0, 19.0, 5.0, 5.0, 7.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.543133735656738, -7.349100589752197, -7.155067443847656, -6.961034297943115, -6.767001152038574, -6.572968006134033, -6.378934860229492, -6.184902191162109, -5.99086856842041, -5.796835422515869, -5.602802276611328, -5.408769130706787, -5.214735984802246, -5.020702838897705, -4.826669692993164, -4.632637023925781, -4.43860387802124, -4.244570732116699, -4.050537586212158, -3.856504440307617, -3.662471294403076, -3.468438148498535, -3.2744052410125732, -3.0803720951080322, -2.886338949203491, -2.69230580329895, -2.498272657394409, -2.3042397499084473, -2.1102066040039062, -1.9161733388900757, -1.7221403121948242, -1.5281071662902832, -1.3340744972229004, -1.1400413513183594, -0.9460082650184631, -0.7519751787185669, -0.5579420328140259, -0.36390888690948486, -0.1698758602142334, 0.024157285690307617, 0.21819043159484863, 0.41222354769706726, 0.6062566637992859, 0.8002897500991821, 0.9943228960037231, 1.1883560419082642, 1.3823890686035156, 1.5764222145080566, 1.7704553604125977, 1.9644885063171387, 2.1585216522216797, 2.3525547981262207, 2.5465879440307617, 2.7406210899353027, 2.9346539974212646, 3.1286871433258057, 3.3227202892303467, 3.5167534351348877, 3.7107865810394287, 3.9048194885253906, 4.098852634429932, 4.292885780334473, 4.486918926239014, 4.680952072143555, 4.874985218048096]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 8.0, 10.0, 4.0, 13.0, 10.0, 13.0, 17.0, 12.0, 20.0, 21.0, 29.0, 26.0, 34.0, 35.0, 35.0, 29.0, 36.0, 32.0, 41.0, 41.0, 45.0, 38.0, 38.0, 38.0, 36.0, 38.0, 43.0, 25.0, 31.0, 27.0, 21.0, 23.0, 24.0, 22.0, 17.0, 10.0, 13.0, 9.0, 6.0, 10.0, 9.0, 2.0, 2.0, 6.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-3.09440279006958, -3.0093836784362793, -2.9243645668029785, -2.8393454551696777, -2.754326343536377, -2.669307231903076, -2.5842881202697754, -2.4992687702178955, -2.4142496585845947, -2.329230546951294, -2.244211435317993, -2.1591923236846924, -2.0741732120513916, -1.9891539812088013, -1.9041348695755005, -1.8191156387329102, -1.734096646308899, -1.6490775346755981, -1.5640584230422974, -1.479039192199707, -1.3940200805664062, -1.3090009689331055, -1.2239818572998047, -1.138962745666504, -1.0539436340332031, -0.9689245223999023, -0.8839053511619568, -0.798886239528656, -0.7138670682907104, -0.6288479566574097, -0.5438288450241089, -0.45880967378616333, -0.3737905025482178, -0.2887713611125946, -0.20375223457813263, -0.11873310804367065, -0.033713966608047485, 0.051305174827575684, 0.13632428646087646, 0.22134345769882202, 0.3063625693321228, 0.39138171076774597, 0.47640085220336914, 0.5614199638366699, 0.6464390754699707, 0.7314582467079163, 0.816477358341217, 0.9014965295791626, 0.9865156412124634, 1.0715347528457642, 1.156553864479065, 1.2415730953216553, 1.326592206954956, 1.4116113185882568, 1.4966304302215576, 1.5816495418548584, 1.6666686534881592, 1.75168776512146, 1.8367068767547607, 1.9217259883880615, 2.0067451000213623, 2.091764450073242, 2.176783561706543, 2.2618026733398438, 2.3468217849731445]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 5.0, 1.0, 7.0, 4.0, 12.0, 16.0, 20.0, 32.0, 45.0, 68.0, 103.0, 124.0, 177.0, 279.0, 419.0, 634.0, 932.0, 1507.0, 2412.0, 3939.0, 6577.0, 11542.0, 20800.0, 38968.0, 76523.0, 157289.0, 263868.0, 222608.0, 114657.0, 56607.0, 29124.0, 16002.0, 9119.0, 5246.0, 3247.0, 1973.0, 1217.0, 846.0, 525.0, 326.0, 245.0, 143.0, 116.0, 73.0, 56.0, 39.0, 29.0, 18.0, 20.0, 10.0, 5.0, 5.0, 0.0, 0.0, 7.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.92529296875, -0.895233154296875, -0.86517333984375, -0.835113525390625, -0.8050537109375, -0.774993896484375, -0.74493408203125, -0.714874267578125, -0.684814453125, -0.654754638671875, -0.62469482421875, -0.594635009765625, -0.5645751953125, -0.534515380859375, -0.50445556640625, -0.474395751953125, -0.4443359375, -0.414276123046875, -0.38421630859375, -0.354156494140625, -0.3240966796875, -0.294036865234375, -0.26397705078125, -0.233917236328125, -0.203857421875, -0.173797607421875, -0.14373779296875, -0.113677978515625, -0.0836181640625, -0.053558349609375, -0.02349853515625, 0.006561279296875, 0.03662109375, 0.066680908203125, 0.09674072265625, 0.126800537109375, 0.1568603515625, 0.186920166015625, 0.21697998046875, 0.247039794921875, 0.277099609375, 0.307159423828125, 0.33721923828125, 0.367279052734375, 0.3973388671875, 0.427398681640625, 0.45745849609375, 0.487518310546875, 0.517578125, 0.547637939453125, 0.57769775390625, 0.607757568359375, 0.6378173828125, 0.667877197265625, 0.69793701171875, 0.727996826171875, 0.758056640625, 0.788116455078125, 0.81817626953125, 0.848236083984375, 0.8782958984375, 0.908355712890625, 0.93841552734375, 0.968475341796875, 0.99853515625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 6.0, 4.0, 9.0, 9.0, 9.0, 8.0, 12.0, 20.0, 21.0, 24.0, 26.0, 29.0, 35.0, 34.0, 52.0, 51.0, 58.0, 51.0, 55.0, 48.0, 51.0, 48.0, 36.0, 44.0, 36.0, 39.0, 36.0, 20.0, 30.0, 23.0, 20.0, 14.0, 11.0, 7.0, 7.0, 6.0, 4.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.71875, -2.640411376953125, -2.56207275390625, -2.483734130859375, -2.4053955078125, -2.327056884765625, -2.24871826171875, -2.170379638671875, -2.092041015625, -2.013702392578125, -1.93536376953125, -1.857025146484375, -1.7786865234375, -1.700347900390625, -1.62200927734375, -1.543670654296875, -1.46533203125, -1.386993408203125, -1.30865478515625, -1.230316162109375, -1.1519775390625, -1.073638916015625, -0.99530029296875, -0.916961669921875, -0.838623046875, -0.760284423828125, -0.68194580078125, -0.603607177734375, -0.5252685546875, -0.446929931640625, -0.36859130859375, -0.290252685546875, -0.2119140625, -0.133575439453125, -0.05523681640625, 0.023101806640625, 0.1014404296875, 0.179779052734375, 0.25811767578125, 0.336456298828125, 0.414794921875, 0.493133544921875, 0.57147216796875, 0.649810791015625, 0.7281494140625, 0.806488037109375, 0.88482666015625, 0.963165283203125, 1.04150390625, 1.119842529296875, 1.19818115234375, 1.276519775390625, 1.3548583984375, 1.433197021484375, 1.51153564453125, 1.589874267578125, 1.668212890625, 1.746551513671875, 1.82489013671875, 1.903228759765625, 1.9815673828125, 2.059906005859375, 2.13824462890625, 2.216583251953125, 2.294921875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 11.0, 9.0, 14.0, 16.0, 27.0, 39.0, 37.0, 47.0, 86.0, 128.0, 229.0, 324.0, 578.0, 1161.0, 2493.0, 6813.0, 20603.0, 76424.0, 327205.0, 448920.0, 117582.0, 29767.0, 9352.0, 3428.0, 1476.0, 697.0, 368.0, 219.0, 135.0, 100.0, 75.0, 44.0, 42.0, 24.0, 20.0, 19.0, 13.0, 7.0, 5.0, 3.0, 1.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.7607421875, -1.7091827392578125, -1.657623291015625, -1.6060638427734375, -1.55450439453125, -1.5029449462890625, -1.451385498046875, -1.3998260498046875, -1.3482666015625, -1.2967071533203125, -1.245147705078125, -1.1935882568359375, -1.14202880859375, -1.0904693603515625, -1.038909912109375, -0.9873504638671875, -0.935791015625, -0.8842315673828125, -0.832672119140625, -0.7811126708984375, -0.72955322265625, -0.6779937744140625, -0.626434326171875, -0.5748748779296875, -0.5233154296875, -0.4717559814453125, -0.420196533203125, -0.3686370849609375, -0.31707763671875, -0.2655181884765625, -0.213958740234375, -0.1623992919921875, -0.11083984375, -0.0592803955078125, -0.007720947265625, 0.0438385009765625, 0.09539794921875, 0.1469573974609375, 0.198516845703125, 0.2500762939453125, 0.3016357421875, 0.3531951904296875, 0.404754638671875, 0.4563140869140625, 0.50787353515625, 0.5594329833984375, 0.610992431640625, 0.6625518798828125, 0.714111328125, 0.7656707763671875, 0.817230224609375, 0.8687896728515625, 0.92034912109375, 0.9719085693359375, 1.023468017578125, 1.0750274658203125, 1.1265869140625, 1.1781463623046875, 1.229705810546875, 1.2812652587890625, 1.33282470703125, 1.3843841552734375, 1.435943603515625, 1.4875030517578125, 1.5390625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 6.0, 10.0, 11.0, 8.0, 17.0, 14.0, 10.0, 24.0, 26.0, 17.0, 28.0, 26.0, 34.0, 43.0, 37.0, 42.0, 38.0, 45.0, 39.0, 47.0, 52.0, 37.0, 45.0, 32.0, 38.0, 35.0, 36.0, 36.0, 22.0, 16.0, 27.0, 18.0, 16.0, 16.0, 6.0, 10.0, 5.0, 10.0, 5.0, 6.0, 4.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-4.546875, -4.40087890625, -4.2548828125, -4.10888671875, -3.962890625, -3.81689453125, -3.6708984375, -3.52490234375, -3.37890625, -3.23291015625, -3.0869140625, -2.94091796875, -2.794921875, -2.64892578125, -2.5029296875, -2.35693359375, -2.2109375, -2.06494140625, -1.9189453125, -1.77294921875, -1.626953125, -1.48095703125, -1.3349609375, -1.18896484375, -1.04296875, -0.89697265625, -0.7509765625, -0.60498046875, -0.458984375, -0.31298828125, -0.1669921875, -0.02099609375, 0.125, 0.27099609375, 0.4169921875, 0.56298828125, 0.708984375, 0.85498046875, 1.0009765625, 1.14697265625, 1.29296875, 1.43896484375, 1.5849609375, 1.73095703125, 1.876953125, 2.02294921875, 2.1689453125, 2.31494140625, 2.4609375, 2.60693359375, 2.7529296875, 2.89892578125, 3.044921875, 3.19091796875, 3.3369140625, 3.48291015625, 3.62890625, 3.77490234375, 3.9208984375, 4.06689453125, 4.212890625, 4.35888671875, 4.5048828125, 4.65087890625, 4.796875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 7.0, 4.0, 7.0, 14.0, 21.0, 34.0, 49.0, 74.0, 105.0, 166.0, 255.0, 435.0, 633.0, 1046.0, 1825.0, 3531.0, 6779.0, 15190.0, 42872.0, 224689.0, 597089.0, 104320.0, 26873.0, 10947.0, 5074.0, 2677.0, 1508.0, 879.0, 561.0, 310.0, 200.0, 123.0, 78.0, 60.0, 37.0, 22.0, 19.0, 18.0, 18.0, 2.0, 8.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.73681640625, -0.711669921875, -0.6865234375, -0.661376953125, -0.63623046875, -0.611083984375, -0.5859375, -0.560791015625, -0.53564453125, -0.510498046875, -0.4853515625, -0.460205078125, -0.43505859375, -0.409912109375, -0.384765625, -0.359619140625, -0.33447265625, -0.309326171875, -0.2841796875, -0.259033203125, -0.23388671875, -0.208740234375, -0.18359375, -0.158447265625, -0.13330078125, -0.108154296875, -0.0830078125, -0.057861328125, -0.03271484375, -0.007568359375, 0.017578125, 0.042724609375, 0.06787109375, 0.093017578125, 0.1181640625, 0.143310546875, 0.16845703125, 0.193603515625, 0.21875, 0.243896484375, 0.26904296875, 0.294189453125, 0.3193359375, 0.344482421875, 0.36962890625, 0.394775390625, 0.419921875, 0.445068359375, 0.47021484375, 0.495361328125, 0.5205078125, 0.545654296875, 0.57080078125, 0.595947265625, 0.62109375, 0.646240234375, 0.67138671875, 0.696533203125, 0.7216796875, 0.746826171875, 0.77197265625, 0.797119140625, 0.822265625, 0.847412109375, 0.87255859375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 9.0, 17.0, 34.0, 114.0, 208.0, 297.0, 182.0, 62.0, 31.0, 16.0, 5.0, 6.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001049041748046875, -0.0010166317224502563, -0.0009842216968536377, -0.000951811671257019, -0.0009194016456604004, -0.0008869916200637817, -0.0008545815944671631, -0.0008221715688705444, -0.0007897615432739258, -0.0007573515176773071, -0.0007249414920806885, -0.0006925314664840698, -0.0006601214408874512, -0.0006277114152908325, -0.0005953013896942139, -0.0005628913640975952, -0.0005304813385009766, -0.0004980713129043579, -0.00046566128730773926, -0.0004332512617111206, -0.00040084123611450195, -0.0003684312105178833, -0.00033602118492126465, -0.000303611159324646, -0.00027120113372802734, -0.0002387911081314087, -0.00020638108253479004, -0.0001739710569381714, -0.00014156103134155273, -0.00010915100574493408, -7.674098014831543e-05, -4.433095455169678e-05, -1.1920928955078125e-05, 2.0489096641540527e-05, 5.289912223815918e-05, 8.530914783477783e-05, 0.00011771917343139648, 0.00015012919902801514, 0.0001825392246246338, 0.00021494925022125244, 0.0002473592758178711, 0.00027976930141448975, 0.0003121793270111084, 0.00034458935260772705, 0.0003769993782043457, 0.00040940940380096436, 0.000441819429397583, 0.00047422945499420166, 0.0005066394805908203, 0.000539049506187439, 0.0005714595317840576, 0.0006038695573806763, 0.0006362795829772949, 0.0006686896085739136, 0.0007010996341705322, 0.0007335096597671509, 0.0007659196853637695, 0.0007983297109603882, 0.0008307397365570068, 0.0008631497621536255, 0.0008955597877502441, 0.0009279698133468628, 0.0009603798389434814, 0.0009927898645401, 0.0010251998901367188]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 7.0, 4.0, 5.0, 4.0, 8.0, 6.0, 14.0, 12.0, 30.0, 32.0, 70.0, 143.0, 335.0, 1896.0, 16992.0, 871287.0, 149856.0, 6390.0, 936.0, 256.0, 85.0, 47.0, 26.0, 25.0, 16.0, 19.0, 12.0, 10.0, 4.0, 7.0, 7.0, 2.0, 2.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.576171875, -2.476318359375, -2.37646484375, -2.276611328125, -2.1767578125, -2.076904296875, -1.97705078125, -1.877197265625, -1.77734375, -1.677490234375, -1.57763671875, -1.477783203125, -1.3779296875, -1.278076171875, -1.17822265625, -1.078369140625, -0.978515625, -0.878662109375, -0.77880859375, -0.678955078125, -0.5791015625, -0.479248046875, -0.37939453125, -0.279541015625, -0.1796875, -0.079833984375, 0.02001953125, 0.119873046875, 0.2197265625, 0.319580078125, 0.41943359375, 0.519287109375, 0.619140625, 0.718994140625, 0.81884765625, 0.918701171875, 1.0185546875, 1.118408203125, 1.21826171875, 1.318115234375, 1.41796875, 1.517822265625, 1.61767578125, 1.717529296875, 1.8173828125, 1.917236328125, 2.01708984375, 2.116943359375, 2.216796875, 2.316650390625, 2.41650390625, 2.516357421875, 2.6162109375, 2.716064453125, 2.81591796875, 2.915771484375, 3.015625, 3.115478515625, 3.21533203125, 3.315185546875, 3.4150390625, 3.514892578125, 3.61474609375, 3.714599609375, 3.814453125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 5.0, 5.0, 3.0, 8.0, 5.0, 14.0, 10.0, 19.0, 20.0, 30.0, 40.0, 46.0, 76.0, 92.0, 114.0, 115.0, 95.0, 64.0, 58.0, 27.0, 31.0, 18.0, 13.0, 23.0, 15.0, 9.0, 6.0, 7.0, 5.0, 5.0, 6.0, 4.0, 3.0, 0.0, 3.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2413330078125, -0.23204994201660156, -0.22276687622070312, -0.2134838104248047, -0.20420074462890625, -0.1949176788330078, -0.18563461303710938, -0.17635154724121094, -0.1670684814453125, -0.15778541564941406, -0.14850234985351562, -0.1392192840576172, -0.12993621826171875, -0.12065315246582031, -0.11137008666992188, -0.10208702087402344, -0.092803955078125, -0.08352088928222656, -0.07423782348632812, -0.06495475769042969, -0.05567169189453125, -0.04638862609863281, -0.037105560302734375, -0.027822494506835938, -0.0185394287109375, -0.009256362915039062, 2.6702880859375e-05, 0.009309768676757812, 0.01859283447265625, 0.027875900268554688, 0.037158966064453125, 0.04644203186035156, 0.05572509765625, 0.06500816345214844, 0.07429122924804688, 0.08357429504394531, 0.09285736083984375, 0.10214042663574219, 0.11142349243164062, 0.12070655822753906, 0.1299896240234375, 0.13927268981933594, 0.14855575561523438, 0.1578388214111328, 0.16712188720703125, 0.1764049530029297, 0.18568801879882812, 0.19497108459472656, 0.204254150390625, 0.21353721618652344, 0.22282028198242188, 0.2321033477783203, 0.24138641357421875, 0.2506694793701172, 0.2599525451660156, 0.26923561096191406, 0.2785186767578125, 0.28780174255371094, 0.2970848083496094, 0.3063678741455078, 0.31565093994140625, 0.3249340057373047, 0.3342170715332031, 0.34350013732910156, 0.352783203125]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 7.0, 17.0, 36.0, 102.0, 320.0, 309.0, 150.0, 46.0, 14.0, 8.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.670473098754883, -18.246179580688477, -17.82188606262207, -17.397594451904297, -16.97330093383789, -16.549007415771484, -16.124713897705078, -15.700420379638672, -15.276126861572266, -14.85183334350586, -14.42754077911377, -14.003247261047363, -13.578953742980957, -13.154661178588867, -12.730367660522461, -12.306074142456055, -11.881781578063965, -11.457488059997559, -11.033195495605469, -10.608901977539062, -10.184608459472656, -9.76031494140625, -9.33602237701416, -8.911728858947754, -8.487436294555664, -8.063142776489258, -7.63884973526001, -7.214556694030762, -6.7902631759643555, -6.365970134735107, -5.941677093505859, -5.517383575439453, -5.093091011047363, -4.668797969818115, -4.244504451751709, -3.820211410522461, -3.395918130874634, -2.9716248512268066, -2.5473318099975586, -2.1230385303497314, -1.6987452507019043, -1.2744519710540771, -0.8501588106155396, -0.42586565017700195, -0.0015723705291748047, 0.42272090911865234, 0.8470139503479004, 1.2713072299957275, 1.6956005096435547, 2.119893789291382, 2.544187068939209, 2.968480110168457, 3.392773389816284, 3.8170666694641113, 4.241359710693359, 4.665653228759766, 5.089946269989014, 5.514239311218262, 5.938532829284668, 6.362825870513916, 6.787118911743164, 7.21141242980957, 7.635705471038818, 8.059998512268066, 8.484292030334473]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 5.0, 5.0, 7.0, 14.0, 13.0, 15.0, 21.0, 19.0, 30.0, 32.0, 31.0, 37.0, 42.0, 56.0, 58.0, 37.0, 65.0, 48.0, 51.0, 54.0, 47.0, 40.0, 50.0, 43.0, 34.0, 33.0, 24.0, 17.0, 19.0, 18.0, 12.0, 5.0, 7.0, 4.0, 2.0, 0.0, 5.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.0516724586486816, -2.959702253341675, -2.867732286453247, -2.7757620811462402, -2.6837921142578125, -2.5918219089508057, -2.499851703643799, -2.407881736755371, -2.3159115314483643, -2.2239413261413574, -2.1319713592529297, -2.040001153945923, -1.9480310678482056, -1.8560609817504883, -1.7640907764434814, -1.6721206903457642, -1.5801506042480469, -1.4881805181503296, -1.3962104320526123, -1.3042402267456055, -1.2122701406478882, -1.120300054550171, -1.028329849243164, -0.9363597631454468, -0.8443896770477295, -0.7524195909500122, -0.6604494452476501, -0.5684792995452881, -0.4765092134475708, -0.38453909754753113, -0.29256898164749146, -0.2005988359451294, -0.10862898826599121, -0.016658872365951538, 0.07531124353408813, 0.1672813594341278, 0.2592514753341675, 0.35122159123420715, 0.4431917071342468, 0.5351618528366089, 0.6271319389343262, 0.7191020250320435, 0.8110721707344055, 0.9030423164367676, 0.9950124025344849, 1.0869824886322021, 1.178952693939209, 1.2709227800369263, 1.3628928661346436, 1.4548629522323608, 1.5468330383300781, 1.638803243637085, 1.7307733297348022, 1.8227434158325195, 1.9147136211395264, 2.006683826446533, 2.098653793334961, 2.1906239986419678, 2.2825939655303955, 2.3745641708374023, 2.46653413772583, 2.558504343032837, 2.6504745483398438, 2.7424445152282715, 2.8344147205352783]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 10.0, 11.0, 22.0, 24.0, 47.0, 62.0, 98.0, 187.0, 329.0, 555.0, 917.0, 1882.0, 3928.0, 8068.0, 18557.0, 47092.0, 137313.0, 395931.0, 284914.0, 90011.0, 32716.0, 13531.0, 6077.0, 2968.0, 1463.0, 768.0, 428.0, 260.0, 151.0, 97.0, 49.0, 35.0, 17.0, 15.0, 10.0, 8.0, 1.0, 5.0, 2.0, 1.0, 0.0, 4.0, 1.0], "bins": [-1.841796875, -1.794342041015625, -1.74688720703125, -1.699432373046875, -1.6519775390625, -1.604522705078125, -1.55706787109375, -1.509613037109375, -1.462158203125, -1.414703369140625, -1.36724853515625, -1.319793701171875, -1.2723388671875, -1.224884033203125, -1.17742919921875, -1.129974365234375, -1.08251953125, -1.035064697265625, -0.98760986328125, -0.940155029296875, -0.8927001953125, -0.845245361328125, -0.79779052734375, -0.750335693359375, -0.702880859375, -0.655426025390625, -0.60797119140625, -0.560516357421875, -0.5130615234375, -0.465606689453125, -0.41815185546875, -0.370697021484375, -0.3232421875, -0.275787353515625, -0.22833251953125, -0.180877685546875, -0.1334228515625, -0.085968017578125, -0.03851318359375, 0.008941650390625, 0.056396484375, 0.103851318359375, 0.15130615234375, 0.198760986328125, 0.2462158203125, 0.293670654296875, 0.34112548828125, 0.388580322265625, 0.43603515625, 0.483489990234375, 0.53094482421875, 0.578399658203125, 0.6258544921875, 0.673309326171875, 0.72076416015625, 0.768218994140625, 0.815673828125, 0.863128662109375, 0.91058349609375, 0.958038330078125, 1.0054931640625, 1.052947998046875, 1.10040283203125, 1.147857666015625, 1.1953125]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 3.0, 2.0, 3.0, 4.0, 3.0, 10.0, 5.0, 7.0, 10.0, 15.0, 11.0, 15.0, 18.0, 32.0, 17.0, 23.0, 38.0, 34.0, 32.0, 31.0, 36.0, 45.0, 49.0, 40.0, 45.0, 39.0, 48.0, 42.0, 35.0, 27.0, 38.0, 37.0, 24.0, 25.0, 17.0, 26.0, 20.0, 20.0, 16.0, 11.0, 10.0, 11.0, 8.0, 4.0, 5.0, 4.0, 3.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 2.0, 3.0], "bins": [-6.984375, -6.776123046875, -6.56787109375, -6.359619140625, -6.1513671875, -5.943115234375, -5.73486328125, -5.526611328125, -5.318359375, -5.110107421875, -4.90185546875, -4.693603515625, -4.4853515625, -4.277099609375, -4.06884765625, -3.860595703125, -3.65234375, -3.444091796875, -3.23583984375, -3.027587890625, -2.8193359375, -2.611083984375, -2.40283203125, -2.194580078125, -1.986328125, -1.778076171875, -1.56982421875, -1.361572265625, -1.1533203125, -0.945068359375, -0.73681640625, -0.528564453125, -0.3203125, -0.112060546875, 0.09619140625, 0.304443359375, 0.5126953125, 0.720947265625, 0.92919921875, 1.137451171875, 1.345703125, 1.553955078125, 1.76220703125, 1.970458984375, 2.1787109375, 2.386962890625, 2.59521484375, 2.803466796875, 3.01171875, 3.219970703125, 3.42822265625, 3.636474609375, 3.8447265625, 4.052978515625, 4.26123046875, 4.469482421875, 4.677734375, 4.885986328125, 5.09423828125, 5.302490234375, 5.5107421875, 5.718994140625, 5.92724609375, 6.135498046875, 6.34375]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 1.0, 2.0, 1.0, 2.0, 4.0, 5.0, 4.0, 4.0, 7.0, 8.0, 17.0, 20.0, 25.0, 30.0, 33.0, 48.0, 54.0, 85.0, 115.0, 200.0, 395.0, 1058.0, 10221.0, 785611.0, 244120.0, 4789.0, 779.0, 292.0, 175.0, 123.0, 78.0, 48.0, 34.0, 30.0, 22.0, 27.0, 24.0, 18.0, 8.0, 10.0, 7.0, 2.0, 3.0, 4.0, 2.0, 5.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.99609375, -6.76947021484375, -6.5428466796875, -6.31622314453125, -6.089599609375, -5.86297607421875, -5.6363525390625, -5.40972900390625, -5.18310546875, -4.95648193359375, -4.7298583984375, -4.50323486328125, -4.276611328125, -4.04998779296875, -3.8233642578125, -3.59674072265625, -3.3701171875, -3.14349365234375, -2.9168701171875, -2.69024658203125, -2.463623046875, -2.23699951171875, -2.0103759765625, -1.78375244140625, -1.55712890625, -1.33050537109375, -1.1038818359375, -0.87725830078125, -0.650634765625, -0.42401123046875, -0.1973876953125, 0.02923583984375, 0.255859375, 0.48248291015625, 0.7091064453125, 0.93572998046875, 1.162353515625, 1.38897705078125, 1.6156005859375, 1.84222412109375, 2.06884765625, 2.29547119140625, 2.5220947265625, 2.74871826171875, 2.975341796875, 3.20196533203125, 3.4285888671875, 3.65521240234375, 3.8818359375, 4.10845947265625, 4.3350830078125, 4.56170654296875, 4.788330078125, 5.01495361328125, 5.2415771484375, 5.46820068359375, 5.69482421875, 5.92144775390625, 6.1480712890625, 6.37469482421875, 6.601318359375, 6.82794189453125, 7.0545654296875, 7.28118896484375, 7.5078125]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 4.0, 6.0, 2.0, 4.0, 9.0, 9.0, 11.0, 17.0, 10.0, 16.0, 18.0, 16.0, 27.0, 24.0, 23.0, 33.0, 30.0, 42.0, 33.0, 34.0, 46.0, 29.0, 42.0, 46.0, 37.0, 41.0, 45.0, 40.0, 26.0, 40.0, 23.0, 27.0, 22.0, 19.0, 14.0, 20.0, 17.0, 14.0, 15.0, 20.0, 17.0, 12.0, 7.0, 4.0, 6.0, 0.0, 3.0, 6.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.40625, -6.18902587890625, -5.9718017578125, -5.75457763671875, -5.537353515625, -5.32012939453125, -5.1029052734375, -4.88568115234375, -4.66845703125, -4.45123291015625, -4.2340087890625, -4.01678466796875, -3.799560546875, -3.58233642578125, -3.3651123046875, -3.14788818359375, -2.9306640625, -2.71343994140625, -2.4962158203125, -2.27899169921875, -2.061767578125, -1.84454345703125, -1.6273193359375, -1.41009521484375, -1.19287109375, -0.97564697265625, -0.7584228515625, -0.54119873046875, -0.323974609375, -0.10675048828125, 0.1104736328125, 0.32769775390625, 0.544921875, 0.76214599609375, 0.9793701171875, 1.19659423828125, 1.413818359375, 1.63104248046875, 1.8482666015625, 2.06549072265625, 2.28271484375, 2.49993896484375, 2.7171630859375, 2.93438720703125, 3.151611328125, 3.36883544921875, 3.5860595703125, 3.80328369140625, 4.0205078125, 4.23773193359375, 4.4549560546875, 4.67218017578125, 4.889404296875, 5.10662841796875, 5.3238525390625, 5.54107666015625, 5.75830078125, 5.97552490234375, 6.1927490234375, 6.40997314453125, 6.627197265625, 6.84442138671875, 7.0616455078125, 7.27886962890625, 7.49609375]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 0.0, 2.0, 8.0, 20.0, 23.0, 37.0, 72.0, 142.0, 268.0, 685.0, 2249.0, 11081.0, 120348.0, 836622.0, 66784.0, 7458.0, 1679.0, 585.0, 238.0, 126.0, 45.0, 33.0, 12.0, 13.0, 4.0, 4.0, 5.0, 3.0, 4.0, 3.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.775390625, -0.7470855712890625, -0.718780517578125, -0.6904754638671875, -0.66217041015625, -0.6338653564453125, -0.605560302734375, -0.5772552490234375, -0.5489501953125, -0.5206451416015625, -0.492340087890625, -0.4640350341796875, -0.43572998046875, -0.4074249267578125, -0.379119873046875, -0.3508148193359375, -0.322509765625, -0.2942047119140625, -0.265899658203125, -0.2375946044921875, -0.20928955078125, -0.1809844970703125, -0.152679443359375, -0.1243743896484375, -0.0960693359375, -0.0677642822265625, -0.039459228515625, -0.0111541748046875, 0.01715087890625, 0.0454559326171875, 0.073760986328125, 0.1020660400390625, 0.13037109375, 0.1586761474609375, 0.186981201171875, 0.2152862548828125, 0.24359130859375, 0.2718963623046875, 0.300201416015625, 0.3285064697265625, 0.3568115234375, 0.3851165771484375, 0.413421630859375, 0.4417266845703125, 0.47003173828125, 0.4983367919921875, 0.526641845703125, 0.5549468994140625, 0.583251953125, 0.6115570068359375, 0.639862060546875, 0.6681671142578125, 0.69647216796875, 0.7247772216796875, 0.753082275390625, 0.7813873291015625, 0.8096923828125, 0.8379974365234375, 0.866302490234375, 0.8946075439453125, 0.92291259765625, 0.9512176513671875, 0.979522705078125, 1.0078277587890625, 1.0361328125]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 8.0, 9.0, 10.0, 15.0, 27.0, 47.0, 43.0, 91.0, 156.0, 203.0, 138.0, 79.0, 54.0, 32.0, 33.0, 18.0, 13.0, 7.0, 8.0, 1.0, 3.0, 3.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00015294551849365234, -0.00014848820865154266, -0.00014403089880943298, -0.0001395735889673233, -0.00013511627912521362, -0.00013065896928310394, -0.00012620165944099426, -0.00012174434959888458, -0.0001172870397567749, -0.00011282972991466522, -0.00010837242007255554, -0.00010391511023044586, -9.945780038833618e-05, -9.50004905462265e-05, -9.054318070411682e-05, -8.608587086200714e-05, -8.162856101989746e-05, -7.717125117778778e-05, -7.27139413356781e-05, -6.825663149356842e-05, -6.379932165145874e-05, -5.934201180934906e-05, -5.488470196723938e-05, -5.04273921251297e-05, -4.597008228302002e-05, -4.151277244091034e-05, -3.705546259880066e-05, -3.259815275669098e-05, -2.81408429145813e-05, -2.368353307247162e-05, -1.922622323036194e-05, -1.4768913388252258e-05, -1.0311603546142578e-05, -5.854293704032898e-06, -1.3969838619232178e-06, 3.0603259801864624e-06, 7.517635822296143e-06, 1.1974945664405823e-05, 1.6432255506515503e-05, 2.0889565348625183e-05, 2.5346875190734863e-05, 2.9804185032844543e-05, 3.4261494874954224e-05, 3.8718804717063904e-05, 4.3176114559173584e-05, 4.7633424401283264e-05, 5.2090734243392944e-05, 5.6548044085502625e-05, 6.1005353927612305e-05, 6.546266376972198e-05, 6.991997361183167e-05, 7.437728345394135e-05, 7.883459329605103e-05, 8.32919031381607e-05, 8.774921298027039e-05, 9.220652282238007e-05, 9.666383266448975e-05, 0.00010112114250659943, 0.0001055784523487091, 0.00011003576219081879, 0.00011449307203292847, 0.00011895038187503815, 0.00012340769171714783, 0.0001278650015592575, 0.0001323223114013672]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 6.0, 4.0, 7.0, 5.0, 15.0, 10.0, 18.0, 21.0, 35.0, 66.0, 141.0, 305.0, 1092.0, 5738.0, 65162.0, 859744.0, 105897.0, 8172.0, 1357.0, 398.0, 152.0, 73.0, 51.0, 26.0, 20.0, 13.0, 8.0, 8.0, 2.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.2392578125, -1.2071380615234375, -1.175018310546875, -1.1428985595703125, -1.11077880859375, -1.0786590576171875, -1.046539306640625, -1.0144195556640625, -0.9822998046875, -0.9501800537109375, -0.918060302734375, -0.8859405517578125, -0.85382080078125, -0.8217010498046875, -0.789581298828125, -0.7574615478515625, -0.725341796875, -0.6932220458984375, -0.661102294921875, -0.6289825439453125, -0.59686279296875, -0.5647430419921875, -0.532623291015625, -0.5005035400390625, -0.4683837890625, -0.4362640380859375, -0.404144287109375, -0.3720245361328125, -0.33990478515625, -0.3077850341796875, -0.275665283203125, -0.2435455322265625, -0.21142578125, -0.1793060302734375, -0.147186279296875, -0.1150665283203125, -0.08294677734375, -0.0508270263671875, -0.018707275390625, 0.0134124755859375, 0.0455322265625, 0.0776519775390625, 0.109771728515625, 0.1418914794921875, 0.17401123046875, 0.2061309814453125, 0.238250732421875, 0.2703704833984375, 0.302490234375, 0.3346099853515625, 0.366729736328125, 0.3988494873046875, 0.43096923828125, 0.4630889892578125, 0.495208740234375, 0.5273284912109375, 0.5594482421875, 0.5915679931640625, 0.623687744140625, 0.6558074951171875, 0.68792724609375, 0.7200469970703125, 0.752166748046875, 0.7842864990234375, 0.81640625]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 3.0, 4.0, 9.0, 8.0, 14.0, 10.0, 6.0, 11.0, 22.0, 29.0, 33.0, 32.0, 61.0, 60.0, 106.0, 223.0, 95.0, 49.0, 49.0, 32.0, 25.0, 25.0, 18.0, 18.0, 15.0, 8.0, 10.0, 7.0, 4.0, 5.0, 2.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.315673828125, -0.30764007568359375, -0.2996063232421875, -0.29157257080078125, -0.283538818359375, -0.27550506591796875, -0.2674713134765625, -0.25943756103515625, -0.25140380859375, -0.24337005615234375, -0.2353363037109375, -0.22730255126953125, -0.219268798828125, -0.21123504638671875, -0.2032012939453125, -0.19516754150390625, -0.1871337890625, -0.17910003662109375, -0.1710662841796875, -0.16303253173828125, -0.154998779296875, -0.14696502685546875, -0.1389312744140625, -0.13089752197265625, -0.12286376953125, -0.11483001708984375, -0.1067962646484375, -0.09876251220703125, -0.090728759765625, -0.08269500732421875, -0.0746612548828125, -0.06662750244140625, -0.05859375, -0.05055999755859375, -0.0425262451171875, -0.03449249267578125, -0.026458740234375, -0.01842498779296875, -0.0103912353515625, -0.00235748291015625, 0.00567626953125, 0.01371002197265625, 0.0217437744140625, 0.02977752685546875, 0.037811279296875, 0.04584503173828125, 0.0538787841796875, 0.06191253662109375, 0.0699462890625, 0.07798004150390625, 0.0860137939453125, 0.09404754638671875, 0.102081298828125, 0.11011505126953125, 0.1181488037109375, 0.12618255615234375, 0.13421630859375, 0.14225006103515625, 0.1502838134765625, 0.15831756591796875, 0.166351318359375, 0.17438507080078125, 0.1824188232421875, 0.19045257568359375, 0.198486328125]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 8.0, 36.0, 202.0, 505.0, 226.0, 33.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.393667221069336, -17.34039878845215, -16.28713035583496, -15.233861923217773, -14.180593490600586, -13.127325057983398, -12.074055671691895, -11.020787239074707, -9.96751880645752, -8.914250373840332, -7.8609819412231445, -6.807713031768799, -5.754444599151611, -4.701176166534424, -3.647907257080078, -2.5946388244628906, -1.5413703918457031, -0.4881018400192261, 0.565166711807251, 1.6184353828430176, 2.671703815460205, 3.7249722480773926, 4.778241157531738, 5.831509590148926, 6.884778022766113, 7.938046455383301, 8.991314888000488, 10.044584274291992, 11.09785270690918, 12.151121139526367, 13.204389572143555, 14.257658004760742, 15.310924530029297, 16.364192962646484, 17.417461395263672, 18.47072982788086, 19.523998260498047, 20.577266693115234, 21.630535125732422, 22.68380355834961, 23.737071990966797, 24.790340423583984, 25.843608856201172, 26.89687728881836, 27.950145721435547, 29.003414154052734, 30.056682586669922, 31.10995101928711, 32.16322326660156, 33.21649169921875, 34.26976013183594, 35.323028564453125, 36.37629699707031, 37.4295654296875, 38.48283386230469, 39.536102294921875, 40.58937072753906, 41.64263916015625, 42.69590759277344, 43.749176025390625, 44.80244445800781, 45.855712890625, 46.90898132324219, 47.962249755859375, 49.01551818847656]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 4.0, 7.0, 8.0, 6.0, 18.0, 16.0, 20.0, 18.0, 27.0, 34.0, 33.0, 38.0, 36.0, 45.0, 44.0, 56.0, 52.0, 57.0, 42.0, 40.0, 52.0, 36.0, 50.0, 38.0, 35.0, 26.0, 27.0, 24.0, 25.0, 20.0, 14.0, 13.0, 8.0, 13.0, 5.0, 4.0, 6.0, 3.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.071207046508789, -12.654496192932129, -12.237785339355469, -11.821074485778809, -11.404363632202148, -10.987652778625488, -10.570941925048828, -10.154231071472168, -9.737520217895508, -9.320809364318848, -8.904098510742188, -8.487387657165527, -8.070676803588867, -7.653965950012207, -7.237255096435547, -6.820544242858887, -6.403832912445068, -5.987122058868408, -5.570411205291748, -5.153700351715088, -4.736989498138428, -4.320278167724609, -3.9035675525665283, -3.486856698989868, -3.070145845413208, -2.653434991836548, -2.2367241382598877, -1.820013165473938, -1.4033023118972778, -0.9865913391113281, -0.569880485534668, -0.1531696319580078, 0.26354122161865234, 0.6802520751953125, 1.0969629287719727, 1.5136739015579224, 1.9303847551345825, 2.3470957279205322, 2.7638065814971924, 3.1805174350738525, 3.5972282886505127, 4.013939380645752, 4.430650234222412, 4.847361087799072, 5.264071941375732, 5.680782794952393, 6.097493648529053, 6.514204502105713, 6.930915355682373, 7.347626209259033, 7.764337062835693, 8.181048393249512, 8.597759246826172, 9.014470100402832, 9.431180953979492, 9.847891807556152, 10.264602661132812, 10.681313514709473, 11.098024368286133, 11.514735221862793, 11.931446075439453, 12.348156929016113, 12.764867782592773, 13.181578636169434, 13.598289489746094]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 8.0, 4.0, 6.0, 8.0, 11.0, 11.0, 21.0, 23.0, 55.0, 70.0, 83.0, 145.0, 254.0, 490.0, 868.0, 1886.0, 4320.0, 11205.0, 35206.0, 152654.0, 1392681.0, 2311467.0, 211938.0, 46058.0, 14744.0, 5470.0, 2274.0, 1086.0, 486.0, 284.0, 161.0, 111.0, 69.0, 31.0, 33.0, 18.0, 15.0, 8.0, 10.0, 3.0, 7.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.560546875, -3.45611572265625, -3.3516845703125, -3.24725341796875, -3.142822265625, -3.03839111328125, -2.9339599609375, -2.82952880859375, -2.72509765625, -2.62066650390625, -2.5162353515625, -2.41180419921875, -2.307373046875, -2.20294189453125, -2.0985107421875, -1.99407958984375, -1.8896484375, -1.78521728515625, -1.6807861328125, -1.57635498046875, -1.471923828125, -1.36749267578125, -1.2630615234375, -1.15863037109375, -1.05419921875, -0.94976806640625, -0.8453369140625, -0.74090576171875, -0.636474609375, -0.53204345703125, -0.4276123046875, -0.32318115234375, -0.21875, -0.11431884765625, -0.0098876953125, 0.09454345703125, 0.198974609375, 0.30340576171875, 0.4078369140625, 0.51226806640625, 0.61669921875, 0.72113037109375, 0.8255615234375, 0.92999267578125, 1.034423828125, 1.13885498046875, 1.2432861328125, 1.34771728515625, 1.4521484375, 1.55657958984375, 1.6610107421875, 1.76544189453125, 1.869873046875, 1.97430419921875, 2.0787353515625, 2.18316650390625, 2.28759765625, 2.39202880859375, 2.4964599609375, 2.60089111328125, 2.705322265625, 2.80975341796875, 2.9141845703125, 3.01861572265625, 3.123046875]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 6.0, 5.0, 10.0, 7.0, 19.0, 18.0, 34.0, 30.0, 35.0, 41.0, 44.0, 41.0, 53.0, 55.0, 59.0, 77.0, 74.0, 58.0, 43.0, 33.0, 43.0, 42.0, 36.0, 36.0, 26.0, 22.0, 15.0, 8.0, 4.0, 7.0, 7.0, 2.0, 4.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-3.716796875, -3.614654541015625, -3.51251220703125, -3.410369873046875, -3.3082275390625, -3.206085205078125, -3.10394287109375, -3.001800537109375, -2.899658203125, -2.797515869140625, -2.69537353515625, -2.593231201171875, -2.4910888671875, -2.388946533203125, -2.28680419921875, -2.184661865234375, -2.08251953125, -1.980377197265625, -1.87823486328125, -1.776092529296875, -1.6739501953125, -1.571807861328125, -1.46966552734375, -1.367523193359375, -1.265380859375, -1.163238525390625, -1.06109619140625, -0.958953857421875, -0.8568115234375, -0.754669189453125, -0.65252685546875, -0.550384521484375, -0.4482421875, -0.346099853515625, -0.24395751953125, -0.141815185546875, -0.0396728515625, 0.062469482421875, 0.16461181640625, 0.266754150390625, 0.368896484375, 0.471038818359375, 0.57318115234375, 0.675323486328125, 0.7774658203125, 0.879608154296875, 0.98175048828125, 1.083892822265625, 1.18603515625, 1.288177490234375, 1.39031982421875, 1.492462158203125, 1.5946044921875, 1.696746826171875, 1.79888916015625, 1.901031494140625, 2.003173828125, 2.105316162109375, 2.20745849609375, 2.309600830078125, 2.4117431640625, 2.513885498046875, 2.61602783203125, 2.718170166015625, 2.8203125]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 1.0, 3.0, 4.0, 13.0, 8.0, 21.0, 33.0, 77.0, 211.0, 605.0, 566910.0, 3625317.0, 683.0, 202.0, 87.0, 49.0, 18.0, 11.0, 6.0, 8.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-40.125, -39.09716796875, -38.0693359375, -37.04150390625, -36.013671875, -34.98583984375, -33.9580078125, -32.93017578125, -31.90234375, -30.87451171875, -29.8466796875, -28.81884765625, -27.791015625, -26.76318359375, -25.7353515625, -24.70751953125, -23.6796875, -22.65185546875, -21.6240234375, -20.59619140625, -19.568359375, -18.54052734375, -17.5126953125, -16.48486328125, -15.45703125, -14.42919921875, -13.4013671875, -12.37353515625, -11.345703125, -10.31787109375, -9.2900390625, -8.26220703125, -7.234375, -6.20654296875, -5.1787109375, -4.15087890625, -3.123046875, -2.09521484375, -1.0673828125, -0.03955078125, 0.98828125, 2.01611328125, 3.0439453125, 4.07177734375, 5.099609375, 6.12744140625, 7.1552734375, 8.18310546875, 9.2109375, 10.23876953125, 11.2666015625, 12.29443359375, 13.322265625, 14.35009765625, 15.3779296875, 16.40576171875, 17.43359375, 18.46142578125, 19.4892578125, 20.51708984375, 21.544921875, 22.57275390625, 23.6005859375, 24.62841796875, 25.65625]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0, 5.0, 4.0, 8.0, 8.0, 11.0, 12.0, 41.0, 70.0, 125.0, 181.0, 332.0, 854.0, 1244.0, 563.0, 239.0, 164.0, 81.0, 58.0, 29.0, 17.0, 13.0, 10.0, 7.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.447265625, -1.4010162353515625, -1.354766845703125, -1.3085174560546875, -1.26226806640625, -1.2160186767578125, -1.169769287109375, -1.1235198974609375, -1.0772705078125, -1.0310211181640625, -0.984771728515625, -0.9385223388671875, -0.89227294921875, -0.8460235595703125, -0.799774169921875, -0.7535247802734375, -0.707275390625, -0.6610260009765625, -0.614776611328125, -0.5685272216796875, -0.52227783203125, -0.4760284423828125, -0.429779052734375, -0.3835296630859375, -0.3372802734375, -0.2910308837890625, -0.244781494140625, -0.1985321044921875, -0.15228271484375, -0.1060333251953125, -0.059783935546875, -0.0135345458984375, 0.03271484375, 0.0789642333984375, 0.125213623046875, 0.1714630126953125, 0.21771240234375, 0.2639617919921875, 0.310211181640625, 0.3564605712890625, 0.4027099609375, 0.4489593505859375, 0.495208740234375, 0.5414581298828125, 0.58770751953125, 0.6339569091796875, 0.680206298828125, 0.7264556884765625, 0.772705078125, 0.8189544677734375, 0.865203857421875, 0.9114532470703125, 0.95770263671875, 1.0039520263671875, 1.050201416015625, 1.0964508056640625, 1.1427001953125, 1.1889495849609375, 1.235198974609375, 1.2814483642578125, 1.32769775390625, 1.3739471435546875, 1.420196533203125, 1.4664459228515625, 1.5126953125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 7.0, 14.0, 7.0, 16.0, 20.0, 38.0, 53.0, 64.0, 101.0, 123.0, 112.0, 101.0, 120.0, 71.0, 55.0, 33.0, 23.0, 14.0, 15.0, 7.0, 2.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.647217273712158, -5.4839606285095215, -5.320703506469727, -5.15744686126709, -4.994190216064453, -4.830933094024658, -4.6676764488220215, -4.504419326782227, -4.34116268157959, -4.177906036376953, -4.014648914337158, -3.8513922691345215, -3.6881353855133057, -3.52487850189209, -3.361621856689453, -3.1983649730682373, -3.0351083278656006, -2.8718514442443848, -2.708594799041748, -2.5453379154205322, -2.3820810317993164, -2.2188243865966797, -2.055567502975464, -1.892310619354248, -1.7290538549423218, -1.5657970905303955, -1.4025402069091797, -1.2392834424972534, -1.0760266780853271, -0.9127697944641113, -0.7495130300521851, -0.5862561464309692, -0.42299938201904297, -0.2597425580024719, -0.09648576378822327, 0.06677103042602539, 0.23002785444259644, 0.3932846784591675, 0.5565414428710938, 0.7197983264923096, 0.8830550909042358, 1.046311855316162, 1.209568738937378, 1.3728255033493042, 1.5360822677612305, 1.6993391513824463, 1.8625959157943726, 2.025852680206299, 2.1891095638275146, 2.3523664474487305, 2.515623092651367, 2.678879976272583, 2.842136859893799, 3.0053935050964355, 3.1686503887176514, 3.331907272338867, 3.495163917541504, 3.6584208011627197, 3.8216774463653564, 3.9849343299865723, 4.148190975189209, 4.311448097229004, 4.474704742431641, 4.637961387634277, 4.801218509674072]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 9.0, 5.0, 12.0, 10.0, 11.0, 22.0, 21.0, 27.0, 33.0, 32.0, 43.0, 48.0, 51.0, 53.0, 50.0, 58.0, 70.0, 56.0, 69.0, 53.0, 41.0, 39.0, 37.0, 18.0, 30.0, 19.0, 23.0, 17.0, 13.0, 11.0, 4.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-3.8437633514404297, -3.737733840942383, -3.631704330444336, -3.525674819946289, -3.419645309448242, -3.3136157989501953, -3.2075862884521484, -3.1015567779541016, -2.9955272674560547, -2.889497756958008, -2.783468246459961, -2.677438735961914, -2.571409225463867, -2.4653797149658203, -2.3593502044677734, -2.2533206939697266, -2.1472911834716797, -2.041261672973633, -1.935232162475586, -1.829202651977539, -1.7231731414794922, -1.6171436309814453, -1.5111141204833984, -1.4050846099853516, -1.2990550994873047, -1.1930255889892578, -1.086996078491211, -0.9809665679931641, -0.8749370574951172, -0.7689075469970703, -0.6628780364990234, -0.5568485260009766, -0.4508192539215088, -0.3447897434234619, -0.23876023292541504, -0.13273072242736816, -0.02670121192932129, 0.07932829856872559, 0.18535780906677246, 0.29138731956481934, 0.3974168300628662, 0.5034463405609131, 0.60947585105896, 0.7155053615570068, 0.8215348720550537, 0.9275643825531006, 1.0335938930511475, 1.1396234035491943, 1.2456529140472412, 1.351682424545288, 1.457711935043335, 1.5637414455413818, 1.6697709560394287, 1.7758004665374756, 1.8818299770355225, 1.9878594875335693, 2.093888998031616, 2.199918508529663, 2.30594801902771, 2.411977529525757, 2.5180070400238037, 2.6240365505218506, 2.7300660610198975, 2.8360955715179443, 2.942125082015991]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 14.0, 19.0, 18.0, 21.0, 41.0, 54.0, 93.0, 146.0, 231.0, 333.0, 522.0, 881.0, 1416.0, 2432.0, 4339.0, 8180.0, 18209.0, 51675.0, 226552.0, 533469.0, 135119.0, 35715.0, 13613.0, 6595.0, 3535.0, 2072.0, 1159.0, 742.0, 461.0, 281.0, 212.0, 119.0, 93.0, 51.0, 41.0, 27.0, 28.0, 12.0, 12.0, 7.0, 5.0, 6.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.203125, -1.165924072265625, -1.12872314453125, -1.091522216796875, -1.0543212890625, -1.017120361328125, -0.97991943359375, -0.942718505859375, -0.905517578125, -0.868316650390625, -0.83111572265625, -0.793914794921875, -0.7567138671875, -0.719512939453125, -0.68231201171875, -0.645111083984375, -0.60791015625, -0.570709228515625, -0.53350830078125, -0.496307373046875, -0.4591064453125, -0.421905517578125, -0.38470458984375, -0.347503662109375, -0.310302734375, -0.273101806640625, -0.23590087890625, -0.198699951171875, -0.1614990234375, -0.124298095703125, -0.08709716796875, -0.049896240234375, -0.0126953125, 0.024505615234375, 0.06170654296875, 0.098907470703125, 0.1361083984375, 0.173309326171875, 0.21051025390625, 0.247711181640625, 0.284912109375, 0.322113037109375, 0.35931396484375, 0.396514892578125, 0.4337158203125, 0.470916748046875, 0.50811767578125, 0.545318603515625, 0.58251953125, 0.619720458984375, 0.65692138671875, 0.694122314453125, 0.7313232421875, 0.768524169921875, 0.80572509765625, 0.842926025390625, 0.880126953125, 0.917327880859375, 0.95452880859375, 0.991729736328125, 1.0289306640625, 1.066131591796875, 1.10333251953125, 1.140533447265625, 1.177734375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 11.0, 9.0, 14.0, 23.0, 16.0, 20.0, 48.0, 50.0, 56.0, 59.0, 76.0, 82.0, 74.0, 72.0, 75.0, 75.0, 54.0, 45.0, 33.0, 22.0, 20.0, 22.0, 13.0, 10.0, 7.0, 3.0, 4.0, 5.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.216796875, -3.123260498046875, -3.02972412109375, -2.936187744140625, -2.8426513671875, -2.749114990234375, -2.65557861328125, -2.562042236328125, -2.468505859375, -2.374969482421875, -2.28143310546875, -2.187896728515625, -2.0943603515625, -2.000823974609375, -1.90728759765625, -1.813751220703125, -1.72021484375, -1.626678466796875, -1.53314208984375, -1.439605712890625, -1.3460693359375, -1.252532958984375, -1.15899658203125, -1.065460205078125, -0.971923828125, -0.878387451171875, -0.78485107421875, -0.691314697265625, -0.5977783203125, -0.504241943359375, -0.41070556640625, -0.317169189453125, -0.2236328125, -0.130096435546875, -0.03656005859375, 0.056976318359375, 0.1505126953125, 0.244049072265625, 0.33758544921875, 0.431121826171875, 0.524658203125, 0.618194580078125, 0.71173095703125, 0.805267333984375, 0.8988037109375, 0.992340087890625, 1.08587646484375, 1.179412841796875, 1.27294921875, 1.366485595703125, 1.46002197265625, 1.553558349609375, 1.6470947265625, 1.740631103515625, 1.83416748046875, 1.927703857421875, 2.021240234375, 2.114776611328125, 2.20831298828125, 2.301849365234375, 2.3953857421875, 2.488922119140625, 2.58245849609375, 2.675994873046875, 2.76953125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 1.0, 7.0, 9.0, 15.0, 18.0, 35.0, 29.0, 47.0, 90.0, 134.0, 287.0, 620.0, 1584.0, 4566.0, 17106.0, 94078.0, 668503.0, 219376.0, 30552.0, 7526.0, 2276.0, 846.0, 359.0, 198.0, 103.0, 62.0, 42.0, 27.0, 19.0, 21.0, 5.0, 6.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.7490234375, -1.7026214599609375, -1.656219482421875, -1.6098175048828125, -1.56341552734375, -1.5170135498046875, -1.470611572265625, -1.4242095947265625, -1.3778076171875, -1.3314056396484375, -1.285003662109375, -1.2386016845703125, -1.19219970703125, -1.1457977294921875, -1.099395751953125, -1.0529937744140625, -1.006591796875, -0.9601898193359375, -0.913787841796875, -0.8673858642578125, -0.82098388671875, -0.7745819091796875, -0.728179931640625, -0.6817779541015625, -0.6353759765625, -0.5889739990234375, -0.542572021484375, -0.4961700439453125, -0.44976806640625, -0.4033660888671875, -0.356964111328125, -0.3105621337890625, -0.26416015625, -0.2177581787109375, -0.171356201171875, -0.1249542236328125, -0.07855224609375, -0.0321502685546875, 0.014251708984375, 0.0606536865234375, 0.1070556640625, 0.1534576416015625, 0.199859619140625, 0.2462615966796875, 0.29266357421875, 0.3390655517578125, 0.385467529296875, 0.4318695068359375, 0.478271484375, 0.5246734619140625, 0.571075439453125, 0.6174774169921875, 0.66387939453125, 0.7102813720703125, 0.756683349609375, 0.8030853271484375, 0.8494873046875, 0.8958892822265625, 0.942291259765625, 0.9886932373046875, 1.03509521484375, 1.0814971923828125, 1.127899169921875, 1.1743011474609375, 1.220703125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 4.0, 1.0, 1.0, 6.0, 8.0, 8.0, 7.0, 13.0, 16.0, 12.0, 20.0, 16.0, 31.0, 18.0, 28.0, 39.0, 45.0, 41.0, 44.0, 47.0, 52.0, 61.0, 47.0, 45.0, 43.0, 37.0, 55.0, 35.0, 31.0, 27.0, 26.0, 24.0, 23.0, 18.0, 19.0, 13.0, 9.0, 8.0, 8.0, 13.0, 3.0, 1.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.580078125, -3.468994140625, -3.35791015625, -3.246826171875, -3.1357421875, -3.024658203125, -2.91357421875, -2.802490234375, -2.69140625, -2.580322265625, -2.46923828125, -2.358154296875, -2.2470703125, -2.135986328125, -2.02490234375, -1.913818359375, -1.802734375, -1.691650390625, -1.58056640625, -1.469482421875, -1.3583984375, -1.247314453125, -1.13623046875, -1.025146484375, -0.9140625, -0.802978515625, -0.69189453125, -0.580810546875, -0.4697265625, -0.358642578125, -0.24755859375, -0.136474609375, -0.025390625, 0.085693359375, 0.19677734375, 0.307861328125, 0.4189453125, 0.530029296875, 0.64111328125, 0.752197265625, 0.86328125, 0.974365234375, 1.08544921875, 1.196533203125, 1.3076171875, 1.418701171875, 1.52978515625, 1.640869140625, 1.751953125, 1.863037109375, 1.97412109375, 2.085205078125, 2.1962890625, 2.307373046875, 2.41845703125, 2.529541015625, 2.640625, 2.751708984375, 2.86279296875, 2.973876953125, 3.0849609375, 3.196044921875, 3.30712890625, 3.418212890625, 3.529296875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 0.0, 3.0, 4.0, 3.0, 7.0, 6.0, 18.0, 12.0, 27.0, 15.0, 24.0, 48.0, 72.0, 97.0, 139.0, 243.0, 424.0, 692.0, 1290.0, 2543.0, 5707.0, 15940.0, 72333.0, 697790.0, 206352.0, 28600.0, 8634.0, 3507.0, 1677.0, 924.0, 525.0, 346.0, 172.0, 114.0, 77.0, 70.0, 37.0, 26.0, 20.0, 11.0, 13.0, 8.0, 4.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.479248046875, -0.4613151550292969, -0.44338226318359375, -0.4254493713378906, -0.4075164794921875, -0.3895835876464844, -0.37165069580078125, -0.3537178039550781, -0.335784912109375, -0.3178520202636719, -0.29991912841796875, -0.2819862365722656, -0.2640533447265625, -0.24612045288085938, -0.22818756103515625, -0.21025466918945312, -0.19232177734375, -0.17438888549804688, -0.15645599365234375, -0.13852310180664062, -0.1205902099609375, -0.10265731811523438, -0.08472442626953125, -0.06679153442382812, -0.048858642578125, -0.030925750732421875, -0.01299285888671875, 0.004940032958984375, 0.0228729248046875, 0.040805816650390625, 0.05873870849609375, 0.07667160034179688, 0.0946044921875, 0.11253738403320312, 0.13047027587890625, 0.14840316772460938, 0.1663360595703125, 0.18426895141601562, 0.20220184326171875, 0.22013473510742188, 0.238067626953125, 0.2560005187988281, 0.27393341064453125, 0.2918663024902344, 0.3097991943359375, 0.3277320861816406, 0.34566497802734375, 0.3635978698730469, 0.38153076171875, 0.3994636535644531, 0.41739654541015625, 0.4353294372558594, 0.4532623291015625, 0.4711952209472656, 0.48912811279296875, 0.5070610046386719, 0.524993896484375, 0.5429267883300781, 0.5608596801757812, 0.5787925720214844, 0.5967254638671875, 0.6146583557128906, 0.6325912475585938, 0.6505241394042969, 0.66845703125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 2.0, 5.0, 4.0, 19.0, 13.0, 29.0, 72.0, 132.0, 210.0, 234.0, 124.0, 55.0, 37.0, 21.0, 14.0, 5.0, 8.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0004410743713378906, -0.000428810715675354, -0.0004165470600128174, -0.00040428340435028076, -0.00039201974868774414, -0.0003797560930252075, -0.0003674924373626709, -0.0003552287817001343, -0.00034296512603759766, -0.00033070147037506104, -0.0003184378147125244, -0.0003061741590499878, -0.00029391050338745117, -0.00028164684772491455, -0.00026938319206237793, -0.0002571195363998413, -0.0002448558807373047, -0.00023259222507476807, -0.00022032856941223145, -0.00020806491374969482, -0.0001958012580871582, -0.00018353760242462158, -0.00017127394676208496, -0.00015901029109954834, -0.00014674663543701172, -0.0001344829797744751, -0.00012221932411193848, -0.00010995566844940186, -9.769201278686523e-05, -8.542835712432861e-05, -7.316470146179199e-05, -6.090104579925537e-05, -4.863739013671875e-05, -3.637373447418213e-05, -2.4110078811645508e-05, -1.1846423149108887e-05, 4.172325134277344e-07, 1.2680888175964355e-05, 2.4944543838500977e-05, 3.72081995010376e-05, 4.947185516357422e-05, 6.173551082611084e-05, 7.399916648864746e-05, 8.626282215118408e-05, 9.85264778137207e-05, 0.00011079013347625732, 0.00012305378913879395, 0.00013531744480133057, 0.0001475811004638672, 0.0001598447561264038, 0.00017210841178894043, 0.00018437206745147705, 0.00019663572311401367, 0.0002088993787765503, 0.00022116303443908691, 0.00023342669010162354, 0.00024569034576416016, 0.0002579540014266968, 0.0002702176570892334, 0.00028248131275177, 0.00029474496841430664, 0.00030700862407684326, 0.0003192722797393799, 0.0003315359354019165, 0.0003437995910644531]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 5.0, 5.0, 8.0, 14.0, 15.0, 40.0, 45.0, 98.0, 250.0, 717.0, 2182.0, 8583.0, 81037.0, 913858.0, 33897.0, 5430.0, 1538.0, 460.0, 158.0, 91.0, 35.0, 19.0, 12.0, 25.0, 8.0, 9.0, 2.0, 7.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.2021484375, -1.1625518798828125, -1.122955322265625, -1.0833587646484375, -1.04376220703125, -1.0041656494140625, -0.964569091796875, -0.9249725341796875, -0.8853759765625, -0.8457794189453125, -0.806182861328125, -0.7665863037109375, -0.72698974609375, -0.6873931884765625, -0.647796630859375, -0.6082000732421875, -0.568603515625, -0.5290069580078125, -0.489410400390625, -0.4498138427734375, -0.41021728515625, -0.3706207275390625, -0.331024169921875, -0.2914276123046875, -0.2518310546875, -0.2122344970703125, -0.172637939453125, -0.1330413818359375, -0.09344482421875, -0.0538482666015625, -0.014251708984375, 0.0253448486328125, 0.06494140625, 0.1045379638671875, 0.144134521484375, 0.1837310791015625, 0.22332763671875, 0.2629241943359375, 0.302520751953125, 0.3421173095703125, 0.3817138671875, 0.4213104248046875, 0.460906982421875, 0.5005035400390625, 0.54010009765625, 0.5796966552734375, 0.619293212890625, 0.6588897705078125, 0.698486328125, 0.7380828857421875, 0.777679443359375, 0.8172760009765625, 0.85687255859375, 0.8964691162109375, 0.936065673828125, 0.9756622314453125, 1.0152587890625, 1.0548553466796875, 1.094451904296875, 1.1340484619140625, 1.17364501953125, 1.2132415771484375, 1.252838134765625, 1.2924346923828125, 1.33203125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 3.0, 3.0, 5.0, 8.0, 16.0, 22.0, 38.0, 97.0, 166.0, 260.0, 159.0, 92.0, 53.0, 27.0, 16.0, 12.0, 6.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.218505859375, -0.21135711669921875, -0.2042083740234375, -0.19705963134765625, -0.189910888671875, -0.18276214599609375, -0.1756134033203125, -0.16846466064453125, -0.16131591796875, -0.15416717529296875, -0.1470184326171875, -0.13986968994140625, -0.132720947265625, -0.12557220458984375, -0.1184234619140625, -0.11127471923828125, -0.1041259765625, -0.09697723388671875, -0.0898284912109375, -0.08267974853515625, -0.075531005859375, -0.06838226318359375, -0.0612335205078125, -0.05408477783203125, -0.04693603515625, -0.03978729248046875, -0.0326385498046875, -0.02548980712890625, -0.018341064453125, -0.01119232177734375, -0.0040435791015625, 0.00310516357421875, 0.01025390625, 0.01740264892578125, 0.0245513916015625, 0.03170013427734375, 0.038848876953125, 0.04599761962890625, 0.0531463623046875, 0.06029510498046875, 0.06744384765625, 0.07459259033203125, 0.0817413330078125, 0.08889007568359375, 0.096038818359375, 0.10318756103515625, 0.1103363037109375, 0.11748504638671875, 0.1246337890625, 0.13178253173828125, 0.1389312744140625, 0.14608001708984375, 0.153228759765625, 0.16037750244140625, 0.1675262451171875, 0.17467498779296875, 0.18182373046875, 0.18897247314453125, 0.1961212158203125, 0.20326995849609375, 0.210418701171875, 0.21756744384765625, 0.2247161865234375, 0.23186492919921875, 0.239013671875]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 2.0, 5.0, 14.0, 12.0, 1.0, 30.0, 44.0, 81.0, 137.0, 168.0, 167.0, 153.0, 79.0, 47.0, 21.0, 20.0, 10.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.365777015686035, -3.2193212509155273, -3.0728654861450195, -2.9264097213745117, -2.779953956604004, -2.633498191833496, -2.487042188644409, -2.3405864238739014, -2.1941306591033936, -2.0476748943328857, -1.901219129562378, -1.7547632455825806, -1.6083074808120728, -1.461851716041565, -1.3153958320617676, -1.1689400672912598, -1.022484302520752, -0.8760285377502441, -0.7295727133750916, -0.583116888999939, -0.43666112422943115, -0.29020535945892334, -0.14374953508377075, 0.002706289291381836, 0.14916205406188965, 0.29561784863471985, 0.44207364320755005, 0.5885294675827026, 0.7349852323532104, 0.8814409971237183, 1.0278968811035156, 1.1743526458740234, 1.3208084106445312, 1.467264175415039, 1.6137199401855469, 1.7601758241653442, 1.906631588935852, 2.0530872344970703, 2.1995432376861572, 2.345999002456665, 2.492454767227173, 2.6389105319976807, 2.7853662967681885, 2.9318220615386963, 3.078278064727783, 3.224733829498291, 3.371189594268799, 3.5176453590393066, 3.6641011238098145, 3.8105568885803223, 3.95701265335083, 4.103468418121338, 4.249924182891846, 4.3963799476623535, 4.542835712432861, 4.689291954040527, 4.835747718811035, 4.982203483581543, 5.128659248352051, 5.275115013122559, 5.421570777893066, 5.568026542663574, 5.714482307434082, 5.86093807220459, 6.007393836975098]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 6.0, 7.0, 6.0, 12.0, 16.0, 17.0, 22.0, 32.0, 41.0, 38.0, 55.0, 53.0, 63.0, 75.0, 71.0, 72.0, 72.0, 65.0, 62.0, 47.0, 37.0, 29.0, 23.0, 24.0, 18.0, 14.0, 7.0, 6.0, 6.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.069934368133545, -2.981529951095581, -2.893125295639038, -2.804720878601074, -2.7163162231445312, -2.6279118061065674, -2.5395071506500244, -2.4511027336120605, -2.3626980781555176, -2.2742936611175537, -2.1858890056610107, -2.097484588623047, -2.009079933166504, -1.9206753969192505, -1.832270860671997, -1.7438664436340332, -1.6554619073867798, -1.5670573711395264, -1.478652834892273, -1.3902482986450195, -1.3018437623977661, -1.2134392261505127, -1.1250348091125488, -1.0366301536560059, -0.9482256770133972, -0.8598211407661438, -0.7714166045188904, -0.6830121278762817, -0.5946075916290283, -0.5062030553817749, -0.4177985191345215, -0.32939398288726807, -0.24098944664001465, -0.15258491039276123, -0.064180389046669, 0.024224132299423218, 0.11262866854667664, 0.20103320479393005, 0.2894377112388611, 0.3778422474861145, 0.4662467837333679, 0.5546513199806213, 0.6430558562278748, 0.7314603328704834, 0.8198648691177368, 0.9082694053649902, 0.9966739416122437, 1.085078477859497, 1.1734830141067505, 1.261887550354004, 1.3502920866012573, 1.4386966228485107, 1.5271011590957642, 1.6155056953430176, 1.7039101123809814, 1.7923147678375244, 1.8807191848754883, 1.9691237211227417, 2.057528257369995, 2.145932674407959, 2.234337329864502, 2.322741746902466, 2.411146402359009, 2.4995508193969727, 2.5879554748535156]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 6.0, 6.0, 5.0, 4.0, 9.0, 16.0, 19.0, 39.0, 43.0, 79.0, 124.0, 197.0, 352.0, 627.0, 1144.0, 2192.0, 4446.0, 9925.0, 25233.0, 93276.0, 647462.0, 199837.0, 37833.0, 13390.0, 6102.0, 2830.0, 1423.0, 826.0, 411.0, 252.0, 158.0, 101.0, 53.0, 37.0, 32.0, 15.0, 18.0, 14.0, 8.0, 8.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.53515625, -2.462066650390625, -2.38897705078125, -2.315887451171875, -2.2427978515625, -2.169708251953125, -2.09661865234375, -2.023529052734375, -1.950439453125, -1.877349853515625, -1.80426025390625, -1.731170654296875, -1.6580810546875, -1.584991455078125, -1.51190185546875, -1.438812255859375, -1.36572265625, -1.292633056640625, -1.21954345703125, -1.146453857421875, -1.0733642578125, -1.000274658203125, -0.92718505859375, -0.854095458984375, -0.781005859375, -0.707916259765625, -0.63482666015625, -0.561737060546875, -0.4886474609375, -0.415557861328125, -0.34246826171875, -0.269378662109375, -0.1962890625, -0.123199462890625, -0.05010986328125, 0.022979736328125, 0.0960693359375, 0.169158935546875, 0.24224853515625, 0.315338134765625, 0.388427734375, 0.461517333984375, 0.53460693359375, 0.607696533203125, 0.6807861328125, 0.753875732421875, 0.82696533203125, 0.900054931640625, 0.97314453125, 1.046234130859375, 1.11932373046875, 1.192413330078125, 1.2655029296875, 1.338592529296875, 1.41168212890625, 1.484771728515625, 1.557861328125, 1.630950927734375, 1.70404052734375, 1.777130126953125, 1.8502197265625, 1.923309326171875, 1.99639892578125, 2.069488525390625, 2.142578125]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 2.0, 4.0, 3.0, 4.0, 7.0, 10.0, 13.0, 10.0, 13.0, 16.0, 14.0, 37.0, 35.0, 42.0, 40.0, 38.0, 65.0, 57.0, 51.0, 57.0, 59.0, 53.0, 55.0, 48.0, 36.0, 35.0, 35.0, 34.0, 20.0, 25.0, 18.0, 13.0, 12.0, 9.0, 14.0, 5.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.80859375, -4.652099609375, -4.49560546875, -4.339111328125, -4.1826171875, -4.026123046875, -3.86962890625, -3.713134765625, -3.556640625, -3.400146484375, -3.24365234375, -3.087158203125, -2.9306640625, -2.774169921875, -2.61767578125, -2.461181640625, -2.3046875, -2.148193359375, -1.99169921875, -1.835205078125, -1.6787109375, -1.522216796875, -1.36572265625, -1.209228515625, -1.052734375, -0.896240234375, -0.73974609375, -0.583251953125, -0.4267578125, -0.270263671875, -0.11376953125, 0.042724609375, 0.19921875, 0.355712890625, 0.51220703125, 0.668701171875, 0.8251953125, 0.981689453125, 1.13818359375, 1.294677734375, 1.451171875, 1.607666015625, 1.76416015625, 1.920654296875, 2.0771484375, 2.233642578125, 2.39013671875, 2.546630859375, 2.703125, 2.859619140625, 3.01611328125, 3.172607421875, 3.3291015625, 3.485595703125, 3.64208984375, 3.798583984375, 3.955078125, 4.111572265625, 4.26806640625, 4.424560546875, 4.5810546875, 4.737548828125, 4.89404296875, 5.050537109375, 5.20703125]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 4.0, 3.0, 5.0, 6.0, 11.0, 14.0, 9.0, 11.0, 22.0, 23.0, 33.0, 44.0, 55.0, 57.0, 80.0, 160.0, 1212.0, 1020384.0, 25589.0, 388.0, 102.0, 76.0, 69.0, 54.0, 36.0, 23.0, 18.0, 16.0, 17.0, 10.0, 9.0, 6.0, 4.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.265625, -18.65966796875, -18.0537109375, -17.44775390625, -16.841796875, -16.23583984375, -15.6298828125, -15.02392578125, -14.41796875, -13.81201171875, -13.2060546875, -12.60009765625, -11.994140625, -11.38818359375, -10.7822265625, -10.17626953125, -9.5703125, -8.96435546875, -8.3583984375, -7.75244140625, -7.146484375, -6.54052734375, -5.9345703125, -5.32861328125, -4.72265625, -4.11669921875, -3.5107421875, -2.90478515625, -2.298828125, -1.69287109375, -1.0869140625, -0.48095703125, 0.125, 0.73095703125, 1.3369140625, 1.94287109375, 2.548828125, 3.15478515625, 3.7607421875, 4.36669921875, 4.97265625, 5.57861328125, 6.1845703125, 6.79052734375, 7.396484375, 8.00244140625, 8.6083984375, 9.21435546875, 9.8203125, 10.42626953125, 11.0322265625, 11.63818359375, 12.244140625, 12.85009765625, 13.4560546875, 14.06201171875, 14.66796875, 15.27392578125, 15.8798828125, 16.48583984375, 17.091796875, 17.69775390625, 18.3037109375, 18.90966796875, 19.515625]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 0.0, 5.0, 3.0, 9.0, 5.0, 15.0, 10.0, 7.0, 16.0, 26.0, 23.0, 33.0, 40.0, 45.0, 58.0, 56.0, 40.0, 49.0, 53.0, 78.0, 54.0, 63.0, 56.0, 65.0, 37.0, 37.0, 28.0, 19.0, 17.0, 16.0, 11.0, 10.0, 10.0, 3.0, 5.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.9296875, -6.71173095703125, -6.4937744140625, -6.27581787109375, -6.057861328125, -5.83990478515625, -5.6219482421875, -5.40399169921875, -5.18603515625, -4.96807861328125, -4.7501220703125, -4.53216552734375, -4.314208984375, -4.09625244140625, -3.8782958984375, -3.66033935546875, -3.4423828125, -3.22442626953125, -3.0064697265625, -2.78851318359375, -2.570556640625, -2.35260009765625, -2.1346435546875, -1.91668701171875, -1.69873046875, -1.48077392578125, -1.2628173828125, -1.04486083984375, -0.826904296875, -0.60894775390625, -0.3909912109375, -0.17303466796875, 0.044921875, 0.26287841796875, 0.4808349609375, 0.69879150390625, 0.916748046875, 1.13470458984375, 1.3526611328125, 1.57061767578125, 1.78857421875, 2.00653076171875, 2.2244873046875, 2.44244384765625, 2.660400390625, 2.87835693359375, 3.0963134765625, 3.31427001953125, 3.5322265625, 3.75018310546875, 3.9681396484375, 4.18609619140625, 4.404052734375, 4.62200927734375, 4.8399658203125, 5.05792236328125, 5.27587890625, 5.49383544921875, 5.7117919921875, 5.92974853515625, 6.147705078125, 6.36566162109375, 6.5836181640625, 6.80157470703125, 7.01953125]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 6.0, 5.0, 7.0, 14.0, 11.0, 26.0, 37.0, 51.0, 96.0, 292.0, 928.0, 5982.0, 80152.0, 926090.0, 30784.0, 3084.0, 593.0, 186.0, 103.0, 34.0, 26.0, 16.0, 8.0, 15.0, 3.0, 3.0, 3.0, 5.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2412109375, -1.1880340576171875, -1.134857177734375, -1.0816802978515625, -1.02850341796875, -0.9753265380859375, -0.922149658203125, -0.8689727783203125, -0.8157958984375, -0.7626190185546875, -0.709442138671875, -0.6562652587890625, -0.60308837890625, -0.5499114990234375, -0.496734619140625, -0.4435577392578125, -0.390380859375, -0.3372039794921875, -0.284027099609375, -0.2308502197265625, -0.17767333984375, -0.1244964599609375, -0.071319580078125, -0.0181427001953125, 0.0350341796875, 0.0882110595703125, 0.141387939453125, 0.1945648193359375, 0.24774169921875, 0.3009185791015625, 0.354095458984375, 0.4072723388671875, 0.46044921875, 0.5136260986328125, 0.566802978515625, 0.6199798583984375, 0.67315673828125, 0.7263336181640625, 0.779510498046875, 0.8326873779296875, 0.8858642578125, 0.9390411376953125, 0.992218017578125, 1.0453948974609375, 1.09857177734375, 1.1517486572265625, 1.204925537109375, 1.2581024169921875, 1.311279296875, 1.3644561767578125, 1.417633056640625, 1.4708099365234375, 1.52398681640625, 1.5771636962890625, 1.630340576171875, 1.6835174560546875, 1.7366943359375, 1.7898712158203125, 1.843048095703125, 1.8962249755859375, 1.94940185546875, 2.0025787353515625, 2.055755615234375, 2.1089324951171875, 2.162109375]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 4.0, 3.0, 3.0, 2.0, 5.0, 6.0, 8.0, 12.0, 22.0, 15.0, 21.0, 36.0, 33.0, 72.0, 114.0, 217.0, 134.0, 88.0, 58.0, 35.0, 19.0, 25.0, 20.0, 14.0, 10.0, 6.0, 2.0, 2.0, 6.0, 2.0, 3.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.00014865398406982422, -0.0001450013369321823, -0.0001413486897945404, -0.0001376960426568985, -0.0001340433955192566, -0.00013039074838161469, -0.00012673810124397278, -0.00012308545410633087, -0.00011943280696868896, -0.00011578015983104706, -0.00011212751269340515, -0.00010847486555576324, -0.00010482221841812134, -0.00010116957128047943, -9.751692414283752e-05, -9.386427700519562e-05, -9.021162986755371e-05, -8.65589827299118e-05, -8.29063355922699e-05, -7.925368845462799e-05, -7.560104131698608e-05, -7.194839417934418e-05, -6.829574704170227e-05, -6.464309990406036e-05, -6.099045276641846e-05, -5.733780562877655e-05, -5.3685158491134644e-05, -5.003251135349274e-05, -4.637986421585083e-05, -4.272721707820892e-05, -3.9074569940567017e-05, -3.542192280292511e-05, -3.17692756652832e-05, -2.8116628527641296e-05, -2.446398138999939e-05, -2.0811334252357483e-05, -1.7158687114715576e-05, -1.350603997707367e-05, -9.853392839431763e-06, -6.200745701789856e-06, -2.5480985641479492e-06, 1.1045485734939575e-06, 4.757195711135864e-06, 8.409842848777771e-06, 1.2062489986419678e-05, 1.5715137124061584e-05, 1.936778426170349e-05, 2.3020431399345398e-05, 2.6673078536987305e-05, 3.032572567462921e-05, 3.397837281227112e-05, 3.7631019949913025e-05, 4.128366708755493e-05, 4.493631422519684e-05, 4.8588961362838745e-05, 5.224160850048065e-05, 5.589425563812256e-05, 5.9546902775764465e-05, 6.319954991340637e-05, 6.685219705104828e-05, 7.050484418869019e-05, 7.415749132633209e-05, 7.7810138463974e-05, 8.14627856016159e-05, 8.511543273925781e-05]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 6.0, 3.0, 4.0, 6.0, 15.0, 21.0, 33.0, 52.0, 106.0, 250.0, 663.0, 2213.0, 10604.0, 90233.0, 881892.0, 52658.0, 7246.0, 1615.0, 488.0, 209.0, 99.0, 49.0, 28.0, 28.0, 5.0, 14.0, 8.0, 3.0, 2.0, 3.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.93505859375, -0.8950881958007812, -0.8551177978515625, -0.8151473999023438, -0.775177001953125, -0.7352066040039062, -0.6952362060546875, -0.6552658081054688, -0.61529541015625, -0.5753250122070312, -0.5353546142578125, -0.49538421630859375, -0.455413818359375, -0.41544342041015625, -0.3754730224609375, -0.33550262451171875, -0.2955322265625, -0.25556182861328125, -0.2155914306640625, -0.17562103271484375, -0.135650634765625, -0.09568023681640625, -0.0557098388671875, -0.01573944091796875, 0.02423095703125, 0.06420135498046875, 0.1041717529296875, 0.14414215087890625, 0.184112548828125, 0.22408294677734375, 0.2640533447265625, 0.30402374267578125, 0.343994140625, 0.38396453857421875, 0.4239349365234375, 0.46390533447265625, 0.503875732421875, 0.5438461303710938, 0.5838165283203125, 0.6237869262695312, 0.66375732421875, 0.7037277221679688, 0.7436981201171875, 0.7836685180664062, 0.823638916015625, 0.8636093139648438, 0.9035797119140625, 0.9435501098632812, 0.9835205078125, 1.0234909057617188, 1.0634613037109375, 1.1034317016601562, 1.143402099609375, 1.1833724975585938, 1.2233428955078125, 1.2633132934570312, 1.30328369140625, 1.3432540893554688, 1.3832244873046875, 1.4231948852539062, 1.463165283203125, 1.5031356811523438, 1.5431060791015625, 1.5830764770507812, 1.623046875]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 4.0, 6.0, 3.0, 4.0, 5.0, 12.0, 13.0, 18.0, 19.0, 43.0, 61.0, 158.0, 360.0, 107.0, 68.0, 37.0, 24.0, 15.0, 11.0, 6.0, 7.0, 4.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.49560546875, -0.4819984436035156, -0.46839141845703125, -0.4547843933105469, -0.4411773681640625, -0.4275703430175781, -0.41396331787109375, -0.4003562927246094, -0.386749267578125, -0.3731422424316406, -0.35953521728515625, -0.3459281921386719, -0.3323211669921875, -0.3187141418457031, -0.30510711669921875, -0.2915000915527344, -0.27789306640625, -0.2642860412597656, -0.25067901611328125, -0.23707199096679688, -0.2234649658203125, -0.20985794067382812, -0.19625091552734375, -0.18264389038085938, -0.169036865234375, -0.15542984008789062, -0.14182281494140625, -0.12821578979492188, -0.1146087646484375, -0.10100173950195312, -0.08739471435546875, -0.07378768920898438, -0.0601806640625, -0.046573638916015625, -0.03296661376953125, -0.019359588623046875, -0.0057525634765625, 0.007854461669921875, 0.02146148681640625, 0.035068511962890625, 0.048675537109375, 0.062282562255859375, 0.07588958740234375, 0.08949661254882812, 0.1031036376953125, 0.11671066284179688, 0.13031768798828125, 0.14392471313476562, 0.15753173828125, 0.17113876342773438, 0.18474578857421875, 0.19835281372070312, 0.2119598388671875, 0.22556686401367188, 0.23917388916015625, 0.2527809143066406, 0.266387939453125, 0.2799949645996094, 0.29360198974609375, 0.3072090148925781, 0.3208160400390625, 0.3344230651855469, 0.34803009033203125, 0.3616371154785156, 0.375244140625]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 34.0, 98.0, 507.0, 309.0, 52.0, 7.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.406114101409912, -5.458986282348633, -4.511858940124512, -3.5647313594818115, -2.6176037788391113, -1.6704764366149902, -0.7233486175537109, 0.22377920150756836, 1.1709065437316895, 2.1180341243743896, 3.06516170501709, 4.012289047241211, 4.95941686630249, 5.906544208526611, 6.853672027587891, 7.80079984664917, 8.747926712036133, 9.695054054260254, 10.642181396484375, 11.589309692382812, 12.536437034606934, 13.483564376831055, 14.430692672729492, 15.377820014953613, 16.324947357177734, 17.272075653076172, 18.219202041625977, 19.166330337524414, 20.11345672607422, 21.060585021972656, 22.007713317871094, 22.95484161376953, 23.90196990966797, 24.849098205566406, 25.79622459411621, 26.74335289001465, 27.690479278564453, 28.63760757446289, 29.584735870361328, 30.531864166259766, 31.47899055480957, 32.426116943359375, 33.37324523925781, 34.32037353515625, 35.26750183105469, 36.214630126953125, 37.1617546081543, 38.108882904052734, 39.05601119995117, 40.00313949584961, 40.95026779174805, 41.89739227294922, 42.844520568847656, 43.791648864746094, 44.73877716064453, 45.68590545654297, 46.633033752441406, 47.580162048339844, 48.52729034423828, 49.47441482543945, 50.42154312133789, 51.36867141723633, 52.315799713134766, 53.2629280090332, 54.210052490234375]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 3.0, 2.0, 6.0, 6.0, 15.0, 15.0, 12.0, 19.0, 26.0, 28.0, 29.0, 33.0, 38.0, 43.0, 39.0, 31.0, 50.0, 49.0, 53.0, 60.0, 38.0, 50.0, 37.0, 35.0, 31.0, 39.0, 30.0, 36.0, 31.0, 25.0, 22.0, 12.0, 13.0, 11.0, 10.0, 6.0, 4.0, 6.0, 3.0, 4.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.511725425720215, -9.23253059387207, -8.953335762023926, -8.674140930175781, -8.394946098327637, -8.115751266479492, -7.836556434631348, -7.557361602783203, -7.278166770935059, -6.998971939086914, -6.7197771072387695, -6.440582275390625, -6.1613874435424805, -5.882192611694336, -5.602997779846191, -5.323802947998047, -5.044608116149902, -4.765413284301758, -4.486218452453613, -4.207023620605469, -3.927828788757324, -3.6486339569091797, -3.369439125061035, -3.0902442932128906, -2.811049461364746, -2.5318546295166016, -2.252659797668457, -1.9734649658203125, -1.694270133972168, -1.4150753021240234, -1.135880470275879, -0.8566856384277344, -0.5774908065795898, -0.2982959747314453, -0.01910114288330078, 0.26009368896484375, 0.5392885208129883, 0.8184833526611328, 1.0976781845092773, 1.3768730163574219, 1.6560678482055664, 1.935262680053711, 2.2144575119018555, 2.49365234375, 2.7728471755981445, 3.052042007446289, 3.3312368392944336, 3.610431671142578, 3.8896265029907227, 4.168821334838867, 4.448016166687012, 4.727210998535156, 5.006405830383301, 5.285600662231445, 5.56479549407959, 5.843990325927734, 6.123185157775879, 6.402379989624023, 6.681574821472168, 6.9607696533203125, 7.239964485168457, 7.519159317016602, 7.798354148864746, 8.07754898071289, 8.356743812561035]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 2.0, 4.0, 5.0, 1.0, 4.0, 7.0, 6.0, 8.0, 20.0, 14.0, 13.0, 14.0, 21.0, 36.0, 52.0, 53.0, 77.0, 133.0, 228.0, 332.0, 608.0, 1268.0, 2865.0, 7697.0, 25458.0, 123665.0, 2094890.0, 1779917.0, 118254.0, 25326.0, 7751.0, 2829.0, 1252.0, 592.0, 289.0, 171.0, 107.0, 77.0, 59.0, 41.0, 22.0, 25.0, 15.0, 16.0, 16.0, 10.0, 11.0, 4.0, 11.0, 1.0, 6.0, 2.0, 2.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-3.671875, -3.553375244140625, -3.43487548828125, -3.316375732421875, -3.1978759765625, -3.079376220703125, -2.96087646484375, -2.842376708984375, -2.723876953125, -2.605377197265625, -2.48687744140625, -2.368377685546875, -2.2498779296875, -2.131378173828125, -2.01287841796875, -1.894378662109375, -1.77587890625, -1.657379150390625, -1.53887939453125, -1.420379638671875, -1.3018798828125, -1.183380126953125, -1.06488037109375, -0.946380615234375, -0.827880859375, -0.709381103515625, -0.59088134765625, -0.472381591796875, -0.3538818359375, -0.235382080078125, -0.11688232421875, 0.001617431640625, 0.1201171875, 0.238616943359375, 0.35711669921875, 0.475616455078125, 0.5941162109375, 0.712615966796875, 0.83111572265625, 0.949615478515625, 1.068115234375, 1.186614990234375, 1.30511474609375, 1.423614501953125, 1.5421142578125, 1.660614013671875, 1.77911376953125, 1.897613525390625, 2.01611328125, 2.134613037109375, 2.25311279296875, 2.371612548828125, 2.4901123046875, 2.608612060546875, 2.72711181640625, 2.845611572265625, 2.964111328125, 3.082611083984375, 3.20111083984375, 3.319610595703125, 3.4381103515625, 3.556610107421875, 3.67510986328125, 3.793609619140625, 3.912109375]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 3.0, 8.0, 18.0, 15.0, 18.0, 31.0, 34.0, 45.0, 63.0, 62.0, 73.0, 72.0, 77.0, 96.0, 88.0, 64.0, 56.0, 39.0, 36.0, 27.0, 21.0, 15.0, 10.0, 8.0, 10.0, 5.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.125, -4.01141357421875, -3.8978271484375, -3.78424072265625, -3.670654296875, -3.55706787109375, -3.4434814453125, -3.32989501953125, -3.21630859375, -3.10272216796875, -2.9891357421875, -2.87554931640625, -2.761962890625, -2.64837646484375, -2.5347900390625, -2.42120361328125, -2.3076171875, -2.19403076171875, -2.0804443359375, -1.96685791015625, -1.853271484375, -1.73968505859375, -1.6260986328125, -1.51251220703125, -1.39892578125, -1.28533935546875, -1.1717529296875, -1.05816650390625, -0.944580078125, -0.83099365234375, -0.7174072265625, -0.60382080078125, -0.490234375, -0.37664794921875, -0.2630615234375, -0.14947509765625, -0.035888671875, 0.07769775390625, 0.1912841796875, 0.30487060546875, 0.41845703125, 0.53204345703125, 0.6456298828125, 0.75921630859375, 0.872802734375, 0.98638916015625, 1.0999755859375, 1.21356201171875, 1.3271484375, 1.44073486328125, 1.5543212890625, 1.66790771484375, 1.781494140625, 1.89508056640625, 2.0086669921875, 2.12225341796875, 2.23583984375, 2.34942626953125, 2.4630126953125, 2.57659912109375, 2.690185546875, 2.80377197265625, 2.9173583984375, 3.03094482421875, 3.14453125]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 3.0, 6.0, 13.0, 54.0, 407.0, 4143470.0, 50064.0, 225.0, 30.0, 10.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.96875, -13.80517578125, -12.6416015625, -11.47802734375, -10.314453125, -9.15087890625, -7.9873046875, -6.82373046875, -5.66015625, -4.49658203125, -3.3330078125, -2.16943359375, -1.005859375, 0.15771484375, 1.3212890625, 2.48486328125, 3.6484375, 4.81201171875, 5.9755859375, 7.13916015625, 8.302734375, 9.46630859375, 10.6298828125, 11.79345703125, 12.95703125, 14.12060546875, 15.2841796875, 16.44775390625, 17.611328125, 18.77490234375, 19.9384765625, 21.10205078125, 22.265625, 23.42919921875, 24.5927734375, 25.75634765625, 26.919921875, 28.08349609375, 29.2470703125, 30.41064453125, 31.57421875, 32.73779296875, 33.9013671875, 35.06494140625, 36.228515625, 37.39208984375, 38.5556640625, 39.71923828125, 40.8828125, 42.04638671875, 43.2099609375, 44.37353515625, 45.537109375, 46.70068359375, 47.8642578125, 49.02783203125, 50.19140625, 51.35498046875, 52.5185546875, 53.68212890625, 54.845703125, 56.00927734375, 57.1728515625, 58.33642578125, 59.5]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 6.0, 7.0, 5.0, 6.0, 12.0, 7.0, 15.0, 16.0, 30.0, 26.0, 36.0, 39.0, 60.0, 105.0, 132.0, 172.0, 294.0, 526.0, 923.0, 564.0, 344.0, 222.0, 152.0, 98.0, 84.0, 51.0, 30.0, 33.0, 17.0, 20.0, 20.0, 6.0, 10.0, 3.0, 1.0, 3.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.68212890625, -0.657440185546875, -0.63275146484375, -0.608062744140625, -0.5833740234375, -0.558685302734375, -0.53399658203125, -0.509307861328125, -0.484619140625, -0.459930419921875, -0.43524169921875, -0.410552978515625, -0.3858642578125, -0.361175537109375, -0.33648681640625, -0.311798095703125, -0.287109375, -0.262420654296875, -0.23773193359375, -0.213043212890625, -0.1883544921875, -0.163665771484375, -0.13897705078125, -0.114288330078125, -0.089599609375, -0.064910888671875, -0.04022216796875, -0.015533447265625, 0.0091552734375, 0.033843994140625, 0.05853271484375, 0.083221435546875, 0.10791015625, 0.132598876953125, 0.15728759765625, 0.181976318359375, 0.2066650390625, 0.231353759765625, 0.25604248046875, 0.280731201171875, 0.305419921875, 0.330108642578125, 0.35479736328125, 0.379486083984375, 0.4041748046875, 0.428863525390625, 0.45355224609375, 0.478240966796875, 0.5029296875, 0.527618408203125, 0.55230712890625, 0.576995849609375, 0.6016845703125, 0.626373291015625, 0.65106201171875, 0.675750732421875, 0.700439453125, 0.725128173828125, 0.74981689453125, 0.774505615234375, 0.7991943359375, 0.823883056640625, 0.84857177734375, 0.873260498046875, 0.89794921875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 8.0, 5.0, 10.0, 17.0, 24.0, 31.0, 54.0, 90.0, 122.0, 144.0, 148.0, 128.0, 90.0, 52.0, 19.0, 16.0, 8.0, 8.0, 7.0, 7.0, 3.0, 5.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.0028815269470215, -4.835790157318115, -4.668698787689209, -4.501607418060303, -4.334516525268555, -4.167425155639648, -4.000333786010742, -3.833242416381836, -3.6661510467529297, -3.4990596771240234, -3.331968307495117, -3.16487717628479, -2.997785806655884, -2.8306944370269775, -2.6636033058166504, -2.496511936187744, -2.329420566558838, -2.1623291969299316, -1.995237946510315, -1.8281466960906982, -1.661055326461792, -1.4939639568328857, -1.326872706413269, -1.1597814559936523, -0.9926900863647461, -0.8255987763404846, -0.6585074663162231, -0.49141615629196167, -0.3243248462677002, -0.15723353624343872, 0.009857773780822754, 0.17694902420043945, 0.3440399169921875, 0.511131227016449, 0.6782225370407104, 0.8453138470649719, 1.0124051570892334, 1.1794965267181396, 1.3465877771377563, 1.513679027557373, 1.6807703971862793, 1.8478617668151855, 2.014953136444092, 2.182044267654419, 2.349135637283325, 2.5162270069122314, 2.6833181381225586, 2.850409507751465, 3.017500877380371, 3.1845922470092773, 3.3516836166381836, 3.5187747478485107, 3.685866117477417, 3.8529574871063232, 4.02004861831665, 4.187139987945557, 4.354231357574463, 4.521322727203369, 4.688414096832275, 4.855505466461182, 5.02259635925293, 5.189687728881836, 5.356779098510742, 5.523870468139648, 5.690961837768555]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 7.0, 10.0, 8.0, 15.0, 20.0, 19.0, 25.0, 35.0, 43.0, 57.0, 62.0, 58.0, 56.0, 86.0, 74.0, 80.0, 62.0, 65.0, 54.0, 40.0, 30.0, 28.0, 21.0, 14.0, 15.0, 6.0, 3.0, 4.0, 2.0, 5.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.085511684417725, -3.9650323390960693, -3.844552993774414, -3.724073648452759, -3.6035943031311035, -3.483114719390869, -3.362635374069214, -3.2421560287475586, -3.1216766834259033, -3.001197338104248, -2.8807179927825928, -2.7602386474609375, -2.639759063720703, -2.519279956817627, -2.3988003730773926, -2.2783210277557373, -2.157841682434082, -2.0373623371124268, -1.9168829917907715, -1.7964035272598267, -1.6759241819381714, -1.5554448366165161, -1.4349653720855713, -1.314486026763916, -1.1940066814422607, -1.0735273361206055, -0.9530479311943054, -0.8325685262680054, -0.7120891809463501, -0.5916098356246948, -0.4711304306983948, -0.3506510257720947, -0.23017168045043945, -0.10969230532646179, 0.01078706979751587, 0.13126644492149353, 0.2517458200454712, 0.37222516536712646, 0.4927045702934265, 0.6131839752197266, 0.7336633205413818, 0.8541426658630371, 0.9746220707893372, 1.0951014757156372, 1.2155808210372925, 1.3360601663589478, 1.4565396308898926, 1.5770189762115479, 1.6974983215332031, 1.8179776668548584, 1.9384570121765137, 2.058936357498169, 2.179415702819824, 2.2998952865600586, 2.420374631881714, 2.540853977203369, 2.6613333225250244, 2.7818126678466797, 2.902292013168335, 3.0227713584899902, 3.1432509422302246, 3.263730049133301, 3.384209632873535, 3.5046889781951904, 3.6251683235168457]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 7.0, 2.0, 17.0, 11.0, 30.0, 32.0, 60.0, 101.0, 143.0, 239.0, 411.0, 784.0, 1623.0, 3310.0, 7801.0, 23626.0, 147542.0, 718508.0, 110759.0, 20344.0, 6959.0, 3074.0, 1421.0, 762.0, 402.0, 224.0, 127.0, 72.0, 65.0, 36.0, 19.0, 13.0, 10.0, 5.0, 7.0, 3.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.0810546875, -1.0477294921875, -1.014404296875, -0.9810791015625, -0.94775390625, -0.9144287109375, -0.881103515625, -0.8477783203125, -0.814453125, -0.7811279296875, -0.747802734375, -0.7144775390625, -0.68115234375, -0.6478271484375, -0.614501953125, -0.5811767578125, -0.5478515625, -0.5145263671875, -0.481201171875, -0.4478759765625, -0.41455078125, -0.3812255859375, -0.347900390625, -0.3145751953125, -0.28125, -0.2479248046875, -0.214599609375, -0.1812744140625, -0.14794921875, -0.1146240234375, -0.081298828125, -0.0479736328125, -0.0146484375, 0.0186767578125, 0.052001953125, 0.0853271484375, 0.11865234375, 0.1519775390625, 0.185302734375, 0.2186279296875, 0.251953125, 0.2852783203125, 0.318603515625, 0.3519287109375, 0.38525390625, 0.4185791015625, 0.451904296875, 0.4852294921875, 0.5185546875, 0.5518798828125, 0.585205078125, 0.6185302734375, 0.65185546875, 0.6851806640625, 0.718505859375, 0.7518310546875, 0.78515625, 0.8184814453125, 0.851806640625, 0.8851318359375, 0.91845703125, 0.9517822265625, 0.985107421875, 1.0184326171875, 1.0517578125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 9.0, 16.0, 9.0, 21.0, 31.0, 36.0, 42.0, 57.0, 64.0, 75.0, 112.0, 104.0, 91.0, 79.0, 59.0, 62.0, 38.0, 25.0, 16.0, 15.0, 14.0, 9.0, 5.0, 4.0, 5.0, 1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.990234375, -2.897735595703125, -2.80523681640625, -2.712738037109375, -2.6202392578125, -2.527740478515625, -2.43524169921875, -2.342742919921875, -2.250244140625, -2.157745361328125, -2.06524658203125, -1.972747802734375, -1.8802490234375, -1.787750244140625, -1.69525146484375, -1.602752685546875, -1.51025390625, -1.417755126953125, -1.32525634765625, -1.232757568359375, -1.1402587890625, -1.047760009765625, -0.95526123046875, -0.862762451171875, -0.770263671875, -0.677764892578125, -0.58526611328125, -0.492767333984375, -0.4002685546875, -0.307769775390625, -0.21527099609375, -0.122772216796875, -0.0302734375, 0.062225341796875, 0.15472412109375, 0.247222900390625, 0.3397216796875, 0.432220458984375, 0.52471923828125, 0.617218017578125, 0.709716796875, 0.802215576171875, 0.89471435546875, 0.987213134765625, 1.0797119140625, 1.172210693359375, 1.26470947265625, 1.357208251953125, 1.44970703125, 1.542205810546875, 1.63470458984375, 1.727203369140625, 1.8197021484375, 1.912200927734375, 2.00469970703125, 2.097198486328125, 2.189697265625, 2.282196044921875, 2.37469482421875, 2.467193603515625, 2.5596923828125, 2.652191162109375, 2.74468994140625, 2.837188720703125, 2.9296875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 7.0, 2.0, 9.0, 10.0, 12.0, 20.0, 23.0, 37.0, 58.0, 105.0, 160.0, 323.0, 644.0, 1491.0, 3677.0, 12203.0, 68263.0, 750578.0, 181545.0, 20167.0, 5453.0, 1919.0, 865.0, 429.0, 208.0, 103.0, 73.0, 57.0, 25.0, 33.0, 18.0, 6.0, 8.0, 7.0, 2.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.04296875, -1.00897216796875, -0.9749755859375, -0.94097900390625, -0.906982421875, -0.87298583984375, -0.8389892578125, -0.80499267578125, -0.77099609375, -0.73699951171875, -0.7030029296875, -0.66900634765625, -0.635009765625, -0.60101318359375, -0.5670166015625, -0.53302001953125, -0.4990234375, -0.46502685546875, -0.4310302734375, -0.39703369140625, -0.363037109375, -0.32904052734375, -0.2950439453125, -0.26104736328125, -0.22705078125, -0.19305419921875, -0.1590576171875, -0.12506103515625, -0.091064453125, -0.05706787109375, -0.0230712890625, 0.01092529296875, 0.044921875, 0.07891845703125, 0.1129150390625, 0.14691162109375, 0.180908203125, 0.21490478515625, 0.2489013671875, 0.28289794921875, 0.31689453125, 0.35089111328125, 0.3848876953125, 0.41888427734375, 0.452880859375, 0.48687744140625, 0.5208740234375, 0.55487060546875, 0.5888671875, 0.62286376953125, 0.6568603515625, 0.69085693359375, 0.724853515625, 0.75885009765625, 0.7928466796875, 0.82684326171875, 0.86083984375, 0.89483642578125, 0.9288330078125, 0.96282958984375, 0.996826171875, 1.03082275390625, 1.0648193359375, 1.09881591796875, 1.1328125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 5.0, 2.0, 6.0, 2.0, 7.0, 3.0, 13.0, 10.0, 10.0, 16.0, 18.0, 27.0, 25.0, 36.0, 34.0, 38.0, 31.0, 38.0, 44.0, 36.0, 51.0, 44.0, 48.0, 43.0, 45.0, 35.0, 49.0, 41.0, 35.0, 30.0, 29.0, 30.0, 26.0, 18.0, 18.0, 16.0, 15.0, 4.0, 4.0, 9.0, 2.0, 2.0, 3.0, 1.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.322265625, -3.22381591796875, -3.1253662109375, -3.02691650390625, -2.928466796875, -2.83001708984375, -2.7315673828125, -2.63311767578125, -2.53466796875, -2.43621826171875, -2.3377685546875, -2.23931884765625, -2.140869140625, -2.04241943359375, -1.9439697265625, -1.84552001953125, -1.7470703125, -1.64862060546875, -1.5501708984375, -1.45172119140625, -1.353271484375, -1.25482177734375, -1.1563720703125, -1.05792236328125, -0.95947265625, -0.86102294921875, -0.7625732421875, -0.66412353515625, -0.565673828125, -0.46722412109375, -0.3687744140625, -0.27032470703125, -0.171875, -0.07342529296875, 0.0250244140625, 0.12347412109375, 0.221923828125, 0.32037353515625, 0.4188232421875, 0.51727294921875, 0.61572265625, 0.71417236328125, 0.8126220703125, 0.91107177734375, 1.009521484375, 1.10797119140625, 1.2064208984375, 1.30487060546875, 1.4033203125, 1.50177001953125, 1.6002197265625, 1.69866943359375, 1.797119140625, 1.89556884765625, 1.9940185546875, 2.09246826171875, 2.19091796875, 2.28936767578125, 2.3878173828125, 2.48626708984375, 2.584716796875, 2.68316650390625, 2.7816162109375, 2.88006591796875, 2.978515625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 4.0, 1.0, 5.0, 3.0, 6.0, 8.0, 9.0, 14.0, 19.0, 17.0, 19.0, 38.0, 52.0, 76.0, 146.0, 239.0, 404.0, 769.0, 1703.0, 3704.0, 9100.0, 29768.0, 295973.0, 637208.0, 47866.0, 12272.0, 4822.0, 2126.0, 999.0, 457.0, 278.0, 166.0, 83.0, 64.0, 30.0, 26.0, 20.0, 19.0, 13.0, 4.0, 8.0, 7.0, 3.0, 4.0, 3.0, 1.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.455322265625, -0.4411582946777344, -0.42699432373046875, -0.4128303527832031, -0.3986663818359375, -0.3845024108886719, -0.37033843994140625, -0.3561744689941406, -0.342010498046875, -0.3278465270996094, -0.31368255615234375, -0.2995185852050781, -0.2853546142578125, -0.2711906433105469, -0.25702667236328125, -0.24286270141601562, -0.22869873046875, -0.21453475952148438, -0.20037078857421875, -0.18620681762695312, -0.1720428466796875, -0.15787887573242188, -0.14371490478515625, -0.12955093383789062, -0.115386962890625, -0.10122299194335938, -0.08705902099609375, -0.07289505004882812, -0.0587310791015625, -0.044567108154296875, -0.03040313720703125, -0.016239166259765625, -0.0020751953125, 0.012088775634765625, 0.02625274658203125, 0.040416717529296875, 0.0545806884765625, 0.06874465942382812, 0.08290863037109375, 0.09707260131835938, 0.111236572265625, 0.12540054321289062, 0.13956451416015625, 0.15372848510742188, 0.1678924560546875, 0.18205642700195312, 0.19622039794921875, 0.21038436889648438, 0.22454833984375, 0.23871231079101562, 0.25287628173828125, 0.2670402526855469, 0.2812042236328125, 0.2953681945800781, 0.30953216552734375, 0.3236961364746094, 0.337860107421875, 0.3520240783691406, 0.36618804931640625, 0.3803520202636719, 0.3945159912109375, 0.4086799621582031, 0.42284393310546875, 0.4370079040527344, 0.451171875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 8.0, 8.0, 8.0, 17.0, 19.0, 41.0, 78.0, 107.0, 171.0, 162.0, 129.0, 76.0, 60.0, 28.0, 23.0, 13.0, 15.0, 6.0, 8.0, 7.0, 2.0, 3.0, 0.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001876354217529297, -0.00018078461289405823, -0.00017393380403518677, -0.0001670829951763153, -0.00016023218631744385, -0.0001533813774585724, -0.00014653056859970093, -0.00013967975974082947, -0.000132828950881958, -0.00012597814202308655, -0.00011912733316421509, -0.00011227652430534363, -0.00010542571544647217, -9.857490658760071e-05, -9.172409772872925e-05, -8.487328886985779e-05, -7.802248001098633e-05, -7.117167115211487e-05, -6.432086229324341e-05, -5.747005343437195e-05, -5.061924457550049e-05, -4.376843571662903e-05, -3.691762685775757e-05, -3.006681799888611e-05, -2.321600914001465e-05, -1.636520028114319e-05, -9.514391422271729e-06, -2.6635825634002686e-06, 4.187226295471191e-06, 1.1038035154342651e-05, 1.788884401321411e-05, 2.473965287208557e-05, 3.159046173095703e-05, 3.844127058982849e-05, 4.529207944869995e-05, 5.214288830757141e-05, 5.899369716644287e-05, 6.584450602531433e-05, 7.269531488418579e-05, 7.954612374305725e-05, 8.639693260192871e-05, 9.324774146080017e-05, 0.00010009855031967163, 0.00010694935917854309, 0.00011380016803741455, 0.00012065097689628601, 0.00012750178575515747, 0.00013435259461402893, 0.0001412034034729004, 0.00014805421233177185, 0.0001549050211906433, 0.00016175583004951477, 0.00016860663890838623, 0.0001754574477672577, 0.00018230825662612915, 0.0001891590654850006, 0.00019600987434387207, 0.00020286068320274353, 0.000209711492061615, 0.00021656230092048645, 0.0002234131097793579, 0.00023026391863822937, 0.00023711472749710083, 0.0002439655363559723, 0.00025081634521484375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 8.0, 6.0, 14.0, 22.0, 19.0, 48.0, 64.0, 137.0, 209.0, 393.0, 919.0, 2227.0, 6292.0, 23458.0, 229220.0, 716720.0, 52066.0, 10637.0, 3512.0, 1313.0, 597.0, 281.0, 148.0, 91.0, 50.0, 29.0, 19.0, 20.0, 10.0, 2.0, 5.0, 3.0, 5.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.5341796875, -0.519012451171875, -0.50384521484375, -0.488677978515625, -0.4735107421875, -0.458343505859375, -0.44317626953125, -0.428009033203125, -0.412841796875, -0.397674560546875, -0.38250732421875, -0.367340087890625, -0.3521728515625, -0.337005615234375, -0.32183837890625, -0.306671142578125, -0.29150390625, -0.276336669921875, -0.26116943359375, -0.246002197265625, -0.2308349609375, -0.215667724609375, -0.20050048828125, -0.185333251953125, -0.170166015625, -0.154998779296875, -0.13983154296875, -0.124664306640625, -0.1094970703125, -0.094329833984375, -0.07916259765625, -0.063995361328125, -0.048828125, -0.033660888671875, -0.01849365234375, -0.003326416015625, 0.0118408203125, 0.027008056640625, 0.04217529296875, 0.057342529296875, 0.072509765625, 0.087677001953125, 0.10284423828125, 0.118011474609375, 0.1331787109375, 0.148345947265625, 0.16351318359375, 0.178680419921875, 0.19384765625, 0.209014892578125, 0.22418212890625, 0.239349365234375, 0.2545166015625, 0.269683837890625, 0.28485107421875, 0.300018310546875, 0.315185546875, 0.330352783203125, 0.34552001953125, 0.360687255859375, 0.3758544921875, 0.391021728515625, 0.40618896484375, 0.421356201171875, 0.4365234375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 4.0, 2.0, 6.0, 4.0, 10.0, 10.0, 16.0, 36.0, 32.0, 59.0, 115.0, 137.0, 150.0, 127.0, 90.0, 68.0, 43.0, 23.0, 14.0, 9.0, 6.0, 10.0, 7.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.11468505859375, -0.11144638061523438, -0.10820770263671875, -0.10496902465820312, -0.1017303466796875, -0.09849166870117188, -0.09525299072265625, -0.09201431274414062, -0.088775634765625, -0.08553695678710938, -0.08229827880859375, -0.07905960083007812, -0.0758209228515625, -0.07258224487304688, -0.06934356689453125, -0.06610488891601562, -0.0628662109375, -0.059627532958984375, -0.05638885498046875, -0.053150177001953125, -0.0499114990234375, -0.046672821044921875, -0.04343414306640625, -0.040195465087890625, -0.036956787109375, -0.033718109130859375, -0.03047943115234375, -0.027240753173828125, -0.0240020751953125, -0.020763397216796875, -0.01752471923828125, -0.014286041259765625, -0.01104736328125, -0.007808685302734375, -0.00457000732421875, -0.001331329345703125, 0.0019073486328125, 0.005146026611328125, 0.00838470458984375, 0.011623382568359375, 0.014862060546875, 0.018100738525390625, 0.02133941650390625, 0.024578094482421875, 0.0278167724609375, 0.031055450439453125, 0.03429412841796875, 0.037532806396484375, 0.040771484375, 0.044010162353515625, 0.04724884033203125, 0.050487518310546875, 0.0537261962890625, 0.056964874267578125, 0.06020355224609375, 0.06344223022460938, 0.066680908203125, 0.06991958618164062, 0.07315826416015625, 0.07639694213867188, 0.0796356201171875, 0.08287429809570312, 0.08611297607421875, 0.08935165405273438, 0.09259033203125]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 4.0, 3.0, 8.0, 19.0, 22.0, 50.0, 91.0, 163.0, 207.0, 203.0, 105.0, 59.0, 23.0, 9.0, 16.0, 5.0, 4.0, 3.0, 3.0, 0.0, 4.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6511712074279785, -3.50333833694458, -3.3555057048797607, -3.2076730728149414, -3.059840202331543, -2.9120073318481445, -2.764174699783325, -2.616342067718506, -2.4685091972351074, -2.320676326751709, -2.1728436946868896, -2.0250110626220703, -1.8771781921386719, -1.729345440864563, -1.581512689590454, -1.4336799383163452, -1.2858471870422363, -1.1380144357681274, -0.9901816844940186, -0.8423489332199097, -0.6945161819458008, -0.5466834306716919, -0.398850679397583, -0.2510179281234741, -0.10318517684936523, 0.04464757442474365, 0.19248032569885254, 0.3403130769729614, 0.4881458282470703, 0.6359785795211792, 0.7838113307952881, 0.931644082069397, 1.0794763565063477, 1.2273091077804565, 1.3751418590545654, 1.5229746103286743, 1.6708073616027832, 1.818640112876892, 1.966472864151001, 2.1143054962158203, 2.2621383666992188, 2.409971237182617, 2.5578038692474365, 2.705636501312256, 2.8534693717956543, 3.0013022422790527, 3.149134874343872, 3.2969675064086914, 3.44480037689209, 3.5926332473754883, 3.7404658794403076, 3.888298511505127, 4.036131381988525, 4.183964252471924, 4.331796646118164, 4.4796295166015625, 4.627462387084961, 4.775295257568359, 4.923128128051758, 5.070960521697998, 5.2187933921813965, 5.366626262664795, 5.514458656311035, 5.662291526794434, 5.810124397277832]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 3.0, 9.0, 10.0, 15.0, 35.0, 26.0, 42.0, 60.0, 74.0, 76.0, 98.0, 103.0, 88.0, 102.0, 72.0, 49.0, 43.0, 30.0, 12.0, 23.0, 8.0, 8.0, 6.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3646490573883057, -3.2696259021759033, -3.17460298538208, -3.0795798301696777, -2.9845566749572754, -2.889533519744873, -2.7945103645324707, -2.6994874477386475, -2.604464292526245, -2.5094411373138428, -2.4144182205200195, -2.319395065307617, -2.224371910095215, -2.1293487548828125, -2.03432559967041, -1.939302682876587, -1.8442795276641846, -1.7492563724517822, -1.6542333364486694, -1.5592103004455566, -1.4641871452331543, -1.369163990020752, -1.2741409540176392, -1.1791179180145264, -1.084094762802124, -0.9890716671943665, -0.8940485715866089, -0.7990254759788513, -0.7040023803710938, -0.6089792847633362, -0.5139561891555786, -0.41893309354782104, -0.3239097595214844, -0.2288866639137268, -0.13386356830596924, -0.03884047269821167, 0.0561826229095459, 0.15120571851730347, 0.24622881412506104, 0.3412519097328186, 0.43627500534057617, 0.5312981009483337, 0.6263211965560913, 0.7213442921638489, 0.8163673877716064, 0.911390483379364, 1.0064135789871216, 1.1014366149902344, 1.1964597702026367, 1.291482925415039, 1.3865059614181519, 1.4815289974212646, 1.576552152633667, 1.6715753078460693, 1.7665983438491821, 1.861621379852295, 1.9566445350646973, 2.0516676902770996, 2.146690845489502, 2.241713762283325, 2.3367369174957275, 2.43176007270813, 2.526782989501953, 2.6218061447143555, 2.716829299926758]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 5.0, 4.0, 2.0, 3.0, 8.0, 9.0, 14.0, 18.0, 20.0, 49.0, 66.0, 117.0, 188.0, 310.0, 578.0, 1129.0, 2369.0, 5469.0, 14337.0, 45729.0, 219618.0, 596235.0, 115395.0, 29093.0, 9928.0, 4055.0, 1769.0, 901.0, 459.0, 255.0, 147.0, 96.0, 60.0, 36.0, 27.0, 16.0, 9.0, 13.0, 5.0, 2.0, 3.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0], "bins": [-2.05078125, -1.99102783203125, -1.9312744140625, -1.87152099609375, -1.811767578125, -1.75201416015625, -1.6922607421875, -1.63250732421875, -1.57275390625, -1.51300048828125, -1.4532470703125, -1.39349365234375, -1.333740234375, -1.27398681640625, -1.2142333984375, -1.15447998046875, -1.0947265625, -1.03497314453125, -0.9752197265625, -0.91546630859375, -0.855712890625, -0.79595947265625, -0.7362060546875, -0.67645263671875, -0.61669921875, -0.55694580078125, -0.4971923828125, -0.43743896484375, -0.377685546875, -0.31793212890625, -0.2581787109375, -0.19842529296875, -0.138671875, -0.07891845703125, -0.0191650390625, 0.04058837890625, 0.100341796875, 0.16009521484375, 0.2198486328125, 0.27960205078125, 0.33935546875, 0.39910888671875, 0.4588623046875, 0.51861572265625, 0.578369140625, 0.63812255859375, 0.6978759765625, 0.75762939453125, 0.8173828125, 0.87713623046875, 0.9368896484375, 0.99664306640625, 1.056396484375, 1.11614990234375, 1.1759033203125, 1.23565673828125, 1.29541015625, 1.35516357421875, 1.4149169921875, 1.47467041015625, 1.534423828125, 1.59417724609375, 1.6539306640625, 1.71368408203125, 1.7734375]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 3.0, 5.0, 14.0, 10.0, 24.0, 17.0, 34.0, 42.0, 66.0, 55.0, 74.0, 75.0, 106.0, 85.0, 90.0, 66.0, 55.0, 48.0, 36.0, 33.0, 14.0, 15.0, 9.0, 8.0, 8.0, 7.0, 6.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.33984375, -7.1224365234375, -6.905029296875, -6.6876220703125, -6.47021484375, -6.2528076171875, -6.035400390625, -5.8179931640625, -5.6005859375, -5.3831787109375, -5.165771484375, -4.9483642578125, -4.73095703125, -4.5135498046875, -4.296142578125, -4.0787353515625, -3.861328125, -3.6439208984375, -3.426513671875, -3.2091064453125, -2.99169921875, -2.7742919921875, -2.556884765625, -2.3394775390625, -2.1220703125, -1.9046630859375, -1.687255859375, -1.4698486328125, -1.25244140625, -1.0350341796875, -0.817626953125, -0.6002197265625, -0.3828125, -0.1654052734375, 0.052001953125, 0.2694091796875, 0.48681640625, 0.7042236328125, 0.921630859375, 1.1390380859375, 1.3564453125, 1.5738525390625, 1.791259765625, 2.0086669921875, 2.22607421875, 2.4434814453125, 2.660888671875, 2.8782958984375, 3.095703125, 3.3131103515625, 3.530517578125, 3.7479248046875, 3.96533203125, 4.1827392578125, 4.400146484375, 4.6175537109375, 4.8349609375, 5.0523681640625, 5.269775390625, 5.4871826171875, 5.70458984375, 5.9219970703125, 6.139404296875, 6.3568115234375, 6.57421875]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 3.0, 2.0, 4.0, 3.0, 5.0, 14.0, 9.0, 7.0, 17.0, 18.0, 24.0, 29.0, 27.0, 31.0, 35.0, 36.0, 38.0, 38.0, 53.0, 135.0, 3330.0, 1038608.0, 5539.0, 153.0, 52.0, 34.0, 52.0, 35.0, 22.0, 40.0, 32.0, 24.0, 20.0, 14.0, 12.0, 15.0, 6.0, 9.0, 9.0, 10.0, 4.0, 3.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-14.734375, -14.307861328125, -13.88134765625, -13.454833984375, -13.0283203125, -12.601806640625, -12.17529296875, -11.748779296875, -11.322265625, -10.895751953125, -10.46923828125, -10.042724609375, -9.6162109375, -9.189697265625, -8.76318359375, -8.336669921875, -7.91015625, -7.483642578125, -7.05712890625, -6.630615234375, -6.2041015625, -5.777587890625, -5.35107421875, -4.924560546875, -4.498046875, -4.071533203125, -3.64501953125, -3.218505859375, -2.7919921875, -2.365478515625, -1.93896484375, -1.512451171875, -1.0859375, -0.659423828125, -0.23291015625, 0.193603515625, 0.6201171875, 1.046630859375, 1.47314453125, 1.899658203125, 2.326171875, 2.752685546875, 3.17919921875, 3.605712890625, 4.0322265625, 4.458740234375, 4.88525390625, 5.311767578125, 5.73828125, 6.164794921875, 6.59130859375, 7.017822265625, 7.4443359375, 7.870849609375, 8.29736328125, 8.723876953125, 9.150390625, 9.576904296875, 10.00341796875, 10.429931640625, 10.8564453125, 11.282958984375, 11.70947265625, 12.135986328125, 12.5625]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 1.0, 3.0, 1.0, 3.0, 6.0, 4.0, 7.0, 16.0, 8.0, 12.0, 13.0, 24.0, 13.0, 30.0, 32.0, 29.0, 32.0, 31.0, 44.0, 33.0, 41.0, 50.0, 36.0, 36.0, 42.0, 57.0, 42.0, 40.0, 41.0, 38.0, 26.0, 28.0, 37.0, 25.0, 25.0, 20.0, 9.0, 15.0, 7.0, 14.0, 6.0, 11.0, 6.0, 6.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.25, -5.098876953125, -4.94775390625, -4.796630859375, -4.6455078125, -4.494384765625, -4.34326171875, -4.192138671875, -4.041015625, -3.889892578125, -3.73876953125, -3.587646484375, -3.4365234375, -3.285400390625, -3.13427734375, -2.983154296875, -2.83203125, -2.680908203125, -2.52978515625, -2.378662109375, -2.2275390625, -2.076416015625, -1.92529296875, -1.774169921875, -1.623046875, -1.471923828125, -1.32080078125, -1.169677734375, -1.0185546875, -0.867431640625, -0.71630859375, -0.565185546875, -0.4140625, -0.262939453125, -0.11181640625, 0.039306640625, 0.1904296875, 0.341552734375, 0.49267578125, 0.643798828125, 0.794921875, 0.946044921875, 1.09716796875, 1.248291015625, 1.3994140625, 1.550537109375, 1.70166015625, 1.852783203125, 2.00390625, 2.155029296875, 2.30615234375, 2.457275390625, 2.6083984375, 2.759521484375, 2.91064453125, 3.061767578125, 3.212890625, 3.364013671875, 3.51513671875, 3.666259765625, 3.8173828125, 3.968505859375, 4.11962890625, 4.270751953125, 4.421875]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 2.0, 9.0, 14.0, 16.0, 30.0, 73.0, 164.0, 399.0, 1223.0, 6854.0, 109695.0, 882835.0, 42026.0, 3896.0, 839.0, 263.0, 102.0, 50.0, 32.0, 9.0, 10.0, 8.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1787109375, -1.1339874267578125, -1.089263916015625, -1.0445404052734375, -0.99981689453125, -0.9550933837890625, -0.910369873046875, -0.8656463623046875, -0.8209228515625, -0.7761993408203125, -0.731475830078125, -0.6867523193359375, -0.64202880859375, -0.5973052978515625, -0.552581787109375, -0.5078582763671875, -0.463134765625, -0.4184112548828125, -0.373687744140625, -0.3289642333984375, -0.28424072265625, -0.2395172119140625, -0.194793701171875, -0.1500701904296875, -0.1053466796875, -0.0606231689453125, -0.015899658203125, 0.0288238525390625, 0.07354736328125, 0.1182708740234375, 0.162994384765625, 0.2077178955078125, 0.25244140625, 0.2971649169921875, 0.341888427734375, 0.3866119384765625, 0.43133544921875, 0.4760589599609375, 0.520782470703125, 0.5655059814453125, 0.6102294921875, 0.6549530029296875, 0.699676513671875, 0.7444000244140625, 0.78912353515625, 0.8338470458984375, 0.878570556640625, 0.9232940673828125, 0.968017578125, 1.0127410888671875, 1.057464599609375, 1.1021881103515625, 1.14691162109375, 1.1916351318359375, 1.236358642578125, 1.2810821533203125, 1.3258056640625, 1.3705291748046875, 1.415252685546875, 1.4599761962890625, 1.50469970703125, 1.5494232177734375, 1.594146728515625, 1.6388702392578125, 1.68359375]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 5.0, 6.0, 6.0, 13.0, 17.0, 12.0, 19.0, 34.0, 46.0, 36.0, 56.0, 80.0, 104.0, 114.0, 78.0, 74.0, 73.0, 64.0, 41.0, 38.0, 25.0, 17.0, 10.0, 10.0, 7.0, 7.0, 5.0, 1.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010943412780761719, -0.00010620895773172379, -0.00010298378765583038, -9.975861757993698e-05, -9.653344750404358e-05, -9.330827742815018e-05, -9.008310735225677e-05, -8.685793727636337e-05, -8.363276720046997e-05, -8.040759712457657e-05, -7.718242704868317e-05, -7.395725697278976e-05, -7.073208689689636e-05, -6.750691682100296e-05, -6.428174674510956e-05, -6.105657666921616e-05, -5.7831406593322754e-05, -5.460623651742935e-05, -5.138106644153595e-05, -4.815589636564255e-05, -4.4930726289749146e-05, -4.1705556213855743e-05, -3.848038613796234e-05, -3.525521606206894e-05, -3.203004598617554e-05, -2.8804875910282135e-05, -2.5579705834388733e-05, -2.235453575849533e-05, -1.912936568260193e-05, -1.5904195606708527e-05, -1.2679025530815125e-05, -9.453855454921722e-06, -6.22868537902832e-06, -3.0035153031349182e-06, 2.2165477275848389e-07, 3.446824848651886e-06, 6.671994924545288e-06, 9.89716500043869e-06, 1.3122335076332092e-05, 1.6347505152225494e-05, 1.9572675228118896e-05, 2.27978453040123e-05, 2.60230153799057e-05, 2.9248185455799103e-05, 3.2473355531692505e-05, 3.569852560758591e-05, 3.892369568347931e-05, 4.214886575937271e-05, 4.537403583526611e-05, 4.8599205911159515e-05, 5.182437598705292e-05, 5.504954606294632e-05, 5.827471613883972e-05, 6.149988621473312e-05, 6.472505629062653e-05, 6.795022636651993e-05, 7.117539644241333e-05, 7.440056651830673e-05, 7.762573659420013e-05, 8.085090667009354e-05, 8.407607674598694e-05, 8.730124682188034e-05, 9.052641689777374e-05, 9.375158697366714e-05, 9.697675704956055e-05]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 7.0, 6.0, 12.0, 12.0, 25.0, 32.0, 52.0, 81.0, 184.0, 301.0, 608.0, 1345.0, 3201.0, 9941.0, 36634.0, 187932.0, 650743.0, 119978.0, 25722.0, 7155.0, 2435.0, 1049.0, 490.0, 277.0, 124.0, 70.0, 46.0, 35.0, 20.0, 12.0, 7.0, 8.0, 4.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.62451171875, -0.6039505004882812, -0.5833892822265625, -0.5628280639648438, -0.542266845703125, -0.5217056274414062, -0.5011444091796875, -0.48058319091796875, -0.46002197265625, -0.43946075439453125, -0.4188995361328125, -0.39833831787109375, -0.377777099609375, -0.35721588134765625, -0.3366546630859375, -0.31609344482421875, -0.2955322265625, -0.27497100830078125, -0.2544097900390625, -0.23384857177734375, -0.213287353515625, -0.19272613525390625, -0.1721649169921875, -0.15160369873046875, -0.13104248046875, -0.11048126220703125, -0.0899200439453125, -0.06935882568359375, -0.048797607421875, -0.02823638916015625, -0.0076751708984375, 0.01288604736328125, 0.033447265625, 0.05400848388671875, 0.0745697021484375, 0.09513092041015625, 0.115692138671875, 0.13625335693359375, 0.1568145751953125, 0.17737579345703125, 0.19793701171875, 0.21849822998046875, 0.2390594482421875, 0.25962066650390625, 0.280181884765625, 0.30074310302734375, 0.3213043212890625, 0.34186553955078125, 0.3624267578125, 0.38298797607421875, 0.4035491943359375, 0.42411041259765625, 0.444671630859375, 0.46523284912109375, 0.4857940673828125, 0.5063552856445312, 0.52691650390625, 0.5474777221679688, 0.5680389404296875, 0.5886001586914062, 0.609161376953125, 0.6297225952148438, 0.6502838134765625, 0.6708450317382812, 0.69140625]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 2.0, 2.0, 4.0, 5.0, 4.0, 16.0, 23.0, 16.0, 21.0, 38.0, 49.0, 103.0, 171.0, 167.0, 129.0, 78.0, 56.0, 45.0, 20.0, 22.0, 8.0, 8.0, 10.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.498779296875, -0.4841804504394531, -0.46958160400390625, -0.4549827575683594, -0.4403839111328125, -0.4257850646972656, -0.41118621826171875, -0.3965873718261719, -0.381988525390625, -0.3673896789550781, -0.35279083251953125, -0.3381919860839844, -0.3235931396484375, -0.3089942932128906, -0.29439544677734375, -0.2797966003417969, -0.26519775390625, -0.2505989074707031, -0.23600006103515625, -0.22140121459960938, -0.2068023681640625, -0.19220352172851562, -0.17760467529296875, -0.16300582885742188, -0.148406982421875, -0.13380813598632812, -0.11920928955078125, -0.10461044311523438, -0.0900115966796875, -0.07541275024414062, -0.06081390380859375, -0.046215057373046875, -0.0316162109375, -0.017017364501953125, -0.00241851806640625, 0.012180328369140625, 0.0267791748046875, 0.041378021240234375, 0.05597686767578125, 0.07057571411132812, 0.085174560546875, 0.09977340698242188, 0.11437225341796875, 0.12897109985351562, 0.1435699462890625, 0.15816879272460938, 0.17276763916015625, 0.18736648559570312, 0.20196533203125, 0.21656417846679688, 0.23116302490234375, 0.24576187133789062, 0.2603607177734375, 0.2749595642089844, 0.28955841064453125, 0.3041572570800781, 0.318756103515625, 0.3333549499511719, 0.34795379638671875, 0.3625526428222656, 0.3771514892578125, 0.3917503356933594, 0.40634918212890625, 0.4209480285644531, 0.435546875]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 14.0, 80.0, 723.0, 180.0, 14.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.078995227813721, -3.6878089904785156, -2.2966229915618896, -0.9054369926452637, 0.4857492446899414, 1.8769354820251465, 3.2681212425231934, 4.659307956695557, 6.0504937171936035, 7.441679954528809, 8.832865715026855, 10.224052429199219, 11.615238189697266, 13.006423950195312, 14.39760971069336, 15.788797378540039, 17.179983139038086, 18.571168899536133, 19.96235466003418, 21.35354232788086, 22.744728088378906, 24.135913848876953, 25.527099609375, 26.918285369873047, 28.309471130371094, 29.70065689086914, 31.091842651367188, 32.483028411865234, 33.87421417236328, 35.265403747558594, 36.656585693359375, 38.04777526855469, 39.438961029052734, 40.83014678955078, 42.22133255004883, 43.612518310546875, 45.00370407104492, 46.39488983154297, 47.78607940673828, 49.17726516723633, 50.568450927734375, 51.95963668823242, 53.35082244873047, 54.742008209228516, 56.13319396972656, 57.524383544921875, 58.915565490722656, 60.30675506591797, 61.69793701171875, 63.0891227722168, 64.48030853271484, 65.87149810791016, 67.26268005371094, 68.65386962890625, 70.04505157470703, 71.43624114990234, 72.82743072509766, 74.21862030029297, 75.60980224609375, 77.00099182128906, 78.39217376708984, 79.78336334228516, 81.17454528808594, 82.56573486328125, 83.95691680908203]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 10.0, 9.0, 10.0, 10.0, 17.0, 26.0, 26.0, 37.0, 42.0, 46.0, 53.0, 63.0, 70.0, 59.0, 66.0, 69.0, 58.0, 58.0, 48.0, 46.0, 44.0, 35.0, 25.0, 12.0, 17.0, 14.0, 14.0, 6.0, 7.0, 2.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.776616096496582, -11.457667350769043, -11.138718605041504, -10.819770812988281, -10.500822067260742, -10.181873321533203, -9.862924575805664, -9.543975830078125, -9.225027084350586, -8.906078338623047, -8.587129592895508, -8.268181800842285, -7.949233055114746, -7.630284309387207, -7.311335563659668, -6.992386817932129, -6.673439025878906, -6.354490280151367, -6.035542011260986, -5.716593265533447, -5.397644996643066, -5.078696250915527, -4.759747505187988, -4.440798759460449, -4.121850490570068, -3.8029019832611084, -3.4839534759521484, -3.1650047302246094, -2.8460562229156494, -2.5271077156066895, -2.2081589698791504, -1.8892104625701904, -1.5702619552612305, -1.2513134479522705, -0.932364821434021, -0.6134162545204163, -0.2944676876068115, 0.024480819702148438, 0.34342944622039795, 0.6623780727386475, 0.9813265800476074, 1.3002750873565674, 1.619223713874817, 1.9381723403930664, 2.2571208477020264, 2.5760693550109863, 2.8950181007385254, 3.2139666080474854, 3.5329151153564453, 3.8518636226654053, 4.170812129974365, 4.489760875701904, 4.808709144592285, 5.127657890319824, 5.446606636047363, 5.765555381774902, 6.084503650665283, 6.403452396392822, 6.722400665283203, 7.041349411010742, 7.360298156738281, 7.679246425628662, 7.998195171356201, 8.317143440246582, 8.636092185974121]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 6.0, 7.0, 9.0, 4.0, 11.0, 14.0, 15.0, 24.0, 20.0, 42.0, 63.0, 97.0, 209.0, 656.0, 2716.0, 25138.0, 2708189.0, 1432462.0, 21213.0, 2406.0, 508.0, 191.0, 85.0, 52.0, 37.0, 25.0, 22.0, 14.0, 14.0, 12.0, 6.0, 3.0, 6.0, 3.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.046875, -8.80853271484375, -8.5701904296875, -8.33184814453125, -8.093505859375, -7.85516357421875, -7.6168212890625, -7.37847900390625, -7.14013671875, -6.90179443359375, -6.6634521484375, -6.42510986328125, -6.186767578125, -5.94842529296875, -5.7100830078125, -5.47174072265625, -5.2333984375, -4.99505615234375, -4.7567138671875, -4.51837158203125, -4.280029296875, -4.04168701171875, -3.8033447265625, -3.56500244140625, -3.32666015625, -3.08831787109375, -2.8499755859375, -2.61163330078125, -2.373291015625, -2.13494873046875, -1.8966064453125, -1.65826416015625, -1.419921875, -1.18157958984375, -0.9432373046875, -0.70489501953125, -0.466552734375, -0.22821044921875, 0.0101318359375, 0.24847412109375, 0.48681640625, 0.72515869140625, 0.9635009765625, 1.20184326171875, 1.440185546875, 1.67852783203125, 1.9168701171875, 2.15521240234375, 2.3935546875, 2.63189697265625, 2.8702392578125, 3.10858154296875, 3.346923828125, 3.58526611328125, 3.8236083984375, 4.06195068359375, 4.30029296875, 4.53863525390625, 4.7769775390625, 5.01531982421875, 5.253662109375, 5.49200439453125, 5.7303466796875, 5.96868896484375, 6.20703125]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 6.0, 2.0, 3.0, 3.0, 6.0, 8.0, 12.0, 27.0, 37.0, 56.0, 71.0, 86.0, 95.0, 131.0, 131.0, 120.0, 60.0, 52.0, 32.0, 26.0, 14.0, 14.0, 6.0, 8.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0625, -4.92401123046875, -4.7855224609375, -4.64703369140625, -4.508544921875, -4.37005615234375, -4.2315673828125, -4.09307861328125, -3.95458984375, -3.81610107421875, -3.6776123046875, -3.53912353515625, -3.400634765625, -3.26214599609375, -3.1236572265625, -2.98516845703125, -2.8466796875, -2.70819091796875, -2.5697021484375, -2.43121337890625, -2.292724609375, -2.15423583984375, -2.0157470703125, -1.87725830078125, -1.73876953125, -1.60028076171875, -1.4617919921875, -1.32330322265625, -1.184814453125, -1.04632568359375, -0.9078369140625, -0.76934814453125, -0.630859375, -0.49237060546875, -0.3538818359375, -0.21539306640625, -0.076904296875, 0.06158447265625, 0.2000732421875, 0.33856201171875, 0.47705078125, 0.61553955078125, 0.7540283203125, 0.89251708984375, 1.031005859375, 1.16949462890625, 1.3079833984375, 1.44647216796875, 1.5849609375, 1.72344970703125, 1.8619384765625, 2.00042724609375, 2.138916015625, 2.27740478515625, 2.4158935546875, 2.55438232421875, 2.69287109375, 2.83135986328125, 2.9698486328125, 3.10833740234375, 3.246826171875, 3.38531494140625, 3.5238037109375, 3.66229248046875, 3.80078125]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 11.0, 9.0, 8.0, 23.0, 27.0, 51.0, 80.0, 119.0, 233.0, 823.0, 5991.0, 594345.0, 3579707.0, 11145.0, 1048.0, 302.0, 140.0, 86.0, 46.0, 27.0, 19.0, 11.0, 10.0, 7.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.3984375, -12.0968017578125, -11.795166015625, -11.4935302734375, -11.19189453125, -10.8902587890625, -10.588623046875, -10.2869873046875, -9.9853515625, -9.6837158203125, -9.382080078125, -9.0804443359375, -8.77880859375, -8.4771728515625, -8.175537109375, -7.8739013671875, -7.572265625, -7.2706298828125, -6.968994140625, -6.6673583984375, -6.36572265625, -6.0640869140625, -5.762451171875, -5.4608154296875, -5.1591796875, -4.8575439453125, -4.555908203125, -4.2542724609375, -3.95263671875, -3.6510009765625, -3.349365234375, -3.0477294921875, -2.74609375, -2.4444580078125, -2.142822265625, -1.8411865234375, -1.53955078125, -1.2379150390625, -0.936279296875, -0.6346435546875, -0.3330078125, -0.0313720703125, 0.270263671875, 0.5718994140625, 0.87353515625, 1.1751708984375, 1.476806640625, 1.7784423828125, 2.080078125, 2.3817138671875, 2.683349609375, 2.9849853515625, 3.28662109375, 3.5882568359375, 3.889892578125, 4.1915283203125, 4.4931640625, 4.7947998046875, 5.096435546875, 5.3980712890625, 5.69970703125, 6.0013427734375, 6.302978515625, 6.6046142578125, 6.90625]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 4.0, 0.0, 2.0, 6.0, 2.0, 6.0, 9.0, 9.0, 20.0, 24.0, 26.0, 49.0, 49.0, 63.0, 79.0, 111.0, 177.0, 258.0, 395.0, 642.0, 785.0, 422.0, 284.0, 188.0, 122.0, 88.0, 50.0, 53.0, 52.0, 24.0, 20.0, 17.0, 16.0, 5.0, 7.0, 8.0, 3.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.74951171875, -0.726165771484375, -0.70281982421875, -0.679473876953125, -0.6561279296875, -0.632781982421875, -0.60943603515625, -0.586090087890625, -0.562744140625, -0.539398193359375, -0.51605224609375, -0.492706298828125, -0.4693603515625, -0.446014404296875, -0.42266845703125, -0.399322509765625, -0.3759765625, -0.352630615234375, -0.32928466796875, -0.305938720703125, -0.2825927734375, -0.259246826171875, -0.23590087890625, -0.212554931640625, -0.189208984375, -0.165863037109375, -0.14251708984375, -0.119171142578125, -0.0958251953125, -0.072479248046875, -0.04913330078125, -0.025787353515625, -0.00244140625, 0.020904541015625, 0.04425048828125, 0.067596435546875, 0.0909423828125, 0.114288330078125, 0.13763427734375, 0.160980224609375, 0.184326171875, 0.207672119140625, 0.23101806640625, 0.254364013671875, 0.2777099609375, 0.301055908203125, 0.32440185546875, 0.347747802734375, 0.37109375, 0.394439697265625, 0.41778564453125, 0.441131591796875, 0.4644775390625, 0.487823486328125, 0.51116943359375, 0.534515380859375, 0.557861328125, 0.581207275390625, 0.60455322265625, 0.627899169921875, 0.6512451171875, 0.674591064453125, 0.69793701171875, 0.721282958984375, 0.74462890625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 8.0, 7.0, 10.0, 12.0, 20.0, 20.0, 42.0, 60.0, 91.0, 99.0, 124.0, 116.0, 106.0, 83.0, 66.0, 43.0, 25.0, 14.0, 16.0, 9.0, 4.0, 7.0, 5.0, 4.0, 2.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.7563977241516113, -3.636451244354248, -3.5165047645568848, -3.3965582847595215, -3.276611804962158, -3.156665325164795, -3.0367190837860107, -2.9167726039886475, -2.796826124191284, -2.676879644393921, -2.5569331645965576, -2.4369866847991943, -2.31704044342041, -2.197093963623047, -2.0771474838256836, -1.9572010040283203, -1.837254524230957, -1.7173080444335938, -1.5973615646362305, -1.4774152040481567, -1.3574687242507935, -1.2375222444534302, -1.1175758838653564, -0.9976294040679932, -0.8776829242706299, -0.7577364444732666, -0.6377900242805481, -0.5178436040878296, -0.3978971242904663, -0.277950644493103, -0.15800422430038452, -0.038057804107666016, 0.08188843727111816, 0.20183488726615906, 0.32178133726119995, 0.44172778725624084, 0.5616742372512817, 0.681620717048645, 0.8015671372413635, 0.921513557434082, 1.0414600372314453, 1.1614065170288086, 1.2813529968261719, 1.4012993574142456, 1.5212458372116089, 1.6411923170089722, 1.761138677597046, 1.8810851573944092, 2.0010316371917725, 2.1209781169891357, 2.240924596786499, 2.3608710765838623, 2.4808173179626465, 2.6007637977600098, 2.720710277557373, 2.8406567573547363, 2.9606032371520996, 3.080549716949463, 3.200496196746826, 3.3204426765441895, 3.4403891563415527, 3.560335636138916, 3.6802818775177, 3.8002283573150635, 3.9201748371124268]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 8.0, 12.0, 16.0, 20.0, 34.0, 45.0, 40.0, 54.0, 67.0, 83.0, 104.0, 91.0, 107.0, 83.0, 67.0, 55.0, 45.0, 27.0, 17.0, 13.0, 4.0, 6.0, 6.0, 4.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.689472675323486, -4.55390739440918, -4.418341636657715, -4.28277587890625, -4.147210597991943, -4.011645317077637, -3.876079559326172, -3.740514039993286, -3.6049485206604004, -3.4693830013275146, -3.333817481994629, -3.198251962661743, -3.0626864433288574, -2.9271209239959717, -2.791555404663086, -2.6559898853302, -2.5204243659973145, -2.3848588466644287, -2.249293327331543, -2.1137278079986572, -1.9781622886657715, -1.8425967693328857, -1.70703125, -1.5714657306671143, -1.4359002113342285, -1.3003346920013428, -1.164769172668457, -1.0292036533355713, -0.8936381340026855, -0.7580726146697998, -0.6225070953369141, -0.4869415760040283, -0.3513755798339844, -0.21581006050109863, -0.08024454116821289, 0.05532097816467285, 0.1908864974975586, 0.32645201683044434, 0.4620175361633301, 0.5975830554962158, 0.7331485748291016, 0.8687140941619873, 1.004279613494873, 1.1398451328277588, 1.2754106521606445, 1.4109761714935303, 1.546541690826416, 1.6821072101593018, 1.8176727294921875, 1.9532382488250732, 2.088803768157959, 2.2243692874908447, 2.3599348068237305, 2.495500326156616, 2.631065845489502, 2.7666313648223877, 2.9021968841552734, 3.037762403488159, 3.173327922821045, 3.3088934421539307, 3.4444589614868164, 3.580024480819702, 3.715590000152588, 3.8511555194854736, 3.9867210388183594]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 7.0, 3.0, 8.0, 10.0, 24.0, 29.0, 58.0, 96.0, 154.0, 301.0, 631.0, 1514.0, 4182.0, 16518.0, 151244.0, 784434.0, 72696.0, 11238.0, 3126.0, 1169.0, 526.0, 262.0, 139.0, 66.0, 53.0, 27.0, 16.0, 14.0, 8.0, 5.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2626953125, -1.230621337890625, -1.19854736328125, -1.166473388671875, -1.1343994140625, -1.102325439453125, -1.07025146484375, -1.038177490234375, -1.006103515625, -0.974029541015625, -0.94195556640625, -0.909881591796875, -0.8778076171875, -0.845733642578125, -0.81365966796875, -0.781585693359375, -0.74951171875, -0.717437744140625, -0.68536376953125, -0.653289794921875, -0.6212158203125, -0.589141845703125, -0.55706787109375, -0.524993896484375, -0.492919921875, -0.460845947265625, -0.42877197265625, -0.396697998046875, -0.3646240234375, -0.332550048828125, -0.30047607421875, -0.268402099609375, -0.236328125, -0.204254150390625, -0.17218017578125, -0.140106201171875, -0.1080322265625, -0.075958251953125, -0.04388427734375, -0.011810302734375, 0.020263671875, 0.052337646484375, 0.08441162109375, 0.116485595703125, 0.1485595703125, 0.180633544921875, 0.21270751953125, 0.244781494140625, 0.27685546875, 0.308929443359375, 0.34100341796875, 0.373077392578125, 0.4051513671875, 0.437225341796875, 0.46929931640625, 0.501373291015625, 0.533447265625, 0.565521240234375, 0.59759521484375, 0.629669189453125, 0.6617431640625, 0.693817138671875, 0.72589111328125, 0.757965087890625, 0.7900390625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 6.0, 13.0, 24.0, 15.0, 44.0, 48.0, 65.0, 84.0, 110.0, 130.0, 147.0, 101.0, 76.0, 55.0, 36.0, 23.0, 10.0, 9.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.888671875, -3.776153564453125, -3.66363525390625, -3.551116943359375, -3.4385986328125, -3.326080322265625, -3.21356201171875, -3.101043701171875, -2.988525390625, -2.876007080078125, -2.76348876953125, -2.650970458984375, -2.5384521484375, -2.425933837890625, -2.31341552734375, -2.200897216796875, -2.08837890625, -1.975860595703125, -1.86334228515625, -1.750823974609375, -1.6383056640625, -1.525787353515625, -1.41326904296875, -1.300750732421875, -1.188232421875, -1.075714111328125, -0.96319580078125, -0.850677490234375, -0.7381591796875, -0.625640869140625, -0.51312255859375, -0.400604248046875, -0.2880859375, -0.175567626953125, -0.06304931640625, 0.049468994140625, 0.1619873046875, 0.274505615234375, 0.38702392578125, 0.499542236328125, 0.612060546875, 0.724578857421875, 0.83709716796875, 0.949615478515625, 1.0621337890625, 1.174652099609375, 1.28717041015625, 1.399688720703125, 1.51220703125, 1.624725341796875, 1.73724365234375, 1.849761962890625, 1.9622802734375, 2.074798583984375, 2.18731689453125, 2.299835205078125, 2.412353515625, 2.524871826171875, 2.63739013671875, 2.749908447265625, 2.8624267578125, 2.974945068359375, 3.08746337890625, 3.199981689453125, 3.3125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 4.0, 3.0, 5.0, 5.0, 13.0, 14.0, 14.0, 21.0, 42.0, 51.0, 65.0, 88.0, 166.0, 295.0, 557.0, 1229.0, 3136.0, 11346.0, 87362.0, 774015.0, 148442.0, 14858.0, 3885.0, 1441.0, 678.0, 301.0, 174.0, 110.0, 71.0, 61.0, 29.0, 17.0, 11.0, 8.0, 6.0, 9.0, 3.0, 7.0, 1.0, 2.0, 2.0, 0.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.9970703125, -0.96905517578125, -0.9410400390625, -0.91302490234375, -0.885009765625, -0.85699462890625, -0.8289794921875, -0.80096435546875, -0.77294921875, -0.74493408203125, -0.7169189453125, -0.68890380859375, -0.660888671875, -0.63287353515625, -0.6048583984375, -0.57684326171875, -0.548828125, -0.52081298828125, -0.4927978515625, -0.46478271484375, -0.436767578125, -0.40875244140625, -0.3807373046875, -0.35272216796875, -0.32470703125, -0.29669189453125, -0.2686767578125, -0.24066162109375, -0.212646484375, -0.18463134765625, -0.1566162109375, -0.12860107421875, -0.1005859375, -0.07257080078125, -0.0445556640625, -0.01654052734375, 0.011474609375, 0.03948974609375, 0.0675048828125, 0.09552001953125, 0.12353515625, 0.15155029296875, 0.1795654296875, 0.20758056640625, 0.235595703125, 0.26361083984375, 0.2916259765625, 0.31964111328125, 0.34765625, 0.37567138671875, 0.4036865234375, 0.43170166015625, 0.459716796875, 0.48773193359375, 0.5157470703125, 0.54376220703125, 0.57177734375, 0.59979248046875, 0.6278076171875, 0.65582275390625, 0.683837890625, 0.71185302734375, 0.7398681640625, 0.76788330078125, 0.7958984375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 3.0, 4.0, 5.0, 6.0, 7.0, 7.0, 16.0, 16.0, 21.0, 23.0, 18.0, 26.0, 22.0, 31.0, 36.0, 21.0, 35.0, 46.0, 44.0, 47.0, 39.0, 41.0, 58.0, 41.0, 46.0, 39.0, 37.0, 24.0, 40.0, 29.0, 23.0, 36.0, 21.0, 13.0, 20.0, 12.0, 7.0, 16.0, 5.0, 4.0, 3.0, 4.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.64453125, -2.552825927734375, -2.46112060546875, -2.369415283203125, -2.2777099609375, -2.186004638671875, -2.09429931640625, -2.002593994140625, -1.910888671875, -1.819183349609375, -1.72747802734375, -1.635772705078125, -1.5440673828125, -1.452362060546875, -1.36065673828125, -1.268951416015625, -1.17724609375, -1.085540771484375, -0.99383544921875, -0.902130126953125, -0.8104248046875, -0.718719482421875, -0.62701416015625, -0.535308837890625, -0.443603515625, -0.351898193359375, -0.26019287109375, -0.168487548828125, -0.0767822265625, 0.014923095703125, 0.10662841796875, 0.198333740234375, 0.2900390625, 0.381744384765625, 0.47344970703125, 0.565155029296875, 0.6568603515625, 0.748565673828125, 0.84027099609375, 0.931976318359375, 1.023681640625, 1.115386962890625, 1.20709228515625, 1.298797607421875, 1.3905029296875, 1.482208251953125, 1.57391357421875, 1.665618896484375, 1.75732421875, 1.849029541015625, 1.94073486328125, 2.032440185546875, 2.1241455078125, 2.215850830078125, 2.30755615234375, 2.399261474609375, 2.490966796875, 2.582672119140625, 2.67437744140625, 2.766082763671875, 2.8577880859375, 2.949493408203125, 3.04119873046875, 3.132904052734375, 3.224609375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 8.0, 7.0, 2.0, 11.0, 13.0, 13.0, 18.0, 22.0, 34.0, 46.0, 58.0, 88.0, 117.0, 200.0, 357.0, 519.0, 843.0, 1423.0, 2506.0, 4960.0, 11007.0, 32529.0, 206491.0, 671300.0, 79506.0, 19912.0, 7830.0, 3665.0, 1998.0, 1094.0, 710.0, 443.0, 272.0, 160.0, 124.0, 80.0, 42.0, 42.0, 21.0, 20.0, 20.0, 13.0, 6.0, 8.0, 7.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.31298828125, -0.3026542663574219, -0.29232025146484375, -0.2819862365722656, -0.2716522216796875, -0.2613182067871094, -0.25098419189453125, -0.24065017700195312, -0.230316162109375, -0.21998214721679688, -0.20964813232421875, -0.19931411743164062, -0.1889801025390625, -0.17864608764648438, -0.16831207275390625, -0.15797805786132812, -0.14764404296875, -0.13731002807617188, -0.12697601318359375, -0.11664199829101562, -0.1063079833984375, -0.09597396850585938, -0.08563995361328125, -0.07530593872070312, -0.064971923828125, -0.054637908935546875, -0.04430389404296875, -0.033969879150390625, -0.0236358642578125, -0.013301849365234375, -0.00296783447265625, 0.007366180419921875, 0.0177001953125, 0.028034210205078125, 0.03836822509765625, 0.048702239990234375, 0.0590362548828125, 0.06937026977539062, 0.07970428466796875, 0.09003829956054688, 0.100372314453125, 0.11070632934570312, 0.12104034423828125, 0.13137435913085938, 0.1417083740234375, 0.15204238891601562, 0.16237640380859375, 0.17271041870117188, 0.18304443359375, 0.19337844848632812, 0.20371246337890625, 0.21404647827148438, 0.2243804931640625, 0.23471450805664062, 0.24504852294921875, 0.2553825378417969, 0.265716552734375, 0.2760505676269531, 0.28638458251953125, 0.2967185974121094, 0.3070526123046875, 0.3173866271972656, 0.32772064208984375, 0.3380546569824219, 0.348388671875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 11.0, 9.0, 8.0, 6.0, 23.0, 35.0, 42.0, 74.0, 91.0, 139.0, 176.0, 130.0, 78.0, 55.0, 34.0, 22.0, 18.0, 9.0, 9.0, 9.0, 9.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.00016808509826660156, -0.00016343966126441956, -0.00015879422426223755, -0.00015414878726005554, -0.00014950335025787354, -0.00014485791325569153, -0.00014021247625350952, -0.00013556703925132751, -0.0001309216022491455, -0.0001262761652469635, -0.0001216307282447815, -0.00011698529124259949, -0.00011233985424041748, -0.00010769441723823547, -0.00010304898023605347, -9.840354323387146e-05, -9.375810623168945e-05, -8.911266922950745e-05, -8.446723222732544e-05, -7.982179522514343e-05, -7.517635822296143e-05, -7.053092122077942e-05, -6.588548421859741e-05, -6.12400472164154e-05, -5.65946102142334e-05, -5.194917321205139e-05, -4.7303736209869385e-05, -4.265829920768738e-05, -3.801286220550537e-05, -3.3367425203323364e-05, -2.8721988201141357e-05, -2.407655119895935e-05, -1.9431114196777344e-05, -1.4785677194595337e-05, -1.014024019241333e-05, -5.494803190231323e-06, -8.493661880493164e-07, 3.7960708141326904e-06, 8.441507816314697e-06, 1.3086944818496704e-05, 1.773238182067871e-05, 2.2377818822860718e-05, 2.7023255825042725e-05, 3.166869282722473e-05, 3.631412982940674e-05, 4.0959566831588745e-05, 4.560500383377075e-05, 5.025044083595276e-05, 5.4895877838134766e-05, 5.954131484031677e-05, 6.418675184249878e-05, 6.883218884468079e-05, 7.347762584686279e-05, 7.81230628490448e-05, 8.27684998512268e-05, 8.741393685340881e-05, 9.205937385559082e-05, 9.670481085777283e-05, 0.00010135024785995483, 0.00010599568486213684, 0.00011064112186431885, 0.00011528655886650085, 0.00011993199586868286, 0.00012457743287086487, 0.00012922286987304688]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 5.0, 10.0, 2.0, 8.0, 14.0, 7.0, 18.0, 35.0, 64.0, 127.0, 248.0, 563.0, 1303.0, 3483.0, 12767.0, 146447.0, 844301.0, 29656.0, 5963.0, 2032.0, 779.0, 352.0, 164.0, 85.0, 47.0, 26.0, 7.0, 11.0, 8.0, 3.0, 3.0, 7.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.56201171875, -0.538818359375, -0.515625, -0.492431640625, -0.46923828125, -0.446044921875, -0.4228515625, -0.399658203125, -0.37646484375, -0.353271484375, -0.330078125, -0.306884765625, -0.28369140625, -0.260498046875, -0.2373046875, -0.214111328125, -0.19091796875, -0.167724609375, -0.14453125, -0.121337890625, -0.09814453125, -0.074951171875, -0.0517578125, -0.028564453125, -0.00537109375, 0.017822265625, 0.041015625, 0.064208984375, 0.08740234375, 0.110595703125, 0.1337890625, 0.156982421875, 0.18017578125, 0.203369140625, 0.2265625, 0.249755859375, 0.27294921875, 0.296142578125, 0.3193359375, 0.342529296875, 0.36572265625, 0.388916015625, 0.412109375, 0.435302734375, 0.45849609375, 0.481689453125, 0.5048828125, 0.528076171875, 0.55126953125, 0.574462890625, 0.59765625, 0.620849609375, 0.64404296875, 0.667236328125, 0.6904296875, 0.713623046875, 0.73681640625, 0.760009765625, 0.783203125, 0.806396484375, 0.82958984375, 0.852783203125, 0.8759765625, 0.899169921875, 0.92236328125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 5.0, 4.0, 7.0, 8.0, 15.0, 25.0, 28.0, 45.0, 81.0, 163.0, 233.0, 151.0, 88.0, 44.0, 26.0, 19.0, 14.0, 12.0, 6.0, 2.0, 1.0, 5.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1685791015625, -0.16419601440429688, -0.15981292724609375, -0.15542984008789062, -0.1510467529296875, -0.14666366577148438, -0.14228057861328125, -0.13789749145507812, -0.133514404296875, -0.12913131713867188, -0.12474822998046875, -0.12036514282226562, -0.1159820556640625, -0.11159896850585938, -0.10721588134765625, -0.10283279418945312, -0.09844970703125, -0.09406661987304688, -0.08968353271484375, -0.08530044555664062, -0.0809173583984375, -0.07653427124023438, -0.07215118408203125, -0.06776809692382812, -0.063385009765625, -0.059001922607421875, -0.05461883544921875, -0.050235748291015625, -0.0458526611328125, -0.041469573974609375, -0.03708648681640625, -0.032703399658203125, -0.0283203125, -0.023937225341796875, -0.01955413818359375, -0.015171051025390625, -0.0107879638671875, -0.006404876708984375, -0.00202178955078125, 0.002361297607421875, 0.006744384765625, 0.011127471923828125, 0.01551055908203125, 0.019893646240234375, 0.0242767333984375, 0.028659820556640625, 0.03304290771484375, 0.037425994873046875, 0.04180908203125, 0.046192169189453125, 0.05057525634765625, 0.054958343505859375, 0.0593414306640625, 0.06372451782226562, 0.06810760498046875, 0.07249069213867188, 0.076873779296875, 0.08125686645507812, 0.08563995361328125, 0.09002304077148438, 0.0944061279296875, 0.09878921508789062, 0.10317230224609375, 0.10755538940429688, 0.1119384765625]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 3.0, 6.0, 7.0, 6.0, 12.0, 20.0, 33.0, 50.0, 83.0, 140.0, 153.0, 159.0, 130.0, 75.0, 40.0, 28.0, 14.0, 17.0, 7.0, 7.0, 4.0, 6.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.749243974685669, -2.6477582454681396, -2.5462722778320312, -2.444786548614502, -2.3433008193969727, -2.2418148517608643, -2.140329122543335, -2.0388431549072266, -1.9373574256896973, -1.8358715772628784, -1.7343857288360596, -1.6328999996185303, -1.5314141511917114, -1.4299283027648926, -1.3284425735473633, -1.2269567251205444, -1.1254708766937256, -1.0239850282669067, -0.9224992394447327, -0.8210134506225586, -0.7195276021957397, -0.6180417537689209, -0.5165559649467468, -0.41507017612457275, -0.3135843276977539, -0.21209850907325745, -0.11061269044876099, -0.009126871824264526, 0.09235894680023193, 0.19384479522705078, 0.29533058404922485, 0.3968163728713989, 0.49830198287963867, 0.5997878313064575, 0.7012736201286316, 0.8027594089508057, 0.9042452573776245, 1.0057311058044434, 1.1072168350219727, 1.2087026834487915, 1.3101885318756104, 1.4116743803024292, 1.513160228729248, 1.6146459579467773, 1.7161318063735962, 1.817617654800415, 1.9191033840179443, 2.0205893516540527, 2.122075080871582, 2.2235608100891113, 2.3250467777252197, 2.426532506942749, 2.5280184745788574, 2.6295042037963867, 2.730989933013916, 2.8324756622314453, 2.9339616298675537, 3.035447359085083, 3.1369333267211914, 3.2384190559387207, 3.33990478515625, 3.4413907527923584, 3.5428764820098877, 3.644362449645996, 3.7458481788635254]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 8.0, 12.0, 21.0, 27.0, 47.0, 57.0, 69.0, 107.0, 123.0, 140.0, 107.0, 104.0, 71.0, 47.0, 22.0, 20.0, 9.0, 2.0, 8.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.9631612300872803, -3.850487470626831, -3.737813949584961, -3.6251401901245117, -3.5124664306640625, -3.3997926712036133, -3.287118911743164, -3.174445390701294, -3.0617716312408447, -2.9490978717803955, -2.8364243507385254, -2.723750591278076, -2.611076831817627, -2.4984030723571777, -2.3857293128967285, -2.2730557918548584, -2.160382032394409, -2.04770827293396, -1.9350346326828003, -1.8223609924316406, -1.7096872329711914, -1.5970134735107422, -1.4843398332595825, -1.3716661930084229, -1.2589924335479736, -1.1463186740875244, -1.0336450338363647, -0.9209713339805603, -0.8082976341247559, -0.6956239342689514, -0.582950234413147, -0.47027653455734253, -0.357602596282959, -0.24492889642715454, -0.1322551965713501, -0.019581496715545654, 0.09309220314025879, 0.20576590299606323, 0.3184396028518677, 0.4311133027076721, 0.5437870025634766, 0.656460702419281, 0.7691344022750854, 0.8818081021308899, 0.9944818019866943, 1.1071555614471436, 1.2198292016983032, 1.332502841949463, 1.445176601409912, 1.5578503608703613, 1.670524001121521, 1.7831976413726807, 1.8958714008331299, 2.008545160293579, 2.121218681335449, 2.2338924407958984, 2.3465662002563477, 2.459239959716797, 2.571913719177246, 2.684587240219116, 2.7972609996795654, 2.9099347591400146, 3.0226082801818848, 3.135282039642334, 3.247955799102783]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 11.0, 6.0, 11.0, 16.0, 12.0, 23.0, 38.0, 49.0, 84.0, 155.0, 202.0, 332.0, 558.0, 1016.0, 1706.0, 3312.0, 6783.0, 15354.0, 38539.0, 114875.0, 394203.0, 321612.0, 91989.0, 31974.0, 12946.0, 5933.0, 2999.0, 1558.0, 825.0, 522.0, 323.0, 195.0, 133.0, 89.0, 49.0, 29.0, 27.0, 20.0, 12.0, 14.0, 5.0, 7.0, 3.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.990234375, -1.9278564453125, -1.865478515625, -1.8031005859375, -1.74072265625, -1.6783447265625, -1.615966796875, -1.5535888671875, -1.4912109375, -1.4288330078125, -1.366455078125, -1.3040771484375, -1.24169921875, -1.1793212890625, -1.116943359375, -1.0545654296875, -0.9921875, -0.9298095703125, -0.867431640625, -0.8050537109375, -0.74267578125, -0.6802978515625, -0.617919921875, -0.5555419921875, -0.4931640625, -0.4307861328125, -0.368408203125, -0.3060302734375, -0.24365234375, -0.1812744140625, -0.118896484375, -0.0565185546875, 0.005859375, 0.0682373046875, 0.130615234375, 0.1929931640625, 0.25537109375, 0.3177490234375, 0.380126953125, 0.4425048828125, 0.5048828125, 0.5672607421875, 0.629638671875, 0.6920166015625, 0.75439453125, 0.8167724609375, 0.879150390625, 0.9415283203125, 1.00390625, 1.0662841796875, 1.128662109375, 1.1910400390625, 1.25341796875, 1.3157958984375, 1.378173828125, 1.4405517578125, 1.5029296875, 1.5653076171875, 1.627685546875, 1.6900634765625, 1.75244140625, 1.8148193359375, 1.877197265625, 1.9395751953125, 2.001953125]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 15.0, 12.0, 22.0, 31.0, 46.0, 66.0, 96.0, 118.0, 102.0, 141.0, 119.0, 75.0, 51.0, 43.0, 24.0, 14.0, 13.0, 4.0, 2.0, 3.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.6328125, -9.377197265625, -9.12158203125, -8.865966796875, -8.6103515625, -8.354736328125, -8.09912109375, -7.843505859375, -7.587890625, -7.332275390625, -7.07666015625, -6.821044921875, -6.5654296875, -6.309814453125, -6.05419921875, -5.798583984375, -5.54296875, -5.287353515625, -5.03173828125, -4.776123046875, -4.5205078125, -4.264892578125, -4.00927734375, -3.753662109375, -3.498046875, -3.242431640625, -2.98681640625, -2.731201171875, -2.4755859375, -2.219970703125, -1.96435546875, -1.708740234375, -1.453125, -1.197509765625, -0.94189453125, -0.686279296875, -0.4306640625, -0.175048828125, 0.08056640625, 0.336181640625, 0.591796875, 0.847412109375, 1.10302734375, 1.358642578125, 1.6142578125, 1.869873046875, 2.12548828125, 2.381103515625, 2.63671875, 2.892333984375, 3.14794921875, 3.403564453125, 3.6591796875, 3.914794921875, 4.17041015625, 4.426025390625, 4.681640625, 4.937255859375, 5.19287109375, 5.448486328125, 5.7041015625, 5.959716796875, 6.21533203125, 6.470947265625, 6.7265625]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 1.0, 5.0, 6.0, 7.0, 13.0, 7.0, 19.0, 14.0, 19.0, 24.0, 33.0, 33.0, 33.0, 41.0, 55.0, 61.0, 132.0, 498.0, 12456.0, 1012842.0, 21059.0, 625.0, 146.0, 90.0, 66.0, 46.0, 32.0, 20.0, 35.0, 25.0, 14.0, 16.0, 18.0, 5.0, 11.0, 14.0, 7.0, 4.0, 5.0, 3.0, 6.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0], "bins": [-12.59375, -12.2183837890625, -11.843017578125, -11.4676513671875, -11.09228515625, -10.7169189453125, -10.341552734375, -9.9661865234375, -9.5908203125, -9.2154541015625, -8.840087890625, -8.4647216796875, -8.08935546875, -7.7139892578125, -7.338623046875, -6.9632568359375, -6.587890625, -6.2125244140625, -5.837158203125, -5.4617919921875, -5.08642578125, -4.7110595703125, -4.335693359375, -3.9603271484375, -3.5849609375, -3.2095947265625, -2.834228515625, -2.4588623046875, -2.08349609375, -1.7081298828125, -1.332763671875, -0.9573974609375, -0.58203125, -0.2066650390625, 0.168701171875, 0.5440673828125, 0.91943359375, 1.2947998046875, 1.670166015625, 2.0455322265625, 2.4208984375, 2.7962646484375, 3.171630859375, 3.5469970703125, 3.92236328125, 4.2977294921875, 4.673095703125, 5.0484619140625, 5.423828125, 5.7991943359375, 6.174560546875, 6.5499267578125, 6.92529296875, 7.3006591796875, 7.676025390625, 8.0513916015625, 8.4267578125, 8.8021240234375, 9.177490234375, 9.5528564453125, 9.92822265625, 10.3035888671875, 10.678955078125, 11.0543212890625, 11.4296875]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 3.0, 7.0, 1.0, 3.0, 4.0, 3.0, 7.0, 9.0, 11.0, 17.0, 16.0, 14.0, 16.0, 32.0, 37.0, 24.0, 32.0, 46.0, 40.0, 35.0, 34.0, 45.0, 49.0, 53.0, 41.0, 62.0, 37.0, 48.0, 41.0, 36.0, 23.0, 16.0, 34.0, 23.0, 15.0, 19.0, 15.0, 9.0, 12.0, 5.0, 7.0, 6.0, 8.0, 6.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0], "bins": [-4.48828125, -4.359893798828125, -4.23150634765625, -4.103118896484375, -3.9747314453125, -3.846343994140625, -3.71795654296875, -3.589569091796875, -3.461181640625, -3.332794189453125, -3.20440673828125, -3.076019287109375, -2.9476318359375, -2.819244384765625, -2.69085693359375, -2.562469482421875, -2.43408203125, -2.305694580078125, -2.17730712890625, -2.048919677734375, -1.9205322265625, -1.792144775390625, -1.66375732421875, -1.535369873046875, -1.406982421875, -1.278594970703125, -1.15020751953125, -1.021820068359375, -0.8934326171875, -0.765045166015625, -0.63665771484375, -0.508270263671875, -0.3798828125, -0.251495361328125, -0.12310791015625, 0.005279541015625, 0.1336669921875, 0.262054443359375, 0.39044189453125, 0.518829345703125, 0.647216796875, 0.775604248046875, 0.90399169921875, 1.032379150390625, 1.1607666015625, 1.289154052734375, 1.41754150390625, 1.545928955078125, 1.67431640625, 1.802703857421875, 1.93109130859375, 2.059478759765625, 2.1878662109375, 2.316253662109375, 2.44464111328125, 2.573028564453125, 2.701416015625, 2.829803466796875, 2.95819091796875, 3.086578369140625, 3.2149658203125, 3.343353271484375, 3.47174072265625, 3.600128173828125, 3.728515625]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 7.0, 5.0, 5.0, 7.0, 12.0, 22.0, 28.0, 41.0, 56.0, 100.0, 193.0, 390.0, 787.0, 1947.0, 5759.0, 20442.0, 98711.0, 534094.0, 313317.0, 53956.0, 12326.0, 3768.0, 1364.0, 581.0, 265.0, 129.0, 71.0, 71.0, 32.0, 22.0, 20.0, 4.0, 10.0, 5.0, 2.0, 8.0, 3.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.7197265625, -0.6963729858398438, -0.6730194091796875, -0.6496658325195312, -0.626312255859375, -0.6029586791992188, -0.5796051025390625, -0.5562515258789062, -0.53289794921875, -0.5095443725585938, -0.4861907958984375, -0.46283721923828125, -0.439483642578125, -0.41613006591796875, -0.3927764892578125, -0.36942291259765625, -0.3460693359375, -0.32271575927734375, -0.2993621826171875, -0.27600860595703125, -0.252655029296875, -0.22930145263671875, -0.2059478759765625, -0.18259429931640625, -0.15924072265625, -0.13588714599609375, -0.1125335693359375, -0.08917999267578125, -0.065826416015625, -0.04247283935546875, -0.0191192626953125, 0.00423431396484375, 0.027587890625, 0.05094146728515625, 0.0742950439453125, 0.09764862060546875, 0.121002197265625, 0.14435577392578125, 0.1677093505859375, 0.19106292724609375, 0.21441650390625, 0.23777008056640625, 0.2611236572265625, 0.28447723388671875, 0.307830810546875, 0.33118438720703125, 0.3545379638671875, 0.37789154052734375, 0.4012451171875, 0.42459869384765625, 0.4479522705078125, 0.47130584716796875, 0.494659423828125, 0.5180130004882812, 0.5413665771484375, 0.5647201538085938, 0.58807373046875, 0.6114273071289062, 0.6347808837890625, 0.6581344604492188, 0.681488037109375, 0.7048416137695312, 0.7281951904296875, 0.7515487670898438, 0.77490234375]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 6.0, 10.0, 6.0, 12.0, 21.0, 17.0, 31.0, 58.0, 66.0, 87.0, 83.0, 129.0, 107.0, 102.0, 82.0, 53.0, 44.0, 28.0, 16.0, 12.0, 12.0, 7.0, 10.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001430511474609375, -0.00013811886310577393, -0.00013318657875061035, -0.00012825429439544678, -0.0001233220100402832, -0.00011838972568511963, -0.00011345744132995605, -0.00010852515697479248, -0.0001035928726196289, -9.866058826446533e-05, -9.372830390930176e-05, -8.879601955413818e-05, -8.386373519897461e-05, -7.893145084381104e-05, -7.399916648864746e-05, -6.906688213348389e-05, -6.413459777832031e-05, -5.920231342315674e-05, -5.4270029067993164e-05, -4.933774471282959e-05, -4.4405460357666016e-05, -3.947317600250244e-05, -3.454089164733887e-05, -2.9608607292175293e-05, -2.467632293701172e-05, -1.9744038581848145e-05, -1.481175422668457e-05, -9.879469871520996e-06, -4.947185516357422e-06, -1.4901161193847656e-08, 4.9173831939697266e-06, 9.8496675491333e-06, 1.4781951904296875e-05, 1.971423625946045e-05, 2.4646520614624023e-05, 2.9578804969787598e-05, 3.451108932495117e-05, 3.9443373680114746e-05, 4.437565803527832e-05, 4.9307942390441895e-05, 5.424022674560547e-05, 5.917251110076904e-05, 6.410479545593262e-05, 6.903707981109619e-05, 7.396936416625977e-05, 7.890164852142334e-05, 8.383393287658691e-05, 8.876621723175049e-05, 9.369850158691406e-05, 9.863078594207764e-05, 0.00010356307029724121, 0.00010849535465240479, 0.00011342763900756836, 0.00011835992336273193, 0.0001232922077178955, 0.00012822449207305908, 0.00013315677642822266, 0.00013808906078338623, 0.0001430213451385498, 0.00014795362949371338, 0.00015288591384887695, 0.00015781819820404053, 0.0001627504825592041, 0.00016768276691436768, 0.00017261505126953125]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 3.0, 4.0, 3.0, 4.0, 11.0, 5.0, 12.0, 15.0, 10.0, 21.0, 27.0, 70.0, 117.0, 196.0, 373.0, 631.0, 1351.0, 3141.0, 8336.0, 25735.0, 100358.0, 426267.0, 364169.0, 83018.0, 22273.0, 7001.0, 2812.0, 1230.0, 596.0, 314.0, 173.0, 107.0, 50.0, 46.0, 20.0, 19.0, 12.0, 8.0, 6.0, 8.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.5625, -0.543060302734375, -0.52362060546875, -0.504180908203125, -0.4847412109375, -0.465301513671875, -0.44586181640625, -0.426422119140625, -0.406982421875, -0.387542724609375, -0.36810302734375, -0.348663330078125, -0.3292236328125, -0.309783935546875, -0.29034423828125, -0.270904541015625, -0.25146484375, -0.232025146484375, -0.21258544921875, -0.193145751953125, -0.1737060546875, -0.154266357421875, -0.13482666015625, -0.115386962890625, -0.095947265625, -0.076507568359375, -0.05706787109375, -0.037628173828125, -0.0181884765625, 0.001251220703125, 0.02069091796875, 0.040130615234375, 0.0595703125, 0.079010009765625, 0.09844970703125, 0.117889404296875, 0.1373291015625, 0.156768798828125, 0.17620849609375, 0.195648193359375, 0.215087890625, 0.234527587890625, 0.25396728515625, 0.273406982421875, 0.2928466796875, 0.312286376953125, 0.33172607421875, 0.351165771484375, 0.37060546875, 0.390045166015625, 0.40948486328125, 0.428924560546875, 0.4483642578125, 0.467803955078125, 0.48724365234375, 0.506683349609375, 0.526123046875, 0.545562744140625, 0.56500244140625, 0.584442138671875, 0.6038818359375, 0.623321533203125, 0.64276123046875, 0.662200927734375, 0.681640625]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 3.0, 2.0, 6.0, 3.0, 2.0, 5.0, 13.0, 11.0, 9.0, 12.0, 17.0, 27.0, 36.0, 29.0, 34.0, 38.0, 42.0, 64.0, 55.0, 59.0, 66.0, 74.0, 59.0, 56.0, 40.0, 44.0, 36.0, 29.0, 33.0, 19.0, 18.0, 19.0, 7.0, 8.0, 6.0, 5.0, 7.0, 3.0, 4.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.29541015625, -0.2868461608886719, -0.27828216552734375, -0.2697181701660156, -0.2611541748046875, -0.2525901794433594, -0.24402618408203125, -0.23546218872070312, -0.226898193359375, -0.21833419799804688, -0.20977020263671875, -0.20120620727539062, -0.1926422119140625, -0.18407821655273438, -0.17551422119140625, -0.16695022583007812, -0.15838623046875, -0.14982223510742188, -0.14125823974609375, -0.13269424438476562, -0.1241302490234375, -0.11556625366210938, -0.10700225830078125, -0.09843826293945312, -0.089874267578125, -0.08131027221679688, -0.07274627685546875, -0.06418228149414062, -0.0556182861328125, -0.047054290771484375, -0.03849029541015625, -0.029926300048828125, -0.0213623046875, -0.012798309326171875, -0.00423431396484375, 0.004329681396484375, 0.0128936767578125, 0.021457672119140625, 0.03002166748046875, 0.038585662841796875, 0.047149658203125, 0.055713653564453125, 0.06427764892578125, 0.07284164428710938, 0.0814056396484375, 0.08996963500976562, 0.09853363037109375, 0.10709762573242188, 0.11566162109375, 0.12422561645507812, 0.13278961181640625, 0.14135360717773438, 0.1499176025390625, 0.15848159790039062, 0.16704559326171875, 0.17560958862304688, 0.184173583984375, 0.19273757934570312, 0.20130157470703125, 0.20986557006835938, 0.2184295654296875, 0.22699356079101562, 0.23555755615234375, 0.24412155151367188, 0.252685546875]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 4.0, 14.0, 74.0, 641.0, 255.0, 23.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.353118896484375, -4.227870941162109, -3.102623224258423, -1.9773755073547363, -0.8521275520324707, 0.2731204032897949, 1.3983678817749023, 2.523615837097168, 3.6488637924194336, 4.774111747741699, 5.899359703063965, 7.024607181549072, 8.14985466003418, 9.275102615356445, 10.400350570678711, 11.525598526000977, 12.650846481323242, 13.776094436645508, 14.901342391967773, 16.02659034729004, 17.151838302612305, 18.27708625793457, 19.402332305908203, 20.52758026123047, 21.652828216552734, 22.778076171875, 23.903324127197266, 25.02857208251953, 26.153820037841797, 27.279067993164062, 28.404315948486328, 29.529563903808594, 30.65481185913086, 31.780059814453125, 32.90530776977539, 34.030555725097656, 35.15580368041992, 36.28105163574219, 37.40629959106445, 38.53154754638672, 39.656795501708984, 40.78204345703125, 41.907291412353516, 43.03253936767578, 44.15778732299805, 45.28303527832031, 46.40828323364258, 47.533531188964844, 48.658775329589844, 49.78402328491211, 50.909271240234375, 52.03451919555664, 53.159767150878906, 54.28501510620117, 55.41026306152344, 56.5355110168457, 57.66075897216797, 58.786006927490234, 59.9112548828125, 61.036502838134766, 62.16175079345703, 63.2869987487793, 64.41224670410156, 65.53749084472656, 66.6627426147461]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 6.0, 3.0, 6.0, 9.0, 14.0, 11.0, 15.0, 23.0, 34.0, 33.0, 42.0, 59.0, 53.0, 64.0, 59.0, 68.0, 65.0, 65.0, 77.0, 49.0, 58.0, 51.0, 37.0, 24.0, 20.0, 18.0, 13.0, 8.0, 10.0, 10.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-13.233388900756836, -12.895090103149414, -12.556790351867676, -12.218491554260254, -11.880191802978516, -11.541893005371094, -11.203594207763672, -10.86529541015625, -10.526995658874512, -10.18869686126709, -9.850397109985352, -9.51209831237793, -9.173799514770508, -8.83549976348877, -8.497200965881348, -8.15890121459961, -7.8206024169921875, -7.482303142547607, -7.144003868103027, -6.8057050704956055, -6.467405796051025, -6.129106521606445, -5.790807723999023, -5.452508449554443, -5.114209175109863, -4.775909900665283, -4.437610626220703, -4.099311828613281, -3.761012554168701, -3.422713279724121, -3.08441424369812, -2.746115207672119, -2.407815933227539, -2.069516658782959, -1.731217622756958, -1.3929184675216675, -1.054619312286377, -0.7163201570510864, -0.3780210018157959, -0.03972196578979492, 0.29857730865478516, 0.6368764638900757, 0.9751756191253662, 1.3134747743606567, 1.6517739295959473, 1.9900730848312378, 2.3283722400665283, 2.6666712760925293, 3.0049705505371094, 3.3432698249816895, 3.6815688610076904, 4.019867897033691, 4.3581671714782715, 4.696466445922852, 5.034765243530273, 5.3730645179748535, 5.711363792419434, 6.049663066864014, 6.387962341308594, 6.726261138916016, 7.064560413360596, 7.402859687805176, 7.741158485412598, 8.079458236694336, 8.417757034301758]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 7.0, 16.0, 6.0, 16.0, 21.0, 27.0, 40.0, 45.0, 73.0, 140.0, 278.0, 931.0, 4120.0, 35780.0, 3374217.0, 754974.0, 19435.0, 2910.0, 662.0, 230.0, 113.0, 59.0, 45.0, 31.0, 21.0, 13.0, 18.0, 13.0, 9.0, 7.0, 8.0, 4.0, 0.0, 5.0, 1.0, 3.0, 1.0, 0.0, 2.0, 3.0], "bins": [-7.55078125, -7.3565673828125, -7.162353515625, -6.9681396484375, -6.77392578125, -6.5797119140625, -6.385498046875, -6.1912841796875, -5.9970703125, -5.8028564453125, -5.608642578125, -5.4144287109375, -5.22021484375, -5.0260009765625, -4.831787109375, -4.6375732421875, -4.443359375, -4.2491455078125, -4.054931640625, -3.8607177734375, -3.66650390625, -3.4722900390625, -3.278076171875, -3.0838623046875, -2.8896484375, -2.6954345703125, -2.501220703125, -2.3070068359375, -2.11279296875, -1.9185791015625, -1.724365234375, -1.5301513671875, -1.3359375, -1.1417236328125, -0.947509765625, -0.7532958984375, -0.55908203125, -0.3648681640625, -0.170654296875, 0.0235595703125, 0.2177734375, 0.4119873046875, 0.606201171875, 0.8004150390625, 0.99462890625, 1.1888427734375, 1.383056640625, 1.5772705078125, 1.771484375, 1.9656982421875, 2.159912109375, 2.3541259765625, 2.54833984375, 2.7425537109375, 2.936767578125, 3.1309814453125, 3.3251953125, 3.5194091796875, 3.713623046875, 3.9078369140625, 4.10205078125, 4.2962646484375, 4.490478515625, 4.6846923828125, 4.87890625]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 7.0, 7.0, 16.0, 27.0, 34.0, 51.0, 63.0, 116.0, 121.0, 133.0, 131.0, 90.0, 74.0, 49.0, 26.0, 22.0, 15.0, 8.0, 2.0, 5.0, 6.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.4375, -5.292266845703125, -5.14703369140625, -5.001800537109375, -4.8565673828125, -4.711334228515625, -4.56610107421875, -4.420867919921875, -4.275634765625, -4.130401611328125, -3.98516845703125, -3.839935302734375, -3.6947021484375, -3.549468994140625, -3.40423583984375, -3.259002685546875, -3.11376953125, -2.968536376953125, -2.82330322265625, -2.678070068359375, -2.5328369140625, -2.387603759765625, -2.24237060546875, -2.097137451171875, -1.951904296875, -1.806671142578125, -1.66143798828125, -1.516204833984375, -1.3709716796875, -1.225738525390625, -1.08050537109375, -0.935272216796875, -0.7900390625, -0.644805908203125, -0.49957275390625, -0.354339599609375, -0.2091064453125, -0.063873291015625, 0.08135986328125, 0.226593017578125, 0.371826171875, 0.517059326171875, 0.66229248046875, 0.807525634765625, 0.9527587890625, 1.097991943359375, 1.24322509765625, 1.388458251953125, 1.53369140625, 1.678924560546875, 1.82415771484375, 1.969390869140625, 2.1146240234375, 2.259857177734375, 2.40509033203125, 2.550323486328125, 2.695556640625, 2.840789794921875, 2.98602294921875, 3.131256103515625, 3.2764892578125, 3.421722412109375, 3.56695556640625, 3.712188720703125, 3.857421875]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 10.0, 18.0, 21.0, 68.0, 285.0, 28789.0, 4164340.0, 596.0, 116.0, 25.0, 17.0, 5.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.0625, -32.094970703125, -31.12744140625, -30.159912109375, -29.1923828125, -28.224853515625, -27.25732421875, -26.289794921875, -25.322265625, -24.354736328125, -23.38720703125, -22.419677734375, -21.4521484375, -20.484619140625, -19.51708984375, -18.549560546875, -17.58203125, -16.614501953125, -15.64697265625, -14.679443359375, -13.7119140625, -12.744384765625, -11.77685546875, -10.809326171875, -9.841796875, -8.874267578125, -7.90673828125, -6.939208984375, -5.9716796875, -5.004150390625, -4.03662109375, -3.069091796875, -2.1015625, -1.134033203125, -0.16650390625, 0.801025390625, 1.7685546875, 2.736083984375, 3.70361328125, 4.671142578125, 5.638671875, 6.606201171875, 7.57373046875, 8.541259765625, 9.5087890625, 10.476318359375, 11.44384765625, 12.411376953125, 13.37890625, 14.346435546875, 15.31396484375, 16.281494140625, 17.2490234375, 18.216552734375, 19.18408203125, 20.151611328125, 21.119140625, 22.086669921875, 23.05419921875, 24.021728515625, 24.9892578125, 25.956787109375, 26.92431640625, 27.891845703125, 28.859375]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 8.0, 14.0, 21.0, 30.0, 48.0, 69.0, 78.0, 156.0, 239.0, 416.0, 999.0, 947.0, 426.0, 225.0, 131.0, 89.0, 54.0, 27.0, 23.0, 20.0, 15.0, 10.0, 3.0, 6.0, 6.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7080078125, -0.6817855834960938, -0.6555633544921875, -0.6293411254882812, -0.603118896484375, -0.5768966674804688, -0.5506744384765625, -0.5244522094726562, -0.49822998046875, -0.47200775146484375, -0.4457855224609375, -0.41956329345703125, -0.393341064453125, -0.36711883544921875, -0.3408966064453125, -0.31467437744140625, -0.2884521484375, -0.26222991943359375, -0.2360076904296875, -0.20978546142578125, -0.183563232421875, -0.15734100341796875, -0.1311187744140625, -0.10489654541015625, -0.07867431640625, -0.05245208740234375, -0.0262298583984375, -7.62939453125e-06, 0.026214599609375, 0.05243682861328125, 0.0786590576171875, 0.10488128662109375, 0.131103515625, 0.15732574462890625, 0.1835479736328125, 0.20977020263671875, 0.235992431640625, 0.26221466064453125, 0.2884368896484375, 0.31465911865234375, 0.34088134765625, 0.36710357666015625, 0.3933258056640625, 0.41954803466796875, 0.445770263671875, 0.47199249267578125, 0.4982147216796875, 0.5244369506835938, 0.5506591796875, 0.5768814086914062, 0.6031036376953125, 0.6293258666992188, 0.655548095703125, 0.6817703247070312, 0.7079925537109375, 0.7342147827148438, 0.76043701171875, 0.7866592407226562, 0.8128814697265625, 0.8391036987304688, 0.865325927734375, 0.8915481567382812, 0.9177703857421875, 0.9439926147460938, 0.97021484375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 3.0, 8.0, 5.0, 5.0, 11.0, 14.0, 24.0, 37.0, 83.0, 121.0, 182.0, 175.0, 144.0, 74.0, 50.0, 23.0, 18.0, 10.0, 6.0, 9.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.773680210113525, -4.615267753601074, -4.456855297088623, -4.29844331741333, -4.140030860900879, -3.9816184043884277, -3.8232059478759766, -3.6647934913635254, -3.5063812732696533, -3.347968816757202, -3.18955659866333, -3.031144142150879, -2.8727316856384277, -2.7143194675445557, -2.5559070110321045, -2.3974947929382324, -2.2390823364257812, -2.08066987991333, -1.922257661819458, -1.7638452053070068, -1.6054328680038452, -1.4470205307006836, -1.2886080741882324, -1.1301957368850708, -0.9717833995819092, -0.8133710622787476, -0.6549586653709412, -0.49654629826545715, -0.33813393115997314, -0.17972159385681152, -0.021309196949005127, 0.13710319995880127, 0.2955150604248047, 0.4539274275302887, 0.6123397946357727, 0.7707521915435791, 0.9291645288467407, 1.0875768661499023, 1.2459893226623535, 1.4044016599655151, 1.5628139972686768, 1.7212263345718384, 1.879638671875, 2.038051128387451, 2.1964635848999023, 2.3548758029937744, 2.5132882595062256, 2.6717004776000977, 2.830112934112549, 2.988525390625, 3.146937608718872, 3.3053500652313232, 3.4637622833251953, 3.6221747398376465, 3.7805871963500977, 3.938999652862549, 4.097412109375, 4.255824565887451, 4.414237022399902, 4.572649002075195, 4.7310614585876465, 4.889473915100098, 5.047886371612549, 5.206298828125, 5.364710807800293]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 7.0, 4.0, 10.0, 26.0, 26.0, 36.0, 57.0, 76.0, 93.0, 121.0, 127.0, 94.0, 86.0, 90.0, 46.0, 41.0, 31.0, 14.0, 11.0, 9.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.2591705322265625, -5.109409332275391, -4.959648609161377, -4.809887409210205, -4.660126686096191, -4.5103654861450195, -4.360604763031006, -4.210843563079834, -4.06108283996582, -3.9113218784332275, -3.7615609169006348, -3.611799955368042, -3.462038993835449, -3.3122780323028564, -3.1625170707702637, -3.012755870819092, -2.862994909286499, -2.7132339477539062, -2.5634729862213135, -2.4137120246887207, -2.263951063156128, -2.114190101623535, -1.9644290208816528, -1.81466805934906, -1.6649070978164673, -1.5151461362838745, -1.3653851747512817, -1.2156240940093994, -1.0658631324768066, -0.9161022305488586, -0.7663412094116211, -0.6165802478790283, -0.46681928634643555, -0.3170583248138428, -0.1672973334789276, -0.01753634214401245, 0.13222461938858032, 0.2819855809211731, 0.43174660205841064, 0.5815075635910034, 0.7312685251235962, 0.881029486656189, 1.0307904481887817, 1.180551528930664, 1.3303124904632568, 1.4800734519958496, 1.6298344135284424, 1.7795953750610352, 1.929356336593628, 2.0791172981262207, 2.2288782596588135, 2.3786392211914062, 2.528400182723999, 2.678161144256592, 2.8279223442077637, 2.9776830673217773, 3.127444267272949, 3.277205228805542, 3.4269661903381348, 3.5767271518707275, 3.7264881134033203, 3.876249074935913, 4.026010036468506, 4.175771236419678, 4.325531959533691]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 9.0, 10.0, 18.0, 29.0, 47.0, 150.0, 367.0, 1405.0, 8084.0, 92338.0, 816030.0, 118070.0, 9777.0, 1553.0, 388.0, 128.0, 75.0, 36.0, 20.0, 15.0, 3.0, 7.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.671875, -0.6491317749023438, -0.6263885498046875, -0.6036453247070312, -0.580902099609375, -0.5581588745117188, -0.5354156494140625, -0.5126724243164062, -0.48992919921875, -0.46718597412109375, -0.4444427490234375, -0.42169952392578125, -0.398956298828125, -0.37621307373046875, -0.3534698486328125, -0.33072662353515625, -0.3079833984375, -0.28524017333984375, -0.2624969482421875, -0.23975372314453125, -0.217010498046875, -0.19426727294921875, -0.1715240478515625, -0.14878082275390625, -0.12603759765625, -0.10329437255859375, -0.0805511474609375, -0.05780792236328125, -0.035064697265625, -0.01232147216796875, 0.0104217529296875, 0.03316497802734375, 0.055908203125, 0.07865142822265625, 0.1013946533203125, 0.12413787841796875, 0.146881103515625, 0.16962432861328125, 0.1923675537109375, 0.21511077880859375, 0.23785400390625, 0.26059722900390625, 0.2833404541015625, 0.30608367919921875, 0.328826904296875, 0.35157012939453125, 0.3743133544921875, 0.39705657958984375, 0.4197998046875, 0.44254302978515625, 0.4652862548828125, 0.48802947998046875, 0.510772705078125, 0.5335159301757812, 0.5562591552734375, 0.5790023803710938, 0.60174560546875, 0.6244888305664062, 0.6472320556640625, 0.6699752807617188, 0.692718505859375, 0.7154617309570312, 0.7382049560546875, 0.7609481811523438, 0.78369140625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 7.0, 13.0, 15.0, 28.0, 28.0, 77.0, 87.0, 142.0, 158.0, 135.0, 107.0, 84.0, 57.0, 30.0, 13.0, 11.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.40234375, -4.27886962890625, -4.1553955078125, -4.03192138671875, -3.908447265625, -3.78497314453125, -3.6614990234375, -3.53802490234375, -3.41455078125, -3.29107666015625, -3.1676025390625, -3.04412841796875, -2.920654296875, -2.79718017578125, -2.6737060546875, -2.55023193359375, -2.4267578125, -2.30328369140625, -2.1798095703125, -2.05633544921875, -1.932861328125, -1.80938720703125, -1.6859130859375, -1.56243896484375, -1.43896484375, -1.31549072265625, -1.1920166015625, -1.06854248046875, -0.945068359375, -0.82159423828125, -0.6981201171875, -0.57464599609375, -0.451171875, -0.32769775390625, -0.2042236328125, -0.08074951171875, 0.042724609375, 0.16619873046875, 0.2896728515625, 0.41314697265625, 0.53662109375, 0.66009521484375, 0.7835693359375, 0.90704345703125, 1.030517578125, 1.15399169921875, 1.2774658203125, 1.40093994140625, 1.5244140625, 1.64788818359375, 1.7713623046875, 1.89483642578125, 2.018310546875, 2.14178466796875, 2.2652587890625, 2.38873291015625, 2.51220703125, 2.63568115234375, 2.7591552734375, 2.88262939453125, 3.006103515625, 3.12957763671875, 3.2530517578125, 3.37652587890625, 3.5]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 5.0, 4.0, 8.0, 3.0, 12.0, 14.0, 7.0, 20.0, 28.0, 43.0, 88.0, 96.0, 156.0, 327.0, 717.0, 1959.0, 7250.0, 40566.0, 323723.0, 565456.0, 89604.0, 13327.0, 3060.0, 1056.0, 406.0, 235.0, 131.0, 70.0, 59.0, 32.0, 27.0, 20.0, 9.0, 8.0, 10.0, 6.0, 9.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.394287109375, -0.3792381286621094, -0.36418914794921875, -0.3491401672363281, -0.3340911865234375, -0.3190422058105469, -0.30399322509765625, -0.2889442443847656, -0.273895263671875, -0.2588462829589844, -0.24379730224609375, -0.22874832153320312, -0.2136993408203125, -0.19865036010742188, -0.18360137939453125, -0.16855239868164062, -0.15350341796875, -0.13845443725585938, -0.12340545654296875, -0.10835647583007812, -0.0933074951171875, -0.07825851440429688, -0.06320953369140625, -0.048160552978515625, -0.033111572265625, -0.018062591552734375, -0.00301361083984375, 0.012035369873046875, 0.0270843505859375, 0.042133331298828125, 0.05718231201171875, 0.07223129272460938, 0.0872802734375, 0.10232925415039062, 0.11737823486328125, 0.13242721557617188, 0.1474761962890625, 0.16252517700195312, 0.17757415771484375, 0.19262313842773438, 0.207672119140625, 0.22272109985351562, 0.23777008056640625, 0.2528190612792969, 0.2678680419921875, 0.2829170227050781, 0.29796600341796875, 0.3130149841308594, 0.32806396484375, 0.3431129455566406, 0.35816192626953125, 0.3732109069824219, 0.3882598876953125, 0.4033088684082031, 0.41835784912109375, 0.4334068298339844, 0.448455810546875, 0.4635047912597656, 0.47855377197265625, 0.4936027526855469, 0.5086517333984375, 0.5237007141113281, 0.5387496948242188, 0.5537986755371094, 0.56884765625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 1.0, 2.0, 9.0, 9.0, 12.0, 11.0, 16.0, 24.0, 35.0, 29.0, 30.0, 42.0, 36.0, 38.0, 50.0, 56.0, 39.0, 64.0, 54.0, 46.0, 52.0, 40.0, 51.0, 49.0, 23.0, 37.0, 21.0, 21.0, 21.0, 24.0, 17.0, 14.0, 8.0, 5.0, 2.0, 7.0, 4.0, 4.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.080078125, -2.964019775390625, -2.84796142578125, -2.731903076171875, -2.6158447265625, -2.499786376953125, -2.38372802734375, -2.267669677734375, -2.151611328125, -2.035552978515625, -1.91949462890625, -1.803436279296875, -1.6873779296875, -1.571319580078125, -1.45526123046875, -1.339202880859375, -1.22314453125, -1.107086181640625, -0.99102783203125, -0.874969482421875, -0.7589111328125, -0.642852783203125, -0.52679443359375, -0.410736083984375, -0.294677734375, -0.178619384765625, -0.06256103515625, 0.053497314453125, 0.1695556640625, 0.285614013671875, 0.40167236328125, 0.517730712890625, 0.6337890625, 0.749847412109375, 0.86590576171875, 0.981964111328125, 1.0980224609375, 1.214080810546875, 1.33013916015625, 1.446197509765625, 1.562255859375, 1.678314208984375, 1.79437255859375, 1.910430908203125, 2.0264892578125, 2.142547607421875, 2.25860595703125, 2.374664306640625, 2.49072265625, 2.606781005859375, 2.72283935546875, 2.838897705078125, 2.9549560546875, 3.071014404296875, 3.18707275390625, 3.303131103515625, 3.419189453125, 3.535247802734375, 3.65130615234375, 3.767364501953125, 3.8834228515625, 3.999481201171875, 4.11553955078125, 4.231597900390625, 4.34765625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 6.0, 5.0, 14.0, 10.0, 19.0, 54.0, 111.0, 276.0, 1083.0, 9813.0, 870221.0, 162484.0, 3437.0, 614.0, 212.0, 88.0, 44.0, 30.0, 8.0, 6.0, 7.0, 5.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.66357421875, -0.6445159912109375, -0.625457763671875, -0.6063995361328125, -0.58734130859375, -0.5682830810546875, -0.549224853515625, -0.5301666259765625, -0.5111083984375, -0.4920501708984375, -0.472991943359375, -0.4539337158203125, -0.43487548828125, -0.4158172607421875, -0.396759033203125, -0.3777008056640625, -0.358642578125, -0.3395843505859375, -0.320526123046875, -0.3014678955078125, -0.28240966796875, -0.2633514404296875, -0.244293212890625, -0.2252349853515625, -0.2061767578125, -0.1871185302734375, -0.168060302734375, -0.1490020751953125, -0.12994384765625, -0.1108856201171875, -0.091827392578125, -0.0727691650390625, -0.0537109375, -0.0346527099609375, -0.015594482421875, 0.0034637451171875, 0.02252197265625, 0.0415802001953125, 0.060638427734375, 0.0796966552734375, 0.0987548828125, 0.1178131103515625, 0.136871337890625, 0.1559295654296875, 0.17498779296875, 0.1940460205078125, 0.213104248046875, 0.2321624755859375, 0.251220703125, 0.2702789306640625, 0.289337158203125, 0.3083953857421875, 0.32745361328125, 0.3465118408203125, 0.365570068359375, 0.3846282958984375, 0.4036865234375, 0.4227447509765625, 0.441802978515625, 0.4608612060546875, 0.47991943359375, 0.4989776611328125, 0.518035888671875, 0.5370941162109375, 0.55615234375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 7.0, 18.0, 15.0, 33.0, 66.0, 82.0, 182.0, 210.0, 159.0, 115.0, 50.0, 32.0, 18.0, 7.0, 7.0, 5.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.00023066997528076172, -0.00022581685334444046, -0.0002209637314081192, -0.00021611060947179794, -0.00021125748753547668, -0.00020640436559915543, -0.00020155124366283417, -0.0001966981217265129, -0.00019184499979019165, -0.0001869918778538704, -0.00018213875591754913, -0.00017728563398122787, -0.00017243251204490662, -0.00016757939010858536, -0.0001627262681722641, -0.00015787314623594284, -0.00015302002429962158, -0.00014816690236330032, -0.00014331378042697906, -0.0001384606584906578, -0.00013360753655433655, -0.0001287544146180153, -0.00012390129268169403, -0.00011904817074537277, -0.00011419504880905151, -0.00010934192687273026, -0.000104488804936409, -9.963568300008774e-05, -9.478256106376648e-05, -8.992943912744522e-05, -8.507631719112396e-05, -8.02231952548027e-05, -7.537007331848145e-05, -7.051695138216019e-05, -6.566382944583893e-05, -6.081070750951767e-05, -5.595758557319641e-05, -5.110446363687515e-05, -4.6251341700553894e-05, -4.1398219764232635e-05, -3.654509782791138e-05, -3.169197589159012e-05, -2.683885395526886e-05, -2.19857320189476e-05, -1.7132610082626343e-05, -1.2279488146305084e-05, -7.426366209983826e-06, -2.573244273662567e-06, 2.2798776626586914e-06, 7.13299959897995e-06, 1.1986121535301208e-05, 1.6839243471622467e-05, 2.1692365407943726e-05, 2.6545487344264984e-05, 3.139860928058624e-05, 3.62517312169075e-05, 4.110485315322876e-05, 4.595797508955002e-05, 5.081109702587128e-05, 5.5664218962192535e-05, 6.0517340898513794e-05, 6.537046283483505e-05, 7.022358477115631e-05, 7.507670670747757e-05, 7.992982864379883e-05]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 6.0, 8.0, 11.0, 10.0, 21.0, 33.0, 49.0, 117.0, 264.0, 971.0, 6134.0, 151033.0, 865688.0, 21467.0, 1948.0, 451.0, 166.0, 71.0, 40.0, 22.0, 15.0, 9.0, 9.0, 7.0, 1.0, 0.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.390380859375, -0.3760490417480469, -0.36171722412109375, -0.3473854064941406, -0.3330535888671875, -0.3187217712402344, -0.30438995361328125, -0.2900581359863281, -0.275726318359375, -0.2613945007324219, -0.24706268310546875, -0.23273086547851562, -0.2183990478515625, -0.20406723022460938, -0.18973541259765625, -0.17540359497070312, -0.16107177734375, -0.14673995971679688, -0.13240814208984375, -0.11807632446289062, -0.1037445068359375, -0.08941268920898438, -0.07508087158203125, -0.060749053955078125, -0.046417236328125, -0.032085418701171875, -0.01775360107421875, -0.003421783447265625, 0.0109100341796875, 0.025241851806640625, 0.03957366943359375, 0.053905487060546875, 0.0682373046875, 0.08256912231445312, 0.09690093994140625, 0.11123275756835938, 0.1255645751953125, 0.13989639282226562, 0.15422821044921875, 0.16856002807617188, 0.182891845703125, 0.19722366333007812, 0.21155548095703125, 0.22588729858398438, 0.2402191162109375, 0.2545509338378906, 0.26888275146484375, 0.2832145690917969, 0.29754638671875, 0.3118782043457031, 0.32621002197265625, 0.3405418395996094, 0.3548736572265625, 0.3692054748535156, 0.38353729248046875, 0.3978691101074219, 0.412200927734375, 0.4265327453613281, 0.44086456298828125, 0.4551963806152344, 0.4695281982421875, 0.4838600158691406, 0.49819183349609375, 0.5125236511230469, 0.52685546875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 5.0, 5.0, 2.0, 12.0, 9.0, 17.0, 18.0, 22.0, 35.0, 58.0, 106.0, 154.0, 217.0, 112.0, 86.0, 48.0, 27.0, 19.0, 15.0, 15.0, 11.0, 6.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08740234375, -0.08499336242675781, -0.08258438110351562, -0.08017539978027344, -0.07776641845703125, -0.07535743713378906, -0.07294845581054688, -0.07053947448730469, -0.0681304931640625, -0.06572151184082031, -0.06331253051757812, -0.06090354919433594, -0.05849456787109375, -0.05608558654785156, -0.053676605224609375, -0.05126762390136719, -0.048858642578125, -0.04644966125488281, -0.044040679931640625, -0.04163169860839844, -0.03922271728515625, -0.03681373596191406, -0.034404754638671875, -0.03199577331542969, -0.0295867919921875, -0.027177810668945312, -0.024768829345703125, -0.022359848022460938, -0.01995086669921875, -0.017541885375976562, -0.015132904052734375, -0.012723922729492188, -0.01031494140625, -0.007905960083007812, -0.005496978759765625, -0.0030879974365234375, -0.00067901611328125, 0.0017299652099609375, 0.004138946533203125, 0.0065479278564453125, 0.0089569091796875, 0.011365890502929688, 0.013774871826171875, 0.016183853149414062, 0.01859283447265625, 0.021001815795898438, 0.023410797119140625, 0.025819778442382812, 0.028228759765625, 0.030637741088867188, 0.033046722412109375, 0.03545570373535156, 0.03786468505859375, 0.04027366638183594, 0.042682647705078125, 0.04509162902832031, 0.0475006103515625, 0.04990959167480469, 0.052318572998046875, 0.05472755432128906, 0.05713653564453125, 0.05954551696777344, 0.061954498291015625, 0.06436347961425781, 0.0667724609375]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 5.0, 7.0, 8.0, 12.0, 18.0, 42.0, 102.0, 213.0, 273.0, 166.0, 81.0, 36.0, 20.0, 9.0, 7.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.2689971923828125, -4.1184234619140625, -3.9678499698638916, -3.8172764778137207, -3.6667027473449707, -3.5161292552948, -3.365555763244629, -3.214982032775879, -3.064408302307129, -2.913834810256958, -2.763261079788208, -2.612687587738037, -2.462113857269287, -2.311540365219116, -2.1609668731689453, -2.0103931427001953, -1.8598196506500244, -1.709246039390564, -1.5586724281311035, -1.4080989360809326, -1.2575252056121826, -1.1069517135620117, -0.9563781023025513, -0.8058044910430908, -0.6552308797836304, -0.5046572685241699, -0.35408368706703186, -0.2035101056098938, -0.05293649435043335, 0.0976371169090271, 0.24821066856384277, 0.3987842798233032, 0.5493578910827637, 0.6999315023422241, 0.8505051136016846, 1.0010786056518555, 1.1516523361206055, 1.3022258281707764, 1.4527994394302368, 1.6033730506896973, 1.7539466619491577, 1.9045202732086182, 2.055093765258789, 2.205667495727539, 2.35624098777771, 2.50681471824646, 2.657388210296631, 2.807961940765381, 2.9585354328155518, 3.1091089248657227, 3.2596826553344727, 3.4102561473846436, 3.5608298778533936, 3.7114033699035645, 3.8619771003723145, 4.012550354003906, 4.163124084472656, 4.313697814941406, 4.464271068572998, 4.614844799041748, 4.765418529510498, 4.915992259979248, 5.06656551361084, 5.21713924407959, 5.36771297454834]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 9.0, 9.0, 19.0, 41.0, 42.0, 73.0, 114.0, 149.0, 158.0, 137.0, 87.0, 66.0, 43.0, 26.0, 16.0, 6.0, 2.0, 6.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.244857311248779, -4.124806880950928, -4.004756927490234, -3.884706735610962, -3.7646565437316895, -3.644606113433838, -3.5245561599731445, -3.404505729675293, -3.2844555377960205, -3.164405345916748, -3.0443551540374756, -2.924304962158203, -2.8042547702789307, -2.684204578399658, -2.5641541481018066, -2.444103956222534, -2.3240537643432617, -2.2040035724639893, -2.083953380584717, -1.9639031887054443, -1.8438528776168823, -1.7238026857376099, -1.6037524938583374, -1.4837021827697754, -1.363652229309082, -1.2436020374298096, -1.123551845550537, -1.0035016536712646, -0.8834513425827026, -0.7634011507034302, -0.6433509588241577, -0.5233007073402405, -0.40325045585632324, -0.2832002341747284, -0.16315002739429474, -0.043099820613861084, 0.07695040106773376, 0.1970006227493286, 0.3170508146286011, 0.4371010661125183, 0.5571512579917908, 0.6772014498710632, 0.7972517013549805, 0.9173018932342529, 1.0373520851135254, 1.1574022769927979, 1.2774524688720703, 1.3975027799606323, 1.5175529718399048, 1.6376031637191772, 1.7576533555984497, 1.8777036666870117, 1.9977538585662842, 2.1178040504455566, 2.237854242324829, 2.3579044342041016, 2.477954626083374, 2.5980048179626465, 2.718055009841919, 2.8381052017211914, 2.958155393600464, 3.0782055854797363, 3.198256015777588, 3.3183062076568604, 3.438356399536133]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 4.0, 3.0, 1.0, 1.0, 7.0, 8.0, 11.0, 11.0, 20.0, 20.0, 35.0, 89.0, 248.0, 711.0, 3096.0, 22294.0, 388823.0, 596741.0, 31045.0, 4013.0, 873.0, 277.0, 98.0, 56.0, 24.0, 21.0, 12.0, 5.0, 8.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9375, -2.798095703125, -2.65869140625, -2.519287109375, -2.3798828125, -2.240478515625, -2.10107421875, -1.961669921875, -1.822265625, -1.682861328125, -1.54345703125, -1.404052734375, -1.2646484375, -1.125244140625, -0.98583984375, -0.846435546875, -0.70703125, -0.567626953125, -0.42822265625, -0.288818359375, -0.1494140625, -0.010009765625, 0.12939453125, 0.268798828125, 0.408203125, 0.547607421875, 0.68701171875, 0.826416015625, 0.9658203125, 1.105224609375, 1.24462890625, 1.384033203125, 1.5234375, 1.662841796875, 1.80224609375, 1.941650390625, 2.0810546875, 2.220458984375, 2.35986328125, 2.499267578125, 2.638671875, 2.778076171875, 2.91748046875, 3.056884765625, 3.1962890625, 3.335693359375, 3.47509765625, 3.614501953125, 3.75390625, 3.893310546875, 4.03271484375, 4.172119140625, 4.3115234375, 4.450927734375, 4.59033203125, 4.729736328125, 4.869140625, 5.008544921875, 5.14794921875, 5.287353515625, 5.4267578125, 5.566162109375, 5.70556640625, 5.844970703125, 5.984375]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 8.0, 4.0, 9.0, 6.0, 14.0, 14.0, 23.0, 40.0, 58.0, 65.0, 84.0, 132.0, 122.0, 106.0, 92.0, 76.0, 55.0, 29.0, 28.0, 13.0, 10.0, 8.0, 5.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.109375, -7.88018798828125, -7.6510009765625, -7.42181396484375, -7.192626953125, -6.96343994140625, -6.7342529296875, -6.50506591796875, -6.27587890625, -6.04669189453125, -5.8175048828125, -5.58831787109375, -5.359130859375, -5.12994384765625, -4.9007568359375, -4.67156982421875, -4.4423828125, -4.21319580078125, -3.9840087890625, -3.75482177734375, -3.525634765625, -3.29644775390625, -3.0672607421875, -2.83807373046875, -2.60888671875, -2.37969970703125, -2.1505126953125, -1.92132568359375, -1.692138671875, -1.46295166015625, -1.2337646484375, -1.00457763671875, -0.775390625, -0.54620361328125, -0.3170166015625, -0.08782958984375, 0.141357421875, 0.37054443359375, 0.5997314453125, 0.82891845703125, 1.05810546875, 1.28729248046875, 1.5164794921875, 1.74566650390625, 1.974853515625, 2.20404052734375, 2.4332275390625, 2.66241455078125, 2.8916015625, 3.12078857421875, 3.3499755859375, 3.57916259765625, 3.808349609375, 4.03753662109375, 4.2667236328125, 4.49591064453125, 4.72509765625, 4.95428466796875, 5.1834716796875, 5.41265869140625, 5.641845703125, 5.87103271484375, 6.1002197265625, 6.32940673828125, 6.55859375]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 5.0, 7.0, 4.0, 12.0, 7.0, 16.0, 18.0, 18.0, 17.0, 26.0, 40.0, 46.0, 52.0, 53.0, 60.0, 87.0, 135.0, 215.0, 527.0, 2399.0, 24841.0, 792609.0, 215820.0, 9007.0, 1376.0, 388.0, 186.0, 110.0, 92.0, 73.0, 40.0, 53.0, 40.0, 30.0, 25.0, 21.0, 14.0, 17.0, 13.0, 17.0, 10.0, 10.0, 3.0, 2.0, 7.0, 6.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-4.85546875, -4.70281982421875, -4.5501708984375, -4.39752197265625, -4.244873046875, -4.09222412109375, -3.9395751953125, -3.78692626953125, -3.63427734375, -3.48162841796875, -3.3289794921875, -3.17633056640625, -3.023681640625, -2.87103271484375, -2.7183837890625, -2.56573486328125, -2.4130859375, -2.26043701171875, -2.1077880859375, -1.95513916015625, -1.802490234375, -1.64984130859375, -1.4971923828125, -1.34454345703125, -1.19189453125, -1.03924560546875, -0.8865966796875, -0.73394775390625, -0.581298828125, -0.42864990234375, -0.2760009765625, -0.12335205078125, 0.029296875, 0.18194580078125, 0.3345947265625, 0.48724365234375, 0.639892578125, 0.79254150390625, 0.9451904296875, 1.09783935546875, 1.25048828125, 1.40313720703125, 1.5557861328125, 1.70843505859375, 1.861083984375, 2.01373291015625, 2.1663818359375, 2.31903076171875, 2.4716796875, 2.62432861328125, 2.7769775390625, 2.92962646484375, 3.082275390625, 3.23492431640625, 3.3875732421875, 3.54022216796875, 3.69287109375, 3.84552001953125, 3.9981689453125, 4.15081787109375, 4.303466796875, 4.45611572265625, 4.6087646484375, 4.76141357421875, 4.9140625]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 7.0, 3.0, 7.0, 11.0, 6.0, 19.0, 12.0, 11.0, 17.0, 18.0, 24.0, 27.0, 26.0, 33.0, 24.0, 43.0, 43.0, 46.0, 50.0, 33.0, 47.0, 37.0, 43.0, 32.0, 34.0, 44.0, 37.0, 28.0, 24.0, 23.0, 36.0, 29.0, 18.0, 13.0, 18.0, 11.0, 18.0, 11.0, 10.0, 2.0, 10.0, 3.0, 4.0, 3.0, 7.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.77734375, -3.655517578125, -3.53369140625, -3.411865234375, -3.2900390625, -3.168212890625, -3.04638671875, -2.924560546875, -2.802734375, -2.680908203125, -2.55908203125, -2.437255859375, -2.3154296875, -2.193603515625, -2.07177734375, -1.949951171875, -1.828125, -1.706298828125, -1.58447265625, -1.462646484375, -1.3408203125, -1.218994140625, -1.09716796875, -0.975341796875, -0.853515625, -0.731689453125, -0.60986328125, -0.488037109375, -0.3662109375, -0.244384765625, -0.12255859375, -0.000732421875, 0.12109375, 0.242919921875, 0.36474609375, 0.486572265625, 0.6083984375, 0.730224609375, 0.85205078125, 0.973876953125, 1.095703125, 1.217529296875, 1.33935546875, 1.461181640625, 1.5830078125, 1.704833984375, 1.82666015625, 1.948486328125, 2.0703125, 2.192138671875, 2.31396484375, 2.435791015625, 2.5576171875, 2.679443359375, 2.80126953125, 2.923095703125, 3.044921875, 3.166748046875, 3.28857421875, 3.410400390625, 3.5322265625, 3.654052734375, 3.77587890625, 3.897705078125, 4.01953125]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 8.0, 9.0, 8.0, 20.0, 29.0, 44.0, 78.0, 102.0, 171.0, 383.0, 652.0, 1527.0, 3733.0, 10886.0, 37397.0, 160646.0, 558304.0, 207685.0, 45965.0, 12796.0, 4576.0, 1798.0, 785.0, 396.0, 208.0, 135.0, 82.0, 47.0, 29.0, 18.0, 15.0, 8.0, 6.0, 4.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4970703125, -0.48133087158203125, -0.4655914306640625, -0.44985198974609375, -0.434112548828125, -0.41837310791015625, -0.4026336669921875, -0.38689422607421875, -0.37115478515625, -0.35541534423828125, -0.3396759033203125, -0.32393646240234375, -0.308197021484375, -0.29245758056640625, -0.2767181396484375, -0.26097869873046875, -0.2452392578125, -0.22949981689453125, -0.2137603759765625, -0.19802093505859375, -0.182281494140625, -0.16654205322265625, -0.1508026123046875, -0.13506317138671875, -0.11932373046875, -0.10358428955078125, -0.0878448486328125, -0.07210540771484375, -0.056365966796875, -0.04062652587890625, -0.0248870849609375, -0.00914764404296875, 0.006591796875, 0.02233123779296875, 0.0380706787109375, 0.05381011962890625, 0.069549560546875, 0.08528900146484375, 0.1010284423828125, 0.11676788330078125, 0.13250732421875, 0.14824676513671875, 0.1639862060546875, 0.17972564697265625, 0.195465087890625, 0.21120452880859375, 0.2269439697265625, 0.24268341064453125, 0.2584228515625, 0.27416229248046875, 0.2899017333984375, 0.30564117431640625, 0.321380615234375, 0.33712005615234375, 0.3528594970703125, 0.36859893798828125, 0.38433837890625, 0.40007781982421875, 0.4158172607421875, 0.43155670166015625, 0.447296142578125, 0.46303558349609375, 0.4787750244140625, 0.49451446533203125, 0.51025390625]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 6.0, 3.0, 3.0, 3.0, 12.0, 12.0, 8.0, 15.0, 14.0, 17.0, 16.0, 21.0, 23.0, 33.0, 42.0, 51.0, 63.0, 52.0, 77.0, 84.0, 70.0, 63.0, 48.0, 51.0, 44.0, 21.0, 32.0, 25.0, 20.0, 19.0, 5.0, 11.0, 8.0, 5.0, 8.0, 6.0, 6.0, 4.0, 3.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0], "bins": [-9.393692016601562e-05, -9.143166244029999e-05, -8.892640471458435e-05, -8.642114698886871e-05, -8.391588926315308e-05, -8.141063153743744e-05, -7.89053738117218e-05, -7.640011608600616e-05, -7.389485836029053e-05, -7.138960063457489e-05, -6.888434290885925e-05, -6.637908518314362e-05, -6.387382745742798e-05, -6.136856973171234e-05, -5.8863312005996704e-05, -5.635805428028107e-05, -5.385279655456543e-05, -5.134753882884979e-05, -4.8842281103134155e-05, -4.633702337741852e-05, -4.383176565170288e-05, -4.1326507925987244e-05, -3.8821250200271606e-05, -3.631599247455597e-05, -3.381073474884033e-05, -3.1305477023124695e-05, -2.8800219297409058e-05, -2.629496157169342e-05, -2.3789703845977783e-05, -2.1284446120262146e-05, -1.877918839454651e-05, -1.627393066883087e-05, -1.3768672943115234e-05, -1.1263415217399597e-05, -8.75815749168396e-06, -6.252899765968323e-06, -3.7476420402526855e-06, -1.2423843145370483e-06, 1.2628734111785889e-06, 3.768131136894226e-06, 6.273388862609863e-06, 8.7786465883255e-06, 1.1283904314041138e-05, 1.3789162039756775e-05, 1.6294419765472412e-05, 1.879967749118805e-05, 2.1304935216903687e-05, 2.3810192942619324e-05, 2.631545066833496e-05, 2.8820708394050598e-05, 3.1325966119766235e-05, 3.383122384548187e-05, 3.633648157119751e-05, 3.884173929691315e-05, 4.1346997022628784e-05, 4.385225474834442e-05, 4.635751247406006e-05, 4.8862770199775696e-05, 5.136802792549133e-05, 5.387328565120697e-05, 5.637854337692261e-05, 5.8883801102638245e-05, 6.138905882835388e-05, 6.389431655406952e-05, 6.639957427978516e-05]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 10.0, 5.0, 5.0, 10.0, 15.0, 16.0, 23.0, 37.0, 50.0, 86.0, 134.0, 236.0, 412.0, 887.0, 1988.0, 4659.0, 13821.0, 52804.0, 275021.0, 544251.0, 114778.0, 25913.0, 7789.0, 2864.0, 1298.0, 632.0, 319.0, 168.0, 115.0, 59.0, 48.0, 26.0, 24.0, 11.0, 10.0, 13.0, 8.0, 4.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.54248046875, -0.5256576538085938, -0.5088348388671875, -0.49201202392578125, -0.475189208984375, -0.45836639404296875, -0.4415435791015625, -0.42472076416015625, -0.40789794921875, -0.39107513427734375, -0.3742523193359375, -0.35742950439453125, -0.340606689453125, -0.32378387451171875, -0.3069610595703125, -0.29013824462890625, -0.2733154296875, -0.25649261474609375, -0.2396697998046875, -0.22284698486328125, -0.206024169921875, -0.18920135498046875, -0.1723785400390625, -0.15555572509765625, -0.13873291015625, -0.12191009521484375, -0.1050872802734375, -0.08826446533203125, -0.071441650390625, -0.05461883544921875, -0.0377960205078125, -0.02097320556640625, -0.004150390625, 0.01267242431640625, 0.0294952392578125, 0.04631805419921875, 0.063140869140625, 0.07996368408203125, 0.0967864990234375, 0.11360931396484375, 0.13043212890625, 0.14725494384765625, 0.1640777587890625, 0.18090057373046875, 0.197723388671875, 0.21454620361328125, 0.2313690185546875, 0.24819183349609375, 0.2650146484375, 0.28183746337890625, 0.2986602783203125, 0.31548309326171875, 0.332305908203125, 0.34912872314453125, 0.3659515380859375, 0.38277435302734375, 0.39959716796875, 0.41641998291015625, 0.4332427978515625, 0.45006561279296875, 0.466888427734375, 0.48371124267578125, 0.5005340576171875, 0.5173568725585938, 0.5341796875]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 1.0, 4.0, 4.0, 4.0, 7.0, 13.0, 15.0, 17.0, 22.0, 29.0, 30.0, 31.0, 37.0, 64.0, 59.0, 75.0, 95.0, 77.0, 86.0, 53.0, 41.0, 51.0, 29.0, 35.0, 34.0, 19.0, 13.0, 12.0, 11.0, 10.0, 8.0, 3.0, 1.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.270751953125, -0.26278114318847656, -0.2548103332519531, -0.2468395233154297, -0.23886871337890625, -0.2308979034423828, -0.22292709350585938, -0.21495628356933594, -0.2069854736328125, -0.19901466369628906, -0.19104385375976562, -0.1830730438232422, -0.17510223388671875, -0.1671314239501953, -0.15916061401367188, -0.15118980407714844, -0.143218994140625, -0.13524818420410156, -0.12727737426757812, -0.11930656433105469, -0.11133575439453125, -0.10336494445800781, -0.09539413452148438, -0.08742332458496094, -0.0794525146484375, -0.07148170471191406, -0.06351089477539062, -0.05554008483886719, -0.04756927490234375, -0.03959846496582031, -0.031627655029296875, -0.023656845092773438, -0.01568603515625, -0.0077152252197265625, 0.000255584716796875, 0.008226394653320312, 0.01619720458984375, 0.024168014526367188, 0.032138824462890625, 0.04010963439941406, 0.0480804443359375, 0.05605125427246094, 0.06402206420898438, 0.07199287414550781, 0.07996368408203125, 0.08793449401855469, 0.09590530395507812, 0.10387611389160156, 0.111846923828125, 0.11981773376464844, 0.12778854370117188, 0.1357593536376953, 0.14373016357421875, 0.1517009735107422, 0.15967178344726562, 0.16764259338378906, 0.1756134033203125, 0.18358421325683594, 0.19155502319335938, 0.1995258331298828, 0.20749664306640625, 0.2154674530029297, 0.22343826293945312, 0.23140907287597656, 0.2393798828125]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 3.0, 4.0, 8.0, 31.0, 90.0, 390.0, 343.0, 102.0, 27.0, 10.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.983829021453857, -5.384790420532227, -4.785751819610596, -4.186713218688965, -3.587674617767334, -2.988636016845703, -2.3895974159240723, -1.7905588150024414, -1.1915202140808105, -0.5924816131591797, 0.006556987762451172, 0.605595588684082, 1.204634189605713, 1.8036727905273438, 2.4027113914489746, 3.0017499923706055, 3.6007885932922363, 4.199827194213867, 4.798865795135498, 5.397904396057129, 5.99694299697876, 6.595981597900391, 7.1950201988220215, 7.794058799743652, 8.393096923828125, 8.992136001586914, 9.591174125671387, 10.19021224975586, 10.789251327514648, 11.388290405273438, 11.98732852935791, 12.586366653442383, 13.185405731201172, 13.784444808959961, 14.383482933044434, 14.982521057128906, 15.581560134887695, 16.180599212646484, 16.77963638305664, 17.37867546081543, 17.97771453857422, 18.576753616333008, 19.175792694091797, 19.774829864501953, 20.373868942260742, 20.97290802001953, 21.571945190429688, 22.170984268188477, 22.770023345947266, 23.369062423706055, 23.968101501464844, 24.567138671875, 25.16617774963379, 25.765216827392578, 26.364253997802734, 26.963293075561523, 27.562332153320312, 28.1613712310791, 28.76041030883789, 29.359447479248047, 29.958486557006836, 30.557525634765625, 31.15656280517578, 31.75560188293457, 32.35464096069336]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 11.0, 2.0, 7.0, 12.0, 21.0, 13.0, 28.0, 37.0, 44.0, 49.0, 50.0, 62.0, 69.0, 70.0, 59.0, 61.0, 62.0, 63.0, 51.0, 53.0, 35.0, 43.0, 18.0, 26.0, 18.0, 11.0, 7.0, 9.0, 3.0, 4.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.288092613220215, -12.947009086608887, -12.605925559997559, -12.264842987060547, -11.923759460449219, -11.58267593383789, -11.241592407226562, -10.900508880615234, -10.559425354003906, -10.218341827392578, -9.87725830078125, -9.536174774169922, -9.19509220123291, -8.854008674621582, -8.512925148010254, -8.171841621398926, -7.830759048461914, -7.489675521850586, -7.148592472076416, -6.807508945465088, -6.466425895690918, -6.12534236907959, -5.784258842468262, -5.443175315856934, -5.102092266082764, -4.7610087394714355, -4.419925689697266, -4.0788421630859375, -3.7377588748931885, -3.3966755867004395, -3.0555920600891113, -2.7145087718963623, -2.3734264373779297, -2.0323431491851807, -1.691259741783142, -1.3501763343811035, -1.0090930461883545, -0.6680097579956055, -0.32692623138427734, 0.01415705680847168, 0.3552403450012207, 0.6963236927986145, 1.0374070405960083, 1.3784904479980469, 1.719573736190796, 2.060657024383545, 2.401740550994873, 2.742823839187622, 3.083907127380371, 3.42499041557312, 3.766073703765869, 4.107157230377197, 4.448240280151367, 4.789323806762695, 5.130407333374023, 5.471490859985352, 5.8125739097595215, 6.15365743637085, 6.4947404861450195, 6.835824012756348, 7.176907539367676, 7.517990589141846, 7.859074115753174, 8.200157165527344, 8.541240692138672]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 5.0, 6.0, 4.0, 7.0, 7.0, 8.0, 13.0, 14.0, 23.0, 20.0, 38.0, 34.0, 65.0, 72.0, 121.0, 189.0, 388.0, 762.0, 2227.0, 8645.0, 57694.0, 2888569.0, 1181393.0, 42710.0, 7485.0, 2079.0, 783.0, 311.0, 212.0, 99.0, 81.0, 54.0, 33.0, 26.0, 25.0, 17.0, 16.0, 11.0, 10.0, 8.0, 7.0, 6.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-3.955078125, -3.834991455078125, -3.71490478515625, -3.594818115234375, -3.4747314453125, -3.354644775390625, -3.23455810546875, -3.114471435546875, -2.994384765625, -2.874298095703125, -2.75421142578125, -2.634124755859375, -2.5140380859375, -2.393951416015625, -2.27386474609375, -2.153778076171875, -2.03369140625, -1.913604736328125, -1.79351806640625, -1.673431396484375, -1.5533447265625, -1.433258056640625, -1.31317138671875, -1.193084716796875, -1.072998046875, -0.952911376953125, -0.83282470703125, -0.712738037109375, -0.5926513671875, -0.472564697265625, -0.35247802734375, -0.232391357421875, -0.1123046875, 0.007781982421875, 0.12786865234375, 0.247955322265625, 0.3680419921875, 0.488128662109375, 0.60821533203125, 0.728302001953125, 0.848388671875, 0.968475341796875, 1.08856201171875, 1.208648681640625, 1.3287353515625, 1.448822021484375, 1.56890869140625, 1.688995361328125, 1.80908203125, 1.929168701171875, 2.04925537109375, 2.169342041015625, 2.2894287109375, 2.409515380859375, 2.52960205078125, 2.649688720703125, 2.769775390625, 2.889862060546875, 3.00994873046875, 3.130035400390625, 3.2501220703125, 3.370208740234375, 3.49029541015625, 3.610382080078125, 3.73046875]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 6.0, 8.0, 15.0, 18.0, 28.0, 34.0, 70.0, 88.0, 137.0, 162.0, 140.0, 100.0, 69.0, 47.0, 31.0, 22.0, 13.0, 10.0, 1.0, 7.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.484375, -5.33856201171875, -5.1927490234375, -5.04693603515625, -4.901123046875, -4.75531005859375, -4.6094970703125, -4.46368408203125, -4.31787109375, -4.17205810546875, -4.0262451171875, -3.88043212890625, -3.734619140625, -3.58880615234375, -3.4429931640625, -3.29718017578125, -3.1513671875, -3.00555419921875, -2.8597412109375, -2.71392822265625, -2.568115234375, -2.42230224609375, -2.2764892578125, -2.13067626953125, -1.98486328125, -1.83905029296875, -1.6932373046875, -1.54742431640625, -1.401611328125, -1.25579833984375, -1.1099853515625, -0.96417236328125, -0.818359375, -0.67254638671875, -0.5267333984375, -0.38092041015625, -0.235107421875, -0.08929443359375, 0.0565185546875, 0.20233154296875, 0.34814453125, 0.49395751953125, 0.6397705078125, 0.78558349609375, 0.931396484375, 1.07720947265625, 1.2230224609375, 1.36883544921875, 1.5146484375, 1.66046142578125, 1.8062744140625, 1.95208740234375, 2.097900390625, 2.24371337890625, 2.3895263671875, 2.53533935546875, 2.68115234375, 2.82696533203125, 2.9727783203125, 3.11859130859375, 3.264404296875, 3.41021728515625, 3.5560302734375, 3.70184326171875, 3.84765625]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 7.0, 8.0, 9.0, 11.0, 14.0, 19.0, 45.0, 58.0, 113.0, 300.0, 2708.0, 3240567.0, 947562.0, 2243.0, 328.0, 122.0, 64.0, 45.0, 20.0, 7.0, 11.0, 11.0, 7.0, 2.0, 4.0, 2.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.5859375, -12.2154541015625, -11.844970703125, -11.4744873046875, -11.10400390625, -10.7335205078125, -10.363037109375, -9.9925537109375, -9.6220703125, -9.2515869140625, -8.881103515625, -8.5106201171875, -8.14013671875, -7.7696533203125, -7.399169921875, -7.0286865234375, -6.658203125, -6.2877197265625, -5.917236328125, -5.5467529296875, -5.17626953125, -4.8057861328125, -4.435302734375, -4.0648193359375, -3.6943359375, -3.3238525390625, -2.953369140625, -2.5828857421875, -2.21240234375, -1.8419189453125, -1.471435546875, -1.1009521484375, -0.73046875, -0.3599853515625, 0.010498046875, 0.3809814453125, 0.75146484375, 1.1219482421875, 1.492431640625, 1.8629150390625, 2.2333984375, 2.6038818359375, 2.974365234375, 3.3448486328125, 3.71533203125, 4.0858154296875, 4.456298828125, 4.8267822265625, 5.197265625, 5.5677490234375, 5.938232421875, 6.3087158203125, 6.67919921875, 7.0496826171875, 7.420166015625, 7.7906494140625, 8.1611328125, 8.5316162109375, 8.902099609375, 9.2725830078125, 9.64306640625, 10.0135498046875, 10.384033203125, 10.7545166015625, 11.125]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 3.0, 4.0, 4.0, 7.0, 16.0, 16.0, 21.0, 25.0, 44.0, 46.0, 112.0, 127.0, 251.0, 417.0, 1224.0, 888.0, 341.0, 164.0, 124.0, 75.0, 54.0, 31.0, 19.0, 20.0, 14.0, 12.0, 3.0, 2.0, 3.0, 5.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.90087890625, -0.8770980834960938, -0.8533172607421875, -0.8295364379882812, -0.805755615234375, -0.7819747924804688, -0.7581939697265625, -0.7344131469726562, -0.71063232421875, -0.6868515014648438, -0.6630706787109375, -0.6392898559570312, -0.615509033203125, -0.5917282104492188, -0.5679473876953125, -0.5441665649414062, -0.5203857421875, -0.49660491943359375, -0.4728240966796875, -0.44904327392578125, -0.425262451171875, -0.40148162841796875, -0.3777008056640625, -0.35391998291015625, -0.33013916015625, -0.30635833740234375, -0.2825775146484375, -0.25879669189453125, -0.235015869140625, -0.21123504638671875, -0.1874542236328125, -0.16367340087890625, -0.139892578125, -0.11611175537109375, -0.0923309326171875, -0.06855010986328125, -0.044769287109375, -0.02098846435546875, 0.0027923583984375, 0.02657318115234375, 0.05035400390625, 0.07413482666015625, 0.0979156494140625, 0.12169647216796875, 0.145477294921875, 0.16925811767578125, 0.1930389404296875, 0.21681976318359375, 0.2406005859375, 0.26438140869140625, 0.2881622314453125, 0.31194305419921875, 0.335723876953125, 0.35950469970703125, 0.3832855224609375, 0.40706634521484375, 0.43084716796875, 0.45462799072265625, 0.4784088134765625, 0.5021896362304688, 0.525970458984375, 0.5497512817382812, 0.5735321044921875, 0.5973129272460938, 0.62109375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 4.0, 4.0, 5.0, 7.0, 10.0, 14.0, 20.0, 31.0, 39.0, 93.0, 154.0, 199.0, 162.0, 98.0, 53.0, 33.0, 24.0, 17.0, 9.0, 9.0, 10.0, 3.0, 0.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.267861366271973, -4.12433385848999, -3.980806589126587, -3.8372790813446045, -3.693751811981201, -3.5502243041992188, -3.4066967964172363, -3.263169288635254, -3.1196420192718506, -2.976114511489868, -2.832587242126465, -2.6890597343444824, -2.5455322265625, -2.4020049571990967, -2.2584774494171143, -2.114950180053711, -1.9714226722717285, -1.8278952836990356, -1.6843678951263428, -1.5408403873443604, -1.3973129987716675, -1.2537856101989746, -1.1102581024169922, -0.9667307138442993, -0.8232033252716064, -0.6796759366989136, -0.5361484885215759, -0.39262107014656067, -0.2490936517715454, -0.10556626319885254, 0.03796118497848511, 0.18148863315582275, 0.3250155448913574, 0.4685429632663727, 0.6120703816413879, 0.7555978298187256, 0.8991252183914185, 1.0426526069641113, 1.1861801147460938, 1.3297075033187866, 1.4732348918914795, 1.6167622804641724, 1.7602896690368652, 1.9038171768188477, 2.04734468460083, 2.1908719539642334, 2.334399461746216, 2.477926731109619, 2.6214542388916016, 2.764981746673584, 2.9085090160369873, 3.0520365238189697, 3.195563793182373, 3.3390913009643555, 3.482618808746338, 3.6261463165283203, 3.7696735858917236, 3.913201093673706, 4.056728363037109, 4.200255870819092, 4.343783378601074, 4.487310409545898, 4.630837917327881, 4.774365425109863, 4.917892932891846]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 4.0, 14.0, 8.0, 22.0, 41.0, 48.0, 70.0, 82.0, 105.0, 123.0, 113.0, 95.0, 87.0, 67.0, 37.0, 24.0, 25.0, 14.0, 9.0, 7.0, 3.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.006866931915283, -4.865267276763916, -4.723667144775391, -4.582067489624023, -4.440467834472656, -4.298868179321289, -4.157268524169922, -4.0156683921813965, -3.8740687370300293, -3.732469081878662, -3.590869188308716, -3.4492692947387695, -3.3076696395874023, -3.166069984436035, -3.024470090866089, -2.8828701972961426, -2.7412705421447754, -2.599670886993408, -2.458070993423462, -2.3164710998535156, -2.1748714447021484, -2.0332717895507812, -1.891671895980835, -1.7500721216201782, -1.6084723472595215, -1.4668725728988647, -1.325272798538208, -1.1836730241775513, -1.0420732498168945, -0.9004734754562378, -0.758873701095581, -0.6172739267349243, -0.4756746292114258, -0.33407485485076904, -0.1924750804901123, -0.050875306129455566, 0.09072446823120117, 0.2323242425918579, 0.37392401695251465, 0.5155237913131714, 0.6571235656738281, 0.7987233400344849, 0.9403231143951416, 1.0819228887557983, 1.223522663116455, 1.3651224374771118, 1.5067222118377686, 1.6483219861984253, 1.789921760559082, 1.9315215349197388, 2.0731213092803955, 2.214721202850342, 2.356320858001709, 2.497920513153076, 2.6395204067230225, 2.7811203002929688, 2.922719955444336, 3.064319610595703, 3.2059195041656494, 3.3475193977355957, 3.489119052886963, 3.63071870803833, 3.7723186016082764, 3.9139184951782227, 4.05551815032959]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 3.0, 2.0, 11.0, 6.0, 12.0, 18.0, 21.0, 33.0, 33.0, 45.0, 87.0, 123.0, 193.0, 288.0, 509.0, 802.0, 1622.0, 3128.0, 7129.0, 17756.0, 55946.0, 231047.0, 493615.0, 167286.0, 42696.0, 14209.0, 5864.0, 2754.0, 1355.0, 741.0, 447.0, 261.0, 151.0, 103.0, 91.0, 53.0, 38.0, 23.0, 20.0, 11.0, 10.0, 3.0, 8.0, 3.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.307373046875, -0.2984352111816406, -0.28949737548828125, -0.2805595397949219, -0.2716217041015625, -0.2626838684082031, -0.25374603271484375, -0.24480819702148438, -0.235870361328125, -0.22693252563476562, -0.21799468994140625, -0.20905685424804688, -0.2001190185546875, -0.19118118286132812, -0.18224334716796875, -0.17330551147460938, -0.16436767578125, -0.15542984008789062, -0.14649200439453125, -0.13755416870117188, -0.1286163330078125, -0.11967849731445312, -0.11074066162109375, -0.10180282592773438, -0.092864990234375, -0.08392715454101562, -0.07498931884765625, -0.06605148315429688, -0.0571136474609375, -0.048175811767578125, -0.03923797607421875, -0.030300140380859375, -0.0213623046875, -0.012424468994140625, -0.00348663330078125, 0.005451202392578125, 0.0143890380859375, 0.023326873779296875, 0.03226470947265625, 0.041202545166015625, 0.050140380859375, 0.059078216552734375, 0.06801605224609375, 0.07695388793945312, 0.0858917236328125, 0.09482955932617188, 0.10376739501953125, 0.11270523071289062, 0.12164306640625, 0.13058090209960938, 0.13951873779296875, 0.14845657348632812, 0.1573944091796875, 0.16633224487304688, 0.17527008056640625, 0.18420791625976562, 0.193145751953125, 0.20208358764648438, 0.21102142333984375, 0.21995925903320312, 0.2288970947265625, 0.23783493041992188, 0.24677276611328125, 0.2557106018066406, 0.2646484375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 3.0, 3.0, 11.0, 20.0, 29.0, 45.0, 39.0, 85.0, 95.0, 130.0, 125.0, 114.0, 104.0, 72.0, 39.0, 30.0, 17.0, 21.0, 6.0, 6.0, 6.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.615234375, -3.50970458984375, -3.4041748046875, -3.29864501953125, -3.193115234375, -3.08758544921875, -2.9820556640625, -2.87652587890625, -2.77099609375, -2.66546630859375, -2.5599365234375, -2.45440673828125, -2.348876953125, -2.24334716796875, -2.1378173828125, -2.03228759765625, -1.9267578125, -1.82122802734375, -1.7156982421875, -1.61016845703125, -1.504638671875, -1.39910888671875, -1.2935791015625, -1.18804931640625, -1.08251953125, -0.97698974609375, -0.8714599609375, -0.76593017578125, -0.660400390625, -0.55487060546875, -0.4493408203125, -0.34381103515625, -0.23828125, -0.13275146484375, -0.0272216796875, 0.07830810546875, 0.183837890625, 0.28936767578125, 0.3948974609375, 0.50042724609375, 0.60595703125, 0.71148681640625, 0.8170166015625, 0.92254638671875, 1.028076171875, 1.13360595703125, 1.2391357421875, 1.34466552734375, 1.4501953125, 1.55572509765625, 1.6612548828125, 1.76678466796875, 1.872314453125, 1.97784423828125, 2.0833740234375, 2.18890380859375, 2.29443359375, 2.39996337890625, 2.5054931640625, 2.61102294921875, 2.716552734375, 2.82208251953125, 2.9276123046875, 3.03314208984375, 3.138671875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 4.0, 4.0, 8.0, 10.0, 16.0, 25.0, 22.0, 47.0, 94.0, 135.0, 267.0, 589.0, 1417.0, 4589.0, 21052.0, 195697.0, 686903.0, 117439.0, 14443.0, 3600.0, 1124.0, 468.0, 254.0, 129.0, 70.0, 47.0, 36.0, 23.0, 12.0, 9.0, 9.0, 4.0, 6.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4345703125, -0.4181060791015625, -0.401641845703125, -0.3851776123046875, -0.36871337890625, -0.3522491455078125, -0.335784912109375, -0.3193206787109375, -0.3028564453125, -0.2863922119140625, -0.269927978515625, -0.2534637451171875, -0.23699951171875, -0.2205352783203125, -0.204071044921875, -0.1876068115234375, -0.171142578125, -0.1546783447265625, -0.138214111328125, -0.1217498779296875, -0.10528564453125, -0.0888214111328125, -0.072357177734375, -0.0558929443359375, -0.0394287109375, -0.0229644775390625, -0.006500244140625, 0.0099639892578125, 0.02642822265625, 0.0428924560546875, 0.059356689453125, 0.0758209228515625, 0.09228515625, 0.1087493896484375, 0.125213623046875, 0.1416778564453125, 0.15814208984375, 0.1746063232421875, 0.191070556640625, 0.2075347900390625, 0.2239990234375, 0.2404632568359375, 0.256927490234375, 0.2733917236328125, 0.28985595703125, 0.3063201904296875, 0.322784423828125, 0.3392486572265625, 0.355712890625, 0.3721771240234375, 0.388641357421875, 0.4051055908203125, 0.42156982421875, 0.4380340576171875, 0.454498291015625, 0.4709625244140625, 0.4874267578125, 0.5038909912109375, 0.520355224609375, 0.5368194580078125, 0.55328369140625, 0.5697479248046875, 0.586212158203125, 0.6026763916015625, 0.619140625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 4.0, 5.0, 8.0, 6.0, 15.0, 10.0, 12.0, 12.0, 14.0, 23.0, 33.0, 20.0, 33.0, 49.0, 36.0, 39.0, 44.0, 47.0, 56.0, 44.0, 48.0, 42.0, 54.0, 35.0, 43.0, 38.0, 37.0, 28.0, 27.0, 17.0, 23.0, 21.0, 16.0, 18.0, 11.0, 7.0, 8.0, 8.0, 3.0, 3.0, 1.0, 7.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.41796875, -3.306915283203125, -3.19586181640625, -3.084808349609375, -2.9737548828125, -2.862701416015625, -2.75164794921875, -2.640594482421875, -2.529541015625, -2.418487548828125, -2.30743408203125, -2.196380615234375, -2.0853271484375, -1.974273681640625, -1.86322021484375, -1.752166748046875, -1.64111328125, -1.530059814453125, -1.41900634765625, -1.307952880859375, -1.1968994140625, -1.085845947265625, -0.97479248046875, -0.863739013671875, -0.752685546875, -0.641632080078125, -0.53057861328125, -0.419525146484375, -0.3084716796875, -0.197418212890625, -0.08636474609375, 0.024688720703125, 0.1357421875, 0.246795654296875, 0.35784912109375, 0.468902587890625, 0.5799560546875, 0.691009521484375, 0.80206298828125, 0.913116455078125, 1.024169921875, 1.135223388671875, 1.24627685546875, 1.357330322265625, 1.4683837890625, 1.579437255859375, 1.69049072265625, 1.801544189453125, 1.91259765625, 2.023651123046875, 2.13470458984375, 2.245758056640625, 2.3568115234375, 2.467864990234375, 2.57891845703125, 2.689971923828125, 2.801025390625, 2.912078857421875, 3.02313232421875, 3.134185791015625, 3.2452392578125, 3.356292724609375, 3.46734619140625, 3.578399658203125, 3.689453125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 1.0, 0.0, 7.0, 7.0, 11.0, 13.0, 23.0, 31.0, 56.0, 95.0, 230.0, 616.0, 1902.0, 9202.0, 130589.0, 846922.0, 51255.0, 5407.0, 1359.0, 418.0, 181.0, 90.0, 42.0, 27.0, 27.0, 6.0, 9.0, 8.0, 8.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0], "bins": [-0.44384765625, -0.4328498840332031, -0.42185211181640625, -0.4108543395996094, -0.3998565673828125, -0.3888587951660156, -0.37786102294921875, -0.3668632507324219, -0.355865478515625, -0.3448677062988281, -0.33386993408203125, -0.3228721618652344, -0.3118743896484375, -0.3008766174316406, -0.28987884521484375, -0.2788810729980469, -0.26788330078125, -0.2568855285644531, -0.24588775634765625, -0.23488998413085938, -0.2238922119140625, -0.21289443969726562, -0.20189666748046875, -0.19089889526367188, -0.179901123046875, -0.16890335083007812, -0.15790557861328125, -0.14690780639648438, -0.1359100341796875, -0.12491226196289062, -0.11391448974609375, -0.10291671752929688, -0.0919189453125, -0.08092117309570312, -0.06992340087890625, -0.058925628662109375, -0.0479278564453125, -0.036930084228515625, -0.02593231201171875, -0.014934539794921875, -0.003936767578125, 0.007061004638671875, 0.01805877685546875, 0.029056549072265625, 0.0400543212890625, 0.051052093505859375, 0.06204986572265625, 0.07304763793945312, 0.08404541015625, 0.09504318237304688, 0.10604095458984375, 0.11703872680664062, 0.1280364990234375, 0.13903427124023438, 0.15003204345703125, 0.16102981567382812, 0.172027587890625, 0.18302536010742188, 0.19402313232421875, 0.20502090454101562, 0.2160186767578125, 0.22701644897460938, 0.23801422119140625, 0.24901199340820312, 0.260009765625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 7.0, 3.0, 7.0, 18.0, 19.0, 28.0, 22.0, 33.0, 47.0, 63.0, 81.0, 87.0, 93.0, 106.0, 77.0, 65.0, 56.0, 49.0, 44.0, 19.0, 25.0, 16.0, 12.0, 11.0, 8.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.00010395050048828125, -0.00010140985250473022, -9.88692045211792e-05, -9.632855653762817e-05, -9.378790855407715e-05, -9.124726057052612e-05, -8.87066125869751e-05, -8.616596460342407e-05, -8.362531661987305e-05, -8.108466863632202e-05, -7.8544020652771e-05, -7.600337266921997e-05, -7.346272468566895e-05, -7.092207670211792e-05, -6.83814287185669e-05, -6.584078073501587e-05, -6.330013275146484e-05, -6.075948476791382e-05, -5.821883678436279e-05, -5.567818880081177e-05, -5.313754081726074e-05, -5.059689283370972e-05, -4.805624485015869e-05, -4.5515596866607666e-05, -4.297494888305664e-05, -4.0434300899505615e-05, -3.789365291595459e-05, -3.5353004932403564e-05, -3.281235694885254e-05, -3.0271708965301514e-05, -2.7731060981750488e-05, -2.5190412998199463e-05, -2.2649765014648438e-05, -2.0109117031097412e-05, -1.7568469047546387e-05, -1.5027821063995361e-05, -1.2487173080444336e-05, -9.94652509689331e-06, -7.405877113342285e-06, -4.86522912979126e-06, -2.3245811462402344e-06, 2.1606683731079102e-07, 2.7567148208618164e-06, 5.297362804412842e-06, 7.838010787963867e-06, 1.0378658771514893e-05, 1.2919306755065918e-05, 1.5459954738616943e-05, 1.800060272216797e-05, 2.0541250705718994e-05, 2.308189868927002e-05, 2.5622546672821045e-05, 2.816319465637207e-05, 3.0703842639923096e-05, 3.324449062347412e-05, 3.5785138607025146e-05, 3.832578659057617e-05, 4.08664345741272e-05, 4.340708255767822e-05, 4.594773054122925e-05, 4.8488378524780273e-05, 5.10290265083313e-05, 5.3569674491882324e-05, 5.611032247543335e-05, 5.8650970458984375e-05]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 6.0, 6.0, 7.0, 15.0, 16.0, 39.0, 33.0, 47.0, 91.0, 206.0, 713.0, 4024.0, 75751.0, 919059.0, 44644.0, 2979.0, 535.0, 159.0, 72.0, 43.0, 24.0, 14.0, 16.0, 18.0, 9.0, 7.0, 6.0, 5.0, 3.0, 1.0, 1.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.36328125, -0.3509368896484375, -0.338592529296875, -0.3262481689453125, -0.31390380859375, -0.3015594482421875, -0.289215087890625, -0.2768707275390625, -0.2645263671875, -0.2521820068359375, -0.239837646484375, -0.2274932861328125, -0.21514892578125, -0.2028045654296875, -0.190460205078125, -0.1781158447265625, -0.165771484375, -0.1534271240234375, -0.141082763671875, -0.1287384033203125, -0.11639404296875, -0.1040496826171875, -0.091705322265625, -0.0793609619140625, -0.0670166015625, -0.0546722412109375, -0.042327880859375, -0.0299835205078125, -0.01763916015625, -0.0052947998046875, 0.007049560546875, 0.0193939208984375, 0.03173828125, 0.0440826416015625, 0.056427001953125, 0.0687713623046875, 0.08111572265625, 0.0934600830078125, 0.105804443359375, 0.1181488037109375, 0.1304931640625, 0.1428375244140625, 0.155181884765625, 0.1675262451171875, 0.17987060546875, 0.1922149658203125, 0.204559326171875, 0.2169036865234375, 0.229248046875, 0.2415924072265625, 0.253936767578125, 0.2662811279296875, 0.27862548828125, 0.2909698486328125, 0.303314208984375, 0.3156585693359375, 0.3280029296875, 0.3403472900390625, 0.352691650390625, 0.3650360107421875, 0.37738037109375, 0.3897247314453125, 0.402069091796875, 0.4144134521484375, 0.4267578125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 6.0, 9.0, 6.0, 9.0, 15.0, 18.0, 23.0, 35.0, 36.0, 44.0, 71.0, 91.0, 130.0, 111.0, 93.0, 69.0, 54.0, 43.0, 29.0, 31.0, 14.0, 22.0, 15.0, 5.0, 4.0, 4.0, 7.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.055145263671875, -0.05336809158325195, -0.051590919494628906, -0.04981374740600586, -0.04803657531738281, -0.046259403228759766, -0.04448223114013672, -0.04270505905151367, -0.040927886962890625, -0.03915071487426758, -0.03737354278564453, -0.035596370697021484, -0.03381919860839844, -0.03204202651977539, -0.030264854431152344, -0.028487682342529297, -0.02671051025390625, -0.024933338165283203, -0.023156166076660156, -0.02137899398803711, -0.019601821899414062, -0.017824649810791016, -0.01604747772216797, -0.014270305633544922, -0.012493133544921875, -0.010715961456298828, -0.008938789367675781, -0.007161617279052734, -0.0053844451904296875, -0.0036072731018066406, -0.0018301010131835938, -5.2928924560546875e-05, 0.0017242431640625, 0.003501415252685547, 0.005278587341308594, 0.007055759429931641, 0.008832931518554688, 0.010610103607177734, 0.012387275695800781, 0.014164447784423828, 0.015941619873046875, 0.017718791961669922, 0.01949596405029297, 0.021273136138916016, 0.023050308227539062, 0.02482748031616211, 0.026604652404785156, 0.028381824493408203, 0.03015899658203125, 0.0319361686706543, 0.033713340759277344, 0.03549051284790039, 0.03726768493652344, 0.039044857025146484, 0.04082202911376953, 0.04259920120239258, 0.044376373291015625, 0.04615354537963867, 0.04793071746826172, 0.049707889556884766, 0.05148506164550781, 0.05326223373413086, 0.055039405822753906, 0.05681657791137695, 0.05859375]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 6.0, 5.0, 13.0, 8.0, 26.0, 34.0, 69.0, 184.0, 281.0, 167.0, 98.0, 45.0, 23.0, 18.0, 11.0, 7.0, 0.0, 5.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.300103187561035, -3.1663310527801514, -3.0325589179992676, -2.898787021636963, -2.765014886856079, -2.6312427520751953, -2.4974708557128906, -2.363698720932007, -2.229926586151123, -2.0961544513702393, -1.962382435798645, -1.8286104202270508, -1.694838285446167, -1.5610661506652832, -1.427294135093689, -1.2935221195220947, -1.159749984741211, -1.0259778499603271, -0.8922058343887329, -0.7584337592124939, -0.6246616840362549, -0.49088960886001587, -0.35711753368377686, -0.22334545850753784, -0.08957338333129883, 0.044198691844940186, 0.1779707670211792, 0.3117428421974182, 0.4455149173736572, 0.5792869925498962, 0.7130590677261353, 0.8468311429023743, 0.9806027412414551, 1.1143748760223389, 1.248146891593933, 1.3819189071655273, 1.5156910419464111, 1.649463176727295, 1.7832351922988892, 1.9170072078704834, 2.050779342651367, 2.184551477432251, 2.3183236122131348, 2.4520955085754395, 2.5858676433563232, 2.719639778137207, 2.8534116744995117, 2.9871838092803955, 3.1209559440612793, 3.254728078842163, 3.388500213623047, 3.5222721099853516, 3.6560442447662354, 3.789816379547119, 3.923588275909424, 4.057360649108887, 4.191132545471191, 4.324904441833496, 4.458676815032959, 4.592448711395264, 4.726221084594727, 4.859992980957031, 4.993764877319336, 5.127537250518799, 5.2613091468811035]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 6.0, 5.0, 8.0, 19.0, 28.0, 57.0, 76.0, 94.0, 138.0, 159.0, 139.0, 94.0, 54.0, 50.0, 26.0, 22.0, 5.0, 12.0, 8.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.127928733825684, -4.012039661407471, -3.896150827407837, -3.780261754989624, -3.664372682571411, -3.5484838485717773, -3.4325947761535645, -3.3167057037353516, -3.2008166313171387, -3.084927558898926, -2.969038724899292, -2.853149652481079, -2.737260580062866, -2.6213717460632324, -2.5054826736450195, -2.3895936012268066, -2.273704767227173, -2.15781569480896, -2.041926860809326, -1.9260377883911133, -1.8101487159729004, -1.694259762763977, -1.5783708095550537, -1.4624817371368408, -1.3465927839279175, -1.2307038307189941, -1.1148147583007812, -0.9989258050918579, -0.8830367922782898, -0.7671477794647217, -0.6512588262557983, -0.5353698134422302, -0.4194810390472412, -0.3035920262336731, -0.18770304322242737, -0.07181406021118164, 0.044074952602386475, 0.1599639654159546, 0.27585291862487793, 0.39174193143844604, 0.5076309442520142, 0.6235199570655823, 0.7394089698791504, 0.8552979230880737, 0.9711869359016418, 1.08707594871521, 1.2029649019241333, 1.3188538551330566, 1.4347429275512695, 1.5506318807601929, 1.6665209531784058, 1.782409906387329, 1.898298978805542, 2.014187812805176, 2.1300768852233887, 2.2459659576416016, 2.3618550300598145, 2.4777441024780273, 2.593632936477661, 2.709522008895874, 2.825411081314087, 2.9412999153137207, 3.0571889877319336, 3.1730780601501465, 3.2889668941497803]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 5.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 4.0, 4.0, 7.0, 8.0, 7.0, 9.0, 18.0, 17.0, 30.0, 56.0, 78.0, 147.0, 242.0, 469.0, 1022.0, 2485.0, 6854.0, 24768.0, 131785.0, 672813.0, 165559.0, 29289.0, 7819.0, 2724.0, 1097.0, 524.0, 272.0, 147.0, 98.0, 65.0, 28.0, 20.0, 24.0, 13.0, 9.0, 7.0, 6.0, 1.0, 4.0, 6.0, 3.0, 1.0, 4.0, 1.0, 6.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.171875, -2.100799560546875, -2.02972412109375, -1.958648681640625, -1.8875732421875, -1.816497802734375, -1.74542236328125, -1.674346923828125, -1.603271484375, -1.532196044921875, -1.46112060546875, -1.390045166015625, -1.3189697265625, -1.247894287109375, -1.17681884765625, -1.105743408203125, -1.03466796875, -0.963592529296875, -0.89251708984375, -0.821441650390625, -0.7503662109375, -0.679290771484375, -0.60821533203125, -0.537139892578125, -0.466064453125, -0.394989013671875, -0.32391357421875, -0.252838134765625, -0.1817626953125, -0.110687255859375, -0.03961181640625, 0.031463623046875, 0.1025390625, 0.173614501953125, 0.24468994140625, 0.315765380859375, 0.3868408203125, 0.457916259765625, 0.52899169921875, 0.600067138671875, 0.671142578125, 0.742218017578125, 0.81329345703125, 0.884368896484375, 0.9554443359375, 1.026519775390625, 1.09759521484375, 1.168670654296875, 1.23974609375, 1.310821533203125, 1.38189697265625, 1.452972412109375, 1.5240478515625, 1.595123291015625, 1.66619873046875, 1.737274169921875, 1.808349609375, 1.879425048828125, 1.95050048828125, 2.021575927734375, 2.0926513671875, 2.163726806640625, 2.23480224609375, 2.305877685546875, 2.376953125]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 4.0, 13.0, 8.0, 15.0, 33.0, 46.0, 82.0, 137.0, 145.0, 163.0, 135.0, 80.0, 57.0, 32.0, 22.0, 12.0, 7.0, 5.0, 4.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.46875, -11.1751708984375, -10.881591796875, -10.5880126953125, -10.29443359375, -10.0008544921875, -9.707275390625, -9.4136962890625, -9.1201171875, -8.8265380859375, -8.532958984375, -8.2393798828125, -7.94580078125, -7.6522216796875, -7.358642578125, -7.0650634765625, -6.771484375, -6.4779052734375, -6.184326171875, -5.8907470703125, -5.59716796875, -5.3035888671875, -5.010009765625, -4.7164306640625, -4.4228515625, -4.1292724609375, -3.835693359375, -3.5421142578125, -3.24853515625, -2.9549560546875, -2.661376953125, -2.3677978515625, -2.07421875, -1.7806396484375, -1.487060546875, -1.1934814453125, -0.89990234375, -0.6063232421875, -0.312744140625, -0.0191650390625, 0.2744140625, 0.5679931640625, 0.861572265625, 1.1551513671875, 1.44873046875, 1.7423095703125, 2.035888671875, 2.3294677734375, 2.623046875, 2.9166259765625, 3.210205078125, 3.5037841796875, 3.79736328125, 4.0909423828125, 4.384521484375, 4.6781005859375, 4.9716796875, 5.2652587890625, 5.558837890625, 5.8524169921875, 6.14599609375, 6.4395751953125, 6.733154296875, 7.0267333984375, 7.3203125]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 4.0, 3.0, 5.0, 0.0, 4.0, 8.0, 14.0, 13.0, 26.0, 31.0, 55.0, 77.0, 97.0, 199.0, 349.0, 1036.0, 4103.0, 32152.0, 712972.0, 277626.0, 15720.0, 2548.0, 736.0, 314.0, 170.0, 94.0, 58.0, 59.0, 30.0, 15.0, 13.0, 8.0, 5.0, 6.0, 5.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.259765625, -3.166229248046875, -3.07269287109375, -2.979156494140625, -2.8856201171875, -2.792083740234375, -2.69854736328125, -2.605010986328125, -2.511474609375, -2.417938232421875, -2.32440185546875, -2.230865478515625, -2.1373291015625, -2.043792724609375, -1.95025634765625, -1.856719970703125, -1.76318359375, -1.669647216796875, -1.57611083984375, -1.482574462890625, -1.3890380859375, -1.295501708984375, -1.20196533203125, -1.108428955078125, -1.014892578125, -0.921356201171875, -0.82781982421875, -0.734283447265625, -0.6407470703125, -0.547210693359375, -0.45367431640625, -0.360137939453125, -0.2666015625, -0.173065185546875, -0.07952880859375, 0.014007568359375, 0.1075439453125, 0.201080322265625, 0.29461669921875, 0.388153076171875, 0.481689453125, 0.575225830078125, 0.66876220703125, 0.762298583984375, 0.8558349609375, 0.949371337890625, 1.04290771484375, 1.136444091796875, 1.22998046875, 1.323516845703125, 1.41705322265625, 1.510589599609375, 1.6041259765625, 1.697662353515625, 1.79119873046875, 1.884735107421875, 1.978271484375, 2.071807861328125, 2.16534423828125, 2.258880615234375, 2.3524169921875, 2.445953369140625, 2.53948974609375, 2.633026123046875, 2.7265625]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 2.0, 5.0, 3.0, 6.0, 16.0, 18.0, 13.0, 29.0, 32.0, 26.0, 35.0, 46.0, 45.0, 51.0, 71.0, 53.0, 61.0, 65.0, 51.0, 51.0, 41.0, 44.0, 51.0, 39.0, 36.0, 23.0, 22.0, 16.0, 9.0, 11.0, 11.0, 6.0, 7.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.453125, -5.2777099609375, -5.102294921875, -4.9268798828125, -4.75146484375, -4.5760498046875, -4.400634765625, -4.2252197265625, -4.0498046875, -3.8743896484375, -3.698974609375, -3.5235595703125, -3.34814453125, -3.1727294921875, -2.997314453125, -2.8218994140625, -2.646484375, -2.4710693359375, -2.295654296875, -2.1202392578125, -1.94482421875, -1.7694091796875, -1.593994140625, -1.4185791015625, -1.2431640625, -1.0677490234375, -0.892333984375, -0.7169189453125, -0.54150390625, -0.3660888671875, -0.190673828125, -0.0152587890625, 0.16015625, 0.3355712890625, 0.510986328125, 0.6864013671875, 0.86181640625, 1.0372314453125, 1.212646484375, 1.3880615234375, 1.5634765625, 1.7388916015625, 1.914306640625, 2.0897216796875, 2.26513671875, 2.4405517578125, 2.615966796875, 2.7913818359375, 2.966796875, 3.1422119140625, 3.317626953125, 3.4930419921875, 3.66845703125, 3.8438720703125, 4.019287109375, 4.1947021484375, 4.3701171875, 4.5455322265625, 4.720947265625, 4.8963623046875, 5.07177734375, 5.2471923828125, 5.422607421875, 5.5980224609375, 5.7734375]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 4.0, 3.0, 7.0, 14.0, 21.0, 44.0, 85.0, 159.0, 361.0, 1037.0, 3536.0, 17382.0, 166304.0, 771478.0, 74438.0, 9948.0, 2381.0, 800.0, 294.0, 117.0, 65.0, 38.0, 23.0, 10.0, 5.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1630859375, -1.13275146484375, -1.1024169921875, -1.07208251953125, -1.041748046875, -1.01141357421875, -0.9810791015625, -0.95074462890625, -0.92041015625, -0.89007568359375, -0.8597412109375, -0.82940673828125, -0.799072265625, -0.76873779296875, -0.7384033203125, -0.70806884765625, -0.677734375, -0.64739990234375, -0.6170654296875, -0.58673095703125, -0.556396484375, -0.52606201171875, -0.4957275390625, -0.46539306640625, -0.43505859375, -0.40472412109375, -0.3743896484375, -0.34405517578125, -0.313720703125, -0.28338623046875, -0.2530517578125, -0.22271728515625, -0.1923828125, -0.16204833984375, -0.1317138671875, -0.10137939453125, -0.071044921875, -0.04071044921875, -0.0103759765625, 0.01995849609375, 0.05029296875, 0.08062744140625, 0.1109619140625, 0.14129638671875, 0.171630859375, 0.20196533203125, 0.2322998046875, 0.26263427734375, 0.29296875, 0.32330322265625, 0.3536376953125, 0.38397216796875, 0.414306640625, 0.44464111328125, 0.4749755859375, 0.50531005859375, 0.53564453125, 0.56597900390625, 0.5963134765625, 0.62664794921875, 0.656982421875, 0.68731689453125, 0.7176513671875, 0.74798583984375, 0.7783203125]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 11.0, 3.0, 6.0, 3.0, 9.0, 14.0, 8.0, 15.0, 17.0, 32.0, 38.0, 48.0, 83.0, 98.0, 103.0, 129.0, 85.0, 78.0, 47.0, 26.0, 30.0, 37.0, 24.0, 15.0, 8.0, 10.0, 4.0, 5.0, 5.0, 3.0, 5.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00011944770812988281, -0.00011593848466873169, -0.00011242926120758057, -0.00010892003774642944, -0.00010541081428527832, -0.0001019015908241272, -9.839236736297607e-05, -9.488314390182495e-05, -9.137392044067383e-05, -8.78646969795227e-05, -8.435547351837158e-05, -8.084625005722046e-05, -7.733702659606934e-05, -7.382780313491821e-05, -7.031857967376709e-05, -6.680935621261597e-05, -6.330013275146484e-05, -5.979090929031372e-05, -5.62816858291626e-05, -5.2772462368011475e-05, -4.926323890686035e-05, -4.575401544570923e-05, -4.2244791984558105e-05, -3.873556852340698e-05, -3.522634506225586e-05, -3.1717121601104736e-05, -2.8207898139953613e-05, -2.469867467880249e-05, -2.1189451217651367e-05, -1.7680227756500244e-05, -1.4171004295349121e-05, -1.0661780834197998e-05, -7.152557373046875e-06, -3.643333911895752e-06, -1.341104507446289e-07, 3.375113010406494e-06, 6.884336471557617e-06, 1.039355993270874e-05, 1.3902783393859863e-05, 1.7412006855010986e-05, 2.092123031616211e-05, 2.4430453777313232e-05, 2.7939677238464355e-05, 3.144890069961548e-05, 3.49581241607666e-05, 3.8467347621917725e-05, 4.197657108306885e-05, 4.548579454421997e-05, 4.8995018005371094e-05, 5.250424146652222e-05, 5.601346492767334e-05, 5.952268838882446e-05, 6.303191184997559e-05, 6.654113531112671e-05, 7.005035877227783e-05, 7.355958223342896e-05, 7.706880569458008e-05, 8.05780291557312e-05, 8.408725261688232e-05, 8.759647607803345e-05, 9.110569953918457e-05, 9.46149230003357e-05, 9.812414646148682e-05, 0.00010163336992263794, 0.00010514259338378906]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 7.0, 6.0, 6.0, 18.0, 29.0, 49.0, 90.0, 175.0, 384.0, 1198.0, 4716.0, 33475.0, 670636.0, 312933.0, 20204.0, 3188.0, 813.0, 326.0, 152.0, 66.0, 37.0, 23.0, 15.0, 7.0, 3.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9736328125, -0.938720703125, -0.90380859375, -0.868896484375, -0.833984375, -0.799072265625, -0.76416015625, -0.729248046875, -0.6943359375, -0.659423828125, -0.62451171875, -0.589599609375, -0.5546875, -0.519775390625, -0.48486328125, -0.449951171875, -0.4150390625, -0.380126953125, -0.34521484375, -0.310302734375, -0.275390625, -0.240478515625, -0.20556640625, -0.170654296875, -0.1357421875, -0.100830078125, -0.06591796875, -0.031005859375, 0.00390625, 0.038818359375, 0.07373046875, 0.108642578125, 0.1435546875, 0.178466796875, 0.21337890625, 0.248291015625, 0.283203125, 0.318115234375, 0.35302734375, 0.387939453125, 0.4228515625, 0.457763671875, 0.49267578125, 0.527587890625, 0.5625, 0.597412109375, 0.63232421875, 0.667236328125, 0.7021484375, 0.737060546875, 0.77197265625, 0.806884765625, 0.841796875, 0.876708984375, 0.91162109375, 0.946533203125, 0.9814453125, 1.016357421875, 1.05126953125, 1.086181640625, 1.12109375, 1.156005859375, 1.19091796875, 1.225830078125, 1.2607421875]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 8.0, 11.0, 13.0, 15.0, 26.0, 33.0, 34.0, 55.0, 102.0, 157.0, 163.0, 101.0, 79.0, 57.0, 36.0, 31.0, 20.0, 16.0, 9.0, 12.0, 9.0, 8.0, 6.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53076171875, -0.51611328125, -0.50146484375, -0.48681640625, -0.47216796875, -0.45751953125, -0.44287109375, -0.42822265625, -0.41357421875, -0.39892578125, -0.38427734375, -0.36962890625, -0.35498046875, -0.34033203125, -0.32568359375, -0.31103515625, -0.29638671875, -0.28173828125, -0.26708984375, -0.25244140625, -0.23779296875, -0.22314453125, -0.20849609375, -0.19384765625, -0.17919921875, -0.16455078125, -0.14990234375, -0.13525390625, -0.12060546875, -0.10595703125, -0.09130859375, -0.07666015625, -0.06201171875, -0.04736328125, -0.03271484375, -0.01806640625, -0.00341796875, 0.01123046875, 0.02587890625, 0.04052734375, 0.05517578125, 0.06982421875, 0.08447265625, 0.09912109375, 0.11376953125, 0.12841796875, 0.14306640625, 0.15771484375, 0.17236328125, 0.18701171875, 0.20166015625, 0.21630859375, 0.23095703125, 0.24560546875, 0.26025390625, 0.27490234375, 0.28955078125, 0.30419921875, 0.31884765625, 0.33349609375, 0.34814453125, 0.36279296875, 0.37744140625, 0.39208984375, 0.40673828125]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 11.0, 33.0, 151.0, 615.0, 154.0, 31.0, 11.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-24.06016731262207, -23.27197265625, -22.483779907226562, -21.695585250854492, -20.907392501831055, -20.119197845458984, -19.331005096435547, -18.542810440063477, -17.754615783691406, -16.966421127319336, -16.1782283782959, -15.390033721923828, -14.601840019226074, -13.81364631652832, -13.025452613830566, -12.237258911132812, -11.449065208435059, -10.660871505737305, -9.87267780303955, -9.084484100341797, -8.296289443969727, -7.508095741271973, -6.719902038574219, -5.931707859039307, -5.143514156341553, -4.355320453643799, -3.5671262741088867, -2.778932571411133, -1.9907386302947998, -1.2025446891784668, -0.4143509864807129, 0.3738431930541992, 1.1620368957519531, 1.9502308368682861, 2.738424777984619, 3.526618480682373, 4.314812660217285, 5.103006362915039, 5.891200065612793, 6.679394245147705, 7.467587947845459, 8.255782127380371, 9.043975830078125, 9.832169532775879, 10.620363235473633, 11.408557891845703, 12.19675064086914, 12.984945297241211, 13.773138999938965, 14.561332702636719, 15.349526405334473, 16.137720108032227, 16.925914764404297, 17.714107513427734, 18.502302169799805, 19.290496826171875, 20.078689575195312, 20.866884231567383, 21.65507698059082, 22.44327163696289, 23.231464385986328, 24.0196590423584, 24.80785369873047, 25.596046447753906, 26.384241104125977]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 6.0, 6.0, 17.0, 15.0, 15.0, 32.0, 30.0, 52.0, 48.0, 59.0, 63.0, 75.0, 71.0, 67.0, 54.0, 79.0, 65.0, 55.0, 41.0, 35.0, 29.0, 32.0, 22.0, 16.0, 5.0, 11.0, 4.0, 1.0, 2.0, 2.0, 4.0, 0.0, 1.0], "bins": [-19.0388240814209, -18.607173919677734, -18.175525665283203, -17.74387550354004, -17.312227249145508, -16.880577087402344, -16.448928833007812, -16.01727867126465, -15.585630416870117, -15.15398120880127, -14.722332000732422, -14.290682792663574, -13.859033584594727, -13.427384376525879, -12.995735168457031, -12.564085006713867, -12.13243579864502, -11.700786590576172, -11.269137382507324, -10.837488174438477, -10.405838966369629, -9.974189758300781, -9.542539596557617, -9.110891342163086, -8.679241180419922, -8.247591972351074, -7.815942764282227, -7.384293556213379, -6.952644348144531, -6.520995140075684, -6.089345455169678, -5.65769624710083, -5.226047515869141, -4.794398307800293, -4.362749099731445, -3.9310996532440186, -3.499450445175171, -3.0678012371063232, -2.6361517906188965, -2.204502582550049, -1.7728533744812012, -1.3412041664123535, -0.9095548391342163, -0.4779055118560791, -0.046256303787231445, 0.3853929042816162, 0.817042350769043, 1.2486915588378906, 1.6803407669067383, 2.111989974975586, 2.5436391830444336, 2.9752886295318604, 3.406937837600708, 3.8385870456695557, 4.270236492156982, 4.70188570022583, 5.133534908294678, 5.565184116363525, 5.996833324432373, 6.428483009338379, 6.860132217407227, 7.291781425476074, 7.723430633544922, 8.15507984161377, 8.586729049682617]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 0.0, 11.0, 5.0, 9.0, 18.0, 18.0, 25.0, 51.0, 58.0, 83.0, 106.0, 176.0, 275.0, 433.0, 787.0, 1635.0, 3922.0, 11812.0, 52886.0, 654220.0, 3308668.0, 126026.0, 21697.0, 6349.0, 2436.0, 1081.0, 523.0, 323.0, 232.0, 139.0, 81.0, 49.0, 42.0, 19.0, 25.0, 17.0, 11.0, 7.0, 8.0, 5.0, 9.0, 5.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0], "bins": [-3.451171875, -3.35589599609375, -3.2606201171875, -3.16534423828125, -3.070068359375, -2.97479248046875, -2.8795166015625, -2.78424072265625, -2.68896484375, -2.59368896484375, -2.4984130859375, -2.40313720703125, -2.307861328125, -2.21258544921875, -2.1173095703125, -2.02203369140625, -1.9267578125, -1.83148193359375, -1.7362060546875, -1.64093017578125, -1.545654296875, -1.45037841796875, -1.3551025390625, -1.25982666015625, -1.16455078125, -1.06927490234375, -0.9739990234375, -0.87872314453125, -0.783447265625, -0.68817138671875, -0.5928955078125, -0.49761962890625, -0.40234375, -0.30706787109375, -0.2117919921875, -0.11651611328125, -0.021240234375, 0.07403564453125, 0.1693115234375, 0.26458740234375, 0.35986328125, 0.45513916015625, 0.5504150390625, 0.64569091796875, 0.740966796875, 0.83624267578125, 0.9315185546875, 1.02679443359375, 1.1220703125, 1.21734619140625, 1.3126220703125, 1.40789794921875, 1.503173828125, 1.59844970703125, 1.6937255859375, 1.78900146484375, 1.88427734375, 1.97955322265625, 2.0748291015625, 2.17010498046875, 2.265380859375, 2.36065673828125, 2.4559326171875, 2.55120849609375, 2.646484375]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 5.0, 9.0, 13.0, 9.0, 9.0, 31.0, 48.0, 73.0, 77.0, 117.0, 118.0, 149.0, 90.0, 83.0, 58.0, 29.0, 27.0, 17.0, 15.0, 10.0, 10.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.01171875, -3.893524169921875, -3.77532958984375, -3.657135009765625, -3.5389404296875, -3.420745849609375, -3.30255126953125, -3.184356689453125, -3.066162109375, -2.947967529296875, -2.82977294921875, -2.711578369140625, -2.5933837890625, -2.475189208984375, -2.35699462890625, -2.238800048828125, -2.12060546875, -2.002410888671875, -1.88421630859375, -1.766021728515625, -1.6478271484375, -1.529632568359375, -1.41143798828125, -1.293243408203125, -1.175048828125, -1.056854248046875, -0.93865966796875, -0.820465087890625, -0.7022705078125, -0.584075927734375, -0.46588134765625, -0.347686767578125, -0.2294921875, -0.111297607421875, 0.00689697265625, 0.125091552734375, 0.2432861328125, 0.361480712890625, 0.47967529296875, 0.597869873046875, 0.716064453125, 0.834259033203125, 0.95245361328125, 1.070648193359375, 1.1888427734375, 1.307037353515625, 1.42523193359375, 1.543426513671875, 1.66162109375, 1.779815673828125, 1.89801025390625, 2.016204833984375, 2.1343994140625, 2.252593994140625, 2.37078857421875, 2.488983154296875, 2.607177734375, 2.725372314453125, 2.84356689453125, 2.961761474609375, 3.0799560546875, 3.198150634765625, 3.31634521484375, 3.434539794921875, 3.552734375]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 2.0, 3.0, 6.0, 5.0, 10.0, 4.0, 21.0, 22.0, 32.0, 51.0, 55.0, 109.0, 173.0, 336.0, 688.0, 1964.0, 7000.0, 46334.0, 3254172.0, 846412.0, 28718.0, 5199.0, 1591.0, 628.0, 291.0, 154.0, 103.0, 69.0, 34.0, 33.0, 12.0, 12.0, 14.0, 3.0, 6.0, 7.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.109375, -3.9881591796875, -3.866943359375, -3.7457275390625, -3.62451171875, -3.5032958984375, -3.382080078125, -3.2608642578125, -3.1396484375, -3.0184326171875, -2.897216796875, -2.7760009765625, -2.65478515625, -2.5335693359375, -2.412353515625, -2.2911376953125, -2.169921875, -2.0487060546875, -1.927490234375, -1.8062744140625, -1.68505859375, -1.5638427734375, -1.442626953125, -1.3214111328125, -1.2001953125, -1.0789794921875, -0.957763671875, -0.8365478515625, -0.71533203125, -0.5941162109375, -0.472900390625, -0.3516845703125, -0.23046875, -0.1092529296875, 0.011962890625, 0.1331787109375, 0.25439453125, 0.3756103515625, 0.496826171875, 0.6180419921875, 0.7392578125, 0.8604736328125, 0.981689453125, 1.1029052734375, 1.22412109375, 1.3453369140625, 1.466552734375, 1.5877685546875, 1.708984375, 1.8302001953125, 1.951416015625, 2.0726318359375, 2.19384765625, 2.3150634765625, 2.436279296875, 2.5574951171875, 2.6787109375, 2.7999267578125, 2.921142578125, 3.0423583984375, 3.16357421875, 3.2847900390625, 3.406005859375, 3.5272216796875, 3.6484375]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 6.0, 8.0, 8.0, 18.0, 12.0, 22.0, 32.0, 51.0, 69.0, 111.0, 163.0, 275.0, 573.0, 1208.0, 655.0, 330.0, 174.0, 108.0, 60.0, 60.0, 34.0, 26.0, 20.0, 13.0, 9.0, 2.0, 9.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58837890625, -0.5662307739257812, -0.5440826416015625, -0.5219345092773438, -0.499786376953125, -0.47763824462890625, -0.4554901123046875, -0.43334197998046875, -0.41119384765625, -0.38904571533203125, -0.3668975830078125, -0.34474945068359375, -0.322601318359375, -0.30045318603515625, -0.2783050537109375, -0.25615692138671875, -0.2340087890625, -0.21186065673828125, -0.1897125244140625, -0.16756439208984375, -0.145416259765625, -0.12326812744140625, -0.1011199951171875, -0.07897186279296875, -0.05682373046875, -0.03467559814453125, -0.0125274658203125, 0.00962066650390625, 0.031768798828125, 0.05391693115234375, 0.0760650634765625, 0.09821319580078125, 0.120361328125, 0.14250946044921875, 0.1646575927734375, 0.18680572509765625, 0.208953857421875, 0.23110198974609375, 0.2532501220703125, 0.27539825439453125, 0.29754638671875, 0.31969451904296875, 0.3418426513671875, 0.36399078369140625, 0.386138916015625, 0.40828704833984375, 0.4304351806640625, 0.45258331298828125, 0.4747314453125, 0.49687957763671875, 0.5190277099609375, 0.5411758422851562, 0.563323974609375, 0.5854721069335938, 0.6076202392578125, 0.6297683715820312, 0.65191650390625, 0.6740646362304688, 0.6962127685546875, 0.7183609008789062, 0.740509033203125, 0.7626571655273438, 0.7848052978515625, 0.8069534301757812, 0.8291015625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 8.0, 4.0, 6.0, 13.0, 16.0, 30.0, 42.0, 116.0, 166.0, 240.0, 146.0, 93.0, 61.0, 21.0, 8.0, 10.0, 5.0, 8.0, 3.0, 4.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.859816551208496, -4.710173606872559, -4.560530662536621, -4.410887718200684, -4.261244773864746, -4.111601829528809, -3.961958885192871, -3.8123159408569336, -3.662672996520996, -3.5130300521850586, -3.363387107849121, -3.2137441635131836, -3.064101219177246, -2.9144582748413086, -2.764815330505371, -2.6151723861694336, -2.465529441833496, -2.3158864974975586, -2.166243553161621, -2.0166006088256836, -1.866957664489746, -1.7173147201538086, -1.567671775817871, -1.4180288314819336, -1.268385887145996, -1.1187429428100586, -0.9690999984741211, -0.8194570541381836, -0.6698141098022461, -0.5201711654663086, -0.3705282211303711, -0.2208852767944336, -0.07124185562133789, 0.07840108871459961, 0.2280440330505371, 0.3776869773864746, 0.5273299217224121, 0.6769728660583496, 0.8266158103942871, 0.9762587547302246, 1.125901699066162, 1.2755446434020996, 1.425187587738037, 1.5748305320739746, 1.724473476409912, 1.8741164207458496, 2.023759365081787, 2.1734023094177246, 2.323045253753662, 2.4726881980895996, 2.622331142425537, 2.7719740867614746, 2.921617031097412, 3.0712599754333496, 3.220902919769287, 3.3705458641052246, 3.520188808441162, 3.6698317527770996, 3.819474697113037, 3.9691176414489746, 4.118760585784912, 4.26840353012085, 4.418046474456787, 4.567689418792725, 4.717332363128662]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 4.0, 5.0, 5.0, 3.0, 16.0, 21.0, 46.0, 66.0, 78.0, 93.0, 114.0, 134.0, 115.0, 86.0, 64.0, 57.0, 35.0, 21.0, 16.0, 12.0, 10.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.220878601074219, -5.086127758026123, -4.951376914978027, -4.81662654876709, -4.681875705718994, -4.547124862670898, -4.412374496459961, -4.277623653411865, -4.1428728103637695, -4.008121967315674, -3.8733713626861572, -3.7386207580566406, -3.603869915008545, -3.469119071960449, -3.3343684673309326, -3.199617862701416, -3.0648670196533203, -2.9301161766052246, -2.795365571975708, -2.6606149673461914, -2.5258641242980957, -2.39111328125, -2.2563626766204834, -2.121612071990967, -1.986861228942871, -1.852110505104065, -1.7173597812652588, -1.5826090574264526, -1.4478583335876465, -1.3131076097488403, -1.1783568859100342, -1.043606162071228, -0.9088551998138428, -0.7741044759750366, -0.6393537521362305, -0.5046030282974243, -0.36985230445861816, -0.235101580619812, -0.10035085678100586, 0.03439986705780029, 0.16915059089660645, 0.3039013147354126, 0.43865203857421875, 0.5734027624130249, 0.708153486251831, 0.8429042100906372, 0.9776549339294434, 1.1124056577682495, 1.2471563816070557, 1.3819071054458618, 1.516657829284668, 1.6514085531234741, 1.7861592769622803, 1.9209100008010864, 2.0556607246398926, 2.1904115676879883, 2.325162172317505, 2.4599127769470215, 2.594663619995117, 2.729414463043213, 2.8641650676727295, 2.998915672302246, 3.133666515350342, 3.2684173583984375, 3.403167963027954]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 4.0, 8.0, 13.0, 10.0, 29.0, 27.0, 58.0, 102.0, 184.0, 404.0, 933.0, 2928.0, 12352.0, 81451.0, 640148.0, 271237.0, 29923.0, 5987.0, 1597.0, 573.0, 289.0, 95.0, 82.0, 45.0, 23.0, 11.0, 14.0, 10.0, 4.0, 4.0, 5.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.403564453125, -0.39044189453125, -0.3773193359375, -0.36419677734375, -0.35107421875, -0.33795166015625, -0.3248291015625, -0.31170654296875, -0.298583984375, -0.28546142578125, -0.2723388671875, -0.25921630859375, -0.24609375, -0.23297119140625, -0.2198486328125, -0.20672607421875, -0.193603515625, -0.18048095703125, -0.1673583984375, -0.15423583984375, -0.14111328125, -0.12799072265625, -0.1148681640625, -0.10174560546875, -0.088623046875, -0.07550048828125, -0.0623779296875, -0.04925537109375, -0.0361328125, -0.02301025390625, -0.0098876953125, 0.00323486328125, 0.016357421875, 0.02947998046875, 0.0426025390625, 0.05572509765625, 0.06884765625, 0.08197021484375, 0.0950927734375, 0.10821533203125, 0.121337890625, 0.13446044921875, 0.1475830078125, 0.16070556640625, 0.173828125, 0.18695068359375, 0.2000732421875, 0.21319580078125, 0.226318359375, 0.23944091796875, 0.2525634765625, 0.26568603515625, 0.27880859375, 0.29193115234375, 0.3050537109375, 0.31817626953125, 0.331298828125, 0.34442138671875, 0.3575439453125, 0.37066650390625, 0.3837890625, 0.39691162109375, 0.4100341796875, 0.42315673828125, 0.436279296875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 4.0, 5.0, 7.0, 8.0, 14.0, 17.0, 28.0, 67.0, 74.0, 108.0, 154.0, 162.0, 114.0, 78.0, 62.0, 34.0, 26.0, 22.0, 9.0, 12.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.58984375, -3.48779296875, -3.3857421875, -3.28369140625, -3.181640625, -3.07958984375, -2.9775390625, -2.87548828125, -2.7734375, -2.67138671875, -2.5693359375, -2.46728515625, -2.365234375, -2.26318359375, -2.1611328125, -2.05908203125, -1.95703125, -1.85498046875, -1.7529296875, -1.65087890625, -1.548828125, -1.44677734375, -1.3447265625, -1.24267578125, -1.140625, -1.03857421875, -0.9365234375, -0.83447265625, -0.732421875, -0.63037109375, -0.5283203125, -0.42626953125, -0.32421875, -0.22216796875, -0.1201171875, -0.01806640625, 0.083984375, 0.18603515625, 0.2880859375, 0.39013671875, 0.4921875, 0.59423828125, 0.6962890625, 0.79833984375, 0.900390625, 1.00244140625, 1.1044921875, 1.20654296875, 1.30859375, 1.41064453125, 1.5126953125, 1.61474609375, 1.716796875, 1.81884765625, 1.9208984375, 2.02294921875, 2.125, 2.22705078125, 2.3291015625, 2.43115234375, 2.533203125, 2.63525390625, 2.7373046875, 2.83935546875, 2.94140625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 4.0, 2.0, 3.0, 2.0, 5.0, 9.0, 14.0, 14.0, 20.0, 23.0, 29.0, 25.0, 56.0, 76.0, 130.0, 156.0, 283.0, 553.0, 1157.0, 3415.0, 14137.0, 82656.0, 432652.0, 416252.0, 78068.0, 13127.0, 3254.0, 1107.0, 491.0, 290.0, 156.0, 108.0, 73.0, 55.0, 36.0, 32.0, 21.0, 14.0, 16.0, 10.0, 12.0, 10.0, 6.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.291748046875, -0.2823333740234375, -0.272918701171875, -0.2635040283203125, -0.25408935546875, -0.2446746826171875, -0.235260009765625, -0.2258453369140625, -0.2164306640625, -0.2070159912109375, -0.197601318359375, -0.1881866455078125, -0.17877197265625, -0.1693572998046875, -0.159942626953125, -0.1505279541015625, -0.14111328125, -0.1316986083984375, -0.122283935546875, -0.1128692626953125, -0.10345458984375, -0.0940399169921875, -0.084625244140625, -0.0752105712890625, -0.0657958984375, -0.0563812255859375, -0.046966552734375, -0.0375518798828125, -0.02813720703125, -0.0187225341796875, -0.009307861328125, 0.0001068115234375, 0.009521484375, 0.0189361572265625, 0.028350830078125, 0.0377655029296875, 0.04718017578125, 0.0565948486328125, 0.066009521484375, 0.0754241943359375, 0.0848388671875, 0.0942535400390625, 0.103668212890625, 0.1130828857421875, 0.12249755859375, 0.1319122314453125, 0.141326904296875, 0.1507415771484375, 0.16015625, 0.1695709228515625, 0.178985595703125, 0.1884002685546875, 0.19781494140625, 0.2072296142578125, 0.216644287109375, 0.2260589599609375, 0.2354736328125, 0.2448883056640625, 0.254302978515625, 0.2637176513671875, 0.27313232421875, 0.2825469970703125, 0.291961669921875, 0.3013763427734375, 0.310791015625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 7.0, 10.0, 11.0, 6.0, 16.0, 16.0, 22.0, 22.0, 20.0, 34.0, 48.0, 38.0, 43.0, 42.0, 49.0, 53.0, 45.0, 54.0, 37.0, 42.0, 40.0, 40.0, 43.0, 36.0, 23.0, 37.0, 29.0, 28.0, 23.0, 23.0, 19.0, 12.0, 15.0, 5.0, 9.0, 2.0, 3.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.8203125, -2.740142822265625, -2.65997314453125, -2.579803466796875, -2.4996337890625, -2.419464111328125, -2.33929443359375, -2.259124755859375, -2.178955078125, -2.098785400390625, -2.01861572265625, -1.938446044921875, -1.8582763671875, -1.778106689453125, -1.69793701171875, -1.617767333984375, -1.53759765625, -1.457427978515625, -1.37725830078125, -1.297088623046875, -1.2169189453125, -1.136749267578125, -1.05657958984375, -0.976409912109375, -0.896240234375, -0.816070556640625, -0.73590087890625, -0.655731201171875, -0.5755615234375, -0.495391845703125, -0.41522216796875, -0.335052490234375, -0.2548828125, -0.174713134765625, -0.09454345703125, -0.014373779296875, 0.0657958984375, 0.145965576171875, 0.22613525390625, 0.306304931640625, 0.386474609375, 0.466644287109375, 0.54681396484375, 0.626983642578125, 0.7071533203125, 0.787322998046875, 0.86749267578125, 0.947662353515625, 1.02783203125, 1.108001708984375, 1.18817138671875, 1.268341064453125, 1.3485107421875, 1.428680419921875, 1.50885009765625, 1.589019775390625, 1.669189453125, 1.749359130859375, 1.82952880859375, 1.909698486328125, 1.9898681640625, 2.070037841796875, 2.15020751953125, 2.230377197265625, 2.310546875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 6.0, 12.0, 19.0, 26.0, 39.0, 53.0, 93.0, 136.0, 262.0, 601.0, 1359.0, 5001.0, 32586.0, 520171.0, 451699.0, 29037.0, 4726.0, 1390.0, 570.0, 305.0, 182.0, 105.0, 71.0, 47.0, 19.0, 14.0, 7.0, 5.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.189208984375, -0.18394851684570312, -0.17868804931640625, -0.17342758178710938, -0.1681671142578125, -0.16290664672851562, -0.15764617919921875, -0.15238571166992188, -0.147125244140625, -0.14186477661132812, -0.13660430908203125, -0.13134384155273438, -0.1260833740234375, -0.12082290649414062, -0.11556243896484375, -0.11030197143554688, -0.10504150390625, -0.09978103637695312, -0.09452056884765625, -0.08926010131835938, -0.0839996337890625, -0.07873916625976562, -0.07347869873046875, -0.06821823120117188, -0.062957763671875, -0.057697296142578125, -0.05243682861328125, -0.047176361083984375, -0.0419158935546875, -0.036655426025390625, -0.03139495849609375, -0.026134490966796875, -0.0208740234375, -0.015613555908203125, -0.01035308837890625, -0.005092620849609375, 0.0001678466796875, 0.005428314208984375, 0.01068878173828125, 0.015949249267578125, 0.021209716796875, 0.026470184326171875, 0.03173065185546875, 0.036991119384765625, 0.0422515869140625, 0.047512054443359375, 0.05277252197265625, 0.058032989501953125, 0.06329345703125, 0.06855392456054688, 0.07381439208984375, 0.07907485961914062, 0.0843353271484375, 0.08959579467773438, 0.09485626220703125, 0.10011672973632812, 0.105377197265625, 0.11063766479492188, 0.11589813232421875, 0.12115859985351562, 0.1264190673828125, 0.13167953491210938, 0.13694000244140625, 0.14220046997070312, 0.1474609375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 2.0, 6.0, 3.0, 4.0, 10.0, 10.0, 16.0, 30.0, 28.0, 50.0, 68.0, 91.0, 135.0, 132.0, 102.0, 88.0, 70.0, 46.0, 44.0, 21.0, 9.0, 8.0, 9.0, 5.0, 4.0, 5.0, 4.0, 1.0, 3.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.029273986816406e-05, -3.849528729915619e-05, -3.6697834730148315e-05, -3.490038216114044e-05, -3.310292959213257e-05, -3.1305477023124695e-05, -2.950802445411682e-05, -2.7710571885108948e-05, -2.5913119316101074e-05, -2.41156667470932e-05, -2.2318214178085327e-05, -2.0520761609077454e-05, -1.872330904006958e-05, -1.6925856471061707e-05, -1.5128403902053833e-05, -1.333095133304596e-05, -1.1533498764038086e-05, -9.736046195030212e-06, -7.938593626022339e-06, -6.141141057014465e-06, -4.343688488006592e-06, -2.5462359189987183e-06, -7.487833499908447e-07, 1.0486692190170288e-06, 2.8461217880249023e-06, 4.643574357032776e-06, 6.441026926040649e-06, 8.238479495048523e-06, 1.0035932064056396e-05, 1.183338463306427e-05, 1.3630837202072144e-05, 1.5428289771080017e-05, 1.722574234008789e-05, 1.9023194909095764e-05, 2.0820647478103638e-05, 2.261810004711151e-05, 2.4415552616119385e-05, 2.6213005185127258e-05, 2.8010457754135132e-05, 2.9807910323143005e-05, 3.160536289215088e-05, 3.340281546115875e-05, 3.5200268030166626e-05, 3.69977205991745e-05, 3.879517316818237e-05, 4.0592625737190247e-05, 4.239007830619812e-05, 4.4187530875205994e-05, 4.598498344421387e-05, 4.778243601322174e-05, 4.9579888582229614e-05, 5.137734115123749e-05, 5.317479372024536e-05, 5.4972246289253235e-05, 5.676969885826111e-05, 5.856715142726898e-05, 6.0364603996276855e-05, 6.216205656528473e-05, 6.39595091342926e-05, 6.575696170330048e-05, 6.755441427230835e-05, 6.935186684131622e-05, 7.11493194103241e-05, 7.294677197933197e-05, 7.474422454833984e-05]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 6.0, 8.0, 8.0, 7.0, 21.0, 20.0, 25.0, 46.0, 77.0, 139.0, 282.0, 836.0, 3433.0, 22105.0, 346061.0, 629232.0, 39181.0, 5142.0, 1173.0, 351.0, 157.0, 93.0, 48.0, 38.0, 21.0, 11.0, 8.0, 8.0, 4.0, 2.0, 3.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2027587890625, -0.1971454620361328, -0.19153213500976562, -0.18591880798339844, -0.18030548095703125, -0.17469215393066406, -0.16907882690429688, -0.1634654998779297, -0.1578521728515625, -0.1522388458251953, -0.14662551879882812, -0.14101219177246094, -0.13539886474609375, -0.12978553771972656, -0.12417221069335938, -0.11855888366699219, -0.112945556640625, -0.10733222961425781, -0.10171890258789062, -0.09610557556152344, -0.09049224853515625, -0.08487892150878906, -0.07926559448242188, -0.07365226745605469, -0.0680389404296875, -0.06242561340332031, -0.056812286376953125, -0.05119895935058594, -0.04558563232421875, -0.03997230529785156, -0.034358978271484375, -0.028745651245117188, -0.02313232421875, -0.017518997192382812, -0.011905670166015625, -0.0062923431396484375, -0.00067901611328125, 0.0049343109130859375, 0.010547637939453125, 0.016160964965820312, 0.0217742919921875, 0.027387619018554688, 0.033000946044921875, 0.03861427307128906, 0.04422760009765625, 0.04984092712402344, 0.055454254150390625, 0.06106758117675781, 0.066680908203125, 0.07229423522949219, 0.07790756225585938, 0.08352088928222656, 0.08913421630859375, 0.09474754333496094, 0.10036087036132812, 0.10597419738769531, 0.1115875244140625, 0.11720085144042969, 0.12281417846679688, 0.12842750549316406, 0.13404083251953125, 0.13965415954589844, 0.14526748657226562, 0.1508808135986328, 0.156494140625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 2.0, 11.0, 6.0, 15.0, 23.0, 23.0, 30.0, 37.0, 62.0, 83.0, 120.0, 106.0, 123.0, 100.0, 70.0, 43.0, 34.0, 33.0, 22.0, 17.0, 9.0, 8.0, 9.0, 5.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02740478515625, -0.02633953094482422, -0.025274276733398438, -0.024209022521972656, -0.023143768310546875, -0.022078514099121094, -0.021013259887695312, -0.01994800567626953, -0.01888275146484375, -0.01781749725341797, -0.016752243041992188, -0.015686988830566406, -0.014621734619140625, -0.013556480407714844, -0.012491226196289062, -0.011425971984863281, -0.0103607177734375, -0.009295463562011719, -0.008230209350585938, -0.007164955139160156, -0.006099700927734375, -0.005034446716308594, -0.0039691925048828125, -0.0029039382934570312, -0.00183868408203125, -0.0007734298706054688, 0.0002918243408203125, 0.0013570785522460938, 0.002422332763671875, 0.0034875869750976562, 0.0045528411865234375, 0.005618095397949219, 0.006683349609375, 0.007748603820800781, 0.008813858032226562, 0.009879112243652344, 0.010944366455078125, 0.012009620666503906, 0.013074874877929688, 0.014140129089355469, 0.01520538330078125, 0.01627063751220703, 0.017335891723632812, 0.018401145935058594, 0.019466400146484375, 0.020531654357910156, 0.021596908569335938, 0.02266216278076172, 0.0237274169921875, 0.02479267120361328, 0.025857925415039062, 0.026923179626464844, 0.027988433837890625, 0.029053688049316406, 0.030118942260742188, 0.03118419647216797, 0.03224945068359375, 0.03331470489501953, 0.03437995910644531, 0.035445213317871094, 0.036510467529296875, 0.037575721740722656, 0.03864097595214844, 0.03970623016357422, 0.040771484375]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 7.0, 6.0, 17.0, 32.0, 71.0, 248.0, 368.0, 159.0, 59.0, 15.0, 10.0, 7.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.687591791152954, -3.5144524574279785, -3.341312885284424, -3.1681735515594482, -2.9950342178344727, -2.821894884109497, -2.6487555503845215, -2.475615978240967, -2.302476644515991, -2.1293373107910156, -1.9561978578567505, -1.7830584049224854, -1.6099190711975098, -1.4367797374725342, -1.263640284538269, -1.090500831604004, -0.9173614978790283, -0.744222104549408, -0.5710827112197876, -0.39794331789016724, -0.22480392456054688, -0.051664531230926514, 0.12147486209869385, 0.294614315032959, 0.46775364875793457, 0.6408930420875549, 0.8140324354171753, 0.9871718287467957, 1.160311222076416, 1.3334505558013916, 1.5065900087356567, 1.6797294616699219, 1.8528690338134766, 2.026008367538452, 2.1991477012634277, 2.3722872734069824, 2.545426607131958, 2.7185659408569336, 2.8917055130004883, 3.064844846725464, 3.2379841804504395, 3.411123514175415, 3.5842628479003906, 3.7574024200439453, 3.930541753768921, 4.1036810874938965, 4.276820659637451, 4.449959754943848, 4.623099327087402, 4.796238899230957, 4.9693779945373535, 5.142517566680908, 5.315656661987305, 5.488796234130859, 5.661935806274414, 5.835075378417969, 6.008214473724365, 6.18135404586792, 6.354493141174316, 6.527632713317871, 6.700772285461426, 6.873911380767822, 7.047050952911377, 7.220190048217773, 7.393329620361328]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 6.0, 5.0, 6.0, 13.0, 21.0, 54.0, 71.0, 97.0, 135.0, 162.0, 153.0, 80.0, 76.0, 47.0, 31.0, 18.0, 13.0, 8.0, 3.0, 4.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0336809158325195, -3.926571846008301, -3.819462776184082, -3.7123537063598633, -3.6052446365356445, -3.498135566711426, -3.391026496887207, -3.2839174270629883, -3.1768083572387695, -3.069699287414551, -2.962590217590332, -2.8554811477661133, -2.7483720779418945, -2.641263008117676, -2.534153938293457, -2.4270448684692383, -2.3199357986450195, -2.212826728820801, -2.105717658996582, -1.9986085891723633, -1.8914995193481445, -1.7843904495239258, -1.677281379699707, -1.5701723098754883, -1.4630630016326904, -1.3559539318084717, -1.248844861984253, -1.1417357921600342, -1.0346267223358154, -0.9275175929069519, -0.8204085230827332, -0.7132994532585144, -0.6061904430389404, -0.4990813732147217, -0.39197230339050293, -0.2848632037639618, -0.17775413393974304, -0.0706450343132019, 0.036464035511016846, 0.1435731053352356, 0.25068217515945435, 0.3577912449836731, 0.46490031480789185, 0.5720094442367554, 0.6791185140609741, 0.7862275838851929, 0.8933366537094116, 1.0004457235336304, 1.1075547933578491, 1.2146638631820679, 1.3217729330062866, 1.4288820028305054, 1.5359910726547241, 1.6431002616882324, 1.7502093315124512, 1.85731840133667, 1.9644274711608887, 2.0715365409851074, 2.178645610809326, 2.285754680633545, 2.3928637504577637, 2.4999728202819824, 2.607081890106201, 2.71419095993042, 2.8213000297546387]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 1.0, 7.0, 11.0, 11.0, 17.0, 44.0, 45.0, 138.0, 293.0, 787.0, 2587.0, 10092.0, 55249.0, 571133.0, 360192.0, 37446.0, 7432.0, 1938.0, 653.0, 243.0, 104.0, 60.0, 29.0, 18.0, 8.0, 7.0, 2.0, 7.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.599609375, -2.525115966796875, -2.45062255859375, -2.376129150390625, -2.3016357421875, -2.227142333984375, -2.15264892578125, -2.078155517578125, -2.003662109375, -1.929168701171875, -1.85467529296875, -1.780181884765625, -1.7056884765625, -1.631195068359375, -1.55670166015625, -1.482208251953125, -1.40771484375, -1.333221435546875, -1.25872802734375, -1.184234619140625, -1.1097412109375, -1.035247802734375, -0.96075439453125, -0.886260986328125, -0.811767578125, -0.737274169921875, -0.66278076171875, -0.588287353515625, -0.5137939453125, -0.439300537109375, -0.36480712890625, -0.290313720703125, -0.2158203125, -0.141326904296875, -0.06683349609375, 0.007659912109375, 0.0821533203125, 0.156646728515625, 0.23114013671875, 0.305633544921875, 0.380126953125, 0.454620361328125, 0.52911376953125, 0.603607177734375, 0.6781005859375, 0.752593994140625, 0.82708740234375, 0.901580810546875, 0.97607421875, 1.050567626953125, 1.12506103515625, 1.199554443359375, 1.2740478515625, 1.348541259765625, 1.42303466796875, 1.497528076171875, 1.572021484375, 1.646514892578125, 1.72100830078125, 1.795501708984375, 1.8699951171875, 1.944488525390625, 2.01898193359375, 2.093475341796875, 2.16796875]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 4.0, 1.0, 4.0, 9.0, 7.0, 22.0, 37.0, 64.0, 67.0, 87.0, 137.0, 181.0, 108.0, 83.0, 65.0, 39.0, 31.0, 18.0, 12.0, 8.0, 8.0, 6.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.1875, -8.95391845703125, -8.7203369140625, -8.48675537109375, -8.253173828125, -8.01959228515625, -7.7860107421875, -7.55242919921875, -7.31884765625, -7.08526611328125, -6.8516845703125, -6.61810302734375, -6.384521484375, -6.15093994140625, -5.9173583984375, -5.68377685546875, -5.4501953125, -5.21661376953125, -4.9830322265625, -4.74945068359375, -4.515869140625, -4.28228759765625, -4.0487060546875, -3.81512451171875, -3.58154296875, -3.34796142578125, -3.1143798828125, -2.88079833984375, -2.647216796875, -2.41363525390625, -2.1800537109375, -1.94647216796875, -1.712890625, -1.47930908203125, -1.2457275390625, -1.01214599609375, -0.778564453125, -0.54498291015625, -0.3114013671875, -0.07781982421875, 0.15576171875, 0.38934326171875, 0.6229248046875, 0.85650634765625, 1.090087890625, 1.32366943359375, 1.5572509765625, 1.79083251953125, 2.0244140625, 2.25799560546875, 2.4915771484375, 2.72515869140625, 2.958740234375, 3.19232177734375, 3.4259033203125, 3.65948486328125, 3.89306640625, 4.12664794921875, 4.3602294921875, 4.59381103515625, 4.827392578125, 5.06097412109375, 5.2945556640625, 5.52813720703125, 5.76171875]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 5.0, 4.0, 8.0, 4.0, 6.0, 18.0, 17.0, 27.0, 54.0, 90.0, 144.0, 340.0, 817.0, 2527.0, 11943.0, 118611.0, 807432.0, 92718.0, 10097.0, 2221.0, 713.0, 290.0, 157.0, 110.0, 66.0, 37.0, 32.0, 22.0, 14.0, 13.0, 8.0, 0.0, 4.0, 4.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-2.673828125, -2.6060638427734375, -2.538299560546875, -2.4705352783203125, -2.40277099609375, -2.3350067138671875, -2.267242431640625, -2.1994781494140625, -2.1317138671875, -2.0639495849609375, -1.996185302734375, -1.9284210205078125, -1.86065673828125, -1.7928924560546875, -1.725128173828125, -1.6573638916015625, -1.589599609375, -1.5218353271484375, -1.454071044921875, -1.3863067626953125, -1.31854248046875, -1.2507781982421875, -1.183013916015625, -1.1152496337890625, -1.0474853515625, -0.9797210693359375, -0.911956787109375, -0.8441925048828125, -0.77642822265625, -0.7086639404296875, -0.640899658203125, -0.5731353759765625, -0.50537109375, -0.4376068115234375, -0.369842529296875, -0.3020782470703125, -0.23431396484375, -0.1665496826171875, -0.098785400390625, -0.0310211181640625, 0.0367431640625, 0.1045074462890625, 0.172271728515625, 0.2400360107421875, 0.30780029296875, 0.3755645751953125, 0.443328857421875, 0.5110931396484375, 0.578857421875, 0.6466217041015625, 0.714385986328125, 0.7821502685546875, 0.84991455078125, 0.9176788330078125, 0.985443115234375, 1.0532073974609375, 1.1209716796875, 1.1887359619140625, 1.256500244140625, 1.3242645263671875, 1.39202880859375, 1.4597930908203125, 1.527557373046875, 1.5953216552734375, 1.6630859375]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 5.0, 6.0, 4.0, 2.0, 10.0, 14.0, 17.0, 11.0, 22.0, 23.0, 30.0, 27.0, 39.0, 39.0, 44.0, 51.0, 43.0, 66.0, 59.0, 33.0, 48.0, 61.0, 48.0, 39.0, 41.0, 33.0, 24.0, 26.0, 24.0, 24.0, 15.0, 17.0, 17.0, 11.0, 6.0, 7.0, 7.0, 2.0, 3.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.3046875, -5.15875244140625, -5.0128173828125, -4.86688232421875, -4.720947265625, -4.57501220703125, -4.4290771484375, -4.28314208984375, -4.13720703125, -3.99127197265625, -3.8453369140625, -3.69940185546875, -3.553466796875, -3.40753173828125, -3.2615966796875, -3.11566162109375, -2.9697265625, -2.82379150390625, -2.6778564453125, -2.53192138671875, -2.385986328125, -2.24005126953125, -2.0941162109375, -1.94818115234375, -1.80224609375, -1.65631103515625, -1.5103759765625, -1.36444091796875, -1.218505859375, -1.07257080078125, -0.9266357421875, -0.78070068359375, -0.634765625, -0.48883056640625, -0.3428955078125, -0.19696044921875, -0.051025390625, 0.09490966796875, 0.2408447265625, 0.38677978515625, 0.53271484375, 0.67864990234375, 0.8245849609375, 0.97052001953125, 1.116455078125, 1.26239013671875, 1.4083251953125, 1.55426025390625, 1.7001953125, 1.84613037109375, 1.9920654296875, 2.13800048828125, 2.283935546875, 2.42987060546875, 2.5758056640625, 2.72174072265625, 2.86767578125, 3.01361083984375, 3.1595458984375, 3.30548095703125, 3.451416015625, 3.59735107421875, 3.7432861328125, 3.88922119140625, 4.03515625]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 5.0, 3.0, 7.0, 12.0, 20.0, 18.0, 24.0, 73.0, 136.0, 296.0, 846.0, 3561.0, 35080.0, 851150.0, 146768.0, 8205.0, 1438.0, 439.0, 207.0, 105.0, 54.0, 22.0, 31.0, 23.0, 11.0, 10.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.859375, -0.8246002197265625, -0.789825439453125, -0.7550506591796875, -0.72027587890625, -0.6855010986328125, -0.650726318359375, -0.6159515380859375, -0.5811767578125, -0.5464019775390625, -0.511627197265625, -0.4768524169921875, -0.44207763671875, -0.4073028564453125, -0.372528076171875, -0.3377532958984375, -0.302978515625, -0.2682037353515625, -0.233428955078125, -0.1986541748046875, -0.16387939453125, -0.1291046142578125, -0.094329833984375, -0.0595550537109375, -0.0247802734375, 0.0099945068359375, 0.044769287109375, 0.0795440673828125, 0.11431884765625, 0.1490936279296875, 0.183868408203125, 0.2186431884765625, 0.25341796875, 0.2881927490234375, 0.322967529296875, 0.3577423095703125, 0.39251708984375, 0.4272918701171875, 0.462066650390625, 0.4968414306640625, 0.5316162109375, 0.5663909912109375, 0.601165771484375, 0.6359405517578125, 0.67071533203125, 0.7054901123046875, 0.740264892578125, 0.7750396728515625, 0.809814453125, 0.8445892333984375, 0.879364013671875, 0.9141387939453125, 0.94891357421875, 0.9836883544921875, 1.018463134765625, 1.0532379150390625, 1.0880126953125, 1.1227874755859375, 1.157562255859375, 1.1923370361328125, 1.22711181640625, 1.2618865966796875, 1.296661376953125, 1.3314361572265625, 1.3662109375]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 6.0, 3.0, 11.0, 9.0, 7.0, 12.0, 13.0, 18.0, 23.0, 28.0, 32.0, 58.0, 67.0, 81.0, 106.0, 116.0, 103.0, 62.0, 59.0, 47.0, 35.0, 21.0, 26.0, 13.0, 13.0, 9.0, 8.0, 6.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.745359420776367e-05, -9.450037032365799e-05, -9.154714643955231e-05, -8.859392255544662e-05, -8.564069867134094e-05, -8.268747478723526e-05, -7.973425090312958e-05, -7.67810270190239e-05, -7.382780313491821e-05, -7.087457925081253e-05, -6.792135536670685e-05, -6.496813148260117e-05, -6.201490759849548e-05, -5.90616837143898e-05, -5.610845983028412e-05, -5.3155235946178436e-05, -5.0202012062072754e-05, -4.724878817796707e-05, -4.429556429386139e-05, -4.134234040975571e-05, -3.8389116525650024e-05, -3.543589264154434e-05, -3.248266875743866e-05, -2.9529444873332977e-05, -2.6576220989227295e-05, -2.3622997105121613e-05, -2.066977322101593e-05, -1.7716549336910248e-05, -1.4763325452804565e-05, -1.1810101568698883e-05, -8.8568776845932e-06, -5.903653800487518e-06, -2.950429916381836e-06, 2.7939677238464355e-09, 2.956017851829529e-06, 5.909241735935211e-06, 8.862465620040894e-06, 1.1815689504146576e-05, 1.4768913388252258e-05, 1.772213727235794e-05, 2.0675361156463623e-05, 2.3628585040569305e-05, 2.6581808924674988e-05, 2.953503280878067e-05, 3.248825669288635e-05, 3.5441480576992035e-05, 3.839470446109772e-05, 4.13479283452034e-05, 4.430115222930908e-05, 4.7254376113414764e-05, 5.020759999752045e-05, 5.316082388162613e-05, 5.611404776573181e-05, 5.9067271649837494e-05, 6.202049553394318e-05, 6.497371941804886e-05, 6.792694330215454e-05, 7.088016718626022e-05, 7.38333910703659e-05, 7.678661495447159e-05, 7.973983883857727e-05, 8.269306272268295e-05, 8.564628660678864e-05, 8.859951049089432e-05, 9.1552734375e-05]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 5.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 8.0, 17.0, 24.0, 32.0, 75.0, 195.0, 484.0, 1562.0, 8184.0, 103127.0, 867481.0, 59429.0, 5926.0, 1244.0, 398.0, 179.0, 88.0, 39.0, 17.0, 16.0, 7.0, 8.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.35546875, -1.321075439453125, -1.28668212890625, -1.252288818359375, -1.2178955078125, -1.183502197265625, -1.14910888671875, -1.114715576171875, -1.080322265625, -1.045928955078125, -1.01153564453125, -0.977142333984375, -0.9427490234375, -0.908355712890625, -0.87396240234375, -0.839569091796875, -0.80517578125, -0.770782470703125, -0.73638916015625, -0.701995849609375, -0.6676025390625, -0.633209228515625, -0.59881591796875, -0.564422607421875, -0.530029296875, -0.495635986328125, -0.46124267578125, -0.426849365234375, -0.3924560546875, -0.358062744140625, -0.32366943359375, -0.289276123046875, -0.2548828125, -0.220489501953125, -0.18609619140625, -0.151702880859375, -0.1173095703125, -0.082916259765625, -0.04852294921875, -0.014129638671875, 0.020263671875, 0.054656982421875, 0.08905029296875, 0.123443603515625, 0.1578369140625, 0.192230224609375, 0.22662353515625, 0.261016845703125, 0.29541015625, 0.329803466796875, 0.36419677734375, 0.398590087890625, 0.4329833984375, 0.467376708984375, 0.50177001953125, 0.536163330078125, 0.570556640625, 0.604949951171875, 0.63934326171875, 0.673736572265625, 0.7081298828125, 0.742523193359375, 0.77691650390625, 0.811309814453125, 0.845703125]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 8.0, 17.0, 15.0, 32.0, 50.0, 74.0, 114.0, 198.0, 192.0, 139.0, 66.0, 38.0, 31.0, 12.0, 6.0, 7.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.470703125, -0.45194244384765625, -0.4331817626953125, -0.41442108154296875, -0.395660400390625, -0.37689971923828125, -0.3581390380859375, -0.33937835693359375, -0.32061767578125, -0.30185699462890625, -0.2830963134765625, -0.26433563232421875, -0.245574951171875, -0.22681427001953125, -0.2080535888671875, -0.18929290771484375, -0.1705322265625, -0.15177154541015625, -0.1330108642578125, -0.11425018310546875, -0.095489501953125, -0.07672882080078125, -0.0579681396484375, -0.03920745849609375, -0.02044677734375, -0.00168609619140625, 0.0170745849609375, 0.03583526611328125, 0.054595947265625, 0.07335662841796875, 0.0921173095703125, 0.11087799072265625, 0.129638671875, 0.14839935302734375, 0.1671600341796875, 0.18592071533203125, 0.204681396484375, 0.22344207763671875, 0.2422027587890625, 0.26096343994140625, 0.27972412109375, 0.29848480224609375, 0.3172454833984375, 0.33600616455078125, 0.354766845703125, 0.37352752685546875, 0.3922882080078125, 0.41104888916015625, 0.4298095703125, 0.44857025146484375, 0.4673309326171875, 0.48609161376953125, 0.504852294921875, 0.5236129760742188, 0.5423736572265625, 0.5611343383789062, 0.57989501953125, 0.5986557006835938, 0.6174163818359375, 0.6361770629882812, 0.654937744140625, 0.6736984252929688, 0.6924591064453125, 0.7112197875976562, 0.72998046875]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 25.0, 256.0, 670.0, 42.0, 12.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.647586822509766, -5.574344635009766, -4.501102447509766, -3.4278602600097656, -2.3546180725097656, -1.2813758850097656, -0.20813369750976562, 0.8651084899902344, 1.9383506774902344, 3.0115928649902344, 4.084835052490234, 5.158077239990234, 6.231319427490234, 7.304561614990234, 8.377803802490234, 9.451045989990234, 10.524288177490234, 11.597530364990234, 12.670772552490234, 13.744014739990234, 14.817256927490234, 15.890499114990234, 16.963741302490234, 18.036983489990234, 19.110225677490234, 20.183467864990234, 21.256710052490234, 22.329952239990234, 23.403194427490234, 24.476436614990234, 25.549678802490234, 26.622920989990234, 27.69615936279297, 28.76940155029297, 29.84264373779297, 30.91588592529297, 31.98912811279297, 33.06237030029297, 34.13561248779297, 35.20885467529297, 36.28209686279297, 37.35533905029297, 38.42858123779297, 39.50182342529297, 40.57506561279297, 41.64830780029297, 42.72154998779297, 43.79479217529297, 44.86803436279297, 45.94127655029297, 47.01451873779297, 48.08776092529297, 49.16100311279297, 50.23424530029297, 51.30748748779297, 52.38072967529297, 53.45397186279297, 54.52721405029297, 55.60045623779297, 56.67369842529297, 57.74694061279297, 58.82018280029297, 59.89342498779297, 60.96666717529297, 62.03990936279297]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 8.0, 11.0, 11.0, 10.0, 20.0, 23.0, 33.0, 37.0, 46.0, 51.0, 47.0, 62.0, 66.0, 63.0, 74.0, 76.0, 47.0, 52.0, 47.0, 43.0, 44.0, 26.0, 33.0, 17.0, 12.0, 17.0, 14.0, 10.0, 5.0, 6.0, 0.0, 3.0, 2.0, 2.0], "bins": [-16.87106704711914, -16.491321563720703, -16.111576080322266, -15.731831550598145, -15.352087020874023, -14.972341537475586, -14.592596054077148, -14.212850570678711, -13.83310604095459, -13.453360557556152, -13.073616027832031, -12.693870544433594, -12.314125061035156, -11.934380531311035, -11.554635047912598, -11.174890518188477, -10.795145034790039, -10.415399551391602, -10.03565502166748, -9.655909538269043, -9.276165008544922, -8.896419525146484, -8.516674041748047, -8.13692855834961, -7.757184028625488, -7.377439022064209, -6.99769401550293, -6.617948532104492, -6.238203525543213, -5.858458518981934, -5.478713035583496, -5.098968029022217, -4.719223499298096, -4.339478492736816, -3.959733247756958, -3.5799880027770996, -3.2002429962158203, -2.820497989654541, -2.4407527446746826, -2.061007499694824, -1.681262493133545, -1.301517367362976, -0.9217722415924072, -0.5420271158218384, -0.16228199005126953, 0.21746313571929932, 0.5972082614898682, 0.9769535064697266, 1.3566985130310059, 1.7364436388015747, 2.1161887645721436, 2.495934009552002, 2.8756790161132812, 3.2554240226745605, 3.635169267654419, 4.014914512634277, 4.394659519195557, 4.774404525756836, 5.154150009155273, 5.533895015716553, 5.913640022277832, 6.293385028839111, 6.673130035400391, 7.052875518798828, 7.432620525360107]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 4.0, 4.0, 11.0, 9.0, 7.0, 23.0, 25.0, 43.0, 79.0, 98.0, 153.0, 264.0, 446.0, 893.0, 1683.0, 3769.0, 10823.0, 40945.0, 346539.0, 3540196.0, 201146.0, 31395.0, 8934.0, 3366.0, 1504.0, 792.0, 451.0, 227.0, 146.0, 99.0, 77.0, 36.0, 33.0, 16.0, 20.0, 12.0, 7.0, 2.0, 4.0, 3.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.919921875, -2.835052490234375, -2.75018310546875, -2.665313720703125, -2.5804443359375, -2.495574951171875, -2.41070556640625, -2.325836181640625, -2.240966796875, -2.156097412109375, -2.07122802734375, -1.986358642578125, -1.9014892578125, -1.816619873046875, -1.73175048828125, -1.646881103515625, -1.56201171875, -1.477142333984375, -1.39227294921875, -1.307403564453125, -1.2225341796875, -1.137664794921875, -1.05279541015625, -0.967926025390625, -0.883056640625, -0.798187255859375, -0.71331787109375, -0.628448486328125, -0.5435791015625, -0.458709716796875, -0.37384033203125, -0.288970947265625, -0.2041015625, -0.119232177734375, -0.03436279296875, 0.050506591796875, 0.1353759765625, 0.220245361328125, 0.30511474609375, 0.389984130859375, 0.474853515625, 0.559722900390625, 0.64459228515625, 0.729461669921875, 0.8143310546875, 0.899200439453125, 0.98406982421875, 1.068939208984375, 1.15380859375, 1.238677978515625, 1.32354736328125, 1.408416748046875, 1.4932861328125, 1.578155517578125, 1.66302490234375, 1.747894287109375, 1.832763671875, 1.917633056640625, 2.00250244140625, 2.087371826171875, 2.1722412109375, 2.257110595703125, 2.34197998046875, 2.426849365234375, 2.51171875]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 3.0, 6.0, 18.0, 14.0, 47.0, 53.0, 105.0, 155.0, 190.0, 160.0, 104.0, 58.0, 35.0, 20.0, 15.0, 6.0, 6.0, 8.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.8515625, -4.7147216796875, -4.577880859375, -4.4410400390625, -4.30419921875, -4.1673583984375, -4.030517578125, -3.8936767578125, -3.7568359375, -3.6199951171875, -3.483154296875, -3.3463134765625, -3.20947265625, -3.0726318359375, -2.935791015625, -2.7989501953125, -2.662109375, -2.5252685546875, -2.388427734375, -2.2515869140625, -2.11474609375, -1.9779052734375, -1.841064453125, -1.7042236328125, -1.5673828125, -1.4305419921875, -1.293701171875, -1.1568603515625, -1.02001953125, -0.8831787109375, -0.746337890625, -0.6094970703125, -0.47265625, -0.3358154296875, -0.198974609375, -0.0621337890625, 0.07470703125, 0.2115478515625, 0.348388671875, 0.4852294921875, 0.6220703125, 0.7589111328125, 0.895751953125, 1.0325927734375, 1.16943359375, 1.3062744140625, 1.443115234375, 1.5799560546875, 1.716796875, 1.8536376953125, 1.990478515625, 2.1273193359375, 2.26416015625, 2.4010009765625, 2.537841796875, 2.6746826171875, 2.8115234375, 2.9483642578125, 3.085205078125, 3.2220458984375, 3.35888671875, 3.4957275390625, 3.632568359375, 3.7694091796875, 3.90625]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 9.0, 7.0, 11.0, 14.0, 31.0, 35.0, 50.0, 92.0, 147.0, 300.0, 700.0, 2035.0, 8689.0, 71866.0, 3796016.0, 290738.0, 17916.0, 3547.0, 1136.0, 426.0, 213.0, 97.0, 79.0, 34.0, 24.0, 20.0, 14.0, 11.0, 4.0, 5.0, 5.0, 6.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0], "bins": [-4.796875, -4.676055908203125, -4.55523681640625, -4.434417724609375, -4.3135986328125, -4.192779541015625, -4.07196044921875, -3.951141357421875, -3.830322265625, -3.709503173828125, -3.58868408203125, -3.467864990234375, -3.3470458984375, -3.226226806640625, -3.10540771484375, -2.984588623046875, -2.86376953125, -2.742950439453125, -2.62213134765625, -2.501312255859375, -2.3804931640625, -2.259674072265625, -2.13885498046875, -2.018035888671875, -1.897216796875, -1.776397705078125, -1.65557861328125, -1.534759521484375, -1.4139404296875, -1.293121337890625, -1.17230224609375, -1.051483154296875, -0.9306640625, -0.809844970703125, -0.68902587890625, -0.568206787109375, -0.4473876953125, -0.326568603515625, -0.20574951171875, -0.084930419921875, 0.035888671875, 0.156707763671875, 0.27752685546875, 0.398345947265625, 0.5191650390625, 0.639984130859375, 0.76080322265625, 0.881622314453125, 1.00244140625, 1.123260498046875, 1.24407958984375, 1.364898681640625, 1.4857177734375, 1.606536865234375, 1.72735595703125, 1.848175048828125, 1.968994140625, 2.089813232421875, 2.21063232421875, 2.331451416015625, 2.4522705078125, 2.573089599609375, 2.69390869140625, 2.814727783203125, 2.935546875]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 7.0, 9.0, 6.0, 12.0, 16.0, 23.0, 29.0, 46.0, 78.0, 128.0, 203.0, 395.0, 810.0, 1240.0, 452.0, 224.0, 126.0, 80.0, 63.0, 42.0, 29.0, 16.0, 15.0, 8.0, 5.0, 2.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.62841796875, -0.6053237915039062, -0.5822296142578125, -0.5591354370117188, -0.536041259765625, -0.5129470825195312, -0.4898529052734375, -0.46675872802734375, -0.44366455078125, -0.42057037353515625, -0.3974761962890625, -0.37438201904296875, -0.351287841796875, -0.32819366455078125, -0.3050994873046875, -0.28200531005859375, -0.2589111328125, -0.23581695556640625, -0.2127227783203125, -0.18962860107421875, -0.166534423828125, -0.14344024658203125, -0.1203460693359375, -0.09725189208984375, -0.07415771484375, -0.05106353759765625, -0.0279693603515625, -0.00487518310546875, 0.018218994140625, 0.04131317138671875, 0.0644073486328125, 0.08750152587890625, 0.110595703125, 0.13368988037109375, 0.1567840576171875, 0.17987823486328125, 0.202972412109375, 0.22606658935546875, 0.2491607666015625, 0.27225494384765625, 0.29534912109375, 0.31844329833984375, 0.3415374755859375, 0.36463165283203125, 0.387725830078125, 0.41082000732421875, 0.4339141845703125, 0.45700836181640625, 0.4801025390625, 0.5031967163085938, 0.5262908935546875, 0.5493850708007812, 0.572479248046875, 0.5955734252929688, 0.6186676025390625, 0.6417617797851562, 0.66485595703125, 0.6879501342773438, 0.7110443115234375, 0.7341384887695312, 0.757232666015625, 0.7803268432617188, 0.8034210205078125, 0.8265151977539062, 0.849609375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0, 5.0, 7.0, 11.0, 15.0, 29.0, 50.0, 116.0, 224.0, 257.0, 147.0, 67.0, 34.0, 12.0, 13.0, 4.0, 3.0, 8.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.455747604370117, -4.291762351989746, -4.127776622772217, -3.9637913703918457, -3.7998058795928955, -3.6358203887939453, -3.471834897994995, -3.307849407196045, -3.143864154815674, -2.9798786640167236, -2.8158931732177734, -2.6519079208374023, -2.487922430038452, -2.323936939239502, -2.1599514484405518, -1.9959660768508911, -1.8319804668426514, -1.6679949760437012, -1.5040096044540405, -1.3400241136550903, -1.1760387420654297, -1.0120532512664795, -0.8480677604675293, -0.6840823888778687, -0.5200968980789185, -0.35611146688461304, -0.19212600588798523, -0.028140544891357422, 0.135844886302948, 0.2998303174972534, 0.4638158082962036, 0.6278011798858643, 0.7917866706848145, 0.9557721018791199, 1.1197575330734253, 1.2837430238723755, 1.4477283954620361, 1.6117138862609863, 1.7756993770599365, 1.9396847486495972, 2.103670120239258, 2.267655611038208, 2.431641101837158, 2.5956263542175293, 2.7596118450164795, 2.9235973358154297, 3.08758282661438, 3.25156831741333, 3.4155538082122803, 3.5795392990112305, 3.7435247898101807, 3.907510280609131, 4.071495532989502, 4.235481262207031, 4.399466514587402, 4.563451766967773, 4.727437496185303, 4.891422748565674, 5.055408477783203, 5.219393730163574, 5.3833794593811035, 5.547364711761475, 5.711350440979004, 5.875335693359375, 6.039320945739746]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 6.0, 8.0, 11.0, 22.0, 27.0, 43.0, 54.0, 72.0, 103.0, 114.0, 110.0, 120.0, 86.0, 70.0, 41.0, 43.0, 30.0, 14.0, 10.0, 8.0, 5.0, 5.0, 3.0, 0.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.138020038604736, -4.023368835449219, -3.908717393875122, -3.7940659523010254, -3.6794145107269287, -3.564763069152832, -3.4501118659973145, -3.3354604244232178, -3.220808982849121, -3.1061575412750244, -2.991506338119507, -2.87685489654541, -2.7622034549713135, -2.647552013397217, -2.532900810241699, -2.4182493686676025, -2.303598165512085, -2.1889467239379883, -2.0742955207824707, -1.959644079208374, -1.8449926376342773, -1.7303413152694702, -1.615689992904663, -1.5010385513305664, -1.3863872289657593, -1.2717359066009521, -1.1570844650268555, -1.0424331426620483, -0.9277817606925964, -0.8131303787231445, -0.6984790563583374, -0.5838276743888855, -0.4691760540008545, -0.3545246720314026, -0.23987331986427307, -0.12522196769714355, -0.01057058572769165, 0.10408079624176025, 0.21873211860656738, 0.3333835005760193, 0.4480348825454712, 0.5626862645149231, 0.677337646484375, 0.7919889688491821, 0.906640350818634, 1.021291732788086, 1.135943055152893, 1.2505943775177002, 1.3652458190917969, 1.479897141456604, 1.5945485830307007, 1.7091999053955078, 1.8238513469696045, 1.9385026693344116, 2.0531539916992188, 2.1678054332733154, 2.282456874847412, 2.397108316421509, 2.5117595195770264, 2.626410961151123, 2.7410624027252197, 2.8557138442993164, 2.970365047454834, 3.0850164890289307, 3.1996676921844482]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 6.0, 6.0, 22.0, 26.0, 41.0, 84.0, 187.0, 366.0, 1066.0, 3856.0, 30071.0, 626803.0, 363542.0, 18151.0, 2893.0, 805.0, 319.0, 120.0, 70.0, 50.0, 28.0, 17.0, 9.0, 6.0, 7.0, 5.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.62646484375, -0.6085128784179688, -0.5905609130859375, -0.5726089477539062, -0.554656982421875, -0.5367050170898438, -0.5187530517578125, -0.5008010864257812, -0.48284912109375, -0.46489715576171875, -0.4469451904296875, -0.42899322509765625, -0.411041259765625, -0.39308929443359375, -0.3751373291015625, -0.35718536376953125, -0.3392333984375, -0.32128143310546875, -0.3033294677734375, -0.28537750244140625, -0.267425537109375, -0.24947357177734375, -0.2315216064453125, -0.21356964111328125, -0.19561767578125, -0.17766571044921875, -0.1597137451171875, -0.14176177978515625, -0.123809814453125, -0.10585784912109375, -0.0879058837890625, -0.06995391845703125, -0.052001953125, -0.03404998779296875, -0.0160980224609375, 0.00185394287109375, 0.019805908203125, 0.03775787353515625, 0.0557098388671875, 0.07366180419921875, 0.09161376953125, 0.10956573486328125, 0.1275177001953125, 0.14546966552734375, 0.163421630859375, 0.18137359619140625, 0.1993255615234375, 0.21727752685546875, 0.2352294921875, 0.25318145751953125, 0.2711334228515625, 0.28908538818359375, 0.307037353515625, 0.32498931884765625, 0.3429412841796875, 0.36089324951171875, 0.37884521484375, 0.39679718017578125, 0.4147491455078125, 0.43270111083984375, 0.450653076171875, 0.46860504150390625, 0.4865570068359375, 0.5045089721679688, 0.5224609375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 11.0, 12.0, 17.0, 17.0, 35.0, 59.0, 82.0, 130.0, 133.0, 143.0, 113.0, 84.0, 63.0, 36.0, 27.0, 11.0, 8.0, 7.0, 6.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.080078125, -2.983917236328125, -2.88775634765625, -2.791595458984375, -2.6954345703125, -2.599273681640625, -2.50311279296875, -2.406951904296875, -2.310791015625, -2.214630126953125, -2.11846923828125, -2.022308349609375, -1.9261474609375, -1.829986572265625, -1.73382568359375, -1.637664794921875, -1.54150390625, -1.445343017578125, -1.34918212890625, -1.253021240234375, -1.1568603515625, -1.060699462890625, -0.96453857421875, -0.868377685546875, -0.772216796875, -0.676055908203125, -0.57989501953125, -0.483734130859375, -0.3875732421875, -0.291412353515625, -0.19525146484375, -0.099090576171875, -0.0029296875, 0.093231201171875, 0.18939208984375, 0.285552978515625, 0.3817138671875, 0.477874755859375, 0.57403564453125, 0.670196533203125, 0.766357421875, 0.862518310546875, 0.95867919921875, 1.054840087890625, 1.1510009765625, 1.247161865234375, 1.34332275390625, 1.439483642578125, 1.53564453125, 1.631805419921875, 1.72796630859375, 1.824127197265625, 1.9202880859375, 2.016448974609375, 2.11260986328125, 2.208770751953125, 2.304931640625, 2.401092529296875, 2.49725341796875, 2.593414306640625, 2.6895751953125, 2.785736083984375, 2.88189697265625, 2.978057861328125, 3.07421875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 5.0, 7.0, 5.0, 10.0, 12.0, 29.0, 37.0, 61.0, 88.0, 177.0, 322.0, 704.0, 1978.0, 7857.0, 58314.0, 505944.0, 417046.0, 45997.0, 6790.0, 1817.0, 648.0, 314.0, 150.0, 92.0, 43.0, 36.0, 23.0, 14.0, 14.0, 10.0, 8.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.23681640625, -0.22602081298828125, -0.2152252197265625, -0.20442962646484375, -0.193634033203125, -0.18283843994140625, -0.1720428466796875, -0.16124725341796875, -0.15045166015625, -0.13965606689453125, -0.1288604736328125, -0.11806488037109375, -0.107269287109375, -0.09647369384765625, -0.0856781005859375, -0.07488250732421875, -0.0640869140625, -0.05329132080078125, -0.0424957275390625, -0.03170013427734375, -0.020904541015625, -0.01010894775390625, 0.0006866455078125, 0.01148223876953125, 0.02227783203125, 0.03307342529296875, 0.0438690185546875, 0.05466461181640625, 0.065460205078125, 0.07625579833984375, 0.0870513916015625, 0.09784698486328125, 0.108642578125, 0.11943817138671875, 0.1302337646484375, 0.14102935791015625, 0.151824951171875, 0.16262054443359375, 0.1734161376953125, 0.18421173095703125, 0.19500732421875, 0.20580291748046875, 0.2165985107421875, 0.22739410400390625, 0.238189697265625, 0.24898529052734375, 0.2597808837890625, 0.27057647705078125, 0.2813720703125, 0.29216766357421875, 0.3029632568359375, 0.31375885009765625, 0.324554443359375, 0.33535003662109375, 0.3461456298828125, 0.35694122314453125, 0.36773681640625, 0.37853240966796875, 0.3893280029296875, 0.40012359619140625, 0.410919189453125, 0.42171478271484375, 0.4325103759765625, 0.44330596923828125, 0.4541015625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 5.0, 2.0, 3.0, 1.0, 6.0, 9.0, 13.0, 13.0, 18.0, 33.0, 28.0, 37.0, 60.0, 59.0, 44.0, 56.0, 61.0, 65.0, 70.0, 57.0, 52.0, 68.0, 57.0, 38.0, 24.0, 24.0, 24.0, 24.0, 14.0, 14.0, 6.0, 12.0, 6.0, 1.0, 4.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.296875, -2.19024658203125, -2.0836181640625, -1.97698974609375, -1.870361328125, -1.76373291015625, -1.6571044921875, -1.55047607421875, -1.44384765625, -1.33721923828125, -1.2305908203125, -1.12396240234375, -1.017333984375, -0.91070556640625, -0.8040771484375, -0.69744873046875, -0.5908203125, -0.48419189453125, -0.3775634765625, -0.27093505859375, -0.164306640625, -0.05767822265625, 0.0489501953125, 0.15557861328125, 0.26220703125, 0.36883544921875, 0.4754638671875, 0.58209228515625, 0.688720703125, 0.79534912109375, 0.9019775390625, 1.00860595703125, 1.115234375, 1.22186279296875, 1.3284912109375, 1.43511962890625, 1.541748046875, 1.64837646484375, 1.7550048828125, 1.86163330078125, 1.96826171875, 2.07489013671875, 2.1815185546875, 2.28814697265625, 2.394775390625, 2.50140380859375, 2.6080322265625, 2.71466064453125, 2.8212890625, 2.92791748046875, 3.0345458984375, 3.14117431640625, 3.247802734375, 3.35443115234375, 3.4610595703125, 3.56768798828125, 3.67431640625, 3.78094482421875, 3.8875732421875, 3.99420166015625, 4.100830078125, 4.20745849609375, 4.3140869140625, 4.42071533203125, 4.52734375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 4.0, 6.0, 11.0, 19.0, 21.0, 50.0, 121.0, 257.0, 953.0, 7524.0, 517951.0, 512735.0, 7546.0, 919.0, 235.0, 111.0, 41.0, 23.0, 15.0, 6.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1893310546875, -0.1803150177001953, -0.17129898071289062, -0.16228294372558594, -0.15326690673828125, -0.14425086975097656, -0.13523483276367188, -0.1262187957763672, -0.1172027587890625, -0.10818672180175781, -0.09917068481445312, -0.09015464782714844, -0.08113861083984375, -0.07212257385253906, -0.06310653686523438, -0.05409049987792969, -0.045074462890625, -0.03605842590332031, -0.027042388916015625, -0.018026351928710938, -0.00901031494140625, 5.7220458984375e-06, 0.009021759033203125, 0.018037796020507812, 0.0270538330078125, 0.03606986999511719, 0.045085906982421875, 0.05410194396972656, 0.06311798095703125, 0.07213401794433594, 0.08115005493164062, 0.09016609191894531, 0.09918212890625, 0.10819816589355469, 0.11721420288085938, 0.12623023986816406, 0.13524627685546875, 0.14426231384277344, 0.15327835083007812, 0.1622943878173828, 0.1713104248046875, 0.1803264617919922, 0.18934249877929688, 0.19835853576660156, 0.20737457275390625, 0.21639060974121094, 0.22540664672851562, 0.2344226837158203, 0.243438720703125, 0.2524547576904297, 0.2614707946777344, 0.27048683166503906, 0.27950286865234375, 0.28851890563964844, 0.2975349426269531, 0.3065509796142578, 0.3155670166015625, 0.3245830535888672, 0.3335990905761719, 0.34261512756347656, 0.35163116455078125, 0.36064720153808594, 0.3696632385253906, 0.3786792755126953, 0.3876953125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 11.0, 19.0, 28.0, 63.0, 90.0, 159.0, 178.0, 149.0, 133.0, 67.0, 38.0, 23.0, 16.0, 13.0, 9.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010418891906738281, -0.00010157190263271332, -9.895488619804382e-05, -9.633786976337433e-05, -9.372085332870483e-05, -9.110383689403534e-05, -8.848682045936584e-05, -8.586980402469635e-05, -8.325278759002686e-05, -8.063577115535736e-05, -7.801875472068787e-05, -7.540173828601837e-05, -7.278472185134888e-05, -7.016770541667938e-05, -6.755068898200989e-05, -6.493367254734039e-05, -6.23166561126709e-05, -5.9699639678001404e-05, -5.708262324333191e-05, -5.4465606808662415e-05, -5.184859037399292e-05, -4.9231573939323425e-05, -4.661455750465393e-05, -4.3997541069984436e-05, -4.138052463531494e-05, -3.876350820064545e-05, -3.614649176597595e-05, -3.352947533130646e-05, -3.091245889663696e-05, -2.8295442461967468e-05, -2.5678426027297974e-05, -2.306140959262848e-05, -2.0444393157958984e-05, -1.782737672328949e-05, -1.5210360288619995e-05, -1.25933438539505e-05, -9.976327419281006e-06, -7.359310984611511e-06, -4.742294549942017e-06, -2.125278115272522e-06, 4.917383193969727e-07, 3.1087547540664673e-06, 5.725771188735962e-06, 8.342787623405457e-06, 1.0959804058074951e-05, 1.3576820492744446e-05, 1.619383692741394e-05, 1.8810853362083435e-05, 2.142786979675293e-05, 2.4044886231422424e-05, 2.666190266609192e-05, 2.9278919100761414e-05, 3.189593553543091e-05, 3.45129519701004e-05, 3.71299684047699e-05, 3.974698483943939e-05, 4.236400127410889e-05, 4.498101770877838e-05, 4.7598034143447876e-05, 5.021505057811737e-05, 5.2832067012786865e-05, 5.544908344745636e-05, 5.8066099882125854e-05, 6.068311631679535e-05, 6.330013275146484e-05]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 14.0, 22.0, 35.0, 75.0, 162.0, 431.0, 2364.0, 125101.0, 910959.0, 8220.0, 794.0, 199.0, 67.0, 45.0, 19.0, 15.0, 7.0, 8.0, 7.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25244140625, -0.2410736083984375, -0.229705810546875, -0.2183380126953125, -0.20697021484375, -0.1956024169921875, -0.184234619140625, -0.1728668212890625, -0.1614990234375, -0.1501312255859375, -0.138763427734375, -0.1273956298828125, -0.11602783203125, -0.1046600341796875, -0.093292236328125, -0.0819244384765625, -0.070556640625, -0.0591888427734375, -0.047821044921875, -0.0364532470703125, -0.02508544921875, -0.0137176513671875, -0.002349853515625, 0.0090179443359375, 0.0203857421875, 0.0317535400390625, 0.043121337890625, 0.0544891357421875, 0.06585693359375, 0.0772247314453125, 0.088592529296875, 0.0999603271484375, 0.111328125, 0.1226959228515625, 0.134063720703125, 0.1454315185546875, 0.15679931640625, 0.1681671142578125, 0.179534912109375, 0.1909027099609375, 0.2022705078125, 0.2136383056640625, 0.225006103515625, 0.2363739013671875, 0.24774169921875, 0.2591094970703125, 0.270477294921875, 0.2818450927734375, 0.293212890625, 0.3045806884765625, 0.315948486328125, 0.3273162841796875, 0.33868408203125, 0.3500518798828125, 0.361419677734375, 0.3727874755859375, 0.3841552734375, 0.3955230712890625, 0.406890869140625, 0.4182586669921875, 0.42962646484375, 0.4409942626953125, 0.452362060546875, 0.4637298583984375, 0.47509765625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 4.0, 7.0, 9.0, 21.0, 41.0, 136.0, 290.0, 290.0, 118.0, 46.0, 20.0, 10.0, 8.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.11572265625, -0.11296749114990234, -0.11021232604980469, -0.10745716094970703, -0.10470199584960938, -0.10194683074951172, -0.09919166564941406, -0.0964365005493164, -0.09368133544921875, -0.0909261703491211, -0.08817100524902344, -0.08541584014892578, -0.08266067504882812, -0.07990550994873047, -0.07715034484863281, -0.07439517974853516, -0.0716400146484375, -0.06888484954833984, -0.06612968444824219, -0.06337451934814453, -0.060619354248046875, -0.05786418914794922, -0.05510902404785156, -0.052353858947753906, -0.04959869384765625, -0.046843528747558594, -0.04408836364746094, -0.04133319854736328, -0.038578033447265625, -0.03582286834716797, -0.03306770324707031, -0.030312538146972656, -0.027557373046875, -0.024802207946777344, -0.022047042846679688, -0.01929187774658203, -0.016536712646484375, -0.013781547546386719, -0.011026382446289062, -0.008271217346191406, -0.00551605224609375, -0.0027608871459960938, -5.7220458984375e-06, 0.0027494430541992188, 0.005504608154296875, 0.008259773254394531, 0.011014938354492188, 0.013770103454589844, 0.0165252685546875, 0.019280433654785156, 0.022035598754882812, 0.02479076385498047, 0.027545928955078125, 0.03030109405517578, 0.03305625915527344, 0.035811424255371094, 0.03856658935546875, 0.041321754455566406, 0.04407691955566406, 0.04683208465576172, 0.049587249755859375, 0.05234241485595703, 0.05509757995605469, 0.057852745056152344, 0.06060791015625]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 11.0, 13.0, 33.0, 90.0, 304.0, 374.0, 106.0, 39.0, 13.0, 13.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.638274669647217, -3.457681655883789, -3.2770886421203613, -3.0964956283569336, -2.915902614593506, -2.735309600830078, -2.5547165870666504, -2.3741235733032227, -2.193530559539795, -2.012937545776367, -1.8323445320129395, -1.6517515182495117, -1.471158504486084, -1.2905654907226562, -1.109972596168518, -0.9293795824050903, -0.7487866878509521, -0.5681936740875244, -0.38760069012641907, -0.20700770616531372, -0.026414692401885986, 0.15417832136154175, 0.3347712755203247, 0.5153642892837524, 0.6959573030471802, 0.8765503168106079, 1.0571433305740356, 1.2377362251281738, 1.4183292388916016, 1.5989222526550293, 1.779515266418457, 1.9601082801818848, 2.1407012939453125, 2.3212943077087402, 2.501887321472168, 2.6824803352355957, 2.8630733489990234, 3.043666362762451, 3.224259376525879, 3.4048523902893066, 3.5854454040527344, 3.766038417816162, 3.94663143157959, 4.127224445343018, 4.307817459106445, 4.488410472869873, 4.669003486633301, 4.8495965003967285, 5.030189514160156, 5.210782527923584, 5.391375541687012, 5.5719685554504395, 5.752561569213867, 5.933154582977295, 6.113747596740723, 6.29434061050415, 6.47493314743042, 6.655526161193848, 6.836119174957275, 7.016712188720703, 7.197305202484131, 7.377898216247559, 7.558491230010986, 7.739084243774414, 7.919677257537842]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 8.0, 15.0, 16.0, 29.0, 42.0, 68.0, 83.0, 134.0, 160.0, 130.0, 119.0, 58.0, 53.0, 34.0, 18.0, 11.0, 9.0, 2.0, 7.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.435612916946411, -3.3394315242767334, -3.2432503700256348, -3.147068977355957, -3.0508875846862793, -2.9547061920166016, -2.858525037765503, -2.762343645095825, -2.6661622524261475, -2.5699808597564697, -2.473799705505371, -2.3776183128356934, -2.2814369201660156, -2.185255527496338, -2.0890743732452393, -1.9928929805755615, -1.8967117071151733, -1.8005304336547852, -1.7043490409851074, -1.6081677675247192, -1.5119863748550415, -1.4158051013946533, -1.3196237087249756, -1.2234424352645874, -1.1272611618041992, -1.031079888343811, -0.9348984956741333, -0.8387172222137451, -0.7425358295440674, -0.6463545560836792, -0.5501732230186462, -0.4539918899536133, -0.35781049728393555, -0.2616291642189026, -0.16544784605503082, -0.06926652789115906, 0.0269148051738739, 0.12309613823890686, 0.21927744150161743, 0.3154587745666504, 0.41164010763168335, 0.5078214406967163, 0.6040027737617493, 0.7001841068267822, 0.7963653802871704, 0.8925467729568481, 0.9887280464172363, 1.084909439086914, 1.1810907125473022, 1.2772719860076904, 1.3734533786773682, 1.4696346521377563, 1.565816044807434, 1.6619973182678223, 1.7581787109375, 1.8543599843978882, 1.9505412578582764, 2.046722650527954, 2.1429038047790527, 2.2390851974487305, 2.335266590118408, 2.431447982788086, 2.5276291370391846, 2.6238105297088623, 2.71999192237854]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 6.0, 2.0, 4.0, 5.0, 7.0, 17.0, 19.0, 28.0, 40.0, 57.0, 91.0, 132.0, 204.0, 401.0, 652.0, 1092.0, 2188.0, 4725.0, 11189.0, 32386.0, 132629.0, 638124.0, 163840.0, 37401.0, 12593.0, 5241.0, 2482.0, 1211.0, 702.0, 430.0, 230.0, 146.0, 88.0, 65.0, 38.0, 32.0, 21.0, 15.0, 10.0, 8.0, 3.0, 6.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2646484375, -1.224578857421875, -1.18450927734375, -1.144439697265625, -1.1043701171875, -1.064300537109375, -1.02423095703125, -0.984161376953125, -0.944091796875, -0.904022216796875, -0.86395263671875, -0.823883056640625, -0.7838134765625, -0.743743896484375, -0.70367431640625, -0.663604736328125, -0.62353515625, -0.583465576171875, -0.54339599609375, -0.503326416015625, -0.4632568359375, -0.423187255859375, -0.38311767578125, -0.343048095703125, -0.302978515625, -0.262908935546875, -0.22283935546875, -0.182769775390625, -0.1427001953125, -0.102630615234375, -0.06256103515625, -0.022491455078125, 0.017578125, 0.057647705078125, 0.09771728515625, 0.137786865234375, 0.1778564453125, 0.217926025390625, 0.25799560546875, 0.298065185546875, 0.338134765625, 0.378204345703125, 0.41827392578125, 0.458343505859375, 0.4984130859375, 0.538482666015625, 0.57855224609375, 0.618621826171875, 0.65869140625, 0.698760986328125, 0.73883056640625, 0.778900146484375, 0.8189697265625, 0.859039306640625, 0.89910888671875, 0.939178466796875, 0.979248046875, 1.019317626953125, 1.05938720703125, 1.099456787109375, 1.1395263671875, 1.179595947265625, 1.21966552734375, 1.259735107421875, 1.2998046875]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 5.0, 8.0, 10.0, 11.0, 19.0, 22.0, 44.0, 56.0, 77.0, 117.0, 149.0, 118.0, 106.0, 90.0, 40.0, 42.0, 37.0, 12.0, 12.0, 12.0, 7.0, 2.0, 3.0, 6.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.00390625, -6.81451416015625, -6.6251220703125, -6.43572998046875, -6.246337890625, -6.05694580078125, -5.8675537109375, -5.67816162109375, -5.48876953125, -5.29937744140625, -5.1099853515625, -4.92059326171875, -4.731201171875, -4.54180908203125, -4.3524169921875, -4.16302490234375, -3.9736328125, -3.78424072265625, -3.5948486328125, -3.40545654296875, -3.216064453125, -3.02667236328125, -2.8372802734375, -2.64788818359375, -2.45849609375, -2.26910400390625, -2.0797119140625, -1.89031982421875, -1.700927734375, -1.51153564453125, -1.3221435546875, -1.13275146484375, -0.943359375, -0.75396728515625, -0.5645751953125, -0.37518310546875, -0.185791015625, 0.00360107421875, 0.1929931640625, 0.38238525390625, 0.57177734375, 0.76116943359375, 0.9505615234375, 1.13995361328125, 1.329345703125, 1.51873779296875, 1.7081298828125, 1.89752197265625, 2.0869140625, 2.27630615234375, 2.4656982421875, 2.65509033203125, 2.844482421875, 3.03387451171875, 3.2232666015625, 3.41265869140625, 3.60205078125, 3.79144287109375, 3.9808349609375, 4.17022705078125, 4.359619140625, 4.54901123046875, 4.7384033203125, 4.92779541015625, 5.1171875]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 1.0, 1.0, 2.0, 3.0, 7.0, 3.0, 5.0, 3.0, 8.0, 14.0, 16.0, 25.0, 29.0, 38.0, 66.0, 77.0, 104.0, 147.0, 260.0, 442.0, 803.0, 1774.0, 4388.0, 14098.0, 66925.0, 633826.0, 274717.0, 36024.0, 8864.0, 3022.0, 1282.0, 624.0, 334.0, 201.0, 121.0, 78.0, 59.0, 37.0, 27.0, 24.0, 13.0, 15.0, 7.0, 14.0, 7.0, 5.0, 9.0, 5.0, 3.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.4462890625, -1.4022216796875, -1.358154296875, -1.3140869140625, -1.27001953125, -1.2259521484375, -1.181884765625, -1.1378173828125, -1.09375, -1.0496826171875, -1.005615234375, -0.9615478515625, -0.91748046875, -0.8734130859375, -0.829345703125, -0.7852783203125, -0.7412109375, -0.6971435546875, -0.653076171875, -0.6090087890625, -0.56494140625, -0.5208740234375, -0.476806640625, -0.4327392578125, -0.388671875, -0.3446044921875, -0.300537109375, -0.2564697265625, -0.21240234375, -0.1683349609375, -0.124267578125, -0.0802001953125, -0.0361328125, 0.0079345703125, 0.052001953125, 0.0960693359375, 0.14013671875, 0.1842041015625, 0.228271484375, 0.2723388671875, 0.31640625, 0.3604736328125, 0.404541015625, 0.4486083984375, 0.49267578125, 0.5367431640625, 0.580810546875, 0.6248779296875, 0.6689453125, 0.7130126953125, 0.757080078125, 0.8011474609375, 0.84521484375, 0.8892822265625, 0.933349609375, 0.9774169921875, 1.021484375, 1.0655517578125, 1.109619140625, 1.1536865234375, 1.19775390625, 1.2418212890625, 1.285888671875, 1.3299560546875, 1.3740234375]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 4.0, 7.0, 8.0, 8.0, 17.0, 17.0, 16.0, 26.0, 24.0, 32.0, 19.0, 42.0, 36.0, 39.0, 37.0, 47.0, 45.0, 50.0, 51.0, 38.0, 39.0, 51.0, 45.0, 44.0, 29.0, 32.0, 32.0, 29.0, 21.0, 24.0, 17.0, 20.0, 10.0, 11.0, 9.0, 10.0, 3.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.423828125, -3.304229736328125, -3.18463134765625, -3.065032958984375, -2.9454345703125, -2.825836181640625, -2.70623779296875, -2.586639404296875, -2.467041015625, -2.347442626953125, -2.22784423828125, -2.108245849609375, -1.9886474609375, -1.869049072265625, -1.74945068359375, -1.629852294921875, -1.51025390625, -1.390655517578125, -1.27105712890625, -1.151458740234375, -1.0318603515625, -0.912261962890625, -0.79266357421875, -0.673065185546875, -0.553466796875, -0.433868408203125, -0.31427001953125, -0.194671630859375, -0.0750732421875, 0.044525146484375, 0.16412353515625, 0.283721923828125, 0.4033203125, 0.522918701171875, 0.64251708984375, 0.762115478515625, 0.8817138671875, 1.001312255859375, 1.12091064453125, 1.240509033203125, 1.360107421875, 1.479705810546875, 1.59930419921875, 1.718902587890625, 1.8385009765625, 1.958099365234375, 2.07769775390625, 2.197296142578125, 2.31689453125, 2.436492919921875, 2.55609130859375, 2.675689697265625, 2.7952880859375, 2.914886474609375, 3.03448486328125, 3.154083251953125, 3.273681640625, 3.393280029296875, 3.51287841796875, 3.632476806640625, 3.7520751953125, 3.871673583984375, 3.99127197265625, 4.110870361328125, 4.23046875]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 4.0, 6.0, 3.0, 4.0, 4.0, 4.0, 6.0, 10.0, 15.0, 12.0, 15.0, 24.0, 43.0, 47.0, 78.0, 140.0, 227.0, 459.0, 1040.0, 2463.0, 9229.0, 52995.0, 681335.0, 264107.0, 27186.0, 5605.0, 1811.0, 726.0, 369.0, 191.0, 131.0, 77.0, 54.0, 40.0, 29.0, 24.0, 15.0, 9.0, 2.0, 10.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.82861328125, -0.8072738647460938, -0.7859344482421875, -0.7645950317382812, -0.743255615234375, -0.7219161987304688, -0.7005767822265625, -0.6792373657226562, -0.65789794921875, -0.6365585327148438, -0.6152191162109375, -0.5938796997070312, -0.572540283203125, -0.5512008666992188, -0.5298614501953125, -0.5085220336914062, -0.4871826171875, -0.46584320068359375, -0.4445037841796875, -0.42316436767578125, -0.401824951171875, -0.38048553466796875, -0.3591461181640625, -0.33780670166015625, -0.31646728515625, -0.29512786865234375, -0.2737884521484375, -0.25244903564453125, -0.231109619140625, -0.20977020263671875, -0.1884307861328125, -0.16709136962890625, -0.145751953125, -0.12441253662109375, -0.1030731201171875, -0.08173370361328125, -0.060394287109375, -0.03905487060546875, -0.0177154541015625, 0.00362396240234375, 0.02496337890625, 0.04630279541015625, 0.0676422119140625, 0.08898162841796875, 0.110321044921875, 0.13166046142578125, 0.1529998779296875, 0.17433929443359375, 0.1956787109375, 0.21701812744140625, 0.2383575439453125, 0.25969696044921875, 0.281036376953125, 0.30237579345703125, 0.3237152099609375, 0.34505462646484375, 0.36639404296875, 0.38773345947265625, 0.4090728759765625, 0.43041229248046875, 0.451751708984375, 0.47309112548828125, 0.4944305419921875, 0.5157699584960938, 0.537109375]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 6.0, 4.0, 9.0, 13.0, 29.0, 25.0, 39.0, 46.0, 82.0, 128.0, 220.0, 131.0, 83.0, 61.0, 47.0, 29.0, 12.0, 8.0, 15.0, 8.0, 3.0, 2.0, 5.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.857250213623047e-05, -8.464045822620392e-05, -8.070841431617737e-05, -7.677637040615082e-05, -7.284432649612427e-05, -6.891228258609772e-05, -6.498023867607117e-05, -6.104819476604462e-05, -5.7116150856018066e-05, -5.3184106945991516e-05, -4.9252063035964966e-05, -4.5320019125938416e-05, -4.1387975215911865e-05, -3.7455931305885315e-05, -3.3523887395858765e-05, -2.9591843485832214e-05, -2.5659799575805664e-05, -2.1727755665779114e-05, -1.7795711755752563e-05, -1.3863667845726013e-05, -9.931623935699463e-06, -5.999580025672913e-06, -2.0675361156463623e-06, 1.864507794380188e-06, 5.796551704406738e-06, 9.728595614433289e-06, 1.3660639524459839e-05, 1.759268343448639e-05, 2.152472734451294e-05, 2.545677125453949e-05, 2.938881516456604e-05, 3.332085907459259e-05, 3.725290298461914e-05, 4.118494689464569e-05, 4.511699080467224e-05, 4.904903471469879e-05, 5.298107862472534e-05, 5.691312253475189e-05, 6.084516644477844e-05, 6.477721035480499e-05, 6.870925426483154e-05, 7.26412981748581e-05, 7.657334208488464e-05, 8.05053859949112e-05, 8.443742990493774e-05, 8.83694738149643e-05, 9.230151772499084e-05, 9.62335616350174e-05, 0.00010016560554504395, 0.0001040976494550705, 0.00010802969336509705, 0.0001119617372751236, 0.00011589378118515015, 0.0001198258250951767, 0.00012375786900520325, 0.0001276899129152298, 0.00013162195682525635, 0.0001355540007352829, 0.00013948604464530945, 0.000143418088555336, 0.00014735013246536255, 0.0001512821763753891, 0.00015521422028541565, 0.0001591462641954422, 0.00016307830810546875]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 9.0, 6.0, 8.0, 21.0, 22.0, 34.0, 59.0, 107.0, 214.0, 443.0, 1174.0, 4482.0, 27572.0, 637744.0, 350451.0, 20660.0, 3678.0, 1027.0, 400.0, 178.0, 87.0, 64.0, 32.0, 31.0, 14.0, 9.0, 13.0, 4.0, 1.0, 5.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.72119140625, -0.6933822631835938, -0.6655731201171875, -0.6377639770507812, -0.609954833984375, -0.5821456909179688, -0.5543365478515625, -0.5265274047851562, -0.49871826171875, -0.47090911865234375, -0.4430999755859375, -0.41529083251953125, -0.387481689453125, -0.35967254638671875, -0.3318634033203125, -0.30405426025390625, -0.2762451171875, -0.24843597412109375, -0.2206268310546875, -0.19281768798828125, -0.165008544921875, -0.13719940185546875, -0.1093902587890625, -0.08158111572265625, -0.05377197265625, -0.02596282958984375, 0.0018463134765625, 0.02965545654296875, 0.057464599609375, 0.08527374267578125, 0.1130828857421875, 0.14089202880859375, 0.168701171875, 0.19651031494140625, 0.2243194580078125, 0.25212860107421875, 0.279937744140625, 0.30774688720703125, 0.3355560302734375, 0.36336517333984375, 0.39117431640625, 0.41898345947265625, 0.4467926025390625, 0.47460174560546875, 0.502410888671875, 0.5302200317382812, 0.5580291748046875, 0.5858383178710938, 0.6136474609375, 0.6414566040039062, 0.6692657470703125, 0.6970748901367188, 0.724884033203125, 0.7526931762695312, 0.7805023193359375, 0.8083114624023438, 0.83612060546875, 0.8639297485351562, 0.8917388916015625, 0.9195480346679688, 0.947357177734375, 0.9751663208007812, 1.0029754638671875, 1.0307846069335938, 1.05859375]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 9.0, 10.0, 9.0, 12.0, 6.0, 20.0, 17.0, 34.0, 47.0, 55.0, 91.0, 156.0, 183.0, 134.0, 63.0, 40.0, 30.0, 23.0, 15.0, 16.0, 12.0, 8.0, 4.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.465576171875, -0.4539756774902344, -0.44237518310546875, -0.4307746887207031, -0.4191741943359375, -0.4075736999511719, -0.39597320556640625, -0.3843727111816406, -0.372772216796875, -0.3611717224121094, -0.34957122802734375, -0.3379707336425781, -0.3263702392578125, -0.3147697448730469, -0.30316925048828125, -0.2915687561035156, -0.27996826171875, -0.2683677673339844, -0.25676727294921875, -0.24516677856445312, -0.2335662841796875, -0.22196578979492188, -0.21036529541015625, -0.19876480102539062, -0.187164306640625, -0.17556381225585938, -0.16396331787109375, -0.15236282348632812, -0.1407623291015625, -0.12916183471679688, -0.11756134033203125, -0.10596084594726562, -0.0943603515625, -0.08275985717773438, -0.07115936279296875, -0.059558868408203125, -0.0479583740234375, -0.036357879638671875, -0.02475738525390625, -0.013156890869140625, -0.001556396484375, 0.010044097900390625, 0.02164459228515625, 0.033245086669921875, 0.0448455810546875, 0.056446075439453125, 0.06804656982421875, 0.07964706420898438, 0.09124755859375, 0.10284805297851562, 0.11444854736328125, 0.12604904174804688, 0.1376495361328125, 0.14925003051757812, 0.16085052490234375, 0.17245101928710938, 0.184051513671875, 0.19565200805664062, 0.20725250244140625, 0.21885299682617188, 0.2304534912109375, 0.24205398559570312, 0.25365447998046875, 0.2652549743652344, 0.27685546875]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 11.0, 22.0, 125.0, 531.0, 246.0, 45.0, 11.0, 7.0, 7.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.655729293823242, -7.096137523651123, -6.536545753479004, -5.976953506469727, -5.417361736297607, -4.857769966125488, -4.298177719116211, -3.738585948944092, -3.1789941787719727, -2.6194024085998535, -2.0598104000091553, -1.5002185106277466, -0.9406266212463379, -0.38103485107421875, 0.1785571575164795, 0.7381491661071777, 1.2977409362792969, 1.8573328256607056, 2.4169247150421143, 2.9765167236328125, 3.5361084938049316, 4.095700263977051, 4.655292510986328, 5.214884281158447, 5.774476051330566, 6.3340678215026855, 6.893659591674805, 7.453251838684082, 8.01284408569336, 8.57243537902832, 9.132027626037598, 9.691619873046875, 10.251213073730469, 10.810805320739746, 11.370396614074707, 11.929988861083984, 12.489580154418945, 13.049172401428223, 13.6087646484375, 14.168355941772461, 14.727948188781738, 15.287540435791016, 15.847131729125977, 16.406723022460938, 16.96631622314453, 17.525907516479492, 18.085498809814453, 18.645092010498047, 19.204683303833008, 19.76427459716797, 20.323867797851562, 20.883459091186523, 21.443050384521484, 22.002643585205078, 22.56223487854004, 23.121826171875, 23.681419372558594, 24.241010665893555, 24.80060386657715, 25.36019515991211, 25.91978645324707, 26.47937774658203, 27.038970947265625, 27.598562240600586, 28.158153533935547]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 5.0, 5.0, 7.0, 27.0, 23.0, 26.0, 27.0, 33.0, 46.0, 47.0, 61.0, 68.0, 70.0, 73.0, 83.0, 71.0, 52.0, 52.0, 49.0, 37.0, 41.0, 34.0, 26.0, 18.0, 12.0, 9.0, 4.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.112689018249512, -12.791339874267578, -12.469990730285645, -12.148641586303711, -11.827292442321777, -11.505943298339844, -11.184595108032227, -10.863245964050293, -10.54189682006836, -10.220547676086426, -9.899198532104492, -9.577849388122559, -9.256500244140625, -8.935152053833008, -8.613801956176758, -8.29245376586914, -7.971104145050049, -7.649755001068115, -7.328405857086182, -7.007057189941406, -6.685708045959473, -6.364358901977539, -6.0430097579956055, -5.721660614013672, -5.400311470031738, -5.078962326049805, -4.757613182067871, -4.4362640380859375, -4.114915370941162, -3.7935662269592285, -3.472217082977295, -3.1508681774139404, -2.829519748687744, -2.5081706047058105, -2.186821699142456, -1.8654725551605225, -1.5441235303878784, -1.2227745056152344, -0.9014253616333008, -0.5800764560699463, -0.2587273120880127, 0.06262174248695374, 0.38397079706192017, 0.705319881439209, 1.026668906211853, 1.348017930984497, 1.6693670749664307, 1.9907159805297852, 2.3120651245117188, 2.6334142684936523, 2.954763174057007, 3.2761123180389404, 3.597461223602295, 3.9188103675842285, 4.240159511566162, 4.5615081787109375, 4.882857322692871, 5.204206466674805, 5.525555610656738, 5.846904754638672, 6.168253421783447, 6.489602565765381, 6.8109517097473145, 7.13230037689209, 7.453649997711182]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 2.0, 3.0, 3.0, 5.0, 8.0, 12.0, 23.0, 40.0, 63.0, 99.0, 189.0, 301.0, 629.0, 1319.0, 3547.0, 13367.0, 95683.0, 3647336.0, 391902.0, 29403.0, 6400.0, 2098.0, 884.0, 421.0, 215.0, 118.0, 83.0, 55.0, 35.0, 18.0, 8.0, 13.0, 3.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4921875, -3.385467529296875, -3.27874755859375, -3.172027587890625, -3.0653076171875, -2.958587646484375, -2.85186767578125, -2.745147705078125, -2.638427734375, -2.531707763671875, -2.42498779296875, -2.318267822265625, -2.2115478515625, -2.104827880859375, -1.99810791015625, -1.891387939453125, -1.78466796875, -1.677947998046875, -1.57122802734375, -1.464508056640625, -1.3577880859375, -1.251068115234375, -1.14434814453125, -1.037628173828125, -0.930908203125, -0.824188232421875, -0.71746826171875, -0.610748291015625, -0.5040283203125, -0.397308349609375, -0.29058837890625, -0.183868408203125, -0.0771484375, 0.029571533203125, 0.13629150390625, 0.243011474609375, 0.3497314453125, 0.456451416015625, 0.56317138671875, 0.669891357421875, 0.776611328125, 0.883331298828125, 0.99005126953125, 1.096771240234375, 1.2034912109375, 1.310211181640625, 1.41693115234375, 1.523651123046875, 1.63037109375, 1.737091064453125, 1.84381103515625, 1.950531005859375, 2.0572509765625, 2.163970947265625, 2.27069091796875, 2.377410888671875, 2.484130859375, 2.590850830078125, 2.69757080078125, 2.804290771484375, 2.9110107421875, 3.017730712890625, 3.12445068359375, 3.231170654296875, 3.337890625]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 5.0, 6.0, 0.0, 11.0, 20.0, 23.0, 45.0, 75.0, 104.0, 151.0, 157.0, 168.0, 77.0, 55.0, 32.0, 29.0, 16.0, 13.0, 8.0, 5.0, 5.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.4140625, -4.295928955078125, -4.17779541015625, -4.059661865234375, -3.9415283203125, -3.823394775390625, -3.70526123046875, -3.587127685546875, -3.468994140625, -3.350860595703125, -3.23272705078125, -3.114593505859375, -2.9964599609375, -2.878326416015625, -2.76019287109375, -2.642059326171875, -2.52392578125, -2.405792236328125, -2.28765869140625, -2.169525146484375, -2.0513916015625, -1.933258056640625, -1.81512451171875, -1.696990966796875, -1.578857421875, -1.460723876953125, -1.34259033203125, -1.224456787109375, -1.1063232421875, -0.988189697265625, -0.87005615234375, -0.751922607421875, -0.6337890625, -0.515655517578125, -0.39752197265625, -0.279388427734375, -0.1612548828125, -0.043121337890625, 0.07501220703125, 0.193145751953125, 0.311279296875, 0.429412841796875, 0.54754638671875, 0.665679931640625, 0.7838134765625, 0.901947021484375, 1.02008056640625, 1.138214111328125, 1.25634765625, 1.374481201171875, 1.49261474609375, 1.610748291015625, 1.7288818359375, 1.847015380859375, 1.96514892578125, 2.083282470703125, 2.201416015625, 2.319549560546875, 2.43768310546875, 2.555816650390625, 2.6739501953125, 2.792083740234375, 2.91021728515625, 3.028350830078125, 3.146484375]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 3.0, 5.0, 4.0, 5.0, 9.0, 16.0, 16.0, 22.0, 45.0, 65.0, 111.0, 244.0, 601.0, 1902.0, 9925.0, 165404.0, 3949488.0, 58562.0, 5634.0, 1290.0, 487.0, 172.0, 106.0, 61.0, 26.0, 24.0, 20.0, 8.0, 7.0, 5.0, 4.0, 2.0, 4.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.55859375, -5.40570068359375, -5.2528076171875, -5.09991455078125, -4.947021484375, -4.79412841796875, -4.6412353515625, -4.48834228515625, -4.33544921875, -4.18255615234375, -4.0296630859375, -3.87677001953125, -3.723876953125, -3.57098388671875, -3.4180908203125, -3.26519775390625, -3.1123046875, -2.95941162109375, -2.8065185546875, -2.65362548828125, -2.500732421875, -2.34783935546875, -2.1949462890625, -2.04205322265625, -1.88916015625, -1.73626708984375, -1.5833740234375, -1.43048095703125, -1.277587890625, -1.12469482421875, -0.9718017578125, -0.81890869140625, -0.666015625, -0.51312255859375, -0.3602294921875, -0.20733642578125, -0.054443359375, 0.09844970703125, 0.2513427734375, 0.40423583984375, 0.55712890625, 0.71002197265625, 0.8629150390625, 1.01580810546875, 1.168701171875, 1.32159423828125, 1.4744873046875, 1.62738037109375, 1.7802734375, 1.93316650390625, 2.0860595703125, 2.23895263671875, 2.391845703125, 2.54473876953125, 2.6976318359375, 2.85052490234375, 3.00341796875, 3.15631103515625, 3.3092041015625, 3.46209716796875, 3.614990234375, 3.76788330078125, 3.9207763671875, 4.07366943359375, 4.2265625]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 2.0, 4.0, 5.0, 5.0, 11.0, 23.0, 22.0, 20.0, 28.0, 47.0, 60.0, 96.0, 182.0, 299.0, 653.0, 1306.0, 571.0, 266.0, 160.0, 98.0, 54.0, 46.0, 32.0, 33.0, 12.0, 7.0, 13.0, 8.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.544921875, -0.5226516723632812, -0.5003814697265625, -0.47811126708984375, -0.455841064453125, -0.43357086181640625, -0.4113006591796875, -0.38903045654296875, -0.36676025390625, -0.34449005126953125, -0.3222198486328125, -0.29994964599609375, -0.277679443359375, -0.25540924072265625, -0.2331390380859375, -0.21086883544921875, -0.1885986328125, -0.16632843017578125, -0.1440582275390625, -0.12178802490234375, -0.099517822265625, -0.07724761962890625, -0.0549774169921875, -0.03270721435546875, -0.01043701171875, 0.01183319091796875, 0.0341033935546875, 0.05637359619140625, 0.078643798828125, 0.10091400146484375, 0.1231842041015625, 0.14545440673828125, 0.167724609375, 0.18999481201171875, 0.2122650146484375, 0.23453521728515625, 0.256805419921875, 0.27907562255859375, 0.3013458251953125, 0.32361602783203125, 0.34588623046875, 0.36815643310546875, 0.3904266357421875, 0.41269683837890625, 0.434967041015625, 0.45723724365234375, 0.4795074462890625, 0.5017776489257812, 0.5240478515625, 0.5463180541992188, 0.5685882568359375, 0.5908584594726562, 0.613128662109375, 0.6353988647460938, 0.6576690673828125, 0.6799392700195312, 0.70220947265625, 0.7244796752929688, 0.7467498779296875, 0.7690200805664062, 0.791290283203125, 0.8135604858398438, 0.8358306884765625, 0.8581008911132812, 0.88037109375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 5.0, 9.0, 11.0, 22.0, 59.0, 132.0, 248.0, 269.0, 141.0, 57.0, 18.0, 16.0, 6.0, 6.0, 4.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.420680046081543, -7.220265865325928, -7.0198516845703125, -6.819437026977539, -6.619022846221924, -6.418608665466309, -6.218194007873535, -6.01777982711792, -5.817365646362305, -5.6169514656066895, -5.416537284851074, -5.216122627258301, -5.0157084465026855, -4.81529426574707, -4.614879608154297, -4.414465427398682, -4.214051246643066, -4.013637065887451, -3.813222646713257, -3.6128082275390625, -3.4123940467834473, -3.211979866027832, -3.0115654468536377, -2.8111510276794434, -2.610736846923828, -2.410322666168213, -2.2099082469940186, -2.009493827819824, -1.809079647064209, -1.6086653470993042, -1.4082510471343994, -1.2078367471694946, -1.007422924041748, -0.8070086240768433, -0.6065943241119385, -0.4061800241470337, -0.2057657241821289, -0.005351424217224121, 0.19506287574768066, 0.39547717571258545, 0.5958914756774902, 0.796305775642395, 0.9967200756072998, 1.1971343755722046, 1.3975486755371094, 1.5979629755020142, 1.798377275466919, 1.9987915754318237, 2.1992058753967285, 2.3996200561523438, 2.600034475326538, 2.8004488945007324, 3.0008630752563477, 3.201277256011963, 3.4016916751861572, 3.6021060943603516, 3.802520275115967, 4.002934455871582, 4.2033491134643555, 4.403763294219971, 4.604177474975586, 4.804591655731201, 5.005005836486816, 5.20542049407959, 5.405834674835205]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 6.0, 8.0, 17.0, 27.0, 40.0, 54.0, 66.0, 91.0, 97.0, 126.0, 91.0, 91.0, 75.0, 57.0, 49.0, 26.0, 37.0, 11.0, 9.0, 9.0, 7.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.294147968292236, -4.184197902679443, -4.074248313903809, -3.9642982482910156, -3.8543481826782227, -3.744398355484009, -3.634448528289795, -3.524498462677002, -3.414548635482788, -3.304598808288574, -3.1946487426757812, -3.0846989154815674, -2.9747490882873535, -2.8647990226745605, -2.7548491954803467, -2.644899368286133, -2.53494930267334, -2.424999475479126, -2.315049409866333, -2.205099582672119, -2.095149517059326, -1.9851996898651123, -1.8752498626708984, -1.765299916267395, -1.6553499698638916, -1.5454000234603882, -1.4354500770568848, -1.325500249862671, -1.2155503034591675, -1.105600357055664, -0.9956504702568054, -0.8857005834579468, -0.7757508754730225, -0.665800929069519, -0.5558510422706604, -0.44590112566947937, -0.33595120906829834, -0.22600126266479492, -0.11605137586593628, -0.006101489067077637, 0.10384845733642578, 0.2137983739376068, 0.32374829053878784, 0.43369820713996887, 0.5436481237411499, 0.6535980701446533, 0.763547956943512, 0.8734978437423706, 0.983447790145874, 1.0933977365493774, 1.2033476829528809, 1.3132975101470947, 1.4232474565505981, 1.5331974029541016, 1.6431472301483154, 1.7530971765518188, 1.8630471229553223, 1.9729970693588257, 2.082947015762329, 2.192896842956543, 2.302846908569336, 2.41279673576355, 2.5227465629577637, 2.6326966285705566, 2.7426464557647705]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 6.0, 7.0, 6.0, 10.0, 19.0, 27.0, 51.0, 66.0, 104.0, 194.0, 320.0, 546.0, 1071.0, 2634.0, 7911.0, 34188.0, 319810.0, 593023.0, 69371.0, 12327.0, 3721.0, 1459.0, 738.0, 401.0, 192.0, 118.0, 69.0, 54.0, 29.0, 29.0, 18.0, 9.0, 13.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.32177734375, -0.3099365234375, -0.298095703125, -0.2862548828125, -0.2744140625, -0.2625732421875, -0.250732421875, -0.2388916015625, -0.22705078125, -0.2152099609375, -0.203369140625, -0.1915283203125, -0.1796875, -0.1678466796875, -0.156005859375, -0.1441650390625, -0.13232421875, -0.1204833984375, -0.108642578125, -0.0968017578125, -0.0849609375, -0.0731201171875, -0.061279296875, -0.0494384765625, -0.03759765625, -0.0257568359375, -0.013916015625, -0.0020751953125, 0.009765625, 0.0216064453125, 0.033447265625, 0.0452880859375, 0.05712890625, 0.0689697265625, 0.080810546875, 0.0926513671875, 0.1044921875, 0.1163330078125, 0.128173828125, 0.1400146484375, 0.15185546875, 0.1636962890625, 0.175537109375, 0.1873779296875, 0.19921875, 0.2110595703125, 0.222900390625, 0.2347412109375, 0.24658203125, 0.2584228515625, 0.270263671875, 0.2821044921875, 0.2939453125, 0.3057861328125, 0.317626953125, 0.3294677734375, 0.34130859375, 0.3531494140625, 0.364990234375, 0.3768310546875, 0.388671875, 0.4005126953125, 0.412353515625, 0.4241943359375, 0.43603515625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 1.0, 4.0, 6.0, 8.0, 12.0, 14.0, 38.0, 44.0, 73.0, 77.0, 126.0, 120.0, 146.0, 105.0, 76.0, 41.0, 37.0, 26.0, 15.0, 17.0, 6.0, 3.0, 7.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.416015625, -3.327850341796875, -3.23968505859375, -3.151519775390625, -3.0633544921875, -2.975189208984375, -2.88702392578125, -2.798858642578125, -2.710693359375, -2.622528076171875, -2.53436279296875, -2.446197509765625, -2.3580322265625, -2.269866943359375, -2.18170166015625, -2.093536376953125, -2.00537109375, -1.917205810546875, -1.82904052734375, -1.740875244140625, -1.6527099609375, -1.564544677734375, -1.47637939453125, -1.388214111328125, -1.300048828125, -1.211883544921875, -1.12371826171875, -1.035552978515625, -0.9473876953125, -0.859222412109375, -0.77105712890625, -0.682891845703125, -0.5947265625, -0.506561279296875, -0.41839599609375, -0.330230712890625, -0.2420654296875, -0.153900146484375, -0.06573486328125, 0.022430419921875, 0.110595703125, 0.198760986328125, 0.28692626953125, 0.375091552734375, 0.4632568359375, 0.551422119140625, 0.63958740234375, 0.727752685546875, 0.81591796875, 0.904083251953125, 0.99224853515625, 1.080413818359375, 1.1685791015625, 1.256744384765625, 1.34490966796875, 1.433074951171875, 1.521240234375, 1.609405517578125, 1.69757080078125, 1.785736083984375, 1.8739013671875, 1.962066650390625, 2.05023193359375, 2.138397216796875, 2.2265625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 5.0, 2.0, 4.0, 9.0, 14.0, 13.0, 19.0, 33.0, 43.0, 74.0, 88.0, 137.0, 291.0, 476.0, 1138.0, 3110.0, 12882.0, 172599.0, 787871.0, 58479.0, 7391.0, 2176.0, 791.0, 349.0, 204.0, 112.0, 77.0, 44.0, 32.0, 30.0, 17.0, 11.0, 10.0, 9.0, 5.0, 3.0, 1.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.52880859375, -0.5129432678222656, -0.49707794189453125, -0.4812126159667969, -0.4653472900390625, -0.4494819641113281, -0.43361663818359375, -0.4177513122558594, -0.401885986328125, -0.3860206604003906, -0.37015533447265625, -0.3542900085449219, -0.3384246826171875, -0.3225593566894531, -0.30669403076171875, -0.2908287048339844, -0.27496337890625, -0.2590980529785156, -0.24323272705078125, -0.22736740112304688, -0.2115020751953125, -0.19563674926757812, -0.17977142333984375, -0.16390609741210938, -0.148040771484375, -0.13217544555664062, -0.11631011962890625, -0.10044479370117188, -0.0845794677734375, -0.06871414184570312, -0.05284881591796875, -0.036983489990234375, -0.0211181640625, -0.005252838134765625, 0.01061248779296875, 0.026477813720703125, 0.0423431396484375, 0.058208465576171875, 0.07407379150390625, 0.08993911743164062, 0.105804443359375, 0.12166976928710938, 0.13753509521484375, 0.15340042114257812, 0.1692657470703125, 0.18513107299804688, 0.20099639892578125, 0.21686172485351562, 0.23272705078125, 0.24859237670898438, 0.26445770263671875, 0.2803230285644531, 0.2961883544921875, 0.3120536804199219, 0.32791900634765625, 0.3437843322753906, 0.359649658203125, 0.3755149841308594, 0.39138031005859375, 0.4072456359863281, 0.4231109619140625, 0.4389762878417969, 0.45484161376953125, 0.4707069396972656, 0.486572265625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 4.0, 5.0, 4.0, 7.0, 14.0, 7.0, 16.0, 22.0, 17.0, 16.0, 32.0, 27.0, 37.0, 34.0, 43.0, 56.0, 65.0, 58.0, 52.0, 63.0, 74.0, 52.0, 43.0, 35.0, 42.0, 33.0, 29.0, 20.0, 20.0, 15.0, 16.0, 7.0, 11.0, 5.0, 10.0, 6.0, 3.0, 4.0, 4.0, 3.0, 0.0, 2.0, 1.0], "bins": [-3.607421875, -3.51708984375, -3.4267578125, -3.33642578125, -3.24609375, -3.15576171875, -3.0654296875, -2.97509765625, -2.884765625, -2.79443359375, -2.7041015625, -2.61376953125, -2.5234375, -2.43310546875, -2.3427734375, -2.25244140625, -2.162109375, -2.07177734375, -1.9814453125, -1.89111328125, -1.80078125, -1.71044921875, -1.6201171875, -1.52978515625, -1.439453125, -1.34912109375, -1.2587890625, -1.16845703125, -1.078125, -0.98779296875, -0.8974609375, -0.80712890625, -0.716796875, -0.62646484375, -0.5361328125, -0.44580078125, -0.35546875, -0.26513671875, -0.1748046875, -0.08447265625, 0.005859375, 0.09619140625, 0.1865234375, 0.27685546875, 0.3671875, 0.45751953125, 0.5478515625, 0.63818359375, 0.728515625, 0.81884765625, 0.9091796875, 0.99951171875, 1.08984375, 1.18017578125, 1.2705078125, 1.36083984375, 1.451171875, 1.54150390625, 1.6318359375, 1.72216796875, 1.8125, 1.90283203125, 1.9931640625, 2.08349609375, 2.173828125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 2.0, 8.0, 10.0, 12.0, 22.0, 45.0, 102.0, 263.0, 846.0, 6100.0, 621757.0, 413143.0, 5173.0, 689.0, 194.0, 96.0, 41.0, 16.0, 10.0, 6.0, 3.0, 5.0, 3.0, 1.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.259521484375, -0.24714279174804688, -0.23476409912109375, -0.22238540649414062, -0.2100067138671875, -0.19762802124023438, -0.18524932861328125, -0.17287063598632812, -0.160491943359375, -0.14811325073242188, -0.13573455810546875, -0.12335586547851562, -0.1109771728515625, -0.09859848022460938, -0.08621978759765625, -0.07384109497070312, -0.06146240234375, -0.049083709716796875, -0.03670501708984375, -0.024326324462890625, -0.0119476318359375, 0.000431060791015625, 0.01280975341796875, 0.025188446044921875, 0.037567138671875, 0.049945831298828125, 0.06232452392578125, 0.07470321655273438, 0.0870819091796875, 0.09946060180664062, 0.11183929443359375, 0.12421798706054688, 0.1365966796875, 0.14897537231445312, 0.16135406494140625, 0.17373275756835938, 0.1861114501953125, 0.19849014282226562, 0.21086883544921875, 0.22324752807617188, 0.235626220703125, 0.24800491333007812, 0.26038360595703125, 0.2727622985839844, 0.2851409912109375, 0.2975196838378906, 0.30989837646484375, 0.3222770690917969, 0.33465576171875, 0.3470344543457031, 0.35941314697265625, 0.3717918395996094, 0.3841705322265625, 0.3965492248535156, 0.40892791748046875, 0.4213066101074219, 0.433685302734375, 0.4460639953613281, 0.45844268798828125, 0.4708213806152344, 0.4832000732421875, 0.4955787658691406, 0.5079574584960938, 0.5203361511230469, 0.53271484375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 1.0, 1.0, 3.0, 6.0, 3.0, 6.0, 9.0, 8.0, 14.0, 18.0, 19.0, 19.0, 36.0, 37.0, 56.0, 79.0, 100.0, 97.0, 99.0, 94.0, 72.0, 40.0, 42.0, 34.0, 30.0, 12.0, 14.0, 9.0, 10.0, 9.0, 8.0, 5.0, 4.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.309415817260742e-05, -4.172883927822113e-05, -4.036352038383484e-05, -3.899820148944855e-05, -3.7632882595062256e-05, -3.6267563700675964e-05, -3.490224480628967e-05, -3.353692591190338e-05, -3.217160701751709e-05, -3.08062881231308e-05, -2.9440969228744507e-05, -2.8075650334358215e-05, -2.6710331439971924e-05, -2.5345012545585632e-05, -2.397969365119934e-05, -2.261437475681305e-05, -2.1249055862426758e-05, -1.9883736968040466e-05, -1.8518418073654175e-05, -1.7153099179267883e-05, -1.5787780284881592e-05, -1.44224613904953e-05, -1.3057142496109009e-05, -1.1691823601722717e-05, -1.0326504707336426e-05, -8.961185812950134e-06, -7.595866918563843e-06, -6.230548024177551e-06, -4.86522912979126e-06, -3.4999102354049683e-06, -2.1345913410186768e-06, -7.692724466323853e-07, 5.960464477539062e-07, 1.9613653421401978e-06, 3.3266842365264893e-06, 4.692003130912781e-06, 6.057322025299072e-06, 7.422640919685364e-06, 8.787959814071655e-06, 1.0153278708457947e-05, 1.1518597602844238e-05, 1.288391649723053e-05, 1.4249235391616821e-05, 1.5614554286003113e-05, 1.6979873180389404e-05, 1.8345192074775696e-05, 1.9710510969161987e-05, 2.107582986354828e-05, 2.244114875793457e-05, 2.3806467652320862e-05, 2.5171786546707153e-05, 2.6537105441093445e-05, 2.7902424335479736e-05, 2.9267743229866028e-05, 3.063306212425232e-05, 3.199838101863861e-05, 3.33636999130249e-05, 3.4729018807411194e-05, 3.6094337701797485e-05, 3.745965659618378e-05, 3.882497549057007e-05, 4.019029438495636e-05, 4.155561327934265e-05, 4.292093217372894e-05, 4.4286251068115234e-05]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 4.0, 9.0, 6.0, 10.0, 21.0, 31.0, 27.0, 67.0, 150.0, 302.0, 704.0, 2208.0, 12885.0, 390715.0, 620314.0, 16919.0, 2739.0, 767.0, 298.0, 161.0, 92.0, 36.0, 24.0, 19.0, 6.0, 9.0, 8.0, 5.0, 5.0, 6.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.2315673828125, -0.2230091094970703, -0.21445083618164062, -0.20589256286621094, -0.19733428955078125, -0.18877601623535156, -0.18021774291992188, -0.1716594696044922, -0.1631011962890625, -0.1545429229736328, -0.14598464965820312, -0.13742637634277344, -0.12886810302734375, -0.12030982971191406, -0.11175155639648438, -0.10319328308105469, -0.094635009765625, -0.08607673645019531, -0.07751846313476562, -0.06896018981933594, -0.06040191650390625, -0.05184364318847656, -0.043285369873046875, -0.03472709655761719, -0.0261688232421875, -0.017610549926757812, -0.009052276611328125, -0.0004940032958984375, 0.00806427001953125, 0.016622543334960938, 0.025180816650390625, 0.03373908996582031, 0.04229736328125, 0.05085563659667969, 0.059413909912109375, 0.06797218322753906, 0.07653045654296875, 0.08508872985839844, 0.09364700317382812, 0.10220527648925781, 0.1107635498046875, 0.11932182312011719, 0.12788009643554688, 0.13643836975097656, 0.14499664306640625, 0.15355491638183594, 0.16211318969726562, 0.1706714630126953, 0.179229736328125, 0.1877880096435547, 0.19634628295898438, 0.20490455627441406, 0.21346282958984375, 0.22202110290527344, 0.23057937622070312, 0.2391376495361328, 0.2476959228515625, 0.2562541961669922, 0.2648124694824219, 0.27337074279785156, 0.28192901611328125, 0.29048728942871094, 0.2990455627441406, 0.3076038360595703, 0.316162109375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 6.0, 7.0, 9.0, 7.0, 29.0, 42.0, 98.0, 180.0, 296.0, 171.0, 72.0, 44.0, 15.0, 12.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.10980224609375, -0.10721826553344727, -0.10463428497314453, -0.1020503044128418, -0.09946632385253906, -0.09688234329223633, -0.0942983627319336, -0.09171438217163086, -0.08913040161132812, -0.08654642105102539, -0.08396244049072266, -0.08137845993041992, -0.07879447937011719, -0.07621049880981445, -0.07362651824951172, -0.07104253768920898, -0.06845855712890625, -0.06587457656860352, -0.06329059600830078, -0.06070661544799805, -0.05812263488769531, -0.05553865432739258, -0.052954673767089844, -0.05037069320678711, -0.047786712646484375, -0.04520273208618164, -0.042618751525878906, -0.04003477096557617, -0.03745079040527344, -0.0348668098449707, -0.03228282928466797, -0.029698848724365234, -0.0271148681640625, -0.024530887603759766, -0.02194690704345703, -0.019362926483154297, -0.016778945922851562, -0.014194965362548828, -0.011610984802246094, -0.00902700424194336, -0.006443023681640625, -0.0038590431213378906, -0.0012750625610351562, 0.0013089179992675781, 0.0038928985595703125, 0.006476879119873047, 0.009060859680175781, 0.011644840240478516, 0.01422882080078125, 0.016812801361083984, 0.01939678192138672, 0.021980762481689453, 0.024564743041992188, 0.027148723602294922, 0.029732704162597656, 0.03231668472290039, 0.034900665283203125, 0.03748464584350586, 0.040068626403808594, 0.04265260696411133, 0.04523658752441406, 0.0478205680847168, 0.05040454864501953, 0.052988529205322266, 0.055572509765625]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 8.0, 12.0, 25.0, 80.0, 281.0, 394.0, 140.0, 32.0, 20.0, 4.0, 8.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.639793872833252, -5.44675350189209, -5.2537126541137695, -5.060672283172607, -4.867631912231445, -4.674591541290283, -4.481551170349121, -4.288510322570801, -4.095469951629639, -3.9024295806884766, -3.7093889713287354, -3.516348361968994, -3.323307991027832, -3.13026762008667, -2.9372270107269287, -2.7441864013671875, -2.5511460304260254, -2.3581056594848633, -2.165065050125122, -1.9720245599746704, -1.7789840698242188, -1.585943579673767, -1.3929030895233154, -1.1998625993728638, -1.006822109222412, -0.8137816190719604, -0.6207411289215088, -0.42770063877105713, -0.23466014862060547, -0.04161965847015381, 0.15142083168029785, 0.3444613218307495, 0.5375018119812012, 0.7305423021316528, 0.9235827922821045, 1.1166232824325562, 1.3096637725830078, 1.5027042627334595, 1.6957447528839111, 1.8887852430343628, 2.0818257331848145, 2.2748661041259766, 2.4679067134857178, 2.660947322845459, 2.853987693786621, 3.047028064727783, 3.2400686740875244, 3.4331092834472656, 3.6261496543884277, 3.81919002532959, 4.01223087310791, 4.205271244049072, 4.398311614990234, 4.5913519859313965, 4.784392356872559, 4.977433204650879, 5.170473575592041, 5.363513946533203, 5.556554794311523, 5.7495951652526855, 5.942635536193848, 6.13567590713501, 6.328716278076172, 6.521757125854492, 6.714797496795654]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 4.0, 9.0, 21.0, 29.0, 36.0, 73.0, 79.0, 124.0, 131.0, 121.0, 105.0, 86.0, 56.0, 39.0, 32.0, 19.0, 5.0, 10.0, 6.0, 5.0, 6.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.274353265762329, -3.1882786750793457, -3.1022040843963623, -3.016129493713379, -2.9300546646118164, -2.843980073928833, -2.7579054832458496, -2.671830892562866, -2.585756301879883, -2.4996817111968994, -2.413607120513916, -2.3275322914123535, -2.24145770072937, -2.1553831100463867, -2.0693085193634033, -1.98323392868042, -1.8971590995788574, -1.811084508895874, -1.725009799003601, -1.6389352083206177, -1.5528604984283447, -1.4667859077453613, -1.380711317062378, -1.2946367263793945, -1.2085620164871216, -1.1224874258041382, -1.0364127159118652, -0.9503381252288818, -0.8642634749412537, -0.7781888246536255, -0.6921142339706421, -0.6060395836830139, -0.5199651718139648, -0.43389052152633667, -0.3478159010410309, -0.2617412805557251, -0.17566663026809692, -0.08959197998046875, -0.0035173892974853516, 0.08255726099014282, 0.168631911277771, 0.25470656156539917, 0.34078118205070496, 0.42685580253601074, 0.5129304528236389, 0.5990051031112671, 0.6850796937942505, 0.7711543440818787, 0.8572289943695068, 0.943303644657135, 1.0293782949447632, 1.1154528856277466, 1.2015275955200195, 1.287602186203003, 1.3736767768859863, 1.4597513675689697, 1.5458260774612427, 1.631900668144226, 1.717975378036499, 1.8040499687194824, 1.8901245594024658, 1.9761992692947388, 2.0622739791870117, 2.148348569869995, 2.2344231605529785]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 5.0, 6.0, 7.0, 6.0, 4.0, 11.0, 14.0, 22.0, 27.0, 31.0, 49.0, 80.0, 120.0, 160.0, 296.0, 484.0, 861.0, 1476.0, 2651.0, 5820.0, 13427.0, 37707.0, 195346.0, 675917.0, 74697.0, 21890.0, 8642.0, 3933.0, 1980.0, 1146.0, 658.0, 360.0, 245.0, 148.0, 93.0, 68.0, 44.0, 37.0, 22.0, 16.0, 11.0, 11.0, 11.0, 4.0, 4.0, 6.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0], "bins": [-1.3974609375, -1.355438232421875, -1.31341552734375, -1.271392822265625, -1.2293701171875, -1.187347412109375, -1.14532470703125, -1.103302001953125, -1.061279296875, -1.019256591796875, -0.97723388671875, -0.935211181640625, -0.8931884765625, -0.851165771484375, -0.80914306640625, -0.767120361328125, -0.72509765625, -0.683074951171875, -0.64105224609375, -0.599029541015625, -0.5570068359375, -0.514984130859375, -0.47296142578125, -0.430938720703125, -0.388916015625, -0.346893310546875, -0.30487060546875, -0.262847900390625, -0.2208251953125, -0.178802490234375, -0.13677978515625, -0.094757080078125, -0.052734375, -0.010711669921875, 0.03131103515625, 0.073333740234375, 0.1153564453125, 0.157379150390625, 0.19940185546875, 0.241424560546875, 0.283447265625, 0.325469970703125, 0.36749267578125, 0.409515380859375, 0.4515380859375, 0.493560791015625, 0.53558349609375, 0.577606201171875, 0.61962890625, 0.661651611328125, 0.70367431640625, 0.745697021484375, 0.7877197265625, 0.829742431640625, 0.87176513671875, 0.913787841796875, 0.955810546875, 0.997833251953125, 1.03985595703125, 1.081878662109375, 1.1239013671875, 1.165924072265625, 1.20794677734375, 1.249969482421875, 1.2919921875]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 2.0, 2.0, 5.0, 6.0, 7.0, 16.0, 23.0, 34.0, 45.0, 54.0, 74.0, 115.0, 116.0, 107.0, 105.0, 72.0, 57.0, 48.0, 34.0, 23.0, 20.0, 11.0, 6.0, 7.0, 4.0, 3.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.87890625, -5.72442626953125, -5.5699462890625, -5.41546630859375, -5.260986328125, -5.10650634765625, -4.9520263671875, -4.79754638671875, -4.64306640625, -4.48858642578125, -4.3341064453125, -4.17962646484375, -4.025146484375, -3.87066650390625, -3.7161865234375, -3.56170654296875, -3.4072265625, -3.25274658203125, -3.0982666015625, -2.94378662109375, -2.789306640625, -2.63482666015625, -2.4803466796875, -2.32586669921875, -2.17138671875, -2.01690673828125, -1.8624267578125, -1.70794677734375, -1.553466796875, -1.39898681640625, -1.2445068359375, -1.09002685546875, -0.935546875, -0.78106689453125, -0.6265869140625, -0.47210693359375, -0.317626953125, -0.16314697265625, -0.0086669921875, 0.14581298828125, 0.30029296875, 0.45477294921875, 0.6092529296875, 0.76373291015625, 0.918212890625, 1.07269287109375, 1.2271728515625, 1.38165283203125, 1.5361328125, 1.69061279296875, 1.8450927734375, 1.99957275390625, 2.154052734375, 2.30853271484375, 2.4630126953125, 2.61749267578125, 2.77197265625, 2.92645263671875, 3.0809326171875, 3.23541259765625, 3.389892578125, 3.54437255859375, 3.6988525390625, 3.85333251953125, 4.0078125]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 6.0, 7.0, 13.0, 17.0, 30.0, 41.0, 63.0, 96.0, 133.0, 337.0, 968.0, 4970.0, 56579.0, 937173.0, 42232.0, 4267.0, 900.0, 327.0, 144.0, 85.0, 40.0, 32.0, 22.0, 17.0, 14.0, 9.0, 5.0, 8.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.861328125, -2.770355224609375, -2.67938232421875, -2.588409423828125, -2.4974365234375, -2.406463623046875, -2.31549072265625, -2.224517822265625, -2.133544921875, -2.042572021484375, -1.95159912109375, -1.860626220703125, -1.7696533203125, -1.678680419921875, -1.58770751953125, -1.496734619140625, -1.40576171875, -1.314788818359375, -1.22381591796875, -1.132843017578125, -1.0418701171875, -0.950897216796875, -0.85992431640625, -0.768951416015625, -0.677978515625, -0.587005615234375, -0.49603271484375, -0.405059814453125, -0.3140869140625, -0.223114013671875, -0.13214111328125, -0.041168212890625, 0.0498046875, 0.140777587890625, 0.23175048828125, 0.322723388671875, 0.4136962890625, 0.504669189453125, 0.59564208984375, 0.686614990234375, 0.777587890625, 0.868560791015625, 0.95953369140625, 1.050506591796875, 1.1414794921875, 1.232452392578125, 1.32342529296875, 1.414398193359375, 1.50537109375, 1.596343994140625, 1.68731689453125, 1.778289794921875, 1.8692626953125, 1.960235595703125, 2.05120849609375, 2.142181396484375, 2.233154296875, 2.324127197265625, 2.41510009765625, 2.506072998046875, 2.5970458984375, 2.688018798828125, 2.77899169921875, 2.869964599609375, 2.9609375]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 5.0, 7.0, 9.0, 8.0, 12.0, 11.0, 25.0, 30.0, 40.0, 34.0, 52.0, 58.0, 66.0, 52.0, 73.0, 74.0, 78.0, 62.0, 63.0, 52.0, 39.0, 23.0, 29.0, 20.0, 19.0, 16.0, 12.0, 10.0, 9.0, 6.0, 4.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.7265625, -4.57012939453125, -4.4136962890625, -4.25726318359375, -4.100830078125, -3.94439697265625, -3.7879638671875, -3.63153076171875, -3.47509765625, -3.31866455078125, -3.1622314453125, -3.00579833984375, -2.849365234375, -2.69293212890625, -2.5364990234375, -2.38006591796875, -2.2236328125, -2.06719970703125, -1.9107666015625, -1.75433349609375, -1.597900390625, -1.44146728515625, -1.2850341796875, -1.12860107421875, -0.97216796875, -0.81573486328125, -0.6593017578125, -0.50286865234375, -0.346435546875, -0.19000244140625, -0.0335693359375, 0.12286376953125, 0.279296875, 0.43572998046875, 0.5921630859375, 0.74859619140625, 0.905029296875, 1.06146240234375, 1.2178955078125, 1.37432861328125, 1.53076171875, 1.68719482421875, 1.8436279296875, 2.00006103515625, 2.156494140625, 2.31292724609375, 2.4693603515625, 2.62579345703125, 2.7822265625, 2.93865966796875, 3.0950927734375, 3.25152587890625, 3.407958984375, 3.56439208984375, 3.7208251953125, 3.87725830078125, 4.03369140625, 4.19012451171875, 4.3465576171875, 4.50299072265625, 4.659423828125, 4.81585693359375, 4.9722900390625, 5.12872314453125, 5.28515625]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 7.0, 4.0, 12.0, 22.0, 39.0, 63.0, 119.0, 316.0, 886.0, 3337.0, 26538.0, 951498.0, 58563.0, 5263.0, 1214.0, 386.0, 141.0, 69.0, 35.0, 14.0, 8.0, 12.0, 7.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.66796875, -1.627899169921875, -1.58782958984375, -1.547760009765625, -1.5076904296875, -1.467620849609375, -1.42755126953125, -1.387481689453125, -1.347412109375, -1.307342529296875, -1.26727294921875, -1.227203369140625, -1.1871337890625, -1.147064208984375, -1.10699462890625, -1.066925048828125, -1.02685546875, -0.986785888671875, -0.94671630859375, -0.906646728515625, -0.8665771484375, -0.826507568359375, -0.78643798828125, -0.746368408203125, -0.706298828125, -0.666229248046875, -0.62615966796875, -0.586090087890625, -0.5460205078125, -0.505950927734375, -0.46588134765625, -0.425811767578125, -0.3857421875, -0.345672607421875, -0.30560302734375, -0.265533447265625, -0.2254638671875, -0.185394287109375, -0.14532470703125, -0.105255126953125, -0.065185546875, -0.025115966796875, 0.01495361328125, 0.055023193359375, 0.0950927734375, 0.135162353515625, 0.17523193359375, 0.215301513671875, 0.25537109375, 0.295440673828125, 0.33551025390625, 0.375579833984375, 0.4156494140625, 0.455718994140625, 0.49578857421875, 0.535858154296875, 0.575927734375, 0.615997314453125, 0.65606689453125, 0.696136474609375, 0.7362060546875, 0.776275634765625, 0.81634521484375, 0.856414794921875, 0.896484375]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 3.0, 2.0, 9.0, 8.0, 7.0, 19.0, 18.0, 28.0, 25.0, 38.0, 94.0, 226.0, 250.0, 100.0, 54.0, 39.0, 23.0, 17.0, 10.0, 7.0, 6.0, 1.0, 6.0, 3.0, 3.0, 0.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00011259317398071289, -0.00010937545448541641, -0.00010615773499011993, -0.00010294001549482346, -9.972229599952698e-05, -9.65045765042305e-05, -9.328685700893402e-05, -9.006913751363754e-05, -8.685141801834106e-05, -8.363369852304459e-05, -8.041597902774811e-05, -7.719825953245163e-05, -7.398054003715515e-05, -7.076282054185867e-05, -6.75451010465622e-05, -6.432738155126572e-05, -6.110966205596924e-05, -5.789194256067276e-05, -5.467422306537628e-05, -5.1456503570079803e-05, -4.8238784074783325e-05, -4.502106457948685e-05, -4.180334508419037e-05, -3.858562558889389e-05, -3.536790609359741e-05, -3.2150186598300934e-05, -2.8932467103004456e-05, -2.5714747607707977e-05, -2.24970281124115e-05, -1.927930861711502e-05, -1.6061589121818542e-05, -1.2843869626522064e-05, -9.626150131225586e-06, -6.408430635929108e-06, -3.1907111406326294e-06, 2.7008354663848877e-08, 3.244727849960327e-06, 6.462447345256805e-06, 9.680166840553284e-06, 1.2897886335849762e-05, 1.611560583114624e-05, 1.933332532644272e-05, 2.2551044821739197e-05, 2.5768764317035675e-05, 2.8986483812332153e-05, 3.220420330762863e-05, 3.542192280292511e-05, 3.863964229822159e-05, 4.1857361793518066e-05, 4.5075081288814545e-05, 4.829280078411102e-05, 5.15105202794075e-05, 5.472823977470398e-05, 5.794595927000046e-05, 6.116367876529694e-05, 6.438139826059341e-05, 6.759911775588989e-05, 7.081683725118637e-05, 7.403455674648285e-05, 7.725227624177933e-05, 8.04699957370758e-05, 8.368771523237228e-05, 8.690543472766876e-05, 9.012315422296524e-05, 9.334087371826172e-05]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 7.0, 5.0, 8.0, 9.0, 13.0, 26.0, 38.0, 57.0, 81.0, 124.0, 198.0, 356.0, 698.0, 1353.0, 3533.0, 12874.0, 92092.0, 874671.0, 48634.0, 8675.0, 2578.0, 1121.0, 563.0, 299.0, 179.0, 125.0, 67.0, 48.0, 34.0, 23.0, 17.0, 5.0, 8.0, 9.0, 8.0, 8.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.88232421875, -0.8558807373046875, -0.829437255859375, -0.8029937744140625, -0.77655029296875, -0.7501068115234375, -0.723663330078125, -0.6972198486328125, -0.6707763671875, -0.6443328857421875, -0.617889404296875, -0.5914459228515625, -0.56500244140625, -0.5385589599609375, -0.512115478515625, -0.4856719970703125, -0.459228515625, -0.4327850341796875, -0.406341552734375, -0.3798980712890625, -0.35345458984375, -0.3270111083984375, -0.300567626953125, -0.2741241455078125, -0.2476806640625, -0.2212371826171875, -0.194793701171875, -0.1683502197265625, -0.14190673828125, -0.1154632568359375, -0.089019775390625, -0.0625762939453125, -0.0361328125, -0.0096893310546875, 0.016754150390625, 0.0431976318359375, 0.06964111328125, 0.0960845947265625, 0.122528076171875, 0.1489715576171875, 0.1754150390625, 0.2018585205078125, 0.228302001953125, 0.2547454833984375, 0.28118896484375, 0.3076324462890625, 0.334075927734375, 0.3605194091796875, 0.386962890625, 0.4134063720703125, 0.439849853515625, 0.4662933349609375, 0.49273681640625, 0.5191802978515625, 0.545623779296875, 0.5720672607421875, 0.5985107421875, 0.6249542236328125, 0.651397705078125, 0.6778411865234375, 0.70428466796875, 0.7307281494140625, 0.757171630859375, 0.7836151123046875, 0.81005859375]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 7.0, 3.0, 5.0, 8.0, 8.0, 10.0, 22.0, 20.0, 22.0, 60.0, 193.0, 435.0, 75.0, 35.0, 29.0, 14.0, 18.0, 5.0, 8.0, 5.0, 8.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.42236328125, -0.4096221923828125, -0.396881103515625, -0.3841400146484375, -0.37139892578125, -0.3586578369140625, -0.345916748046875, -0.3331756591796875, -0.3204345703125, -0.3076934814453125, -0.294952392578125, -0.2822113037109375, -0.26947021484375, -0.2567291259765625, -0.243988037109375, -0.2312469482421875, -0.218505859375, -0.2057647705078125, -0.193023681640625, -0.1802825927734375, -0.16754150390625, -0.1548004150390625, -0.142059326171875, -0.1293182373046875, -0.1165771484375, -0.1038360595703125, -0.091094970703125, -0.0783538818359375, -0.06561279296875, -0.0528717041015625, -0.040130615234375, -0.0273895263671875, -0.0146484375, -0.0019073486328125, 0.010833740234375, 0.0235748291015625, 0.03631591796875, 0.0490570068359375, 0.061798095703125, 0.0745391845703125, 0.0872802734375, 0.1000213623046875, 0.112762451171875, 0.1255035400390625, 0.13824462890625, 0.1509857177734375, 0.163726806640625, 0.1764678955078125, 0.189208984375, 0.2019500732421875, 0.214691162109375, 0.2274322509765625, 0.24017333984375, 0.2529144287109375, 0.265655517578125, 0.2783966064453125, 0.2911376953125, 0.3038787841796875, 0.316619873046875, 0.3293609619140625, 0.34210205078125, 0.3548431396484375, 0.367584228515625, 0.3803253173828125, 0.39306640625]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 12.0, 26.0, 144.0, 625.0, 165.0, 29.0, 10.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.917280197143555, -8.207528114318848, -7.497775077819824, -6.788022994995117, -6.078270435333252, -5.368517875671387, -4.65876579284668, -3.9490132331848145, -3.239260673522949, -2.529508113861084, -1.8197557926177979, -1.1100034713745117, -0.4002509117126465, 0.30950164794921875, 1.0192537307739258, 1.729006290435791, 2.4387588500976562, 3.1485114097595215, 3.8582637310028076, 4.568016052246094, 5.277768611907959, 5.987521171569824, 6.697273254394531, 7.4070258140563965, 8.116778373718262, 8.826530456542969, 9.536283493041992, 10.2460355758667, 10.955787658691406, 11.66554069519043, 12.375292778015137, 13.085044860839844, 13.7947998046875, 14.504551887512207, 15.21430492401123, 15.924057006835938, 16.63381004333496, 17.343563079833984, 18.053314208984375, 18.7630672454834, 19.472820281982422, 20.182573318481445, 20.892324447631836, 21.60207748413086, 22.311830520629883, 23.021583557128906, 23.731334686279297, 24.44108772277832, 25.15083885192871, 25.860591888427734, 26.570343017578125, 27.28009605407715, 27.989849090576172, 28.699600219726562, 29.409353256225586, 30.11910629272461, 30.828857421875, 31.538610458374023, 32.24836349487305, 32.95811462402344, 33.66786575317383, 34.377620697021484, 35.087371826171875, 35.797122955322266, 36.50687789916992]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 3.0, 6.0, 6.0, 8.0, 15.0, 15.0, 26.0, 14.0, 16.0, 23.0, 22.0, 29.0, 35.0, 34.0, 41.0, 38.0, 42.0, 42.0, 45.0, 45.0, 53.0, 46.0, 36.0, 33.0, 49.0, 35.0, 23.0, 28.0, 30.0, 36.0, 25.0, 13.0, 13.0, 13.0, 14.0, 9.0, 11.0, 6.0, 6.0, 6.0, 6.0, 2.0, 1.0, 0.0, 5.0, 0.0, 0.0, 3.0], "bins": [-6.623342990875244, -6.435157299041748, -6.24697208404541, -6.058786392211914, -5.870601177215576, -5.68241548538208, -5.494230270385742, -5.306044578552246, -5.11785888671875, -4.929673194885254, -4.741487979888916, -4.55330228805542, -4.365117073059082, -4.176931381225586, -3.988745927810669, -3.800560474395752, -3.612375020980835, -3.424189567565918, -3.236004114151001, -3.047818660736084, -2.859632968902588, -2.671447515487671, -2.483262062072754, -2.295076370239258, -2.10689115524292, -1.918705701828003, -1.7305201292037964, -1.5423346757888794, -1.3541491031646729, -1.1659636497497559, -0.9777781963348389, -0.7895926237106323, -0.6014070510864258, -0.413221538066864, -0.22503605484962463, -0.036850571632385254, 0.1513349413871765, 0.3395204544067383, 0.5277059078216553, 0.7158914804458618, 0.9040769338607788, 1.0922623872756958, 1.2804479598999023, 1.4686334133148193, 1.6568188667297363, 1.8450044393539429, 2.0331897735595703, 2.2213754653930664, 2.4095609188079834, 2.5977463722229004, 2.7859318256378174, 2.9741172790527344, 3.1623029708862305, 3.3504884243011475, 3.5386738777160645, 3.7268595695495605, 3.9150447845458984, 4.1032304763793945, 4.291415691375732, 4.4796013832092285, 4.667786598205566, 4.8559722900390625, 5.044157981872559, 5.2323431968688965, 5.420528888702393]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 4.0, 3.0, 5.0, 4.0, 9.0, 15.0, 10.0, 6.0, 17.0, 24.0, 19.0, 30.0, 32.0, 43.0, 94.0, 144.0, 230.0, 387.0, 824.0, 2023.0, 6121.0, 30250.0, 633577.0, 3441917.0, 62694.0, 10261.0, 3036.0, 1161.0, 553.0, 271.0, 160.0, 103.0, 63.0, 45.0, 37.0, 30.0, 19.0, 12.0, 11.0, 9.0, 10.0, 8.0, 5.0, 7.0, 2.0, 2.0, 3.0, 0.0, 2.0, 3.0, 2.0, 1.0], "bins": [-3.71875, -3.613006591796875, -3.50726318359375, -3.401519775390625, -3.2957763671875, -3.190032958984375, -3.08428955078125, -2.978546142578125, -2.872802734375, -2.767059326171875, -2.66131591796875, -2.555572509765625, -2.4498291015625, -2.344085693359375, -2.23834228515625, -2.132598876953125, -2.02685546875, -1.921112060546875, -1.81536865234375, -1.709625244140625, -1.6038818359375, -1.498138427734375, -1.39239501953125, -1.286651611328125, -1.180908203125, -1.075164794921875, -0.96942138671875, -0.863677978515625, -0.7579345703125, -0.652191162109375, -0.54644775390625, -0.440704345703125, -0.3349609375, -0.229217529296875, -0.12347412109375, -0.017730712890625, 0.0880126953125, 0.193756103515625, 0.29949951171875, 0.405242919921875, 0.510986328125, 0.616729736328125, 0.72247314453125, 0.828216552734375, 0.9339599609375, 1.039703369140625, 1.14544677734375, 1.251190185546875, 1.35693359375, 1.462677001953125, 1.56842041015625, 1.674163818359375, 1.7799072265625, 1.885650634765625, 1.99139404296875, 2.097137451171875, 2.202880859375, 2.308624267578125, 2.41436767578125, 2.520111083984375, 2.6258544921875, 2.731597900390625, 2.83734130859375, 2.943084716796875, 3.048828125]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 3.0, 12.0, 4.0, 19.0, 29.0, 43.0, 52.0, 88.0, 125.0, 128.0, 137.0, 95.0, 95.0, 67.0, 20.0, 31.0, 17.0, 11.0, 8.0, 3.0, 6.0, 3.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.677734375, -3.5833740234375, -3.489013671875, -3.3946533203125, -3.30029296875, -3.2059326171875, -3.111572265625, -3.0172119140625, -2.9228515625, -2.8284912109375, -2.734130859375, -2.6397705078125, -2.54541015625, -2.4510498046875, -2.356689453125, -2.2623291015625, -2.16796875, -2.0736083984375, -1.979248046875, -1.8848876953125, -1.79052734375, -1.6961669921875, -1.601806640625, -1.5074462890625, -1.4130859375, -1.3187255859375, -1.224365234375, -1.1300048828125, -1.03564453125, -0.9412841796875, -0.846923828125, -0.7525634765625, -0.658203125, -0.5638427734375, -0.469482421875, -0.3751220703125, -0.28076171875, -0.1864013671875, -0.092041015625, 0.0023193359375, 0.0966796875, 0.1910400390625, 0.285400390625, 0.3797607421875, 0.47412109375, 0.5684814453125, 0.662841796875, 0.7572021484375, 0.8515625, 0.9459228515625, 1.040283203125, 1.1346435546875, 1.22900390625, 1.3233642578125, 1.417724609375, 1.5120849609375, 1.6064453125, 1.7008056640625, 1.795166015625, 1.8895263671875, 1.98388671875, 2.0782470703125, 2.172607421875, 2.2669677734375, 2.361328125]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 4.0, 6.0, 10.0, 5.0, 13.0, 19.0, 26.0, 46.0, 82.0, 175.0, 405.0, 1436.0, 9565.0, 362946.0, 3792909.0, 23052.0, 2487.0, 571.0, 251.0, 112.0, 61.0, 36.0, 17.0, 19.0, 14.0, 6.0, 6.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.90625, -6.70989990234375, -6.5135498046875, -6.31719970703125, -6.120849609375, -5.92449951171875, -5.7281494140625, -5.53179931640625, -5.33544921875, -5.13909912109375, -4.9427490234375, -4.74639892578125, -4.550048828125, -4.35369873046875, -4.1573486328125, -3.96099853515625, -3.7646484375, -3.56829833984375, -3.3719482421875, -3.17559814453125, -2.979248046875, -2.78289794921875, -2.5865478515625, -2.39019775390625, -2.19384765625, -1.99749755859375, -1.8011474609375, -1.60479736328125, -1.408447265625, -1.21209716796875, -1.0157470703125, -0.81939697265625, -0.623046875, -0.42669677734375, -0.2303466796875, -0.03399658203125, 0.162353515625, 0.35870361328125, 0.5550537109375, 0.75140380859375, 0.94775390625, 1.14410400390625, 1.3404541015625, 1.53680419921875, 1.733154296875, 1.92950439453125, 2.1258544921875, 2.32220458984375, 2.5185546875, 2.71490478515625, 2.9112548828125, 3.10760498046875, 3.303955078125, 3.50030517578125, 3.6966552734375, 3.89300537109375, 4.08935546875, 4.28570556640625, 4.4820556640625, 4.67840576171875, 4.874755859375, 5.07110595703125, 5.2674560546875, 5.46380615234375, 5.66015625]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 0.0, 2.0, 1.0, 2.0, 5.0, 10.0, 16.0, 12.0, 25.0, 38.0, 53.0, 71.0, 142.0, 236.0, 488.0, 1155.0, 897.0, 392.0, 194.0, 113.0, 59.0, 56.0, 32.0, 32.0, 14.0, 11.0, 5.0, 5.0, 5.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7880859375, -0.76165771484375, -0.7352294921875, -0.70880126953125, -0.682373046875, -0.65594482421875, -0.6295166015625, -0.60308837890625, -0.57666015625, -0.55023193359375, -0.5238037109375, -0.49737548828125, -0.470947265625, -0.44451904296875, -0.4180908203125, -0.39166259765625, -0.365234375, -0.33880615234375, -0.3123779296875, -0.28594970703125, -0.259521484375, -0.23309326171875, -0.2066650390625, -0.18023681640625, -0.15380859375, -0.12738037109375, -0.1009521484375, -0.07452392578125, -0.048095703125, -0.02166748046875, 0.0047607421875, 0.03118896484375, 0.0576171875, 0.08404541015625, 0.1104736328125, 0.13690185546875, 0.163330078125, 0.18975830078125, 0.2161865234375, 0.24261474609375, 0.26904296875, 0.29547119140625, 0.3218994140625, 0.34832763671875, 0.374755859375, 0.40118408203125, 0.4276123046875, 0.45404052734375, 0.48046875, 0.50689697265625, 0.5333251953125, 0.55975341796875, 0.586181640625, 0.61260986328125, 0.6390380859375, 0.66546630859375, 0.69189453125, 0.71832275390625, 0.7447509765625, 0.77117919921875, 0.797607421875, 0.82403564453125, 0.8504638671875, 0.87689208984375, 0.9033203125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 6.0, 5.0, 12.0, 34.0, 71.0, 151.0, 245.0, 238.0, 128.0, 54.0, 34.0, 13.0, 6.0, 8.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-9.747260093688965, -9.551276206970215, -9.355291366577148, -9.159307479858398, -8.963323593139648, -8.767338752746582, -8.571354866027832, -8.375370979309082, -8.179386138916016, -7.983401775360107, -7.787417888641357, -7.591433525085449, -7.395449161529541, -7.199465274810791, -7.003480911254883, -6.807497024536133, -6.611513137817383, -6.415528774261475, -6.219544887542725, -6.023560523986816, -5.827576160430908, -5.631592273712158, -5.43560791015625, -5.2396240234375, -5.043639183044434, -4.847654819488525, -4.651670932769775, -4.455686569213867, -4.259702205657959, -4.063718318939209, -3.867733955383301, -3.6717498302459717, -3.4757654666900635, -3.2797813415527344, -3.083796977996826, -2.887812852859497, -2.691828727722168, -2.4958443641662598, -2.2998602390289307, -2.1038761138916016, -1.907891869544983, -1.7119076251983643, -1.5159235000610352, -1.3199392557144165, -1.1239550113677979, -0.9279708862304688, -0.7319866418838501, -0.536002516746521, -0.34001827239990234, -0.14403407275676727, 0.0519501268863678, 0.24793434143066406, 0.44391852617263794, 0.6399027109146118, 0.8358869552612305, 1.0318710803985596, 1.2278553247451782, 1.4238395690917969, 1.619823694229126, 1.8158079385757446, 2.0117921829223633, 2.2077763080596924, 2.4037604331970215, 2.5997447967529297, 2.795728921890259]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 4.0, 5.0, 2.0, 13.0, 12.0, 25.0, 37.0, 48.0, 54.0, 64.0, 78.0, 86.0, 77.0, 83.0, 88.0, 71.0, 57.0, 57.0, 41.0, 29.0, 21.0, 18.0, 15.0, 8.0, 4.0, 5.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-4.07607889175415, -3.9823105335235596, -3.8885421752929688, -3.794773817062378, -3.701005458831787, -3.6072371006011963, -3.5134687423706055, -3.4197001457214355, -3.325932025909424, -3.232163667678833, -3.138395309448242, -3.0446269512176514, -2.9508585929870605, -2.8570902347564697, -2.763321876525879, -2.669553279876709, -2.575784921646118, -2.4820165634155273, -2.3882482051849365, -2.2944798469543457, -2.200711488723755, -2.106943130493164, -2.013174533843994, -1.9194062948226929, -1.825637936592102, -1.7318695783615112, -1.6381012201309204, -1.54433274269104, -1.4505643844604492, -1.3567960262298584, -1.2630276679992676, -1.1692593097686768, -1.075490951538086, -0.9817225933074951, -0.8879542350769043, -0.7941858172416687, -0.7004174590110779, -0.6066491007804871, -0.5128806829452515, -0.41911232471466064, -0.3253439664840698, -0.2315755933523178, -0.1378072202205658, -0.04403883218765259, 0.04972952604293823, 0.14349788427352905, 0.23726630210876465, 0.33103466033935547, 0.4248030185699463, 0.5185713768005371, 0.6123397350311279, 0.7061081528663635, 0.7998765110969543, 0.8936448693275452, 0.9874132871627808, 1.0811816453933716, 1.1749500036239624, 1.2687183618545532, 1.362486720085144, 1.4562551975250244, 1.5500235557556152, 1.643791913986206, 1.7375602722167969, 1.8313286304473877, 1.9250969886779785]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 2.0, 4.0, 9.0, 8.0, 9.0, 16.0, 26.0, 39.0, 46.0, 100.0, 177.0, 285.0, 518.0, 1059.0, 2077.0, 5144.0, 15289.0, 111414.0, 808350.0, 82021.0, 13259.0, 4635.0, 1963.0, 874.0, 481.0, 300.0, 155.0, 91.0, 61.0, 50.0, 24.0, 23.0, 11.0, 14.0, 6.0, 3.0, 5.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.76513671875, -0.7447052001953125, -0.724273681640625, -0.7038421630859375, -0.68341064453125, -0.6629791259765625, -0.642547607421875, -0.6221160888671875, -0.6016845703125, -0.5812530517578125, -0.560821533203125, -0.5403900146484375, -0.51995849609375, -0.4995269775390625, -0.479095458984375, -0.4586639404296875, -0.438232421875, -0.4178009033203125, -0.397369384765625, -0.3769378662109375, -0.35650634765625, -0.3360748291015625, -0.315643310546875, -0.2952117919921875, -0.2747802734375, -0.2543487548828125, -0.233917236328125, -0.2134857177734375, -0.19305419921875, -0.1726226806640625, -0.152191162109375, -0.1317596435546875, -0.111328125, -0.0908966064453125, -0.070465087890625, -0.0500335693359375, -0.02960205078125, -0.0091705322265625, 0.011260986328125, 0.0316925048828125, 0.0521240234375, 0.0725555419921875, 0.092987060546875, 0.1134185791015625, 0.13385009765625, 0.1542816162109375, 0.174713134765625, 0.1951446533203125, 0.215576171875, 0.2360076904296875, 0.256439208984375, 0.2768707275390625, 0.29730224609375, 0.3177337646484375, 0.338165283203125, 0.3585968017578125, 0.3790283203125, 0.3994598388671875, 0.419891357421875, 0.4403228759765625, 0.46075439453125, 0.4811859130859375, 0.501617431640625, 0.5220489501953125, 0.54248046875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 6.0, 10.0, 8.0, 17.0, 30.0, 33.0, 51.0, 66.0, 82.0, 76.0, 91.0, 97.0, 85.0, 67.0, 67.0, 50.0, 37.0, 34.0, 27.0, 19.0, 13.0, 13.0, 8.0, 4.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-2.939453125, -2.8662872314453125, -2.793121337890625, -2.7199554443359375, -2.64678955078125, -2.5736236572265625, -2.500457763671875, -2.4272918701171875, -2.3541259765625, -2.2809600830078125, -2.207794189453125, -2.1346282958984375, -2.06146240234375, -1.9882965087890625, -1.915130615234375, -1.8419647216796875, -1.768798828125, -1.6956329345703125, -1.622467041015625, -1.5493011474609375, -1.47613525390625, -1.4029693603515625, -1.329803466796875, -1.2566375732421875, -1.1834716796875, -1.1103057861328125, -1.037139892578125, -0.9639739990234375, -0.89080810546875, -0.8176422119140625, -0.744476318359375, -0.6713104248046875, -0.59814453125, -0.5249786376953125, -0.451812744140625, -0.3786468505859375, -0.30548095703125, -0.2323150634765625, -0.159149169921875, -0.0859832763671875, -0.0128173828125, 0.0603485107421875, 0.133514404296875, 0.2066802978515625, 0.27984619140625, 0.3530120849609375, 0.426177978515625, 0.4993438720703125, 0.572509765625, 0.6456756591796875, 0.718841552734375, 0.7920074462890625, 0.86517333984375, 0.9383392333984375, 1.011505126953125, 1.0846710205078125, 1.1578369140625, 1.2310028076171875, 1.304168701171875, 1.3773345947265625, 1.45050048828125, 1.5236663818359375, 1.596832275390625, 1.6699981689453125, 1.7431640625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 8.0, 3.0, 5.0, 8.0, 18.0, 23.0, 24.0, 40.0, 47.0, 81.0, 119.0, 149.0, 276.0, 439.0, 845.0, 1818.0, 4352.0, 12944.0, 80106.0, 696076.0, 217865.0, 22064.0, 6160.0, 2520.0, 1079.0, 575.0, 314.0, 206.0, 109.0, 70.0, 60.0, 44.0, 32.0, 18.0, 17.0, 14.0, 7.0, 10.0, 4.0, 2.0, 3.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.45654296875, -0.441162109375, -0.42578125, -0.410400390625, -0.39501953125, -0.379638671875, -0.3642578125, -0.348876953125, -0.33349609375, -0.318115234375, -0.302734375, -0.287353515625, -0.27197265625, -0.256591796875, -0.2412109375, -0.225830078125, -0.21044921875, -0.195068359375, -0.1796875, -0.164306640625, -0.14892578125, -0.133544921875, -0.1181640625, -0.102783203125, -0.08740234375, -0.072021484375, -0.056640625, -0.041259765625, -0.02587890625, -0.010498046875, 0.0048828125, 0.020263671875, 0.03564453125, 0.051025390625, 0.06640625, 0.081787109375, 0.09716796875, 0.112548828125, 0.1279296875, 0.143310546875, 0.15869140625, 0.174072265625, 0.189453125, 0.204833984375, 0.22021484375, 0.235595703125, 0.2509765625, 0.266357421875, 0.28173828125, 0.297119140625, 0.3125, 0.327880859375, 0.34326171875, 0.358642578125, 0.3740234375, 0.389404296875, 0.40478515625, 0.420166015625, 0.435546875, 0.450927734375, 0.46630859375, 0.481689453125, 0.4970703125, 0.512451171875, 0.52783203125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 6.0, 2.0, 8.0, 7.0, 12.0, 12.0, 8.0, 17.0, 13.0, 18.0, 25.0, 28.0, 28.0, 28.0, 33.0, 38.0, 40.0, 52.0, 36.0, 48.0, 50.0, 44.0, 44.0, 44.0, 47.0, 36.0, 40.0, 36.0, 23.0, 32.0, 29.0, 12.0, 23.0, 18.0, 15.0, 16.0, 10.0, 5.0, 9.0, 5.0, 4.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.630859375, -2.540069580078125, -2.44927978515625, -2.358489990234375, -2.2677001953125, -2.176910400390625, -2.08612060546875, -1.995330810546875, -1.904541015625, -1.813751220703125, -1.72296142578125, -1.632171630859375, -1.5413818359375, -1.450592041015625, -1.35980224609375, -1.269012451171875, -1.17822265625, -1.087432861328125, -0.99664306640625, -0.905853271484375, -0.8150634765625, -0.724273681640625, -0.63348388671875, -0.542694091796875, -0.451904296875, -0.361114501953125, -0.27032470703125, -0.179534912109375, -0.0887451171875, 0.002044677734375, 0.09283447265625, 0.183624267578125, 0.2744140625, 0.365203857421875, 0.45599365234375, 0.546783447265625, 0.6375732421875, 0.728363037109375, 0.81915283203125, 0.909942626953125, 1.000732421875, 1.091522216796875, 1.18231201171875, 1.273101806640625, 1.3638916015625, 1.454681396484375, 1.54547119140625, 1.636260986328125, 1.72705078125, 1.817840576171875, 1.90863037109375, 1.999420166015625, 2.0902099609375, 2.180999755859375, 2.27178955078125, 2.362579345703125, 2.453369140625, 2.544158935546875, 2.63494873046875, 2.725738525390625, 2.8165283203125, 2.907318115234375, 2.99810791015625, 3.088897705078125, 3.1796875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 3.0, 5.0, 24.0, 22.0, 22.0, 68.0, 100.0, 139.0, 260.0, 490.0, 1061.0, 2693.0, 8363.0, 40042.0, 577600.0, 378191.0, 28499.0, 6751.0, 2271.0, 922.0, 426.0, 234.0, 120.0, 74.0, 57.0, 34.0, 27.0, 14.0, 9.0, 8.0, 9.0, 5.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.2109375, -0.20537376403808594, -0.19981002807617188, -0.1942462921142578, -0.18868255615234375, -0.1831188201904297, -0.17755508422851562, -0.17199134826660156, -0.1664276123046875, -0.16086387634277344, -0.15530014038085938, -0.1497364044189453, -0.14417266845703125, -0.1386089324951172, -0.13304519653320312, -0.12748146057128906, -0.121917724609375, -0.11635398864746094, -0.11079025268554688, -0.10522651672363281, -0.09966278076171875, -0.09409904479980469, -0.08853530883789062, -0.08297157287597656, -0.0774078369140625, -0.07184410095214844, -0.06628036499023438, -0.06071662902832031, -0.05515289306640625, -0.04958915710449219, -0.044025421142578125, -0.03846168518066406, -0.03289794921875, -0.027334213256835938, -0.021770477294921875, -0.016206741333007812, -0.01064300537109375, -0.0050792694091796875, 0.000484466552734375, 0.0060482025146484375, 0.0116119384765625, 0.017175674438476562, 0.022739410400390625, 0.028303146362304688, 0.03386688232421875, 0.03943061828613281, 0.044994354248046875, 0.05055809020996094, 0.056121826171875, 0.06168556213378906, 0.06724929809570312, 0.07281303405761719, 0.07837677001953125, 0.08394050598144531, 0.08950424194335938, 0.09506797790527344, 0.1006317138671875, 0.10619544982910156, 0.11175918579101562, 0.11732292175292969, 0.12288665771484375, 0.1284503936767578, 0.13401412963867188, 0.13957786560058594, 0.1451416015625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 5.0, 1.0, 9.0, 4.0, 12.0, 17.0, 32.0, 35.0, 54.0, 76.0, 113.0, 114.0, 141.0, 119.0, 79.0, 66.0, 47.0, 25.0, 20.0, 12.0, 16.0, 2.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.2034854888916016e-05, -4.969164729118347e-05, -4.734843969345093e-05, -4.5005232095718384e-05, -4.266202449798584e-05, -4.0318816900253296e-05, -3.797560930252075e-05, -3.563240170478821e-05, -3.3289194107055664e-05, -3.094598650932312e-05, -2.8602778911590576e-05, -2.6259571313858032e-05, -2.3916363716125488e-05, -2.1573156118392944e-05, -1.92299485206604e-05, -1.6886740922927856e-05, -1.4543533325195312e-05, -1.2200325727462769e-05, -9.857118129730225e-06, -7.513910531997681e-06, -5.170702934265137e-06, -2.8274953365325928e-06, -4.842877388000488e-07, 1.8589198589324951e-06, 4.202127456665039e-06, 6.545335054397583e-06, 8.888542652130127e-06, 1.1231750249862671e-05, 1.3574957847595215e-05, 1.591816544532776e-05, 1.8261373043060303e-05, 2.0604580640792847e-05, 2.294778823852539e-05, 2.5290995836257935e-05, 2.763420343399048e-05, 2.9977411031723022e-05, 3.2320618629455566e-05, 3.466382622718811e-05, 3.7007033824920654e-05, 3.93502414226532e-05, 4.169344902038574e-05, 4.4036656618118286e-05, 4.637986421585083e-05, 4.8723071813583374e-05, 5.106627941131592e-05, 5.340948700904846e-05, 5.5752694606781006e-05, 5.809590220451355e-05, 6.0439109802246094e-05, 6.278231739997864e-05, 6.512552499771118e-05, 6.746873259544373e-05, 6.981194019317627e-05, 7.215514779090881e-05, 7.449835538864136e-05, 7.68415629863739e-05, 7.918477058410645e-05, 8.152797818183899e-05, 8.387118577957153e-05, 8.621439337730408e-05, 8.855760097503662e-05, 9.090080857276917e-05, 9.324401617050171e-05, 9.558722376823425e-05, 9.79304313659668e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 7.0, 3.0, 6.0, 9.0, 18.0, 24.0, 18.0, 33.0, 56.0, 114.0, 228.0, 456.0, 907.0, 2420.0, 7069.0, 26998.0, 228429.0, 685443.0, 74810.0, 14243.0, 4329.0, 1532.0, 616.0, 337.0, 176.0, 98.0, 58.0, 43.0, 25.0, 21.0, 11.0, 8.0, 4.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13623046875, -0.13104629516601562, -0.12586212158203125, -0.12067794799804688, -0.1154937744140625, -0.11030960083007812, -0.10512542724609375, -0.09994125366210938, -0.094757080078125, -0.08957290649414062, -0.08438873291015625, -0.07920455932617188, -0.0740203857421875, -0.06883621215820312, -0.06365203857421875, -0.058467864990234375, -0.05328369140625, -0.048099517822265625, -0.04291534423828125, -0.037731170654296875, -0.0325469970703125, -0.027362823486328125, -0.02217864990234375, -0.016994476318359375, -0.011810302734375, -0.006626129150390625, -0.00144195556640625, 0.003742218017578125, 0.0089263916015625, 0.014110565185546875, 0.01929473876953125, 0.024478912353515625, 0.0296630859375, 0.034847259521484375, 0.04003143310546875, 0.045215606689453125, 0.0503997802734375, 0.055583953857421875, 0.06076812744140625, 0.06595230102539062, 0.071136474609375, 0.07632064819335938, 0.08150482177734375, 0.08668899536132812, 0.0918731689453125, 0.09705734252929688, 0.10224151611328125, 0.10742568969726562, 0.11260986328125, 0.11779403686523438, 0.12297821044921875, 0.12816238403320312, 0.1333465576171875, 0.13853073120117188, 0.14371490478515625, 0.14889907836914062, 0.154083251953125, 0.15926742553710938, 0.16445159912109375, 0.16963577270507812, 0.1748199462890625, 0.18000411987304688, 0.18518829345703125, 0.19037246704101562, 0.195556640625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 7.0, 4.0, 4.0, 1.0, 4.0, 4.0, 10.0, 13.0, 16.0, 19.0, 26.0, 56.0, 66.0, 121.0, 139.0, 143.0, 142.0, 83.0, 50.0, 26.0, 24.0, 17.0, 9.0, 7.0, 2.0, 4.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0535888671875, -0.052019596099853516, -0.05045032501220703, -0.04888105392456055, -0.04731178283691406, -0.04574251174926758, -0.044173240661621094, -0.04260396957397461, -0.041034698486328125, -0.03946542739868164, -0.037896156311035156, -0.03632688522338867, -0.03475761413574219, -0.0331883430480957, -0.03161907196044922, -0.030049800872802734, -0.02848052978515625, -0.026911258697509766, -0.02534198760986328, -0.023772716522216797, -0.022203445434570312, -0.020634174346923828, -0.019064903259277344, -0.01749563217163086, -0.015926361083984375, -0.01435708999633789, -0.012787818908691406, -0.011218547821044922, -0.009649276733398438, -0.008080005645751953, -0.006510734558105469, -0.004941463470458984, -0.0033721923828125, -0.0018029212951660156, -0.00023365020751953125, 0.0013356208801269531, 0.0029048919677734375, 0.004474163055419922, 0.006043434143066406, 0.007612705230712891, 0.009181976318359375, 0.01075124740600586, 0.012320518493652344, 0.013889789581298828, 0.015459060668945312, 0.017028331756591797, 0.01859760284423828, 0.020166873931884766, 0.02173614501953125, 0.023305416107177734, 0.02487468719482422, 0.026443958282470703, 0.028013229370117188, 0.029582500457763672, 0.031151771545410156, 0.03272104263305664, 0.034290313720703125, 0.03585958480834961, 0.037428855895996094, 0.03899812698364258, 0.04056739807128906, 0.04213666915893555, 0.04370594024658203, 0.045275211334228516, 0.046844482421875]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 7.0, 11.0, 14.0, 46.0, 98.0, 233.0, 260.0, 189.0, 82.0, 34.0, 16.0, 8.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.687336444854736, -5.530674457550049, -5.3740129470825195, -5.217350959777832, -5.060689449310303, -4.904027462005615, -4.747365951538086, -4.590703964233398, -4.434041976928711, -4.277379989624023, -4.120718479156494, -3.9640567302703857, -3.8073949813842773, -3.65073299407959, -3.4940712451934814, -3.337409496307373, -3.1807479858398438, -3.0240862369537354, -2.867424488067627, -2.7107627391815186, -2.55410099029541, -2.3974390029907227, -2.2407772541046143, -2.084115505218506, -1.9274537563323975, -1.770792007446289, -1.6141302585601807, -1.4574683904647827, -1.3008066415786743, -1.144144892692566, -0.9874830842018127, -0.8308212757110596, -0.674159049987793, -0.5174973011016846, -0.3608354926109314, -0.2041737139225006, -0.047511935234069824, 0.10914981365203857, 0.26581162214279175, 0.4224734306335449, 0.5791351795196533, 0.7357969284057617, 0.8924587368965149, 1.049120545387268, 1.2057822942733765, 1.3624440431594849, 1.5191059112548828, 1.6757676601409912, 1.8324294090270996, 1.989091157913208, 2.1457529067993164, 2.302414655685425, 2.459076404571533, 2.6157383918762207, 2.772400140762329, 2.9290618896484375, 3.085723638534546, 3.2423853874206543, 3.3990471363067627, 3.555708885192871, 3.7123708724975586, 3.869032382965088, 4.025694370269775, 4.182355880737305, 4.339017868041992]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 0.0, 1.0, 4.0, 4.0, 4.0, 7.0, 8.0, 17.0, 27.0, 41.0, 47.0, 70.0, 73.0, 89.0, 76.0, 87.0, 101.0, 65.0, 62.0, 54.0, 46.0, 30.0, 27.0, 22.0, 13.0, 6.0, 8.0, 5.0, 2.0, 5.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-2.9074008464813232, -2.8369288444519043, -2.7664568424224854, -2.6959846019744873, -2.6255125999450684, -2.5550405979156494, -2.4845685958862305, -2.4140963554382324, -2.3436243534088135, -2.2731523513793945, -2.2026803493499756, -2.1322081089019775, -2.0617361068725586, -1.9912641048431396, -1.9207921028137207, -1.8503199815750122, -1.7798479795455933, -1.7093759775161743, -1.6389038562774658, -1.5684318542480469, -1.4979597330093384, -1.4274877309799194, -1.357015609741211, -1.286543607711792, -1.216071605682373, -1.145599603652954, -1.0751274824142456, -1.0046554803848267, -0.9341833591461182, -0.8637113571166992, -0.7932392954826355, -0.7227672338485718, -0.6522952318191528, -0.5818231701850891, -0.5113511085510254, -0.44087907671928406, -0.37040701508522034, -0.2999349534511566, -0.22946292161941528, -0.15899085998535156, -0.08851879835128784, -0.018046744167804718, 0.052425310015678406, 0.12289735674858093, 0.19336941838264465, 0.2638414800167084, 0.3343135118484497, 0.4047855734825134, 0.47525763511657715, 0.5457296967506409, 0.6162017583847046, 0.6866737604141235, 0.757145881652832, 0.827617883682251, 0.8980899453163147, 0.9685620069503784, 1.039034128189087, 1.1095061302185059, 1.1799782514572144, 1.2504502534866333, 1.3209223747253418, 1.3913943767547607, 1.4618663787841797, 1.5323385000228882, 1.6028105020523071]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 11.0, 20.0, 26.0, 41.0, 37.0, 63.0, 85.0, 141.0, 260.0, 405.0, 616.0, 1129.0, 1995.0, 3901.0, 7995.0, 18344.0, 47623.0, 161438.0, 603603.0, 128821.0, 40756.0, 16080.0, 7117.0, 3503.0, 1847.0, 1056.0, 617.0, 369.0, 224.0, 143.0, 76.0, 58.0, 33.0, 25.0, 33.0, 16.0, 12.0, 6.0, 8.0, 8.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.306640625, -1.267547607421875, -1.22845458984375, -1.189361572265625, -1.1502685546875, -1.111175537109375, -1.07208251953125, -1.032989501953125, -0.993896484375, -0.954803466796875, -0.91571044921875, -0.876617431640625, -0.8375244140625, -0.798431396484375, -0.75933837890625, -0.720245361328125, -0.68115234375, -0.642059326171875, -0.60296630859375, -0.563873291015625, -0.5247802734375, -0.485687255859375, -0.44659423828125, -0.407501220703125, -0.368408203125, -0.329315185546875, -0.29022216796875, -0.251129150390625, -0.2120361328125, -0.172943115234375, -0.13385009765625, -0.094757080078125, -0.0556640625, -0.016571044921875, 0.02252197265625, 0.061614990234375, 0.1007080078125, 0.139801025390625, 0.17889404296875, 0.217987060546875, 0.257080078125, 0.296173095703125, 0.33526611328125, 0.374359130859375, 0.4134521484375, 0.452545166015625, 0.49163818359375, 0.530731201171875, 0.56982421875, 0.608917236328125, 0.64801025390625, 0.687103271484375, 0.7261962890625, 0.765289306640625, 0.80438232421875, 0.843475341796875, 0.882568359375, 0.921661376953125, 0.96075439453125, 0.999847412109375, 1.0389404296875, 1.078033447265625, 1.11712646484375, 1.156219482421875, 1.1953125]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 2.0, 1.0, 4.0, 6.0, 5.0, 5.0, 11.0, 19.0, 30.0, 44.0, 60.0, 71.0, 96.0, 83.0, 104.0, 93.0, 89.0, 66.0, 50.0, 50.0, 29.0, 27.0, 20.0, 11.0, 7.0, 7.0, 2.0, 3.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-6.59375, -6.4422607421875, -6.290771484375, -6.1392822265625, -5.98779296875, -5.8363037109375, -5.684814453125, -5.5333251953125, -5.3818359375, -5.2303466796875, -5.078857421875, -4.9273681640625, -4.77587890625, -4.6243896484375, -4.472900390625, -4.3214111328125, -4.169921875, -4.0184326171875, -3.866943359375, -3.7154541015625, -3.56396484375, -3.4124755859375, -3.260986328125, -3.1094970703125, -2.9580078125, -2.8065185546875, -2.655029296875, -2.5035400390625, -2.35205078125, -2.2005615234375, -2.049072265625, -1.8975830078125, -1.74609375, -1.5946044921875, -1.443115234375, -1.2916259765625, -1.14013671875, -0.9886474609375, -0.837158203125, -0.6856689453125, -0.5341796875, -0.3826904296875, -0.231201171875, -0.0797119140625, 0.07177734375, 0.2232666015625, 0.374755859375, 0.5262451171875, 0.677734375, 0.8292236328125, 0.980712890625, 1.1322021484375, 1.28369140625, 1.4351806640625, 1.586669921875, 1.7381591796875, 1.8896484375, 2.0411376953125, 2.192626953125, 2.3441162109375, 2.49560546875, 2.6470947265625, 2.798583984375, 2.9500732421875, 3.1015625]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 8.0, 8.0, 14.0, 6.0, 13.0, 8.0, 16.0, 32.0, 28.0, 37.0, 52.0, 69.0, 112.0, 139.0, 259.0, 519.0, 1656.0, 8803.0, 141007.0, 865494.0, 25174.0, 3168.0, 853.0, 312.0, 202.0, 144.0, 111.0, 81.0, 56.0, 41.0, 34.0, 24.0, 23.0, 11.0, 10.0, 6.0, 7.0, 4.0, 3.0, 5.0, 4.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0], "bins": [-4.5859375, -4.4593505859375, -4.332763671875, -4.2061767578125, -4.07958984375, -3.9530029296875, -3.826416015625, -3.6998291015625, -3.5732421875, -3.4466552734375, -3.320068359375, -3.1934814453125, -3.06689453125, -2.9403076171875, -2.813720703125, -2.6871337890625, -2.560546875, -2.4339599609375, -2.307373046875, -2.1807861328125, -2.05419921875, -1.9276123046875, -1.801025390625, -1.6744384765625, -1.5478515625, -1.4212646484375, -1.294677734375, -1.1680908203125, -1.04150390625, -0.9149169921875, -0.788330078125, -0.6617431640625, -0.53515625, -0.4085693359375, -0.281982421875, -0.1553955078125, -0.02880859375, 0.0977783203125, 0.224365234375, 0.3509521484375, 0.4775390625, 0.6041259765625, 0.730712890625, 0.8572998046875, 0.98388671875, 1.1104736328125, 1.237060546875, 1.3636474609375, 1.490234375, 1.6168212890625, 1.743408203125, 1.8699951171875, 1.99658203125, 2.1231689453125, 2.249755859375, 2.3763427734375, 2.5029296875, 2.6295166015625, 2.756103515625, 2.8826904296875, 3.00927734375, 3.1358642578125, 3.262451171875, 3.3890380859375, 3.515625]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 3.0, 2.0, 3.0, 10.0, 5.0, 4.0, 5.0, 11.0, 9.0, 15.0, 16.0, 20.0, 19.0, 22.0, 31.0, 29.0, 28.0, 36.0, 39.0, 55.0, 39.0, 45.0, 38.0, 45.0, 54.0, 50.0, 37.0, 46.0, 38.0, 31.0, 26.0, 31.0, 26.0, 20.0, 27.0, 17.0, 12.0, 16.0, 9.0, 6.0, 11.0, 8.0, 3.0, 5.0, 4.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.513671875, -3.400146484375, -3.28662109375, -3.173095703125, -3.0595703125, -2.946044921875, -2.83251953125, -2.718994140625, -2.60546875, -2.491943359375, -2.37841796875, -2.264892578125, -2.1513671875, -2.037841796875, -1.92431640625, -1.810791015625, -1.697265625, -1.583740234375, -1.47021484375, -1.356689453125, -1.2431640625, -1.129638671875, -1.01611328125, -0.902587890625, -0.7890625, -0.675537109375, -0.56201171875, -0.448486328125, -0.3349609375, -0.221435546875, -0.10791015625, 0.005615234375, 0.119140625, 0.232666015625, 0.34619140625, 0.459716796875, 0.5732421875, 0.686767578125, 0.80029296875, 0.913818359375, 1.02734375, 1.140869140625, 1.25439453125, 1.367919921875, 1.4814453125, 1.594970703125, 1.70849609375, 1.822021484375, 1.935546875, 2.049072265625, 2.16259765625, 2.276123046875, 2.3896484375, 2.503173828125, 2.61669921875, 2.730224609375, 2.84375, 2.957275390625, 3.07080078125, 3.184326171875, 3.2978515625, 3.411376953125, 3.52490234375, 3.638427734375, 3.751953125]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 10.0, 12.0, 11.0, 18.0, 23.0, 34.0, 55.0, 99.0, 198.0, 374.0, 815.0, 2294.0, 7091.0, 42080.0, 872065.0, 106879.0, 11098.0, 3179.0, 1146.0, 469.0, 249.0, 126.0, 69.0, 54.0, 34.0, 20.0, 11.0, 7.0, 9.0, 4.0, 5.0, 3.0, 5.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.98193359375, -0.9421157836914062, -0.9022979736328125, -0.8624801635742188, -0.822662353515625, -0.7828445434570312, -0.7430267333984375, -0.7032089233398438, -0.66339111328125, -0.6235733032226562, -0.5837554931640625, -0.5439376831054688, -0.504119873046875, -0.46430206298828125, -0.4244842529296875, -0.38466644287109375, -0.3448486328125, -0.30503082275390625, -0.2652130126953125, -0.22539520263671875, -0.185577392578125, -0.14575958251953125, -0.1059417724609375, -0.06612396240234375, -0.02630615234375, 0.01351165771484375, 0.0533294677734375, 0.09314727783203125, 0.132965087890625, 0.17278289794921875, 0.2126007080078125, 0.25241851806640625, 0.292236328125, 0.33205413818359375, 0.3718719482421875, 0.41168975830078125, 0.451507568359375, 0.49132537841796875, 0.5311431884765625, 0.5709609985351562, 0.61077880859375, 0.6505966186523438, 0.6904144287109375, 0.7302322387695312, 0.770050048828125, 0.8098678588867188, 0.8496856689453125, 0.8895034790039062, 0.9293212890625, 0.9691390991210938, 1.0089569091796875, 1.0487747192382812, 1.088592529296875, 1.1284103393554688, 1.1682281494140625, 1.2080459594726562, 1.24786376953125, 1.2876815795898438, 1.3274993896484375, 1.3673171997070312, 1.407135009765625, 1.4469528198242188, 1.4867706298828125, 1.5265884399414062, 1.56640625]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 5.0, 8.0, 13.0, 17.0, 25.0, 25.0, 32.0, 48.0, 88.0, 126.0, 259.0, 132.0, 65.0, 55.0, 35.0, 19.0, 13.0, 13.0, 6.0, 3.0, 5.0, 6.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00015878677368164062, -0.0001542959362268448, -0.00014980509877204895, -0.0001453142613172531, -0.00014082342386245728, -0.00013633258640766144, -0.0001318417489528656, -0.00012735091149806976, -0.00012286007404327393, -0.00011836923658847809, -0.00011387839913368225, -0.00010938756167888641, -0.00010489672422409058, -0.00010040588676929474, -9.59150493144989e-05, -9.142421185970306e-05, -8.693337440490723e-05, -8.244253695011139e-05, -7.795169949531555e-05, -7.346086204051971e-05, -6.897002458572388e-05, -6.447918713092804e-05, -5.99883496761322e-05, -5.5497512221336365e-05, -5.100667476654053e-05, -4.651583731174469e-05, -4.202499985694885e-05, -3.7534162402153015e-05, -3.304332494735718e-05, -2.855248749256134e-05, -2.4061650037765503e-05, -1.9570812582969666e-05, -1.5079975128173828e-05, -1.058913767337799e-05, -6.098300218582153e-06, -1.607462763786316e-06, 2.8833746910095215e-06, 7.374212145805359e-06, 1.1865049600601196e-05, 1.6355887055397034e-05, 2.084672451019287e-05, 2.533756196498871e-05, 2.9828399419784546e-05, 3.431923687458038e-05, 3.881007432937622e-05, 4.330091178417206e-05, 4.7791749238967896e-05, 5.228258669376373e-05, 5.677342414855957e-05, 6.126426160335541e-05, 6.575509905815125e-05, 7.024593651294708e-05, 7.473677396774292e-05, 7.922761142253876e-05, 8.37184488773346e-05, 8.820928633213043e-05, 9.270012378692627e-05, 9.719096124172211e-05, 0.00010168179869651794, 0.00010617263615131378, 0.00011066347360610962, 0.00011515431106090546, 0.0001196451485157013, 0.00012413598597049713, 0.00012862682342529297]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 8.0, 9.0, 11.0, 20.0, 38.0, 93.0, 190.0, 538.0, 2349.0, 30665.0, 977129.0, 34033.0, 2522.0, 556.0, 202.0, 91.0, 38.0, 23.0, 9.0, 12.0, 7.0, 1.0, 4.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.185546875, -2.113922119140625, -2.04229736328125, -1.970672607421875, -1.8990478515625, -1.827423095703125, -1.75579833984375, -1.684173583984375, -1.612548828125, -1.540924072265625, -1.46929931640625, -1.397674560546875, -1.3260498046875, -1.254425048828125, -1.18280029296875, -1.111175537109375, -1.03955078125, -0.967926025390625, -0.89630126953125, -0.824676513671875, -0.7530517578125, -0.681427001953125, -0.60980224609375, -0.538177490234375, -0.466552734375, -0.394927978515625, -0.32330322265625, -0.251678466796875, -0.1800537109375, -0.108428955078125, -0.03680419921875, 0.034820556640625, 0.1064453125, 0.178070068359375, 0.24969482421875, 0.321319580078125, 0.3929443359375, 0.464569091796875, 0.53619384765625, 0.607818603515625, 0.679443359375, 0.751068115234375, 0.82269287109375, 0.894317626953125, 0.9659423828125, 1.037567138671875, 1.10919189453125, 1.180816650390625, 1.25244140625, 1.324066162109375, 1.39569091796875, 1.467315673828125, 1.5389404296875, 1.610565185546875, 1.68218994140625, 1.753814697265625, 1.825439453125, 1.897064208984375, 1.96868896484375, 2.040313720703125, 2.1119384765625, 2.183563232421875, 2.25518798828125, 2.326812744140625, 2.3984375]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 7.0, 5.0, 6.0, 6.0, 17.0, 25.0, 30.0, 46.0, 75.0, 166.0, 324.0, 107.0, 76.0, 37.0, 23.0, 10.0, 8.0, 8.0, 11.0, 4.0, 3.0, 2.0, 2.0, 5.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.57080078125, -0.5525131225585938, -0.5342254638671875, -0.5159378051757812, -0.497650146484375, -0.47936248779296875, -0.4610748291015625, -0.44278717041015625, -0.42449951171875, -0.40621185302734375, -0.3879241943359375, -0.36963653564453125, -0.351348876953125, -0.33306121826171875, -0.3147735595703125, -0.29648590087890625, -0.2781982421875, -0.25991058349609375, -0.2416229248046875, -0.22333526611328125, -0.205047607421875, -0.18675994873046875, -0.1684722900390625, -0.15018463134765625, -0.13189697265625, -0.11360931396484375, -0.0953216552734375, -0.07703399658203125, -0.058746337890625, -0.04045867919921875, -0.0221710205078125, -0.00388336181640625, 0.014404296875, 0.03269195556640625, 0.0509796142578125, 0.06926727294921875, 0.087554931640625, 0.10584259033203125, 0.1241302490234375, 0.14241790771484375, 0.16070556640625, 0.17899322509765625, 0.1972808837890625, 0.21556854248046875, 0.233856201171875, 0.25214385986328125, 0.2704315185546875, 0.28871917724609375, 0.3070068359375, 0.32529449462890625, 0.3435821533203125, 0.36186981201171875, 0.380157470703125, 0.39844512939453125, 0.4167327880859375, 0.43502044677734375, 0.45330810546875, 0.47159576416015625, 0.4898834228515625, 0.5081710815429688, 0.526458740234375, 0.5447463989257812, 0.5630340576171875, 0.5813217163085938, 0.599609375]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 7.0, 13.0, 51.0, 249.0, 450.0, 187.0, 39.0, 8.0, 7.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.730124473571777, -10.112868309020996, -9.495611190795898, -8.878355026245117, -8.261098861694336, -7.643842697143555, -7.026586055755615, -6.409329414367676, -5.7920732498168945, -5.174817085266113, -4.557560443878174, -3.9403040409088135, -3.323047637939453, -2.7057912349700928, -2.0885348320007324, -1.471278190612793, -0.8540220260620117, -0.23676562309265137, 0.380490779876709, 0.9977471828460693, 1.6150035858154297, 2.23225998878479, 2.8495163917541504, 3.46677303314209, 4.084029197692871, 4.701285362243652, 5.318542003631592, 5.935798645019531, 6.5530548095703125, 7.170310974121094, 7.787567615509033, 8.404824256896973, 9.022079467773438, 9.639335632324219, 10.256591796875, 10.873848915100098, 11.491105079650879, 12.10836124420166, 12.725618362426758, 13.342874526977539, 13.96013069152832, 14.577386856079102, 15.194643020629883, 15.81190013885498, 16.429157257080078, 17.04641342163086, 17.66366958618164, 18.280925750732422, 18.898181915283203, 19.515438079833984, 20.132694244384766, 20.749950408935547, 21.367206573486328, 21.984464645385742, 22.601720809936523, 23.218976974487305, 23.836233139038086, 24.453489303588867, 25.07074546813965, 25.68800163269043, 26.305259704589844, 26.922515869140625, 27.539772033691406, 28.157028198242188, 28.77428436279297]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 2.0, 2.0, 9.0, 5.0, 9.0, 19.0, 17.0, 26.0, 17.0, 19.0, 36.0, 32.0, 19.0, 45.0, 44.0, 44.0, 54.0, 57.0, 56.0, 64.0, 51.0, 49.0, 62.0, 55.0, 39.0, 30.0, 26.0, 29.0, 14.0, 19.0, 17.0, 16.0, 9.0, 5.0, 3.0, 3.0, 1.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.717110633850098, -8.478372573852539, -8.239635467529297, -8.000897407531738, -7.762159824371338, -7.5234222412109375, -7.284684181213379, -7.0459465980529785, -6.807209014892578, -6.568471431732178, -6.329733848571777, -6.090995788574219, -5.852258205413818, -5.613520622253418, -5.374782562255859, -5.136044979095459, -4.897307395935059, -4.658569812774658, -4.419832229614258, -4.181094169616699, -3.942356586456299, -3.7036190032958984, -3.464881181716919, -3.2261433601379395, -2.987405776977539, -2.7486681938171387, -2.509930372238159, -2.2711925506591797, -2.0324549674987793, -1.7937172651290894, -1.5549795627593994, -1.3162418603897095, -1.0775041580200195, -0.8387664556503296, -0.6000287532806396, -0.3612910509109497, -0.12255334854125977, 0.11618435382843018, 0.3549220561981201, 0.5936597585678101, 0.8323974609375, 1.07113516330719, 1.3098728656768799, 1.5486105680465698, 1.7873482704162598, 2.02608585357666, 2.2648236751556396, 2.503561496734619, 2.7422990798950195, 2.98103666305542, 3.2197744846343994, 3.458512306213379, 3.6972498893737793, 3.9359874725341797, 4.174725532531738, 4.413463115692139, 4.652200698852539, 4.8909382820129395, 5.12967586517334, 5.368413925170898, 5.607151508331299, 5.845889091491699, 6.084627151489258, 6.323364734649658, 6.562102317810059]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 6.0, 6.0, 9.0, 13.0, 14.0, 20.0, 13.0, 34.0, 33.0, 42.0, 46.0, 75.0, 68.0, 104.0, 147.0, 232.0, 371.0, 636.0, 1369.0, 3525.0, 11593.0, 62466.0, 1759141.0, 2263664.0, 69827.0, 13382.0, 4053.0, 1531.0, 703.0, 376.0, 225.0, 129.0, 100.0, 84.0, 61.0, 44.0, 25.0, 23.0, 24.0, 17.0, 12.0, 18.0, 6.0, 6.0, 2.0, 3.0, 1.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-3.107421875, -3.00726318359375, -2.9071044921875, -2.80694580078125, -2.706787109375, -2.60662841796875, -2.5064697265625, -2.40631103515625, -2.30615234375, -2.20599365234375, -2.1058349609375, -2.00567626953125, -1.905517578125, -1.80535888671875, -1.7052001953125, -1.60504150390625, -1.5048828125, -1.40472412109375, -1.3045654296875, -1.20440673828125, -1.104248046875, -1.00408935546875, -0.9039306640625, -0.80377197265625, -0.70361328125, -0.60345458984375, -0.5032958984375, -0.40313720703125, -0.302978515625, -0.20281982421875, -0.1026611328125, -0.00250244140625, 0.09765625, 0.19781494140625, 0.2979736328125, 0.39813232421875, 0.498291015625, 0.59844970703125, 0.6986083984375, 0.79876708984375, 0.89892578125, 0.99908447265625, 1.0992431640625, 1.19940185546875, 1.299560546875, 1.39971923828125, 1.4998779296875, 1.60003662109375, 1.7001953125, 1.80035400390625, 1.9005126953125, 2.00067138671875, 2.100830078125, 2.20098876953125, 2.3011474609375, 2.40130615234375, 2.50146484375, 2.60162353515625, 2.7017822265625, 2.80194091796875, 2.902099609375, 3.00225830078125, 3.1024169921875, 3.20257568359375, 3.302734375]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 7.0, 6.0, 18.0, 20.0, 20.0, 32.0, 49.0, 70.0, 98.0, 123.0, 105.0, 98.0, 77.0, 66.0, 59.0, 43.0, 32.0, 20.0, 16.0, 8.0, 10.0, 7.0, 3.0, 3.0, 2.0, 4.0, 3.0, 2.0, 2.0, 2.0], "bins": [-3.373046875, -3.2975311279296875, -3.222015380859375, -3.1464996337890625, -3.07098388671875, -2.9954681396484375, -2.919952392578125, -2.8444366455078125, -2.7689208984375, -2.6934051513671875, -2.617889404296875, -2.5423736572265625, -2.46685791015625, -2.3913421630859375, -2.315826416015625, -2.2403106689453125, -2.164794921875, -2.0892791748046875, -2.013763427734375, -1.9382476806640625, -1.86273193359375, -1.7872161865234375, -1.711700439453125, -1.6361846923828125, -1.5606689453125, -1.4851531982421875, -1.409637451171875, -1.3341217041015625, -1.25860595703125, -1.1830902099609375, -1.107574462890625, -1.0320587158203125, -0.95654296875, -0.8810272216796875, -0.805511474609375, -0.7299957275390625, -0.65447998046875, -0.5789642333984375, -0.503448486328125, -0.4279327392578125, -0.3524169921875, -0.2769012451171875, -0.201385498046875, -0.1258697509765625, -0.05035400390625, 0.0251617431640625, 0.100677490234375, 0.1761932373046875, 0.251708984375, 0.3272247314453125, 0.402740478515625, 0.4782562255859375, 0.55377197265625, 0.6292877197265625, 0.704803466796875, 0.7803192138671875, 0.8558349609375, 0.9313507080078125, 1.006866455078125, 1.0823822021484375, 1.15789794921875, 1.2334136962890625, 1.308929443359375, 1.3844451904296875, 1.4599609375]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 3.0, 9.0, 2.0, 5.0, 11.0, 17.0, 22.0, 37.0, 45.0, 109.0, 257.0, 746.0, 5086.0, 237678.0, 3928852.0, 19064.0, 1611.0, 384.0, 180.0, 57.0, 38.0, 19.0, 17.0, 17.0, 6.0, 6.0, 6.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.16796875, -6.89471435546875, -6.6214599609375, -6.34820556640625, -6.074951171875, -5.80169677734375, -5.5284423828125, -5.25518798828125, -4.98193359375, -4.70867919921875, -4.4354248046875, -4.16217041015625, -3.888916015625, -3.61566162109375, -3.3424072265625, -3.06915283203125, -2.7958984375, -2.52264404296875, -2.2493896484375, -1.97613525390625, -1.702880859375, -1.42962646484375, -1.1563720703125, -0.88311767578125, -0.60986328125, -0.33660888671875, -0.0633544921875, 0.20989990234375, 0.483154296875, 0.75640869140625, 1.0296630859375, 1.30291748046875, 1.576171875, 1.84942626953125, 2.1226806640625, 2.39593505859375, 2.669189453125, 2.94244384765625, 3.2156982421875, 3.48895263671875, 3.76220703125, 4.03546142578125, 4.3087158203125, 4.58197021484375, 4.855224609375, 5.12847900390625, 5.4017333984375, 5.67498779296875, 5.9482421875, 6.22149658203125, 6.4947509765625, 6.76800537109375, 7.041259765625, 7.31451416015625, 7.5877685546875, 7.86102294921875, 8.13427734375, 8.40753173828125, 8.6807861328125, 8.95404052734375, 9.227294921875, 9.50054931640625, 9.7738037109375, 10.04705810546875, 10.3203125]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 5.0, 2.0, 5.0, 12.0, 9.0, 11.0, 16.0, 13.0, 32.0, 24.0, 39.0, 65.0, 72.0, 144.0, 216.0, 335.0, 452.0, 756.0, 623.0, 403.0, 249.0, 150.0, 117.0, 77.0, 78.0, 49.0, 25.0, 21.0, 13.0, 12.0, 12.0, 7.0, 9.0, 5.0, 3.0, 6.0, 4.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.70947265625, -0.6871566772460938, -0.6648406982421875, -0.6425247192382812, -0.620208740234375, -0.5978927612304688, -0.5755767822265625, -0.5532608032226562, -0.53094482421875, -0.5086288452148438, -0.4863128662109375, -0.46399688720703125, -0.441680908203125, -0.41936492919921875, -0.3970489501953125, -0.37473297119140625, -0.3524169921875, -0.33010101318359375, -0.3077850341796875, -0.28546905517578125, -0.263153076171875, -0.24083709716796875, -0.2185211181640625, -0.19620513916015625, -0.17388916015625, -0.15157318115234375, -0.1292572021484375, -0.10694122314453125, -0.084625244140625, -0.06230926513671875, -0.0399932861328125, -0.01767730712890625, 0.004638671875, 0.02695465087890625, 0.0492706298828125, 0.07158660888671875, 0.093902587890625, 0.11621856689453125, 0.1385345458984375, 0.16085052490234375, 0.18316650390625, 0.20548248291015625, 0.2277984619140625, 0.25011444091796875, 0.272430419921875, 0.29474639892578125, 0.3170623779296875, 0.33937835693359375, 0.3616943359375, 0.38401031494140625, 0.4063262939453125, 0.42864227294921875, 0.450958251953125, 0.47327423095703125, 0.4955902099609375, 0.5179061889648438, 0.54022216796875, 0.5625381469726562, 0.5848541259765625, 0.6071701049804688, 0.629486083984375, 0.6518020629882812, 0.6741180419921875, 0.6964340209960938, 0.71875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 12.0, 25.0, 52.0, 84.0, 156.0, 162.0, 187.0, 142.0, 91.0, 47.0, 20.0, 16.0, 4.0, 6.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.17395305633545, -7.999426364898682, -7.824900150299072, -7.650373458862305, -7.475846767425537, -7.3013200759887695, -7.12679386138916, -6.952267169952393, -6.777740478515625, -6.603213787078857, -6.428687572479248, -6.2541608810424805, -6.079634189605713, -5.905107498168945, -5.730581283569336, -5.556054592132568, -5.381527900695801, -5.207001209259033, -5.032474994659424, -4.857948303222656, -4.683421611785889, -4.508894920349121, -4.334368705749512, -4.159842014312744, -3.9853157997131348, -3.8107893466949463, -3.6362626552581787, -3.4617362022399902, -3.2872095108032227, -3.112683057785034, -2.9381566047668457, -2.763629913330078, -2.5891029834747314, -2.414576530456543, -2.2400498390197754, -2.065523386001587, -1.8909966945648193, -1.7164702415466309, -1.5419436693191528, -1.3674170970916748, -1.1928905248641968, -1.0183639526367188, -0.8438373804092407, -0.6693108677864075, -0.49478429555892944, -0.3202577233314514, -0.14573121070861816, 0.028795361518859863, 0.2033219337463379, 0.3778485059738159, 0.552375078201294, 0.7269015908241272, 0.9014281630516052, 1.0759546756744385, 1.2504812479019165, 1.4250078201293945, 1.5995343923568726, 1.7740609645843506, 1.9485875368118286, 2.1231141090393066, 2.297640562057495, 2.4721672534942627, 2.646693706512451, 2.8212203979492188, 2.9957468509674072]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 5.0, 3.0, 8.0, 13.0, 18.0, 19.0, 29.0, 31.0, 35.0, 29.0, 44.0, 53.0, 52.0, 64.0, 70.0, 90.0, 78.0, 59.0, 48.0, 48.0, 48.0, 40.0, 39.0, 21.0, 18.0, 18.0, 9.0, 8.0, 6.0, 0.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.55065655708313, -3.4656519889831543, -3.3806471824645996, -3.295642614364624, -3.2106380462646484, -3.1256332397460938, -3.040628671646118, -2.9556241035461426, -2.870619297027588, -2.7856147289276123, -2.7006099224090576, -2.615605354309082, -2.5306007862091064, -2.4455959796905518, -2.360591411590576, -2.2755866050720215, -2.190582275390625, -2.1055777072906494, -2.0205729007720947, -1.9355683326721191, -1.850563645362854, -1.7655589580535889, -1.6805543899536133, -1.5955497026443481, -1.510545015335083, -1.4255403280258179, -1.3405357599258423, -1.2555310726165771, -1.170526385307312, -1.0855216979980469, -1.0005171298980713, -0.9155124425888062, -0.830507755279541, -0.7455031275749207, -0.6604984402656555, -0.5754938125610352, -0.4904891550540924, -0.40548449754714966, -0.3204798698425293, -0.23547518253326416, -0.1504705548286438, -0.06546590477228165, 0.019538745284080505, 0.10454338788986206, 0.1895480453968048, 0.27455270290374756, 0.3595573306083679, 0.44456201791763306, 0.5295666456222534, 0.6145712733268738, 0.6995759606361389, 0.7845805883407593, 0.8695852756500244, 0.9545899033546448, 1.0395945310592651, 1.1245992183685303, 1.2096037864685059, 1.294608473777771, 1.3796130418777466, 1.4646177291870117, 1.5496224164962769, 1.634627103805542, 1.7196316719055176, 1.8046363592147827, 1.8896410465240479]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 7.0, 10.0, 9.0, 12.0, 10.0, 24.0, 44.0, 43.0, 85.0, 147.0, 280.0, 557.0, 1272.0, 3212.0, 10647.0, 44247.0, 289099.0, 573305.0, 96850.0, 19699.0, 5464.0, 1837.0, 809.0, 363.0, 214.0, 121.0, 76.0, 43.0, 23.0, 21.0, 7.0, 6.0, 4.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.61474609375, -0.5998344421386719, -0.5849227905273438, -0.5700111389160156, -0.5550994873046875, -0.5401878356933594, -0.5252761840820312, -0.5103645324707031, -0.495452880859375, -0.4805412292480469, -0.46562957763671875, -0.4507179260253906, -0.4358062744140625, -0.4208946228027344, -0.40598297119140625, -0.3910713195800781, -0.37615966796875, -0.3612480163574219, -0.34633636474609375, -0.3314247131347656, -0.3165130615234375, -0.3016014099121094, -0.28668975830078125, -0.2717781066894531, -0.256866455078125, -0.24195480346679688, -0.22704315185546875, -0.21213150024414062, -0.1972198486328125, -0.18230819702148438, -0.16739654541015625, -0.15248489379882812, -0.1375732421875, -0.12266159057617188, -0.10774993896484375, -0.09283828735351562, -0.0779266357421875, -0.06301498413085938, -0.04810333251953125, -0.033191680908203125, -0.018280029296875, -0.003368377685546875, 0.01154327392578125, 0.026454925537109375, 0.0413665771484375, 0.056278228759765625, 0.07118988037109375, 0.08610153198242188, 0.10101318359375, 0.11592483520507812, 0.13083648681640625, 0.14574813842773438, 0.1606597900390625, 0.17557144165039062, 0.19048309326171875, 0.20539474487304688, 0.220306396484375, 0.23521804809570312, 0.25012969970703125, 0.2650413513183594, 0.2799530029296875, 0.2948646545410156, 0.30977630615234375, 0.3246879577636719, 0.339599609375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 1.0, 4.0, 3.0, 3.0, 11.0, 14.0, 13.0, 26.0, 28.0, 42.0, 52.0, 54.0, 66.0, 66.0, 89.0, 75.0, 80.0, 79.0, 59.0, 63.0, 46.0, 37.0, 29.0, 27.0, 12.0, 10.0, 5.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-2.68359375, -2.6199188232421875, -2.556243896484375, -2.4925689697265625, -2.42889404296875, -2.3652191162109375, -2.301544189453125, -2.2378692626953125, -2.1741943359375, -2.1105194091796875, -2.046844482421875, -1.9831695556640625, -1.91949462890625, -1.8558197021484375, -1.792144775390625, -1.7284698486328125, -1.664794921875, -1.6011199951171875, -1.537445068359375, -1.4737701416015625, -1.41009521484375, -1.3464202880859375, -1.282745361328125, -1.2190704345703125, -1.1553955078125, -1.0917205810546875, -1.028045654296875, -0.9643707275390625, -0.90069580078125, -0.8370208740234375, -0.773345947265625, -0.7096710205078125, -0.64599609375, -0.5823211669921875, -0.518646240234375, -0.4549713134765625, -0.39129638671875, -0.3276214599609375, -0.263946533203125, -0.2002716064453125, -0.1365966796875, -0.0729217529296875, -0.009246826171875, 0.0544281005859375, 0.11810302734375, 0.1817779541015625, 0.245452880859375, 0.3091278076171875, 0.372802734375, 0.4364776611328125, 0.500152587890625, 0.5638275146484375, 0.62750244140625, 0.6911773681640625, 0.754852294921875, 0.8185272216796875, 0.8822021484375, 0.9458770751953125, 1.009552001953125, 1.0732269287109375, 1.13690185546875, 1.2005767822265625, 1.264251708984375, 1.3279266357421875, 1.3916015625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 1.0, 3.0, 1.0, 9.0, 4.0, 3.0, 17.0, 17.0, 30.0, 38.0, 35.0, 58.0, 102.0, 140.0, 229.0, 420.0, 859.0, 1960.0, 5612.0, 21429.0, 116050.0, 544220.0, 294044.0, 47139.0, 10187.0, 3165.0, 1242.0, 618.0, 315.0, 198.0, 118.0, 74.0, 60.0, 40.0, 29.0, 29.0, 10.0, 11.0, 7.0, 6.0, 12.0, 4.0, 1.0, 3.0, 3.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3837890625, -0.3720703125, -0.3603515625, -0.3486328125, -0.3369140625, -0.3251953125, -0.3134765625, -0.3017578125, -0.2900390625, -0.2783203125, -0.2666015625, -0.2548828125, -0.2431640625, -0.2314453125, -0.2197265625, -0.2080078125, -0.1962890625, -0.1845703125, -0.1728515625, -0.1611328125, -0.1494140625, -0.1376953125, -0.1259765625, -0.1142578125, -0.1025390625, -0.0908203125, -0.0791015625, -0.0673828125, -0.0556640625, -0.0439453125, -0.0322265625, -0.0205078125, -0.0087890625, 0.0029296875, 0.0146484375, 0.0263671875, 0.0380859375, 0.0498046875, 0.0615234375, 0.0732421875, 0.0849609375, 0.0966796875, 0.1083984375, 0.1201171875, 0.1318359375, 0.1435546875, 0.1552734375, 0.1669921875, 0.1787109375, 0.1904296875, 0.2021484375, 0.2138671875, 0.2255859375, 0.2373046875, 0.2490234375, 0.2607421875, 0.2724609375, 0.2841796875, 0.2958984375, 0.3076171875, 0.3193359375, 0.3310546875, 0.3427734375, 0.3544921875, 0.3662109375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 4.0, 7.0, 7.0, 4.0, 6.0, 5.0, 11.0, 13.0, 17.0, 17.0, 18.0, 19.0, 28.0, 26.0, 41.0, 44.0, 54.0, 51.0, 54.0, 58.0, 58.0, 55.0, 55.0, 38.0, 54.0, 21.0, 44.0, 43.0, 20.0, 22.0, 25.0, 16.0, 13.0, 18.0, 7.0, 8.0, 10.0, 4.0, 2.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.666015625, -2.57568359375, -2.4853515625, -2.39501953125, -2.3046875, -2.21435546875, -2.1240234375, -2.03369140625, -1.943359375, -1.85302734375, -1.7626953125, -1.67236328125, -1.58203125, -1.49169921875, -1.4013671875, -1.31103515625, -1.220703125, -1.13037109375, -1.0400390625, -0.94970703125, -0.859375, -0.76904296875, -0.6787109375, -0.58837890625, -0.498046875, -0.40771484375, -0.3173828125, -0.22705078125, -0.13671875, -0.04638671875, 0.0439453125, 0.13427734375, 0.224609375, 0.31494140625, 0.4052734375, 0.49560546875, 0.5859375, 0.67626953125, 0.7666015625, 0.85693359375, 0.947265625, 1.03759765625, 1.1279296875, 1.21826171875, 1.30859375, 1.39892578125, 1.4892578125, 1.57958984375, 1.669921875, 1.76025390625, 1.8505859375, 1.94091796875, 2.03125, 2.12158203125, 2.2119140625, 2.30224609375, 2.392578125, 2.48291015625, 2.5732421875, 2.66357421875, 2.75390625, 2.84423828125, 2.9345703125, 3.02490234375, 3.115234375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 6.0, 3.0, 9.0, 14.0, 15.0, 15.0, 24.0, 31.0, 31.0, 63.0, 82.0, 128.0, 182.0, 306.0, 571.0, 1152.0, 2838.0, 8312.0, 39825.0, 611513.0, 345106.0, 27335.0, 6327.0, 2301.0, 1000.0, 506.0, 285.0, 176.0, 109.0, 71.0, 51.0, 48.0, 42.0, 19.0, 15.0, 10.0, 9.0, 4.0, 6.0, 4.0, 5.0, 2.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.299560546875, -0.2904548645019531, -0.28134918212890625, -0.2722434997558594, -0.2631378173828125, -0.2540321350097656, -0.24492645263671875, -0.23582077026367188, -0.226715087890625, -0.21760940551757812, -0.20850372314453125, -0.19939804077148438, -0.1902923583984375, -0.18118667602539062, -0.17208099365234375, -0.16297531127929688, -0.15386962890625, -0.14476394653320312, -0.13565826416015625, -0.12655258178710938, -0.1174468994140625, -0.10834121704101562, -0.09923553466796875, -0.09012985229492188, -0.081024169921875, -0.07191848754882812, -0.06281280517578125, -0.053707122802734375, -0.0446014404296875, -0.035495758056640625, -0.02639007568359375, -0.017284393310546875, -0.0081787109375, 0.000926971435546875, 0.01003265380859375, 0.019138336181640625, 0.0282440185546875, 0.037349700927734375, 0.04645538330078125, 0.055561065673828125, 0.064666748046875, 0.07377243041992188, 0.08287811279296875, 0.09198379516601562, 0.1010894775390625, 0.11019515991210938, 0.11930084228515625, 0.12840652465820312, 0.13751220703125, 0.14661788940429688, 0.15572357177734375, 0.16482925415039062, 0.1739349365234375, 0.18304061889648438, 0.19214630126953125, 0.20125198364257812, 0.210357666015625, 0.21946334838867188, 0.22856903076171875, 0.23767471313476562, 0.2467803955078125, 0.2558860778808594, 0.26499176025390625, 0.2740974426269531, 0.283203125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 1.0, 4.0, 1.0, 4.0, 2.0, 4.0, 4.0, 8.0, 12.0, 16.0, 22.0, 24.0, 30.0, 30.0, 67.0, 79.0, 108.0, 124.0, 95.0, 94.0, 67.0, 37.0, 47.0, 30.0, 19.0, 16.0, 14.0, 9.0, 9.0, 6.0, 11.0, 5.0, 8.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.146596908569336e-05, -6.889272481203079e-05, -6.631948053836823e-05, -6.374623626470566e-05, -6.117299199104309e-05, -5.8599747717380524e-05, -5.6026503443717957e-05, -5.345325917005539e-05, -5.088001489639282e-05, -4.8306770622730255e-05, -4.573352634906769e-05, -4.316028207540512e-05, -4.0587037801742554e-05, -3.8013793528079987e-05, -3.544054925441742e-05, -3.286730498075485e-05, -3.0294060707092285e-05, -2.7720816433429718e-05, -2.514757215976715e-05, -2.2574327886104584e-05, -2.0001083612442017e-05, -1.742783933877945e-05, -1.4854595065116882e-05, -1.2281350791454315e-05, -9.708106517791748e-06, -7.134862244129181e-06, -4.561617970466614e-06, -1.9883736968040466e-06, 5.848705768585205e-07, 3.1581148505210876e-06, 5.731359124183655e-06, 8.304603397846222e-06, 1.0877847671508789e-05, 1.3451091945171356e-05, 1.6024336218833923e-05, 1.859758049249649e-05, 2.1170824766159058e-05, 2.3744069039821625e-05, 2.6317313313484192e-05, 2.889055758714676e-05, 3.1463801860809326e-05, 3.403704613447189e-05, 3.661029040813446e-05, 3.918353468179703e-05, 4.1756778955459595e-05, 4.433002322912216e-05, 4.690326750278473e-05, 4.9476511776447296e-05, 5.204975605010986e-05, 5.462300032377243e-05, 5.7196244597435e-05, 5.9769488871097565e-05, 6.234273314476013e-05, 6.49159774184227e-05, 6.748922169208527e-05, 7.006246596574783e-05, 7.26357102394104e-05, 7.520895451307297e-05, 7.778219878673553e-05, 8.03554430603981e-05, 8.292868733406067e-05, 8.550193160772324e-05, 8.80751758813858e-05, 9.064842015504837e-05, 9.322166442871094e-05]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 7.0, 3.0, 3.0, 7.0, 13.0, 20.0, 14.0, 48.0, 70.0, 90.0, 178.0, 287.0, 503.0, 938.0, 2317.0, 6459.0, 25835.0, 208484.0, 711286.0, 71791.0, 13190.0, 3818.0, 1515.0, 702.0, 412.0, 216.0, 116.0, 94.0, 51.0, 31.0, 17.0, 15.0, 7.0, 5.0, 4.0, 3.0, 2.0, 8.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.339111328125, -0.329498291015625, -0.31988525390625, -0.310272216796875, -0.3006591796875, -0.291046142578125, -0.28143310546875, -0.271820068359375, -0.26220703125, -0.252593994140625, -0.24298095703125, -0.233367919921875, -0.2237548828125, -0.214141845703125, -0.20452880859375, -0.194915771484375, -0.185302734375, -0.175689697265625, -0.16607666015625, -0.156463623046875, -0.1468505859375, -0.137237548828125, -0.12762451171875, -0.118011474609375, -0.1083984375, -0.098785400390625, -0.08917236328125, -0.079559326171875, -0.0699462890625, -0.060333251953125, -0.05072021484375, -0.041107177734375, -0.031494140625, -0.021881103515625, -0.01226806640625, -0.002655029296875, 0.0069580078125, 0.016571044921875, 0.02618408203125, 0.035797119140625, 0.04541015625, 0.055023193359375, 0.06463623046875, 0.074249267578125, 0.0838623046875, 0.093475341796875, 0.10308837890625, 0.112701416015625, 0.122314453125, 0.131927490234375, 0.14154052734375, 0.151153564453125, 0.1607666015625, 0.170379638671875, 0.17999267578125, 0.189605712890625, 0.19921875, 0.208831787109375, 0.21844482421875, 0.228057861328125, 0.2376708984375, 0.247283935546875, 0.25689697265625, 0.266510009765625, 0.276123046875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 9.0, 10.0, 15.0, 22.0, 22.0, 40.0, 60.0, 102.0, 195.0, 190.0, 111.0, 64.0, 45.0, 32.0, 21.0, 18.0, 12.0, 9.0, 8.0, 6.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.071044921875, -0.06841754913330078, -0.06579017639160156, -0.06316280364990234, -0.060535430908203125, -0.057908058166503906, -0.05528068542480469, -0.05265331268310547, -0.05002593994140625, -0.04739856719970703, -0.04477119445800781, -0.042143821716308594, -0.039516448974609375, -0.036889076232910156, -0.03426170349121094, -0.03163433074951172, -0.0290069580078125, -0.02637958526611328, -0.023752212524414062, -0.021124839782714844, -0.018497467041015625, -0.015870094299316406, -0.013242721557617188, -0.010615348815917969, -0.00798797607421875, -0.005360603332519531, -0.0027332305908203125, -0.00010585784912109375, 0.002521514892578125, 0.005148887634277344, 0.0077762603759765625, 0.010403633117675781, 0.013031005859375, 0.01565837860107422, 0.018285751342773438, 0.020913124084472656, 0.023540496826171875, 0.026167869567871094, 0.028795242309570312, 0.03142261505126953, 0.03404998779296875, 0.03667736053466797, 0.03930473327636719, 0.041932106018066406, 0.044559478759765625, 0.047186851501464844, 0.04981422424316406, 0.05244159698486328, 0.0550689697265625, 0.05769634246826172, 0.06032371520996094, 0.06295108795166016, 0.06557846069335938, 0.0682058334350586, 0.07083320617675781, 0.07346057891845703, 0.07608795166015625, 0.07871532440185547, 0.08134269714355469, 0.0839700698852539, 0.08659744262695312, 0.08922481536865234, 0.09185218811035156, 0.09447956085205078, 0.09710693359375]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 5.0, 3.0, 6.0, 22.0, 29.0, 52.0, 91.0, 102.0, 151.0, 140.0, 130.0, 114.0, 62.0, 40.0, 18.0, 14.0, 12.0, 8.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-3.765005588531494, -3.6798713207244873, -3.5947368144989014, -3.5096025466918945, -3.4244680404663086, -3.3393337726593018, -3.254199266433716, -3.169064998626709, -3.083930492401123, -2.998796224594116, -2.9136617183685303, -2.8285274505615234, -2.7433929443359375, -2.6582586765289307, -2.5731241703033447, -2.487989902496338, -2.402855396270752, -2.317721128463745, -2.232586622238159, -2.1474523544311523, -2.0623178482055664, -1.97718346118927, -1.8920490741729736, -1.8069148063659668, -1.72178053855896, -1.6366461515426636, -1.5515117645263672, -1.4663773775100708, -1.3812429904937744, -1.296108603477478, -1.2109742164611816, -1.1258399486541748, -1.0407054424285889, -0.9555710554122925, -0.8704366683959961, -0.7853022813796997, -0.7001678943634033, -0.6150335073471069, -0.5298991799354553, -0.44476479291915894, -0.35963040590286255, -0.27449601888656616, -0.18936164677143097, -0.10422727465629578, -0.01909288763999939, 0.066041499376297, 0.151175856590271, 0.23631024360656738, 0.32144463062286377, 0.40657901763916016, 0.49171340465545654, 0.5768477916717529, 0.6619821786880493, 0.7471165657043457, 0.8322508931159973, 0.9173852801322937, 1.0025196075439453, 1.0876539945602417, 1.172788381576538, 1.2579227685928345, 1.3430571556091309, 1.4281915426254272, 1.5133259296417236, 1.5984601974487305, 1.6835947036743164]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 3.0, 4.0, 6.0, 11.0, 6.0, 18.0, 22.0, 26.0, 29.0, 48.0, 40.0, 58.0, 59.0, 77.0, 89.0, 87.0, 93.0, 61.0, 56.0, 54.0, 47.0, 30.0, 35.0, 13.0, 12.0, 8.0, 4.0, 4.0, 4.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.5910773277282715, -2.528998374938965, -2.466919422149658, -2.4048404693603516, -2.342761754989624, -2.2806828022003174, -2.2186038494110107, -2.156524896621704, -2.0944459438323975, -2.032366991043091, -1.9702881574630737, -1.908209204673767, -1.8461302518844604, -1.7840514183044434, -1.7219724655151367, -1.65989351272583, -1.5978147983551025, -1.535735845565796, -1.4736570119857788, -1.4115780591964722, -1.3494991064071655, -1.2874202728271484, -1.2253413200378418, -1.1632623672485352, -1.1011834144592285, -1.0391044616699219, -0.97702556848526, -0.9149466753005981, -0.8528677821159363, -0.7907888889312744, -0.7287099361419678, -0.6666310429573059, -0.604552149772644, -0.5424732565879822, -0.4803943336009979, -0.41831541061401367, -0.3562365174293518, -0.29415759444236755, -0.2320786714553833, -0.16999977827072144, -0.10792085528373718, -0.045841943472623825, 0.016236968338489532, 0.07831588387489319, 0.14039479196071625, 0.2024737000465393, 0.26455262303352356, 0.3266315162181854, 0.3887104392051697, 0.45078936219215393, 0.5128682851791382, 0.5749471783638, 0.6370260715484619, 0.6991050243377686, 0.7611839175224304, 0.8232628107070923, 0.8853417634963989, 0.9474206566810608, 1.0094995498657227, 1.0715785026550293, 1.133657455444336, 1.195736289024353, 1.2578152418136597, 1.3198940753936768, 1.3819730281829834]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 6.0, 9.0, 9.0, 9.0, 12.0, 20.0, 30.0, 61.0, 87.0, 181.0, 318.0, 602.0, 1233.0, 2656.0, 6090.0, 15882.0, 51437.0, 237489.0, 551123.0, 129598.0, 32460.0, 10976.0, 4368.0, 1972.0, 908.0, 440.0, 228.0, 132.0, 75.0, 47.0, 24.0, 29.0, 14.0, 5.0, 10.0, 10.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-2.275390625, -2.21441650390625, -2.1534423828125, -2.09246826171875, -2.031494140625, -1.97052001953125, -1.9095458984375, -1.84857177734375, -1.78759765625, -1.72662353515625, -1.6656494140625, -1.60467529296875, -1.543701171875, -1.48272705078125, -1.4217529296875, -1.36077880859375, -1.2998046875, -1.23883056640625, -1.1778564453125, -1.11688232421875, -1.055908203125, -0.99493408203125, -0.9339599609375, -0.87298583984375, -0.81201171875, -0.75103759765625, -0.6900634765625, -0.62908935546875, -0.568115234375, -0.50714111328125, -0.4461669921875, -0.38519287109375, -0.32421875, -0.26324462890625, -0.2022705078125, -0.14129638671875, -0.080322265625, -0.01934814453125, 0.0416259765625, 0.10260009765625, 0.16357421875, 0.22454833984375, 0.2855224609375, 0.34649658203125, 0.407470703125, 0.46844482421875, 0.5294189453125, 0.59039306640625, 0.6513671875, 0.71234130859375, 0.7733154296875, 0.83428955078125, 0.895263671875, 0.95623779296875, 1.0172119140625, 1.07818603515625, 1.13916015625, 1.20013427734375, 1.2611083984375, 1.32208251953125, 1.383056640625, 1.44403076171875, 1.5050048828125, 1.56597900390625, 1.626953125]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 5.0, 3.0, 7.0, 12.0, 15.0, 25.0, 26.0, 27.0, 45.0, 42.0, 69.0, 87.0, 85.0, 96.0, 98.0, 88.0, 62.0, 57.0, 40.0, 35.0, 20.0, 22.0, 16.0, 12.0, 2.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 3.0], "bins": [-7.1171875, -6.96014404296875, -6.8031005859375, -6.64605712890625, -6.489013671875, -6.33197021484375, -6.1749267578125, -6.01788330078125, -5.86083984375, -5.70379638671875, -5.5467529296875, -5.38970947265625, -5.232666015625, -5.07562255859375, -4.9185791015625, -4.76153564453125, -4.6044921875, -4.44744873046875, -4.2904052734375, -4.13336181640625, -3.976318359375, -3.81927490234375, -3.6622314453125, -3.50518798828125, -3.34814453125, -3.19110107421875, -3.0340576171875, -2.87701416015625, -2.719970703125, -2.56292724609375, -2.4058837890625, -2.24884033203125, -2.091796875, -1.93475341796875, -1.7777099609375, -1.62066650390625, -1.463623046875, -1.30657958984375, -1.1495361328125, -0.99249267578125, -0.83544921875, -0.67840576171875, -0.5213623046875, -0.36431884765625, -0.207275390625, -0.05023193359375, 0.1068115234375, 0.26385498046875, 0.4208984375, 0.57794189453125, 0.7349853515625, 0.89202880859375, 1.049072265625, 1.20611572265625, 1.3631591796875, 1.52020263671875, 1.67724609375, 1.83428955078125, 1.9913330078125, 2.14837646484375, 2.305419921875, 2.46246337890625, 2.6195068359375, 2.77655029296875, 2.93359375]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 4.0, 8.0, 9.0, 13.0, 19.0, 47.0, 63.0, 148.0, 327.0, 977.0, 4648.0, 41653.0, 861376.0, 127971.0, 8825.0, 1566.0, 478.0, 201.0, 91.0, 53.0, 24.0, 14.0, 6.0, 9.0, 4.0, 3.0, 3.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.01953125, -3.874267578125, -3.72900390625, -3.583740234375, -3.4384765625, -3.293212890625, -3.14794921875, -3.002685546875, -2.857421875, -2.712158203125, -2.56689453125, -2.421630859375, -2.2763671875, -2.131103515625, -1.98583984375, -1.840576171875, -1.6953125, -1.550048828125, -1.40478515625, -1.259521484375, -1.1142578125, -0.968994140625, -0.82373046875, -0.678466796875, -0.533203125, -0.387939453125, -0.24267578125, -0.097412109375, 0.0478515625, 0.193115234375, 0.33837890625, 0.483642578125, 0.62890625, 0.774169921875, 0.91943359375, 1.064697265625, 1.2099609375, 1.355224609375, 1.50048828125, 1.645751953125, 1.791015625, 1.936279296875, 2.08154296875, 2.226806640625, 2.3720703125, 2.517333984375, 2.66259765625, 2.807861328125, 2.953125, 3.098388671875, 3.24365234375, 3.388916015625, 3.5341796875, 3.679443359375, 3.82470703125, 3.969970703125, 4.115234375, 4.260498046875, 4.40576171875, 4.551025390625, 4.6962890625, 4.841552734375, 4.98681640625, 5.132080078125, 5.27734375]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0, 3.0, 5.0, 7.0, 4.0, 9.0, 10.0, 15.0, 21.0, 18.0, 24.0, 29.0, 28.0, 31.0, 35.0, 37.0, 35.0, 48.0, 61.0, 41.0, 58.0, 49.0, 54.0, 37.0, 56.0, 54.0, 45.0, 37.0, 25.0, 33.0, 12.0, 14.0, 15.0, 15.0, 8.0, 5.0, 13.0, 5.0, 2.0, 6.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.171875, -4.03350830078125, -3.8951416015625, -3.75677490234375, -3.618408203125, -3.48004150390625, -3.3416748046875, -3.20330810546875, -3.06494140625, -2.92657470703125, -2.7882080078125, -2.64984130859375, -2.511474609375, -2.37310791015625, -2.2347412109375, -2.09637451171875, -1.9580078125, -1.81964111328125, -1.6812744140625, -1.54290771484375, -1.404541015625, -1.26617431640625, -1.1278076171875, -0.98944091796875, -0.85107421875, -0.71270751953125, -0.5743408203125, -0.43597412109375, -0.297607421875, -0.15924072265625, -0.0208740234375, 0.11749267578125, 0.255859375, 0.39422607421875, 0.5325927734375, 0.67095947265625, 0.809326171875, 0.94769287109375, 1.0860595703125, 1.22442626953125, 1.36279296875, 1.50115966796875, 1.6395263671875, 1.77789306640625, 1.916259765625, 2.05462646484375, 2.1929931640625, 2.33135986328125, 2.4697265625, 2.60809326171875, 2.7464599609375, 2.88482666015625, 3.023193359375, 3.16156005859375, 3.2999267578125, 3.43829345703125, 3.57666015625, 3.71502685546875, 3.8533935546875, 3.99176025390625, 4.130126953125, 4.26849365234375, 4.4068603515625, 4.54522705078125, 4.68359375]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 2.0, 4.0, 2.0, 7.0, 8.0, 16.0, 17.0, 16.0, 46.0, 78.0, 117.0, 226.0, 613.0, 1743.0, 6207.0, 32146.0, 229399.0, 646604.0, 108618.0, 16959.0, 3700.0, 1094.0, 452.0, 196.0, 98.0, 55.0, 38.0, 21.0, 18.0, 15.0, 8.0, 6.0, 10.0, 4.0, 3.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.68115234375, -0.6552658081054688, -0.6293792724609375, -0.6034927368164062, -0.577606201171875, -0.5517196655273438, -0.5258331298828125, -0.49994659423828125, -0.47406005859375, -0.44817352294921875, -0.4222869873046875, -0.39640045166015625, -0.370513916015625, -0.34462738037109375, -0.3187408447265625, -0.29285430908203125, -0.2669677734375, -0.24108123779296875, -0.2151947021484375, -0.18930816650390625, -0.163421630859375, -0.13753509521484375, -0.1116485595703125, -0.08576202392578125, -0.05987548828125, -0.03398895263671875, -0.0081024169921875, 0.01778411865234375, 0.043670654296875, 0.06955718994140625, 0.0954437255859375, 0.12133026123046875, 0.147216796875, 0.17310333251953125, 0.1989898681640625, 0.22487640380859375, 0.250762939453125, 0.27664947509765625, 0.3025360107421875, 0.32842254638671875, 0.35430908203125, 0.38019561767578125, 0.4060821533203125, 0.43196868896484375, 0.457855224609375, 0.48374176025390625, 0.5096282958984375, 0.5355148315429688, 0.5614013671875, 0.5872879028320312, 0.6131744384765625, 0.6390609741210938, 0.664947509765625, 0.6908340454101562, 0.7167205810546875, 0.7426071166992188, 0.76849365234375, 0.7943801879882812, 0.8202667236328125, 0.8461532592773438, 0.872039794921875, 0.8979263305664062, 0.9238128662109375, 0.9496994018554688, 0.9755859375]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 3.0, 6.0, 3.0, 5.0, 6.0, 6.0, 7.0, 16.0, 15.0, 23.0, 27.0, 49.0, 42.0, 44.0, 73.0, 100.0, 125.0, 104.0, 87.0, 58.0, 48.0, 31.0, 23.0, 16.0, 21.0, 8.0, 17.0, 7.0, 6.0, 8.0, 3.0, 4.0, 2.0, 3.0, 2.0, 3.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011140108108520508, -0.00010807439684867859, -0.0001047477126121521, -0.00010142102837562561, -9.809434413909912e-05, -9.476765990257263e-05, -9.144097566604614e-05, -8.811429142951965e-05, -8.478760719299316e-05, -8.146092295646667e-05, -7.813423871994019e-05, -7.48075544834137e-05, -7.148087024688721e-05, -6.815418601036072e-05, -6.482750177383423e-05, -6.150081753730774e-05, -5.817413330078125e-05, -5.484744906425476e-05, -5.152076482772827e-05, -4.819408059120178e-05, -4.486739635467529e-05, -4.1540712118148804e-05, -3.8214027881622314e-05, -3.4887343645095825e-05, -3.1560659408569336e-05, -2.8233975172042847e-05, -2.4907290935516357e-05, -2.1580606698989868e-05, -1.825392246246338e-05, -1.492723822593689e-05, -1.16005539894104e-05, -8.273869752883911e-06, -4.947185516357422e-06, -1.6205012798309326e-06, 1.7061829566955566e-06, 5.032867193222046e-06, 8.359551429748535e-06, 1.1686235666275024e-05, 1.5012919902801514e-05, 1.8339604139328003e-05, 2.1666288375854492e-05, 2.499297261238098e-05, 2.831965684890747e-05, 3.164634108543396e-05, 3.497302532196045e-05, 3.829970955848694e-05, 4.162639379501343e-05, 4.495307803153992e-05, 4.8279762268066406e-05, 5.1606446504592896e-05, 5.4933130741119385e-05, 5.8259814977645874e-05, 6.158649921417236e-05, 6.491318345069885e-05, 6.823986768722534e-05, 7.156655192375183e-05, 7.489323616027832e-05, 7.821992039680481e-05, 8.15466046333313e-05, 8.487328886985779e-05, 8.819997310638428e-05, 9.152665734291077e-05, 9.485334157943726e-05, 9.818002581596375e-05, 0.00010150671005249023]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 3.0, 5.0, 12.0, 31.0, 48.0, 90.0, 268.0, 882.0, 8073.0, 216314.0, 790728.0, 29293.0, 2106.0, 416.0, 132.0, 63.0, 36.0, 24.0, 14.0, 6.0, 6.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.8154296875, -1.7653045654296875, -1.715179443359375, -1.6650543212890625, -1.61492919921875, -1.5648040771484375, -1.514678955078125, -1.4645538330078125, -1.4144287109375, -1.3643035888671875, -1.314178466796875, -1.2640533447265625, -1.21392822265625, -1.1638031005859375, -1.113677978515625, -1.0635528564453125, -1.013427734375, -0.9633026123046875, -0.913177490234375, -0.8630523681640625, -0.81292724609375, -0.7628021240234375, -0.712677001953125, -0.6625518798828125, -0.6124267578125, -0.5623016357421875, -0.512176513671875, -0.4620513916015625, -0.41192626953125, -0.3618011474609375, -0.311676025390625, -0.2615509033203125, -0.21142578125, -0.1613006591796875, -0.111175537109375, -0.0610504150390625, -0.01092529296875, 0.0391998291015625, 0.089324951171875, 0.1394500732421875, 0.1895751953125, 0.2397003173828125, 0.289825439453125, 0.3399505615234375, 0.39007568359375, 0.4402008056640625, 0.490325927734375, 0.5404510498046875, 0.590576171875, 0.6407012939453125, 0.690826416015625, 0.7409515380859375, 0.79107666015625, 0.8412017822265625, 0.891326904296875, 0.9414520263671875, 0.9915771484375, 1.0417022705078125, 1.091827392578125, 1.1419525146484375, 1.19207763671875, 1.2422027587890625, 1.292327880859375, 1.3424530029296875, 1.392578125]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 5.0, 7.0, 5.0, 10.0, 9.0, 9.0, 8.0, 17.0, 15.0, 18.0, 35.0, 36.0, 48.0, 52.0, 61.0, 74.0, 74.0, 100.0, 59.0, 72.0, 53.0, 42.0, 37.0, 31.0, 24.0, 23.0, 16.0, 14.0, 10.0, 7.0, 10.0, 5.0, 7.0, 6.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.32080078125, -0.3105354309082031, -0.30027008056640625, -0.2900047302246094, -0.2797393798828125, -0.2694740295410156, -0.25920867919921875, -0.24894332885742188, -0.238677978515625, -0.22841262817382812, -0.21814727783203125, -0.20788192749023438, -0.1976165771484375, -0.18735122680664062, -0.17708587646484375, -0.16682052612304688, -0.15655517578125, -0.14628982543945312, -0.13602447509765625, -0.12575912475585938, -0.1154937744140625, -0.10522842407226562, -0.09496307373046875, -0.08469772338867188, -0.074432373046875, -0.06416702270507812, -0.05390167236328125, -0.043636322021484375, -0.0333709716796875, -0.023105621337890625, -0.01284027099609375, -0.002574920654296875, 0.0076904296875, 0.017955780029296875, 0.02822113037109375, 0.038486480712890625, 0.0487518310546875, 0.059017181396484375, 0.06928253173828125, 0.07954788208007812, 0.089813232421875, 0.10007858276367188, 0.11034393310546875, 0.12060928344726562, 0.1308746337890625, 0.14113998413085938, 0.15140533447265625, 0.16167068481445312, 0.17193603515625, 0.18220138549804688, 0.19246673583984375, 0.20273208618164062, 0.2129974365234375, 0.22326278686523438, 0.23352813720703125, 0.24379348754882812, 0.254058837890625, 0.2643241882324219, 0.27458953857421875, 0.2848548889160156, 0.2951202392578125, 0.3053855895996094, 0.31565093994140625, 0.3259162902832031, 0.336181640625]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 7.0, 96.0, 382.0, 427.0, 85.0, 13.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.743201732635498, -6.973764896392822, -6.204327583312988, -5.4348907470703125, -4.665453910827637, -3.896017074584961, -3.126579761505127, -2.357142925262451, -1.5877060890197754, -0.8182691335678101, -0.04883217811584473, 0.7206048965454102, 1.490041732788086, 2.2594785690307617, 3.0289158821105957, 3.7983527183532715, 4.567789554595947, 5.337226390838623, 6.106663703918457, 6.876100540161133, 7.645537376403809, 8.414974212646484, 9.184412002563477, 9.953847885131836, 10.723285675048828, 11.492722511291504, 12.26215934753418, 13.031597137451172, 13.801033020019531, 14.570470809936523, 15.3399076461792, 16.109344482421875, 16.878780364990234, 17.648218154907227, 18.417654037475586, 19.187091827392578, 19.956527709960938, 20.72596549987793, 21.495403289794922, 22.26483917236328, 23.03427505493164, 23.803712844848633, 24.573148727416992, 25.342586517333984, 26.112022399902344, 26.881460189819336, 27.650897979736328, 28.420333862304688, 29.18977165222168, 29.959209442138672, 30.72864532470703, 31.498083114624023, 32.267520904541016, 33.036956787109375, 33.806392669677734, 34.575828552246094, 35.34526824951172, 36.11470413208008, 36.8841438293457, 37.65357971191406, 38.42301559448242, 39.19245147705078, 39.961891174316406, 40.731327056884766, 41.500762939453125]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 7.0, 10.0, 8.0, 11.0, 18.0, 19.0, 20.0, 23.0, 23.0, 26.0, 38.0, 47.0, 51.0, 55.0, 57.0, 47.0, 54.0, 63.0, 54.0, 50.0, 44.0, 46.0, 35.0, 46.0, 27.0, 33.0, 18.0, 19.0, 12.0, 14.0, 5.0, 10.0, 4.0, 6.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-9.816752433776855, -9.54080581665039, -9.26485824584961, -8.988911628723145, -8.712964057922363, -8.437017440795898, -8.161069869995117, -7.885123252868652, -7.609175682067871, -7.333228588104248, -7.057281494140625, -6.781334400177002, -6.505387306213379, -6.229440212249756, -5.953493118286133, -5.677546501159668, -5.401599407196045, -5.125652313232422, -4.849705219268799, -4.573758125305176, -4.297811031341553, -4.02186393737793, -3.7459170818328857, -3.4699699878692627, -3.1940228939056396, -2.9180757999420166, -2.6421287059783936, -2.3661818504333496, -2.0902347564697266, -1.814287543296814, -1.5383405685424805, -1.2623934745788574, -0.9864459037780762, -0.7104988098144531, -0.43455177545547485, -0.15860474109649658, 0.11734235286712646, 0.3932894468307495, 0.669236421585083, 0.945183515548706, 1.221130609512329, 1.4970777034759521, 1.7730247974395752, 2.048971652984619, 2.324918746948242, 2.6008658409118652, 2.8768129348754883, 3.1527600288391113, 3.4287071228027344, 3.7046542167663574, 3.9806013107299805, 4.2565484046936035, 4.532495498657227, 4.80844259262085, 5.084389686584473, 5.3603363037109375, 5.636283874511719, 5.912230968475342, 6.188178062438965, 6.464125156402588, 6.740072250366211, 7.016019344329834, 7.291966438293457, 7.567913055419922, 7.843860149383545]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 8.0, 9.0, 10.0, 8.0, 14.0, 16.0, 26.0, 32.0, 44.0, 50.0, 73.0, 123.0, 201.0, 389.0, 1069.0, 3210.0, 16355.0, 343926.0, 3731639.0, 85210.0, 8592.0, 1934.0, 635.0, 242.0, 138.0, 99.0, 54.0, 37.0, 28.0, 20.0, 23.0, 14.0, 11.0, 5.0, 10.0, 4.0, 7.0, 6.0, 1.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.15234375, -4.00030517578125, -3.8482666015625, -3.69622802734375, -3.544189453125, -3.39215087890625, -3.2401123046875, -3.08807373046875, -2.93603515625, -2.78399658203125, -2.6319580078125, -2.47991943359375, -2.327880859375, -2.17584228515625, -2.0238037109375, -1.87176513671875, -1.7197265625, -1.56768798828125, -1.4156494140625, -1.26361083984375, -1.111572265625, -0.95953369140625, -0.8074951171875, -0.65545654296875, -0.50341796875, -0.35137939453125, -0.1993408203125, -0.04730224609375, 0.104736328125, 0.25677490234375, 0.4088134765625, 0.56085205078125, 0.712890625, 0.86492919921875, 1.0169677734375, 1.16900634765625, 1.321044921875, 1.47308349609375, 1.6251220703125, 1.77716064453125, 1.92919921875, 2.08123779296875, 2.2332763671875, 2.38531494140625, 2.537353515625, 2.68939208984375, 2.8414306640625, 2.99346923828125, 3.1455078125, 3.29754638671875, 3.4495849609375, 3.60162353515625, 3.753662109375, 3.90570068359375, 4.0577392578125, 4.20977783203125, 4.36181640625, 4.51385498046875, 4.6658935546875, 4.81793212890625, 4.969970703125, 5.12200927734375, 5.2740478515625, 5.42608642578125, 5.578125]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 5.0, 9.0, 15.0, 24.0, 22.0, 31.0, 45.0, 72.0, 83.0, 86.0, 104.0, 88.0, 97.0, 70.0, 73.0, 69.0, 38.0, 23.0, 10.0, 12.0, 13.0, 5.0, 4.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.845703125, -2.7777252197265625, -2.709747314453125, -2.6417694091796875, -2.57379150390625, -2.5058135986328125, -2.437835693359375, -2.3698577880859375, -2.3018798828125, -2.2339019775390625, -2.165924072265625, -2.0979461669921875, -2.02996826171875, -1.9619903564453125, -1.894012451171875, -1.8260345458984375, -1.758056640625, -1.6900787353515625, -1.622100830078125, -1.5541229248046875, -1.48614501953125, -1.4181671142578125, -1.350189208984375, -1.2822113037109375, -1.2142333984375, -1.1462554931640625, -1.078277587890625, -1.0102996826171875, -0.94232177734375, -0.8743438720703125, -0.806365966796875, -0.7383880615234375, -0.67041015625, -0.6024322509765625, -0.534454345703125, -0.4664764404296875, -0.39849853515625, -0.3305206298828125, -0.262542724609375, -0.1945648193359375, -0.1265869140625, -0.0586090087890625, 0.009368896484375, 0.0773468017578125, 0.14532470703125, 0.2133026123046875, 0.281280517578125, 0.3492584228515625, 0.417236328125, 0.4852142333984375, 0.553192138671875, 0.6211700439453125, 0.68914794921875, 0.7571258544921875, 0.825103759765625, 0.8930816650390625, 0.9610595703125, 1.0290374755859375, 1.097015380859375, 1.1649932861328125, 1.23297119140625, 1.3009490966796875, 1.368927001953125, 1.4369049072265625, 1.5048828125]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 1.0, 4.0, 10.0, 11.0, 5.0, 15.0, 11.0, 25.0, 29.0, 38.0, 72.0, 125.0, 238.0, 534.0, 1986.0, 13663.0, 284727.0, 3771363.0, 111426.0, 7687.0, 1334.0, 434.0, 202.0, 122.0, 85.0, 39.0, 25.0, 23.0, 15.0, 12.0, 5.0, 8.0, 4.0, 3.0, 3.0, 1.0, 3.0, 3.0, 0.0, 3.0], "bins": [-6.88671875, -6.72027587890625, -6.5538330078125, -6.38739013671875, -6.220947265625, -6.05450439453125, -5.8880615234375, -5.72161865234375, -5.55517578125, -5.38873291015625, -5.2222900390625, -5.05584716796875, -4.889404296875, -4.72296142578125, -4.5565185546875, -4.39007568359375, -4.2236328125, -4.05718994140625, -3.8907470703125, -3.72430419921875, -3.557861328125, -3.39141845703125, -3.2249755859375, -3.05853271484375, -2.89208984375, -2.72564697265625, -2.5592041015625, -2.39276123046875, -2.226318359375, -2.05987548828125, -1.8934326171875, -1.72698974609375, -1.560546875, -1.39410400390625, -1.2276611328125, -1.06121826171875, -0.894775390625, -0.72833251953125, -0.5618896484375, -0.39544677734375, -0.22900390625, -0.06256103515625, 0.1038818359375, 0.27032470703125, 0.436767578125, 0.60321044921875, 0.7696533203125, 0.93609619140625, 1.1025390625, 1.26898193359375, 1.4354248046875, 1.60186767578125, 1.768310546875, 1.93475341796875, 2.1011962890625, 2.26763916015625, 2.43408203125, 2.60052490234375, 2.7669677734375, 2.93341064453125, 3.099853515625, 3.26629638671875, 3.4327392578125, 3.59918212890625, 3.765625]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 8.0, 7.0, 13.0, 17.0, 17.0, 21.0, 50.0, 58.0, 67.0, 104.0, 161.0, 255.0, 338.0, 498.0, 664.0, 548.0, 409.0, 278.0, 183.0, 113.0, 79.0, 49.0, 41.0, 20.0, 20.0, 15.0, 10.0, 10.0, 3.0, 6.0, 1.0, 2.0, 7.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.69775390625, -0.6716232299804688, -0.6454925537109375, -0.6193618774414062, -0.593231201171875, -0.5671005249023438, -0.5409698486328125, -0.5148391723632812, -0.48870849609375, -0.46257781982421875, -0.4364471435546875, -0.41031646728515625, -0.384185791015625, -0.35805511474609375, -0.3319244384765625, -0.30579376220703125, -0.2796630859375, -0.25353240966796875, -0.2274017333984375, -0.20127105712890625, -0.175140380859375, -0.14900970458984375, -0.1228790283203125, -0.09674835205078125, -0.07061767578125, -0.04448699951171875, -0.0183563232421875, 0.00777435302734375, 0.033905029296875, 0.06003570556640625, 0.0861663818359375, 0.11229705810546875, 0.138427734375, 0.16455841064453125, 0.1906890869140625, 0.21681976318359375, 0.242950439453125, 0.26908111572265625, 0.2952117919921875, 0.32134246826171875, 0.34747314453125, 0.37360382080078125, 0.3997344970703125, 0.42586517333984375, 0.451995849609375, 0.47812652587890625, 0.5042572021484375, 0.5303878784179688, 0.5565185546875, 0.5826492309570312, 0.6087799072265625, 0.6349105834960938, 0.661041259765625, 0.6871719360351562, 0.7133026123046875, 0.7394332885742188, 0.76556396484375, 0.7916946411132812, 0.8178253173828125, 0.8439559936523438, 0.870086669921875, 0.8962173461914062, 0.9223480224609375, 0.9484786987304688, 0.974609375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 9.0, 15.0, 15.0, 44.0, 44.0, 61.0, 86.0, 92.0, 112.0, 114.0, 120.0, 88.0, 69.0, 38.0, 40.0, 25.0, 17.0, 9.0, 7.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4264166355133057, -2.307070732116699, -2.1877248287200928, -2.0683789253234863, -1.949033260345459, -1.8296873569488525, -1.710341453552246, -1.5909955501556396, -1.4716497659683228, -1.3523038625717163, -1.2329580783843994, -1.113612174987793, -0.9942663311958313, -0.8749204874038696, -0.7555745840072632, -0.6362287402153015, -0.5168828964233398, -0.3975370526313782, -0.2781911790370941, -0.15884530544281006, -0.03949946165084839, 0.07984638214111328, 0.19919228553771973, 0.3185381293296814, 0.43788397312164307, 0.5572298169136047, 0.6765756607055664, 0.7959215641021729, 0.9152674078941345, 1.0346132516860962, 1.1539591550827026, 1.2733049392700195, 1.3926506042480469, 1.5119965076446533, 1.6313422918319702, 1.7506881952285767, 1.8700339794158936, 1.9893798828125, 2.1087257862091064, 2.228071689605713, 2.3474173545837402, 2.4667632579803467, 2.586109161376953, 2.7054548263549805, 2.824800729751587, 2.9441466331481934, 3.0634925365448, 3.1828384399414062, 3.3021843433380127, 3.421530246734619, 3.5408761501312256, 3.660222053527832, 3.7795677185058594, 3.898913621902466, 4.018259525299072, 4.1376051902771, 4.256951332092285, 4.3762969970703125, 4.495643138885498, 4.614988803863525, 4.734334945678711, 4.853680610656738, 4.973026275634766, 5.092372417449951, 5.2117180824279785]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 4.0, 1.0, 3.0, 2.0, 8.0, 10.0, 12.0, 19.0, 13.0, 17.0, 23.0, 24.0, 23.0, 25.0, 30.0, 28.0, 39.0, 42.0, 50.0, 54.0, 41.0, 42.0, 44.0, 46.0, 47.0, 48.0, 38.0, 37.0, 32.0, 26.0, 30.0, 18.0, 23.0, 20.0, 16.0, 15.0, 10.0, 15.0, 6.0, 4.0, 7.0, 4.0, 1.0, 4.0, 4.0, 3.0, 0.0, 0.0, 0.0, 4.0], "bins": [-2.160945177078247, -2.1008870601654053, -2.0408289432525635, -1.9807708263397217, -1.9207125902175903, -1.8606544733047485, -1.8005963563919067, -1.740538239479065, -1.6804800033569336, -1.6204218864440918, -1.56036376953125, -1.5003056526184082, -1.4402474164962769, -1.380189299583435, -1.3201311826705933, -1.2600730657577515, -1.2000149488449097, -1.1399568319320679, -1.079898715019226, -1.0198404788970947, -0.9597823619842529, -0.8997242450714111, -0.8396661281585693, -0.7796080112457275, -0.719549834728241, -0.6594917178153992, -0.5994335412979126, -0.5393754243850708, -0.4793172776699066, -0.41925913095474243, -0.35920101404190063, -0.29914286732673645, -0.23908460140228271, -0.17902645468711853, -0.11896832287311554, -0.05891019105911255, 0.0011479556560516357, 0.06120610237121582, 0.12126421928405762, 0.1813223659992218, 0.241380512714386, 0.30143865942955017, 0.36149680614471436, 0.42155492305755615, 0.48161306977272034, 0.5416712164878845, 0.6017293334007263, 0.6617875099182129, 0.7218456268310547, 0.7819037437438965, 0.8419619202613831, 0.9020200371742249, 0.9620782136917114, 1.0221363306045532, 1.082194447517395, 1.1422525644302368, 1.2023108005523682, 1.26236891746521, 1.3224270343780518, 1.3824851512908936, 1.442543387413025, 1.5026015043258667, 1.5626596212387085, 1.6227177381515503, 1.682775855064392]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 6.0, 5.0, 11.0, 5.0, 21.0, 14.0, 20.0, 37.0, 43.0, 77.0, 119.0, 187.0, 403.0, 823.0, 2132.0, 6952.0, 32890.0, 662153.0, 314877.0, 19604.0, 5073.0, 1648.0, 655.0, 312.0, 166.0, 104.0, 59.0, 41.0, 30.0, 24.0, 23.0, 13.0, 14.0, 4.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6220703125, -0.5970535278320312, -0.5720367431640625, -0.5470199584960938, -0.522003173828125, -0.49698638916015625, -0.4719696044921875, -0.44695281982421875, -0.42193603515625, -0.39691925048828125, -0.3719024658203125, -0.34688568115234375, -0.321868896484375, -0.29685211181640625, -0.2718353271484375, -0.24681854248046875, -0.2218017578125, -0.19678497314453125, -0.1717681884765625, -0.14675140380859375, -0.121734619140625, -0.09671783447265625, -0.0717010498046875, -0.04668426513671875, -0.02166748046875, 0.00334930419921875, 0.0283660888671875, 0.05338287353515625, 0.078399658203125, 0.10341644287109375, 0.1284332275390625, 0.15345001220703125, 0.178466796875, 0.20348358154296875, 0.2285003662109375, 0.25351715087890625, 0.278533935546875, 0.30355072021484375, 0.3285675048828125, 0.35358428955078125, 0.37860107421875, 0.40361785888671875, 0.4286346435546875, 0.45365142822265625, 0.478668212890625, 0.5036849975585938, 0.5287017822265625, 0.5537185668945312, 0.5787353515625, 0.6037521362304688, 0.6287689208984375, 0.6537857055664062, 0.678802490234375, 0.7038192749023438, 0.7288360595703125, 0.7538528442382812, 0.77886962890625, 0.8038864135742188, 0.8289031982421875, 0.8539199829101562, 0.878936767578125, 0.9039535522460938, 0.9289703369140625, 0.9539871215820312, 0.97900390625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 5.0, 9.0, 16.0, 21.0, 20.0, 26.0, 21.0, 26.0, 39.0, 37.0, 48.0, 51.0, 52.0, 61.0, 59.0, 51.0, 48.0, 53.0, 58.0, 42.0, 51.0, 32.0, 34.0, 31.0, 27.0, 17.0, 10.0, 13.0, 12.0, 4.0, 9.0, 9.0, 2.0, 3.0, 1.0, 5.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.013671875, -1.9622039794921875, -1.910736083984375, -1.8592681884765625, -1.80780029296875, -1.7563323974609375, -1.704864501953125, -1.6533966064453125, -1.6019287109375, -1.5504608154296875, -1.498992919921875, -1.4475250244140625, -1.39605712890625, -1.3445892333984375, -1.293121337890625, -1.2416534423828125, -1.190185546875, -1.1387176513671875, -1.087249755859375, -1.0357818603515625, -0.98431396484375, -0.9328460693359375, -0.881378173828125, -0.8299102783203125, -0.7784423828125, -0.7269744873046875, -0.675506591796875, -0.6240386962890625, -0.57257080078125, -0.5211029052734375, -0.469635009765625, -0.4181671142578125, -0.36669921875, -0.3152313232421875, -0.263763427734375, -0.2122955322265625, -0.16082763671875, -0.1093597412109375, -0.057891845703125, -0.0064239501953125, 0.0450439453125, 0.0965118408203125, 0.147979736328125, 0.1994476318359375, 0.25091552734375, 0.3023834228515625, 0.353851318359375, 0.4053192138671875, 0.456787109375, 0.5082550048828125, 0.559722900390625, 0.6111907958984375, 0.66265869140625, 0.7141265869140625, 0.765594482421875, 0.8170623779296875, 0.8685302734375, 0.9199981689453125, 0.971466064453125, 1.0229339599609375, 1.07440185546875, 1.1258697509765625, 1.177337646484375, 1.2288055419921875, 1.2802734375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 5.0, 2.0, 9.0, 13.0, 7.0, 15.0, 21.0, 39.0, 49.0, 60.0, 116.0, 195.0, 319.0, 557.0, 1152.0, 2765.0, 7856.0, 36410.0, 401139.0, 532638.0, 49854.0, 9455.0, 3058.0, 1311.0, 625.0, 305.0, 175.0, 109.0, 85.0, 51.0, 40.0, 38.0, 22.0, 14.0, 13.0, 8.0, 4.0, 4.0, 5.0, 5.0, 3.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.57177734375, -0.5544891357421875, -0.537200927734375, -0.5199127197265625, -0.50262451171875, -0.4853363037109375, -0.468048095703125, -0.4507598876953125, -0.4334716796875, -0.4161834716796875, -0.398895263671875, -0.3816070556640625, -0.36431884765625, -0.3470306396484375, -0.329742431640625, -0.3124542236328125, -0.295166015625, -0.2778778076171875, -0.260589599609375, -0.2433013916015625, -0.22601318359375, -0.2087249755859375, -0.191436767578125, -0.1741485595703125, -0.1568603515625, -0.1395721435546875, -0.122283935546875, -0.1049957275390625, -0.08770751953125, -0.0704193115234375, -0.053131103515625, -0.0358428955078125, -0.0185546875, -0.0012664794921875, 0.016021728515625, 0.0333099365234375, 0.05059814453125, 0.0678863525390625, 0.085174560546875, 0.1024627685546875, 0.1197509765625, 0.1370391845703125, 0.154327392578125, 0.1716156005859375, 0.18890380859375, 0.2061920166015625, 0.223480224609375, 0.2407684326171875, 0.258056640625, 0.2753448486328125, 0.292633056640625, 0.3099212646484375, 0.32720947265625, 0.3444976806640625, 0.361785888671875, 0.3790740966796875, 0.3963623046875, 0.4136505126953125, 0.430938720703125, 0.4482269287109375, 0.46551513671875, 0.4828033447265625, 0.500091552734375, 0.5173797607421875, 0.53466796875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 5.0, 3.0, 7.0, 11.0, 16.0, 15.0, 10.0, 19.0, 24.0, 29.0, 30.0, 41.0, 31.0, 40.0, 60.0, 42.0, 41.0, 52.0, 46.0, 60.0, 49.0, 52.0, 35.0, 40.0, 31.0, 33.0, 25.0, 31.0, 24.0, 17.0, 15.0, 10.0, 13.0, 6.0, 9.0, 4.0, 7.0, 7.0, 4.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.236328125, -3.117523193359375, -2.99871826171875, -2.879913330078125, -2.7611083984375, -2.642303466796875, -2.52349853515625, -2.404693603515625, -2.285888671875, -2.167083740234375, -2.04827880859375, -1.929473876953125, -1.8106689453125, -1.691864013671875, -1.57305908203125, -1.454254150390625, -1.33544921875, -1.216644287109375, -1.09783935546875, -0.979034423828125, -0.8602294921875, -0.741424560546875, -0.62261962890625, -0.503814697265625, -0.385009765625, -0.266204833984375, -0.14739990234375, -0.028594970703125, 0.0902099609375, 0.209014892578125, 0.32781982421875, 0.446624755859375, 0.5654296875, 0.684234619140625, 0.80303955078125, 0.921844482421875, 1.0406494140625, 1.159454345703125, 1.27825927734375, 1.397064208984375, 1.515869140625, 1.634674072265625, 1.75347900390625, 1.872283935546875, 1.9910888671875, 2.109893798828125, 2.22869873046875, 2.347503662109375, 2.46630859375, 2.585113525390625, 2.70391845703125, 2.822723388671875, 2.9415283203125, 3.060333251953125, 3.17913818359375, 3.297943115234375, 3.416748046875, 3.535552978515625, 3.65435791015625, 3.773162841796875, 3.8919677734375, 4.010772705078125, 4.12957763671875, 4.248382568359375, 4.3671875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 4.0, 4.0, 4.0, 9.0, 14.0, 12.0, 13.0, 25.0, 39.0, 65.0, 78.0, 116.0, 165.0, 256.0, 370.0, 723.0, 1207.0, 2481.0, 5119.0, 12198.0, 36889.0, 221136.0, 635224.0, 93294.0, 22706.0, 8427.0, 3706.0, 1811.0, 974.0, 522.0, 320.0, 202.0, 127.0, 96.0, 52.0, 46.0, 24.0, 21.0, 28.0, 18.0, 7.0, 13.0, 9.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.1861572265625, -0.18039321899414062, -0.17462921142578125, -0.16886520385742188, -0.1631011962890625, -0.15733718872070312, -0.15157318115234375, -0.14580917358398438, -0.140045166015625, -0.13428115844726562, -0.12851715087890625, -0.12275314331054688, -0.1169891357421875, -0.11122512817382812, -0.10546112060546875, -0.09969711303710938, -0.09393310546875, -0.08816909790039062, -0.08240509033203125, -0.07664108276367188, -0.0708770751953125, -0.06511306762695312, -0.05934906005859375, -0.053585052490234375, -0.047821044921875, -0.042057037353515625, -0.03629302978515625, -0.030529022216796875, -0.0247650146484375, -0.019001007080078125, -0.01323699951171875, -0.007472991943359375, -0.001708984375, 0.004055023193359375, 0.00981903076171875, 0.015583038330078125, 0.0213470458984375, 0.027111053466796875, 0.03287506103515625, 0.038639068603515625, 0.044403076171875, 0.050167083740234375, 0.05593109130859375, 0.061695098876953125, 0.0674591064453125, 0.07322311401367188, 0.07898712158203125, 0.08475112915039062, 0.09051513671875, 0.09627914428710938, 0.10204315185546875, 0.10780715942382812, 0.1135711669921875, 0.11933517456054688, 0.12509918212890625, 0.13086318969726562, 0.136627197265625, 0.14239120483398438, 0.14815521240234375, 0.15391921997070312, 0.1596832275390625, 0.16544723510742188, 0.17121124267578125, 0.17697525024414062, 0.1827392578125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 7.0, 7.0, 9.0, 10.0, 13.0, 20.0, 30.0, 42.0, 74.0, 96.0, 120.0, 111.0, 101.0, 101.0, 70.0, 64.0, 39.0, 27.0, 17.0, 5.0, 9.0, 9.0, 4.0, 4.0, 1.0, 5.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00010865926742553711, -0.00010544620454311371, -0.00010223314166069031, -9.90200787782669e-05, -9.58070158958435e-05, -9.25939530134201e-05, -8.93808901309967e-05, -8.61678272485733e-05, -8.29547643661499e-05, -7.97417014837265e-05, -7.65286386013031e-05, -7.33155757188797e-05, -7.01025128364563e-05, -6.68894499540329e-05, -6.36763870716095e-05, -6.0463324189186096e-05, -5.7250261306762695e-05, -5.4037198424339294e-05, -5.0824135541915894e-05, -4.761107265949249e-05, -4.439800977706909e-05, -4.118494689464569e-05, -3.797188401222229e-05, -3.475882112979889e-05, -3.154575824737549e-05, -2.8332695364952087e-05, -2.5119632482528687e-05, -2.1906569600105286e-05, -1.8693506717681885e-05, -1.5480443835258484e-05, -1.2267380952835083e-05, -9.054318070411682e-06, -5.841255187988281e-06, -2.6281923055648804e-06, 5.848705768585205e-07, 3.7979334592819214e-06, 7.010996341705322e-06, 1.0224059224128723e-05, 1.3437122106552124e-05, 1.6650184988975525e-05, 1.9863247871398926e-05, 2.3076310753822327e-05, 2.6289373636245728e-05, 2.950243651866913e-05, 3.271549940109253e-05, 3.592856228351593e-05, 3.914162516593933e-05, 4.235468804836273e-05, 4.556775093078613e-05, 4.8780813813209534e-05, 5.1993876695632935e-05, 5.5206939578056335e-05, 5.8420002460479736e-05, 6.163306534290314e-05, 6.484612822532654e-05, 6.805919110774994e-05, 7.127225399017334e-05, 7.448531687259674e-05, 7.769837975502014e-05, 8.091144263744354e-05, 8.412450551986694e-05, 8.733756840229034e-05, 9.055063128471375e-05, 9.376369416713715e-05, 9.697675704956055e-05]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 1.0, 4.0, 8.0, 14.0, 13.0, 21.0, 45.0, 62.0, 91.0, 142.0, 220.0, 281.0, 537.0, 802.0, 1250.0, 1846.0, 2833.0, 4395.0, 7096.0, 12276.0, 21965.0, 46037.0, 120408.0, 364387.0, 288518.0, 90879.0, 37849.0, 18761.0, 10444.0, 6402.0, 3945.0, 2512.0, 1620.0, 975.0, 677.0, 439.0, 280.0, 198.0, 126.0, 63.0, 31.0, 29.0, 28.0, 25.0, 8.0, 3.0, 4.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.10162353515625, -0.09862327575683594, -0.09562301635742188, -0.09262275695800781, -0.08962249755859375, -0.08662223815917969, -0.08362197875976562, -0.08062171936035156, -0.0776214599609375, -0.07462120056152344, -0.07162094116210938, -0.06862068176269531, -0.06562042236328125, -0.06262016296386719, -0.059619903564453125, -0.05661964416503906, -0.053619384765625, -0.05061912536621094, -0.047618865966796875, -0.04461860656738281, -0.04161834716796875, -0.03861808776855469, -0.035617828369140625, -0.03261756896972656, -0.0296173095703125, -0.026617050170898438, -0.023616790771484375, -0.020616531372070312, -0.01761627197265625, -0.014616012573242188, -0.011615753173828125, -0.008615493774414062, -0.005615234375, -0.0026149749755859375, 0.000385284423828125, 0.0033855438232421875, 0.00638580322265625, 0.009386062622070312, 0.012386322021484375, 0.015386581420898438, 0.0183868408203125, 0.021387100219726562, 0.024387359619140625, 0.027387619018554688, 0.03038787841796875, 0.03338813781738281, 0.036388397216796875, 0.03938865661621094, 0.042388916015625, 0.04538917541503906, 0.048389434814453125, 0.05138969421386719, 0.05438995361328125, 0.05739021301269531, 0.060390472412109375, 0.06339073181152344, 0.0663909912109375, 0.06939125061035156, 0.07239151000976562, 0.07539176940917969, 0.07839202880859375, 0.08139228820800781, 0.08439254760742188, 0.08739280700683594, 0.09039306640625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 2.0, 4.0, 5.0, 1.0, 6.0, 5.0, 8.0, 8.0, 6.0, 13.0, 17.0, 11.0, 14.0, 22.0, 34.0, 29.0, 49.0, 81.0, 112.0, 117.0, 117.0, 80.0, 70.0, 45.0, 25.0, 17.0, 25.0, 8.0, 7.0, 10.0, 4.0, 8.0, 9.0, 8.0, 6.0, 4.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.039398193359375, -0.038146018981933594, -0.03689384460449219, -0.03564167022705078, -0.034389495849609375, -0.03313732147216797, -0.03188514709472656, -0.030632972717285156, -0.02938079833984375, -0.028128623962402344, -0.026876449584960938, -0.02562427520751953, -0.024372100830078125, -0.02311992645263672, -0.021867752075195312, -0.020615577697753906, -0.0193634033203125, -0.018111228942871094, -0.016859054565429688, -0.015606880187988281, -0.014354705810546875, -0.013102531433105469, -0.011850357055664062, -0.010598182678222656, -0.00934600830078125, -0.008093833923339844, -0.0068416595458984375, -0.005589485168457031, -0.004337310791015625, -0.0030851364135742188, -0.0018329620361328125, -0.0005807876586914062, 0.00067138671875, 0.0019235610961914062, 0.0031757354736328125, 0.004427909851074219, 0.005680084228515625, 0.006932258605957031, 0.008184432983398438, 0.009436607360839844, 0.01068878173828125, 0.011940956115722656, 0.013193130493164062, 0.014445304870605469, 0.015697479248046875, 0.01694965362548828, 0.018201828002929688, 0.019454002380371094, 0.0207061767578125, 0.021958351135253906, 0.023210525512695312, 0.02446269989013672, 0.025714874267578125, 0.02696704864501953, 0.028219223022460938, 0.029471397399902344, 0.03072357177734375, 0.031975746154785156, 0.03322792053222656, 0.03448009490966797, 0.035732269287109375, 0.03698444366455078, 0.03823661804199219, 0.039488792419433594, 0.040740966796875]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 2.0, 8.0, 17.0, 11.0, 20.0, 24.0, 30.0, 30.0, 48.0, 49.0, 61.0, 78.0, 61.0, 82.0, 84.0, 66.0, 74.0, 65.0, 41.0, 45.0, 26.0, 23.0, 12.0, 18.0, 6.0, 8.0, 9.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5260614156723022, -1.4730002880096436, -1.4199392795562744, -1.3668781518936157, -1.313817024230957, -1.260756015777588, -1.2076948881149292, -1.1546337604522705, -1.1015727519989014, -1.0485116243362427, -0.9954505562782288, -0.9423894882202148, -0.8893283605575562, -0.8362672924995422, -0.7832062244415283, -0.7301450967788696, -0.6770839691162109, -0.624022901058197, -0.5709617733955383, -0.5179007053375244, -0.4648396074771881, -0.4117785096168518, -0.3587174415588379, -0.3056563436985016, -0.2525952458381653, -0.19953414797782898, -0.14647306501865387, -0.09341198205947876, -0.040350884199142456, 0.012710213661193848, 0.06577128171920776, 0.11883237957954407, 0.17189347743988037, 0.22495457530021667, 0.278015673160553, 0.3310767412185669, 0.3841378390789032, 0.4371989369392395, 0.4902600049972534, 0.5433211326599121, 0.596382200717926, 0.6494432687759399, 0.7025043964385986, 0.7555654644966125, 0.8086265325546265, 0.8616876602172852, 0.9147487282752991, 0.967809796333313, 1.0208709239959717, 1.0739320516586304, 1.1269930601119995, 1.1800541877746582, 1.233115315437317, 1.2861764430999756, 1.3392374515533447, 1.3922985792160034, 1.445359706878662, 1.4984208345413208, 1.55148184299469, 1.6045429706573486, 1.6576040983200073, 1.710665225982666, 1.7637262344360352, 1.8167873620986938, 1.869848370552063]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 6.0, 10.0, 7.0, 15.0, 17.0, 17.0, 21.0, 21.0, 32.0, 29.0, 30.0, 40.0, 34.0, 44.0, 58.0, 53.0, 48.0, 42.0, 51.0, 50.0, 47.0, 40.0, 48.0, 36.0, 39.0, 25.0, 23.0, 20.0, 15.0, 11.0, 20.0, 13.0, 10.0, 6.0, 5.0, 4.0, 4.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-1.5488474369049072, -1.5048059225082397, -1.4607644081115723, -1.4167228937149048, -1.3726813793182373, -1.3286398649215698, -1.2845983505249023, -1.2405568361282349, -1.1965153217315674, -1.1524738073349, -1.1084322929382324, -1.064390778541565, -1.0203492641448975, -0.97630774974823, -0.9322662353515625, -0.888224720954895, -0.8441831469535828, -0.8001416325569153, -0.7561001181602478, -0.7120586037635803, -0.6680170893669128, -0.6239755749702454, -0.5799340009689331, -0.5358924865722656, -0.49185100197792053, -0.44780948758125305, -0.40376797318458557, -0.3597264289855957, -0.3156849145889282, -0.27164340019226074, -0.22760188579559326, -0.18356037139892578, -0.1395188570022583, -0.09547734260559082, -0.05143582075834274, -0.0073942989110946655, 0.036647215485572815, 0.0806887298822403, 0.12473025918006897, 0.16877177357673645, 0.21281328797340393, 0.2568548023700714, 0.3008963167667389, 0.34493786096572876, 0.38897937536239624, 0.4330208897590637, 0.4770624041557312, 0.5211039185523987, 0.5651454329490662, 0.6091869473457336, 0.6532284617424011, 0.6972699761390686, 0.7413114905357361, 0.7853530049324036, 0.8293945789337158, 0.8734360933303833, 0.9174776077270508, 0.9615191221237183, 1.0055606365203857, 1.0496021509170532, 1.0936436653137207, 1.1376851797103882, 1.1817266941070557, 1.2257682085037231, 1.2698097229003906]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 7.0, 10.0, 22.0, 38.0, 45.0, 65.0, 116.0, 224.0, 333.0, 753.0, 2128.0, 6224.0, 22003.0, 93487.0, 470078.0, 359064.0, 68861.0, 17052.0, 5001.0, 1649.0, 675.0, 278.0, 181.0, 106.0, 60.0, 33.0, 21.0, 22.0, 8.0, 7.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.005859375, -2.90533447265625, -2.8048095703125, -2.70428466796875, -2.603759765625, -2.50323486328125, -2.4027099609375, -2.30218505859375, -2.20166015625, -2.10113525390625, -2.0006103515625, -1.90008544921875, -1.799560546875, -1.69903564453125, -1.5985107421875, -1.49798583984375, -1.3974609375, -1.29693603515625, -1.1964111328125, -1.09588623046875, -0.995361328125, -0.89483642578125, -0.7943115234375, -0.69378662109375, -0.59326171875, -0.49273681640625, -0.3922119140625, -0.29168701171875, -0.191162109375, -0.09063720703125, 0.0098876953125, 0.11041259765625, 0.2109375, 0.31146240234375, 0.4119873046875, 0.51251220703125, 0.613037109375, 0.71356201171875, 0.8140869140625, 0.91461181640625, 1.01513671875, 1.11566162109375, 1.2161865234375, 1.31671142578125, 1.417236328125, 1.51776123046875, 1.6182861328125, 1.71881103515625, 1.8193359375, 1.91986083984375, 2.0203857421875, 2.12091064453125, 2.221435546875, 2.32196044921875, 2.4224853515625, 2.52301025390625, 2.62353515625, 2.72406005859375, 2.8245849609375, 2.92510986328125, 3.025634765625, 3.12615966796875, 3.2266845703125, 3.32720947265625, 3.427734375]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 5.0, 3.0, 7.0, 19.0, 10.0, 16.0, 24.0, 17.0, 41.0, 33.0, 47.0, 43.0, 67.0, 68.0, 66.0, 73.0, 76.0, 68.0, 68.0, 35.0, 48.0, 38.0, 26.0, 27.0, 19.0, 14.0, 10.0, 9.0, 12.0, 7.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.04296875, -2.94268798828125, -2.8424072265625, -2.74212646484375, -2.641845703125, -2.54156494140625, -2.4412841796875, -2.34100341796875, -2.24072265625, -2.14044189453125, -2.0401611328125, -1.93988037109375, -1.839599609375, -1.73931884765625, -1.6390380859375, -1.53875732421875, -1.4384765625, -1.33819580078125, -1.2379150390625, -1.13763427734375, -1.037353515625, -0.93707275390625, -0.8367919921875, -0.73651123046875, -0.63623046875, -0.53594970703125, -0.4356689453125, -0.33538818359375, -0.235107421875, -0.13482666015625, -0.0345458984375, 0.06573486328125, 0.166015625, 0.26629638671875, 0.3665771484375, 0.46685791015625, 0.567138671875, 0.66741943359375, 0.7677001953125, 0.86798095703125, 0.96826171875, 1.06854248046875, 1.1688232421875, 1.26910400390625, 1.369384765625, 1.46966552734375, 1.5699462890625, 1.67022705078125, 1.7705078125, 1.87078857421875, 1.9710693359375, 2.07135009765625, 2.171630859375, 2.27191162109375, 2.3721923828125, 2.47247314453125, 2.57275390625, 2.67303466796875, 2.7733154296875, 2.87359619140625, 2.973876953125, 3.07415771484375, 3.1744384765625, 3.27471923828125, 3.375]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 12.0, 11.0, 16.0, 17.0, 36.0, 40.0, 62.0, 90.0, 125.0, 223.0, 334.0, 557.0, 935.0, 1640.0, 2882.0, 5579.0, 10926.0, 22448.0, 49352.0, 119346.0, 296056.0, 309597.0, 127865.0, 51959.0, 23702.0, 11424.0, 5838.0, 3160.0, 1708.0, 997.0, 575.0, 373.0, 253.0, 137.0, 97.0, 61.0, 49.0, 26.0, 18.0, 10.0, 6.0, 5.0, 4.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4169921875, -1.3645782470703125, -1.312164306640625, -1.2597503662109375, -1.20733642578125, -1.1549224853515625, -1.102508544921875, -1.0500946044921875, -0.9976806640625, -0.9452667236328125, -0.892852783203125, -0.8404388427734375, -0.78802490234375, -0.7356109619140625, -0.683197021484375, -0.6307830810546875, -0.578369140625, -0.5259552001953125, -0.473541259765625, -0.4211273193359375, -0.36871337890625, -0.3162994384765625, -0.263885498046875, -0.2114715576171875, -0.1590576171875, -0.1066436767578125, -0.054229736328125, -0.0018157958984375, 0.05059814453125, 0.1030120849609375, 0.155426025390625, 0.2078399658203125, 0.26025390625, 0.3126678466796875, 0.365081787109375, 0.4174957275390625, 0.46990966796875, 0.5223236083984375, 0.574737548828125, 0.6271514892578125, 0.6795654296875, 0.7319793701171875, 0.784393310546875, 0.8368072509765625, 0.88922119140625, 0.9416351318359375, 0.994049072265625, 1.0464630126953125, 1.098876953125, 1.1512908935546875, 1.203704833984375, 1.2561187744140625, 1.30853271484375, 1.3609466552734375, 1.413360595703125, 1.4657745361328125, 1.5181884765625, 1.5706024169921875, 1.623016357421875, 1.6754302978515625, 1.72784423828125, 1.7802581787109375, 1.832672119140625, 1.8850860595703125, 1.9375]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 4.0, 8.0, 5.0, 17.0, 23.0, 17.0, 19.0, 21.0, 27.0, 35.0, 44.0, 44.0, 52.0, 64.0, 52.0, 49.0, 68.0, 46.0, 49.0, 49.0, 47.0, 44.0, 28.0, 39.0, 40.0, 16.0, 21.0, 14.0, 18.0, 5.0, 8.0, 6.0, 3.0, 7.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.56640625, -4.4505615234375, -4.334716796875, -4.2188720703125, -4.10302734375, -3.9871826171875, -3.871337890625, -3.7554931640625, -3.6396484375, -3.5238037109375, -3.407958984375, -3.2921142578125, -3.17626953125, -3.0604248046875, -2.944580078125, -2.8287353515625, -2.712890625, -2.5970458984375, -2.481201171875, -2.3653564453125, -2.24951171875, -2.1336669921875, -2.017822265625, -1.9019775390625, -1.7861328125, -1.6702880859375, -1.554443359375, -1.4385986328125, -1.32275390625, -1.2069091796875, -1.091064453125, -0.9752197265625, -0.859375, -0.7435302734375, -0.627685546875, -0.5118408203125, -0.39599609375, -0.2801513671875, -0.164306640625, -0.0484619140625, 0.0673828125, 0.1832275390625, 0.299072265625, 0.4149169921875, 0.53076171875, 0.6466064453125, 0.762451171875, 0.8782958984375, 0.994140625, 1.1099853515625, 1.225830078125, 1.3416748046875, 1.45751953125, 1.5733642578125, 1.689208984375, 1.8050537109375, 1.9208984375, 2.0367431640625, 2.152587890625, 2.2684326171875, 2.38427734375, 2.5001220703125, 2.615966796875, 2.7318115234375, 2.84765625]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 0.0, 5.0, 3.0, 10.0, 17.0, 15.0, 10.0, 24.0, 34.0, 36.0, 56.0, 72.0, 101.0, 160.0, 215.0, 299.0, 495.0, 765.0, 1192.0, 1889.0, 3187.0, 5212.0, 8747.0, 15271.0, 27514.0, 50932.0, 100190.0, 200022.0, 285099.0, 165962.0, 82465.0, 42548.0, 23514.0, 13014.0, 7534.0, 4376.0, 2745.0, 1663.0, 1067.0, 676.0, 425.0, 284.0, 212.0, 137.0, 111.0, 71.0, 59.0, 33.0, 30.0, 21.0, 11.0, 11.0, 11.0, 3.0, 5.0, 1.0, 2.0, 4.0, 0.0, 0.0, 2.0], "bins": [-0.389892578125, -0.3774604797363281, -0.36502838134765625, -0.3525962829589844, -0.3401641845703125, -0.3277320861816406, -0.31529998779296875, -0.3028678894042969, -0.290435791015625, -0.2780036926269531, -0.26557159423828125, -0.2531394958496094, -0.2407073974609375, -0.22827529907226562, -0.21584320068359375, -0.20341110229492188, -0.19097900390625, -0.17854690551757812, -0.16611480712890625, -0.15368270874023438, -0.1412506103515625, -0.12881851196289062, -0.11638641357421875, -0.10395431518554688, -0.091522216796875, -0.07909011840820312, -0.06665802001953125, -0.054225921630859375, -0.0417938232421875, -0.029361724853515625, -0.01692962646484375, -0.004497528076171875, 0.0079345703125, 0.020366668701171875, 0.03279876708984375, 0.045230865478515625, 0.0576629638671875, 0.07009506225585938, 0.08252716064453125, 0.09495925903320312, 0.107391357421875, 0.11982345581054688, 0.13225555419921875, 0.14468765258789062, 0.1571197509765625, 0.16955184936523438, 0.18198394775390625, 0.19441604614257812, 0.20684814453125, 0.21928024291992188, 0.23171234130859375, 0.24414443969726562, 0.2565765380859375, 0.2690086364746094, 0.28144073486328125, 0.2938728332519531, 0.306304931640625, 0.3187370300292969, 0.33116912841796875, 0.3436012268066406, 0.3560333251953125, 0.3684654235839844, 0.38089752197265625, 0.3933296203613281, 0.40576171875]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 7.0, 9.0, 7.0, 7.0, 9.0, 11.0, 24.0, 31.0, 36.0, 48.0, 55.0, 82.0, 102.0, 106.0, 113.0, 86.0, 59.0, 65.0, 37.0, 29.0, 23.0, 20.0, 9.0, 7.0, 3.0, 8.0, 3.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00019466876983642578, -0.0001892540603876114, -0.000183839350938797, -0.0001784246414899826, -0.0001730099320411682, -0.00016759522259235382, -0.00016218051314353943, -0.00015676580369472504, -0.00015135109424591064, -0.00014593638479709625, -0.00014052167534828186, -0.00013510696589946747, -0.00012969225645065308, -0.00012427754700183868, -0.00011886283755302429, -0.0001134481281042099, -0.00010803341865539551, -0.00010261870920658112, -9.720399975776672e-05, -9.178929030895233e-05, -8.637458086013794e-05, -8.095987141132355e-05, -7.554516196250916e-05, -7.013045251369476e-05, -6.471574306488037e-05, -5.930103361606598e-05, -5.388632416725159e-05, -4.8471614718437195e-05, -4.30569052696228e-05, -3.764219582080841e-05, -3.222748637199402e-05, -2.6812776923179626e-05, -2.1398067474365234e-05, -1.5983358025550842e-05, -1.056864857673645e-05, -5.153939127922058e-06, 2.60770320892334e-07, 5.675479769706726e-06, 1.1090189218521118e-05, 1.650489866733551e-05, 2.1919608116149902e-05, 2.7334317564964294e-05, 3.2749027013778687e-05, 3.816373646259308e-05, 4.357844591140747e-05, 4.899315536022186e-05, 5.4407864809036255e-05, 5.982257425785065e-05, 6.523728370666504e-05, 7.065199315547943e-05, 7.606670260429382e-05, 8.148141205310822e-05, 8.689612150192261e-05, 9.2310830950737e-05, 9.772554039955139e-05, 0.00010314024984836578, 0.00010855495929718018, 0.00011396966874599457, 0.00011938437819480896, 0.00012479908764362335, 0.00013021379709243774, 0.00013562850654125214, 0.00014104321599006653, 0.00014645792543888092, 0.0001518726348876953]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 5.0, 4.0, 10.0, 19.0, 15.0, 27.0, 32.0, 46.0, 66.0, 106.0, 176.0, 226.0, 332.0, 428.0, 717.0, 1072.0, 1630.0, 2611.0, 4331.0, 7186.0, 12325.0, 21793.0, 39257.0, 73473.0, 144960.0, 284989.0, 216901.0, 107037.0, 56202.0, 30364.0, 17146.0, 9720.0, 5775.0, 3454.0, 2092.0, 1400.0, 857.0, 564.0, 395.0, 249.0, 164.0, 109.0, 87.0, 77.0, 38.0, 29.0, 18.0, 12.0, 8.0, 10.0, 10.0, 5.0, 3.0, 3.0, 0.0, 3.0], "bins": [-0.430419921875, -0.4176788330078125, -0.404937744140625, -0.3921966552734375, -0.37945556640625, -0.3667144775390625, -0.353973388671875, -0.3412322998046875, -0.3284912109375, -0.3157501220703125, -0.303009033203125, -0.2902679443359375, -0.27752685546875, -0.2647857666015625, -0.252044677734375, -0.2393035888671875, -0.2265625, -0.2138214111328125, -0.201080322265625, -0.1883392333984375, -0.17559814453125, -0.1628570556640625, -0.150115966796875, -0.1373748779296875, -0.1246337890625, -0.1118927001953125, -0.099151611328125, -0.0864105224609375, -0.07366943359375, -0.0609283447265625, -0.048187255859375, -0.0354461669921875, -0.022705078125, -0.0099639892578125, 0.002777099609375, 0.0155181884765625, 0.02825927734375, 0.0410003662109375, 0.053741455078125, 0.0664825439453125, 0.0792236328125, 0.0919647216796875, 0.104705810546875, 0.1174468994140625, 0.13018798828125, 0.1429290771484375, 0.155670166015625, 0.1684112548828125, 0.18115234375, 0.1938934326171875, 0.206634521484375, 0.2193756103515625, 0.23211669921875, 0.2448577880859375, 0.257598876953125, 0.2703399658203125, 0.2830810546875, 0.2958221435546875, 0.308563232421875, 0.3213043212890625, 0.33404541015625, 0.3467864990234375, 0.359527587890625, 0.3722686767578125, 0.385009765625]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 4.0, 2.0, 1.0, 7.0, 1.0, 5.0, 2.0, 9.0, 11.0, 12.0, 19.0, 25.0, 16.0, 34.0, 42.0, 45.0, 53.0, 74.0, 79.0, 105.0, 85.0, 62.0, 59.0, 61.0, 41.0, 38.0, 28.0, 17.0, 15.0, 10.0, 7.0, 8.0, 6.0, 6.0, 6.0, 5.0, 1.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0], "bins": [-0.50146484375, -0.48769378662109375, -0.4739227294921875, -0.46015167236328125, -0.446380615234375, -0.43260955810546875, -0.4188385009765625, -0.40506744384765625, -0.39129638671875, -0.37752532958984375, -0.3637542724609375, -0.34998321533203125, -0.336212158203125, -0.32244110107421875, -0.3086700439453125, -0.29489898681640625, -0.2811279296875, -0.26735687255859375, -0.2535858154296875, -0.23981475830078125, -0.226043701171875, -0.21227264404296875, -0.1985015869140625, -0.18473052978515625, -0.17095947265625, -0.15718841552734375, -0.1434173583984375, -0.12964630126953125, -0.115875244140625, -0.10210418701171875, -0.0883331298828125, -0.07456207275390625, -0.060791015625, -0.04701995849609375, -0.0332489013671875, -0.01947784423828125, -0.005706787109375, 0.00806427001953125, 0.0218353271484375, 0.03560638427734375, 0.04937744140625, 0.06314849853515625, 0.0769195556640625, 0.09069061279296875, 0.104461669921875, 0.11823272705078125, 0.1320037841796875, 0.14577484130859375, 0.1595458984375, 0.17331695556640625, 0.1870880126953125, 0.20085906982421875, 0.214630126953125, 0.22840118408203125, 0.2421722412109375, 0.25594329833984375, 0.26971435546875, 0.28348541259765625, 0.2972564697265625, 0.31102752685546875, 0.324798583984375, 0.33856964111328125, 0.3523406982421875, 0.36611175537109375, 0.3798828125]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 8.0, 15.0, 57.0, 159.0, 242.0, 253.0, 153.0, 64.0, 31.0, 12.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.058757781982422, -11.642096519470215, -11.225436210632324, -10.808774948120117, -10.39211368560791, -9.97545337677002, -9.558792114257812, -9.142131805419922, -8.725470542907715, -8.308809280395508, -7.892148494720459, -7.47548770904541, -7.058826923370361, -6.6421661376953125, -6.2255048751831055, -5.808844089508057, -5.39218282699585, -4.975522041320801, -4.558860778808594, -4.142199993133545, -3.725539207458496, -3.308878183364868, -2.8922171592712402, -2.4755563735961914, -2.0588953495025635, -1.642234444618225, -1.2255735397338867, -0.8089125156402588, -0.3922516107559204, 0.02440929412841797, 0.4410703182220459, 0.8577311038970947, 1.2743921279907227, 1.691053032875061, 2.1077139377593994, 2.5243749618530273, 2.941035747528076, 3.357696771621704, 3.774357795715332, 4.191018581390381, 4.60767936706543, 5.0243401527404785, 5.4410014152526855, 5.857662200927734, 6.274322986602783, 6.690983772277832, 7.107645034790039, 7.524305820465088, 7.940967082977295, 8.357627868652344, 8.77428913116455, 9.190950393676758, 9.607610702514648, 10.024271965026855, 10.440933227539062, 10.857593536376953, 11.27425479888916, 11.690916061401367, 12.107576370239258, 12.524237632751465, 12.940898895263672, 13.357559204101562, 13.77422046661377, 14.190881729125977, 14.607542037963867]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 3.0, 9.0, 2.0, 19.0, 13.0, 21.0, 11.0, 17.0, 21.0, 23.0, 33.0, 28.0, 40.0, 41.0, 48.0, 50.0, 66.0, 50.0, 55.0, 54.0, 54.0, 47.0, 43.0, 48.0, 39.0, 37.0, 37.0, 18.0, 18.0, 21.0, 6.0, 12.0, 4.0, 5.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-9.15048885345459, -8.914582252502441, -8.67867660522461, -8.442770004272461, -8.206864356994629, -7.9709577560424805, -7.73505163192749, -7.4991455078125, -7.26323938369751, -7.0273332595825195, -6.791427135467529, -6.555521011352539, -6.319614410400391, -6.0837082862854, -5.84780216217041, -5.61189603805542, -5.37598991394043, -5.1400837898254395, -4.904177665710449, -4.668271064758301, -4.4323649406433105, -4.19645881652832, -3.96055269241333, -3.72464656829834, -3.4887399673461914, -3.252833843231201, -3.016927480697632, -2.7810213565826416, -2.5451152324676514, -2.309208869934082, -2.073302745819092, -1.8373966217041016, -1.6014904975891113, -1.3655842542648315, -1.1296781301498413, -0.8937718868255615, -0.6578657031059265, -0.4219595193862915, -0.18605327606201172, 0.049852848052978516, 0.2857590913772583, 0.5216652750968933, 0.7575714588165283, 0.9934777021408081, 1.229383945465088, 1.4652900695800781, 1.701196312904358, 1.9371024370193481, 2.173008680343628, 2.408914804458618, 2.6448211669921875, 2.8807272911071777, 3.116633415222168, 3.352539539337158, 3.5884459018707275, 3.8243520259857178, 4.060258388519287, 4.296164512634277, 4.532070636749268, 4.767976760864258, 5.003883361816406, 5.2397894859313965, 5.475695610046387, 5.711601734161377, 5.947507858276367]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 6.0, 4.0, 10.0, 12.0, 9.0, 14.0, 17.0, 23.0, 28.0, 43.0, 65.0, 87.0, 109.0, 162.0, 201.0, 298.0, 352.0, 526.0, 790.0, 1085.0, 1696.0, 2720.0, 1033277.0, 2964.0, 1873.0, 1278.0, 793.0, 585.0, 422.0, 321.0, 234.0, 161.0, 136.0, 84.0, 72.0, 35.0, 35.0, 24.0, 15.0, 17.0, 5.0, 7.0, 8.0, 3.0, 3.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.565166473388672, -6.363887786865234, -6.162609100341797, -5.961330413818359, -5.76005220413208, -5.558773517608643, -5.357494831085205, -5.156216144561768, -4.95493745803833, -4.753658771514893, -4.552380084991455, -4.351101875305176, -4.149823188781738, -3.948544502258301, -3.7472658157348633, -3.545987129211426, -3.3447086811065674, -3.14342999458313, -2.9421515464782715, -2.740872859954834, -2.5395941734313965, -2.338315486907959, -2.1370370388031006, -1.935758352279663, -1.7344797849655151, -1.5332012176513672, -1.3319225311279297, -1.1306439638137817, -0.929365336894989, -0.7280867099761963, -0.5268081426620483, -0.32552945613861084, -0.12425088882446289, 0.07702772319316864, 0.27830633521080017, 0.4795849323272705, 0.6808635592460632, 0.882142186164856, 1.083420753479004, 1.2846994400024414, 1.4859780073165894, 1.6872565746307373, 1.8885352611541748, 2.089813709259033, 2.2910923957824707, 2.492371082305908, 2.6936497688293457, 2.894928455352783, 3.0962069034576416, 3.297485589981079, 3.4987640380859375, 3.700042724609375, 3.9013214111328125, 4.10260009765625, 4.3038787841796875, 4.505157470703125, 4.706435680389404, 4.907714366912842, 5.108993053436279, 5.310271263122559, 5.511549949645996, 5.712828636169434, 5.914107322692871, 6.115386009216309, 6.316664695739746]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 7.0, 7.0, 4.0, 11.0, 13.0, 28.0, 42.0, 106.0, 178.0, 316.0, 663.0, 1559.0, 3910.0, 9307.0, 30957.0, 51393388.0, 18055.0, 7257.0, 3100.0, 1298.0, 540.0, 263.0, 133.0, 70.0, 44.0, 22.0, 15.0, 13.0, 9.0, 7.0, 6.0, 2.0, 5.0, 3.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.174680709838867, -8.744375228881836, -8.314070701599121, -7.88376522064209, -7.453460693359375, -7.023155212402344, -6.592850208282471, -6.162545204162598, -5.732240200042725, -5.301935195922852, -4.8716301918029785, -4.4413251876831055, -4.011019706726074, -3.5807149410247803, -3.150409698486328, -2.720104694366455, -2.289799690246582, -1.859494686126709, -1.4291895627975464, -0.9988844394683838, -0.5685794353485107, -0.1382744312286377, 0.29203081130981445, 0.7223358154296875, 1.1526408195495605, 1.5829458236694336, 2.0132508277893066, 2.443556070327759, 2.873861074447632, 3.304166078567505, 3.734471321105957, 4.16477632522583, 4.595081329345703, 5.025386333465576, 5.455691337585449, 5.8859968185424805, 6.316301345825195, 6.746606826782227, 7.1769118309021, 7.607216835021973, 8.037521362304688, 8.467826843261719, 8.898131370544434, 9.328436851501465, 9.75874137878418, 10.189046859741211, 10.619352340698242, 11.049656867980957, 11.479962348937988, 11.91026782989502, 12.340572357177734, 12.770877838134766, 13.20118236541748, 13.631487846374512, 14.061792373657227, 14.492097854614258, 14.922403335571289, 15.35270881652832, 15.783013343811035, 16.21331787109375, 16.64362335205078, 17.073928833007812, 17.504234313964844, 17.934539794921875, 18.364843368530273]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 8.0, 5.0, 12.0, 12.0, 29.0, 36.0, 54.0, 75.0, 101.0, 171.0, 239.0, 369.0, 514.0, 751.0, 1250.0, 2251.0, 5461.0, 19506.0, 93547.0, 470505.0, 4251676.0, 1131727.0, 246934.0, 47148.0, 10785.0, 3615.0, 1661.0, 1029.0, 648.0, 427.0, 293.0, 201.0, 142.0, 82.0, 55.0, 36.0, 27.0, 16.0, 10.0, 8.0, 7.0, 9.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.46875, -2.385894775390625, -2.30303955078125, -2.220184326171875, -2.1373291015625, -2.054473876953125, -1.97161865234375, -1.888763427734375, -1.805908203125, -1.723052978515625, -1.64019775390625, -1.557342529296875, -1.4744873046875, -1.391632080078125, -1.30877685546875, -1.225921630859375, -1.14306640625, -1.060211181640625, -0.97735595703125, -0.894500732421875, -0.8116455078125, -0.728790283203125, -0.64593505859375, -0.563079833984375, -0.480224609375, -0.397369384765625, -0.31451416015625, -0.231658935546875, -0.1488037109375, -0.065948486328125, 0.01690673828125, 0.099761962890625, 0.1826171875, 0.265472412109375, 0.34832763671875, 0.431182861328125, 0.5140380859375, 0.596893310546875, 0.67974853515625, 0.762603759765625, 0.845458984375, 0.928314208984375, 1.01116943359375, 1.094024658203125, 1.1768798828125, 1.259735107421875, 1.34259033203125, 1.425445556640625, 1.50830078125, 1.591156005859375, 1.67401123046875, 1.756866455078125, 1.8397216796875, 1.922576904296875, 2.00543212890625, 2.088287353515625, 2.171142578125, 2.253997802734375, 2.33685302734375, 2.419708251953125, 2.5025634765625, 2.585418701171875, 2.66827392578125, 2.751129150390625, 2.833984375]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 8.0, 10.0, 20.0, 37.0, 42.0, 65.0, 81.0, 90.0, 89.0, 793.0, 453.0, 97.0, 67.0, 64.0, 50.0, 25.0, 14.0, 11.0, 9.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.15625, -28.14892578125, -27.1416015625, -26.13427734375, -25.126953125, -24.11962890625, -23.1123046875, -22.10498046875, -21.09765625, -20.09033203125, -19.0830078125, -18.07568359375, -17.068359375, -16.06103515625, -15.0537109375, -14.04638671875, -13.0390625, -12.03173828125, -11.0244140625, -10.01708984375, -9.009765625, -8.00244140625, -6.9951171875, -5.98779296875, -4.98046875, -3.97314453125, -2.9658203125, -1.95849609375, -0.951171875, 0.05615234375, 1.0634765625, 2.07080078125, 3.078125, 4.08544921875, 5.0927734375, 6.10009765625, 7.107421875, 8.11474609375, 9.1220703125, 10.12939453125, 11.13671875, 12.14404296875, 13.1513671875, 14.15869140625, 15.166015625, 16.17333984375, 17.1806640625, 18.18798828125, 19.1953125, 20.20263671875, 21.2099609375, 22.21728515625, 23.224609375, 24.23193359375, 25.2392578125, 26.24658203125, 27.25390625, 28.26123046875, 29.2685546875, 30.27587890625, 31.283203125, 32.29052734375, 33.2978515625, 34.30517578125, 35.3125]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 2.0, 3.0, 3.0, 5.0, 3.0, 6.0, 18.0, 8.0, 19.0, 31.0, 46.0, 57.0, 79.0, 130.0, 198.0, 297.0, 455.0, 771.0, 1550.0, 3309.0, 7090.0, 17322.0, 44455.0, 115105.0, 283833.0, 588469.0, 3894776.0, 724964.0, 359726.0, 150035.0, 58034.0, 22761.0, 9346.0, 4092.0, 1918.0, 989.0, 539.0, 312.0, 204.0, 131.0, 84.0, 67.0, 48.0, 43.0, 32.0, 22.0, 14.0, 15.0, 10.0, 7.0, 1.0, 4.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.24609375, -1.2040557861328125, -1.162017822265625, -1.1199798583984375, -1.07794189453125, -1.0359039306640625, -0.993865966796875, -0.9518280029296875, -0.9097900390625, -0.8677520751953125, -0.825714111328125, -0.7836761474609375, -0.74163818359375, -0.6996002197265625, -0.657562255859375, -0.6155242919921875, -0.573486328125, -0.5314483642578125, -0.489410400390625, -0.4473724365234375, -0.40533447265625, -0.3632965087890625, -0.321258544921875, -0.2792205810546875, -0.2371826171875, -0.1951446533203125, -0.153106689453125, -0.1110687255859375, -0.06903076171875, -0.0269927978515625, 0.015045166015625, 0.0570831298828125, 0.09912109375, 0.1411590576171875, 0.183197021484375, 0.2252349853515625, 0.26727294921875, 0.3093109130859375, 0.351348876953125, 0.3933868408203125, 0.4354248046875, 0.4774627685546875, 0.519500732421875, 0.5615386962890625, 0.60357666015625, 0.6456146240234375, 0.687652587890625, 0.7296905517578125, 0.771728515625, 0.8137664794921875, 0.855804443359375, 0.8978424072265625, 0.93988037109375, 0.9819183349609375, 1.023956298828125, 1.0659942626953125, 1.1080322265625, 1.1500701904296875, 1.192108154296875, 1.2341461181640625, 1.27618408203125, 1.3182220458984375, 1.360260009765625, 1.4022979736328125, 1.4443359375]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 6.0, 11.0, 4.0, 24.0, 39.0, 75.0, 93.0, 128.0, 1079.0, 223.0, 112.0, 84.0, 54.0, 37.0, 24.0, 18.0, 6.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.65625, -47.43603515625, -46.2158203125, -44.99560546875, -43.775390625, -42.55517578125, -41.3349609375, -40.11474609375, -38.89453125, -37.67431640625, -36.4541015625, -35.23388671875, -34.013671875, -32.79345703125, -31.5732421875, -30.35302734375, -29.1328125, -27.91259765625, -26.6923828125, -25.47216796875, -24.251953125, -23.03173828125, -21.8115234375, -20.59130859375, -19.37109375, -18.15087890625, -16.9306640625, -15.71044921875, -14.490234375, -13.27001953125, -12.0498046875, -10.82958984375, -9.609375, -8.38916015625, -7.1689453125, -5.94873046875, -4.728515625, -3.50830078125, -2.2880859375, -1.06787109375, 0.15234375, 1.37255859375, 2.5927734375, 3.81298828125, 5.033203125, 6.25341796875, 7.4736328125, 8.69384765625, 9.9140625, 11.13427734375, 12.3544921875, 13.57470703125, 14.794921875, 16.01513671875, 17.2353515625, 18.45556640625, 19.67578125, 20.89599609375, 22.1162109375, 23.33642578125, 24.556640625, 25.77685546875, 26.9970703125, 28.21728515625, 29.4375]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 3.0, 2.0, 2.0, 2.0, 8.0, 2.0, 5.0, 10.0, 7.0, 14.0, 12.0, 23.0, 40.0, 34.0, 61.0, 111.0, 181.0, 346.0, 857.0, 1864.0, 5411.0, 26580.0, 482276.0, 5663396.0, 92740.0, 11424.0, 3256.0, 1423.0, 653.0, 269.0, 139.0, 75.0, 69.0, 43.0, 31.0, 23.0, 17.0, 5.0, 6.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 4.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0], "bins": [-4.26953125, -4.1129150390625, -3.956298828125, -3.7996826171875, -3.64306640625, -3.4864501953125, -3.329833984375, -3.1732177734375, -3.0166015625, -2.8599853515625, -2.703369140625, -2.5467529296875, -2.39013671875, -2.2335205078125, -2.076904296875, -1.9202880859375, -1.763671875, -1.6070556640625, -1.450439453125, -1.2938232421875, -1.13720703125, -0.9805908203125, -0.823974609375, -0.6673583984375, -0.5107421875, -0.3541259765625, -0.197509765625, -0.0408935546875, 0.11572265625, 0.2723388671875, 0.428955078125, 0.5855712890625, 0.7421875, 0.8988037109375, 1.055419921875, 1.2120361328125, 1.36865234375, 1.5252685546875, 1.681884765625, 1.8385009765625, 1.9951171875, 2.1517333984375, 2.308349609375, 2.4649658203125, 2.62158203125, 2.7781982421875, 2.934814453125, 3.0914306640625, 3.248046875, 3.4046630859375, 3.561279296875, 3.7178955078125, 3.87451171875, 4.0311279296875, 4.187744140625, 4.3443603515625, 4.5009765625, 4.6575927734375, 4.814208984375, 4.9708251953125, 5.12744140625, 5.2840576171875, 5.440673828125, 5.5972900390625, 5.75390625]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 9.0, 9.0, 26.0, 45.0, 65.0, 97.0, 134.0, 1186.0, 140.0, 104.0, 79.0, 51.0, 44.0, 14.0, 10.0, 9.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.8203125, -13.7474365234375, -12.674560546875, -11.6016845703125, -10.52880859375, -9.4559326171875, -8.383056640625, -7.3101806640625, -6.2373046875, -5.1644287109375, -4.091552734375, -3.0186767578125, -1.94580078125, -0.8729248046875, 0.199951171875, 1.2728271484375, 2.345703125, 3.4185791015625, 4.491455078125, 5.5643310546875, 6.63720703125, 7.7100830078125, 8.782958984375, 9.8558349609375, 10.9287109375, 12.0015869140625, 13.074462890625, 14.1473388671875, 15.22021484375, 16.2930908203125, 17.365966796875, 18.4388427734375, 19.51171875, 20.5845947265625, 21.657470703125, 22.7303466796875, 23.80322265625, 24.8760986328125, 25.948974609375, 27.0218505859375, 28.0947265625, 29.1676025390625, 30.240478515625, 31.3133544921875, 32.38623046875, 33.4591064453125, 34.531982421875, 35.6048583984375, 36.677734375, 37.7506103515625, 38.823486328125, 39.8963623046875, 40.96923828125, 42.0421142578125, 43.114990234375, 44.1878662109375, 45.2607421875, 46.3336181640625, 47.406494140625, 48.4793701171875, 49.55224609375, 50.6251220703125, 51.697998046875, 52.7708740234375, 53.84375]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 10.0, 324.0, 650.0, 17.0, 10.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.091644287109375, -48.72985076904297, -44.36805725097656, -40.006263732910156, -35.64447021484375, -31.28267478942871, -26.920879364013672, -22.559085845947266, -18.19729232788086, -13.835498809814453, -9.47370433807373, -5.111909866333008, -0.7501163482666016, 3.6116771697998047, 7.973472595214844, 12.33526611328125, 16.697059631347656, 21.058853149414062, 25.42064666748047, 29.782442092895508, 34.14423370361328, 38.50602722167969, 42.86782455444336, 47.229618072509766, 51.59141159057617, 55.95320510864258, 60.314998626708984, 64.67679595947266, 69.03858947753906, 73.40038299560547, 77.76217651367188, 82.12397003173828, 86.48576354980469, 90.8475570678711, 95.2093505859375, 99.5711441040039, 103.93293762207031, 108.29473114013672, 112.65652465820312, 117.01832580566406, 121.38011169433594, 125.74190521240234, 130.10369873046875, 134.4654998779297, 138.82728576660156, 143.1890869140625, 147.55087280273438, 151.9126739501953, 156.27447509765625, 160.6362762451172, 164.99806213378906, 169.35986328125, 173.72164916992188, 178.0834503173828, 182.4452362060547, 186.80703735351562, 191.1688232421875, 195.53062438964844, 199.8924102783203, 204.25421142578125, 208.61599731445312, 212.97779846191406, 217.33958435058594, 221.70138549804688, 226.06317138671875]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 4.0, 14.0, 30.0, 63.0, 120.0, 192.0, 206.0, 175.0, 92.0, 61.0, 26.0, 12.0, 5.0, 4.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-108.50111389160156, -105.81207275390625, -103.1230239868164, -100.4339828491211, -97.74494171142578, -95.05589294433594, -92.36685180664062, -89.67781066894531, -86.98876953125, -84.29972839355469, -81.61067962646484, -78.92163848876953, -76.23259735107422, -73.54354858398438, -70.85450744628906, -68.16546630859375, -65.4764175415039, -62.78737258911133, -60.098331451416016, -57.40928649902344, -54.720245361328125, -52.03120040893555, -49.34215545654297, -46.653114318847656, -43.96406936645508, -41.2750244140625, -38.58598327636719, -35.89693832397461, -33.20789337158203, -30.51885223388672, -27.82980728149414, -25.140764236450195, -22.45172882080078, -19.762685775756836, -17.07364273071289, -14.384597778320312, -11.695554733276367, -9.006511688232422, -6.317466735839844, -3.6284236907958984, -0.9393806457519531, 1.7496628761291504, 4.438706398010254, 7.127750396728516, 9.816793441772461, 12.505836486816406, 15.194881439208984, 17.88392448425293, 20.572967529296875, 23.26201057434082, 25.951053619384766, 28.640098571777344, 31.32914161682129, 34.018184661865234, 36.70722961425781, 39.396270751953125, 42.0853157043457, 44.77436065673828, 47.463401794433594, 50.15244674682617, 52.84149169921875, 55.53053283691406, 58.21957778930664, 60.90862274169922, 63.59766387939453]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 6.0, 1.0, 3.0, 4.0, 5.0, 23.0, 606.0, 986.0, 3725.0, 363157.0, 3809356.0, 12980.0, 1687.0, 521.0, 593.0, 622.0, 14.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.525390625, -0.5126190185546875, -0.499847412109375, -0.4870758056640625, -0.47430419921875, -0.4615325927734375, -0.448760986328125, -0.4359893798828125, -0.4232177734375, -0.4104461669921875, -0.397674560546875, -0.3849029541015625, -0.37213134765625, -0.3593597412109375, -0.346588134765625, -0.3338165283203125, -0.321044921875, -0.3082733154296875, -0.295501708984375, -0.2827301025390625, -0.26995849609375, -0.2571868896484375, -0.244415283203125, -0.2316436767578125, -0.2188720703125, -0.2061004638671875, -0.193328857421875, -0.1805572509765625, -0.16778564453125, -0.1550140380859375, -0.142242431640625, -0.1294708251953125, -0.11669921875, -0.1039276123046875, -0.091156005859375, -0.0783843994140625, -0.06561279296875, -0.0528411865234375, -0.040069580078125, -0.0272979736328125, -0.0145263671875, -0.0017547607421875, 0.011016845703125, 0.0237884521484375, 0.03656005859375, 0.0493316650390625, 0.062103271484375, 0.0748748779296875, 0.087646484375, 0.1004180908203125, 0.113189697265625, 0.1259613037109375, 0.13873291015625, 0.1515045166015625, 0.164276123046875, 0.1770477294921875, 0.1898193359375, 0.2025909423828125, 0.215362548828125, 0.2281341552734375, 0.24090576171875, 0.2536773681640625, 0.266448974609375, 0.2792205810546875, 0.2919921875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 6.0, 8.0, 17.0, 39.0, 110.0, 416.0, 257.0, 87.0, 41.0, 18.0, 9.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.431884765625, -0.4207611083984375, -0.409637451171875, -0.3985137939453125, -0.38739013671875, -0.3762664794921875, -0.365142822265625, -0.3540191650390625, -0.3428955078125, -0.3317718505859375, -0.320648193359375, -0.3095245361328125, -0.29840087890625, -0.2872772216796875, -0.276153564453125, -0.2650299072265625, -0.25390625, -0.2427825927734375, -0.231658935546875, -0.2205352783203125, -0.20941162109375, -0.1982879638671875, -0.187164306640625, -0.1760406494140625, -0.1649169921875, -0.1537933349609375, -0.142669677734375, -0.1315460205078125, -0.12042236328125, -0.1092987060546875, -0.098175048828125, -0.0870513916015625, -0.075927734375, -0.0648040771484375, -0.053680419921875, -0.0425567626953125, -0.03143310546875, -0.0203094482421875, -0.009185791015625, 0.0019378662109375, 0.0130615234375, 0.0241851806640625, 0.035308837890625, 0.0464324951171875, 0.05755615234375, 0.0686798095703125, 0.079803466796875, 0.0909271240234375, 0.10205078125, 0.1131744384765625, 0.124298095703125, 0.1354217529296875, 0.14654541015625, 0.1576690673828125, 0.168792724609375, 0.1799163818359375, 0.1910400390625, 0.2021636962890625, 0.213287353515625, 0.2244110107421875, 0.23553466796875, 0.2466583251953125, 0.257781982421875, 0.2689056396484375, 0.280029296875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 5.0, 3.0, 10.0, 9.0, 7.0, 11.0, 14.0, 14.0, 23.0, 31.0, 50.0, 74.0, 116.0, 211.0, 457.0, 1663.0, 53636.0, 4117936.0, 18085.0, 1120.0, 344.0, 148.0, 91.0, 50.0, 48.0, 31.0, 18.0, 16.0, 9.0, 13.0, 10.0, 3.0, 0.0, 7.0, 5.0, 4.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2783203125, -0.2691612243652344, -0.26000213623046875, -0.2508430480957031, -0.2416839599609375, -0.23252487182617188, -0.22336578369140625, -0.21420669555664062, -0.205047607421875, -0.19588851928710938, -0.18672943115234375, -0.17757034301757812, -0.1684112548828125, -0.15925216674804688, -0.15009307861328125, -0.14093399047851562, -0.13177490234375, -0.12261581420898438, -0.11345672607421875, -0.10429763793945312, -0.0951385498046875, -0.08597946166992188, -0.07682037353515625, -0.06766128540039062, -0.058502197265625, -0.049343109130859375, -0.04018402099609375, -0.031024932861328125, -0.0218658447265625, -0.012706756591796875, -0.00354766845703125, 0.005611419677734375, 0.0147705078125, 0.023929595947265625, 0.03308868408203125, 0.042247772216796875, 0.0514068603515625, 0.060565948486328125, 0.06972503662109375, 0.07888412475585938, 0.088043212890625, 0.09720230102539062, 0.10636138916015625, 0.11552047729492188, 0.1246795654296875, 0.13383865356445312, 0.14299774169921875, 0.15215682983398438, 0.16131591796875, 0.17047500610351562, 0.17963409423828125, 0.18879318237304688, 0.1979522705078125, 0.20711135864257812, 0.21627044677734375, 0.22542953491210938, 0.234588623046875, 0.24374771118164062, 0.25290679931640625, 0.2620658874511719, 0.2712249755859375, 0.2803840637207031, 0.28954315185546875, 0.2987022399902344, 0.307861328125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 2.0, 9.0, 2.0, 8.0, 5.0, 7.0, 15.0, 9.0, 16.0, 21.0, 31.0, 41.0, 64.0, 97.0, 156.0, 234.0, 406.0, 499.0, 710.0, 580.0, 406.0, 231.0, 166.0, 85.0, 63.0, 54.0, 25.0, 30.0, 18.0, 18.0, 17.0, 9.0, 6.0, 5.0, 6.0, 6.0, 5.0, 1.0, 5.0, 1.0, 2.0, 1.0, 4.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.061798095703125, -0.059916019439697266, -0.05803394317626953, -0.0561518669128418, -0.05426979064941406, -0.05238771438598633, -0.050505638122558594, -0.04862356185913086, -0.046741485595703125, -0.04485940933227539, -0.042977333068847656, -0.04109525680541992, -0.03921318054199219, -0.03733110427856445, -0.03544902801513672, -0.033566951751708984, -0.03168487548828125, -0.029802799224853516, -0.02792072296142578, -0.026038646697998047, -0.024156570434570312, -0.022274494171142578, -0.020392417907714844, -0.01851034164428711, -0.016628265380859375, -0.01474618911743164, -0.012864112854003906, -0.010982036590576172, -0.009099960327148438, -0.007217884063720703, -0.005335807800292969, -0.0034537315368652344, -0.0015716552734375, 0.0003104209899902344, 0.0021924972534179688, 0.004074573516845703, 0.0059566497802734375, 0.007838726043701172, 0.009720802307128906, 0.01160287857055664, 0.013484954833984375, 0.01536703109741211, 0.017249107360839844, 0.019131183624267578, 0.021013259887695312, 0.022895336151123047, 0.02477741241455078, 0.026659488677978516, 0.02854156494140625, 0.030423641204833984, 0.03230571746826172, 0.03418779373168945, 0.03606986999511719, 0.03795194625854492, 0.039834022521972656, 0.04171609878540039, 0.043598175048828125, 0.04548025131225586, 0.047362327575683594, 0.04924440383911133, 0.05112648010253906, 0.0530085563659668, 0.05489063262939453, 0.056772708892822266, 0.05865478515625]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 8.0, 19.0, 60.0, 190.0, 461.0, 204.0, 44.0, 21.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.401622474193573, -0.373960018157959, -0.34629756212234497, -0.31863510608673096, -0.29097265005111694, -0.26331019401550293, -0.2356477677822113, -0.2079853117465973, -0.18032285571098328, -0.15266039967536926, -0.12499795109033585, -0.09733550250530243, -0.06967304646968842, -0.0420105904340744, -0.014348149299621582, 0.013314306735992432, 0.040976762771606445, 0.06863921880722046, 0.09630166739225388, 0.12396411597728729, 0.1516265720129013, 0.17928902804851532, 0.20695146918296814, 0.23461392521858215, 0.26227638125419617, 0.2899388372898102, 0.3176012933254242, 0.3452637195587158, 0.37292617559432983, 0.40058863162994385, 0.42825108766555786, 0.4559135437011719, 0.48357605934143066, 0.5112385153770447, 0.5389009714126587, 0.5665634274482727, 0.5942258834838867, 0.6218883395195007, 0.6495507955551147, 0.677213191986084, 0.7048757076263428, 0.7325381636619568, 0.7602006196975708, 0.7878630757331848, 0.8155255317687988, 0.8431879878044128, 0.8708504438400269, 0.8985128402709961, 0.9261752963066101, 0.9538377523422241, 0.9815002083778381, 1.0091626644134521, 1.0368250608444214, 1.0644875764846802, 1.0921499729156494, 1.1198124885559082, 1.1474748849868774, 1.1751372814178467, 1.2027997970581055, 1.2304621934890747, 1.2581247091293335, 1.2857871055603027, 1.3134496212005615, 1.3411120176315308, 1.3687745332717896]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 3.0, 5.0, 3.0, 10.0, 14.0, 11.0, 9.0, 36.0, 27.0, 27.0, 35.0, 37.0, 27.0, 44.0, 48.0, 40.0, 57.0, 47.0, 57.0, 39.0, 58.0, 45.0, 43.0, 32.0, 42.0, 39.0, 35.0, 28.0, 23.0, 22.0, 17.0, 13.0, 5.0, 4.0, 8.0, 5.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16263657808303833, -0.15611372888088226, -0.1495908945798874, -0.14306804537773132, -0.13654519617557526, -0.1300223469734192, -0.12349951267242432, -0.11697666347026825, -0.11045382171869278, -0.10393097996711731, -0.09740813076496124, -0.09088528901338577, -0.0843624472618103, -0.07783959805965424, -0.07131675630807877, -0.0647939145565033, -0.05827106535434723, -0.05174821987748146, -0.04522537440061569, -0.03870253264904022, -0.032179687172174454, -0.025656841695308685, -0.019133999943733215, -0.012611154466867447, -0.0060883089900016785, 0.00043453555554151535, 0.006957380101084709, 0.013480223715305328, 0.020003069192171097, 0.026525914669036865, 0.033048756420612335, 0.039571601897478104, 0.04609444737434387, 0.05261729285120964, 0.05914013832807541, 0.06566298007965088, 0.07218582928180695, 0.07870867103338242, 0.08523151278495789, 0.09175436198711395, 0.09827720373868942, 0.10480004549026489, 0.11132289469242096, 0.11784573644399643, 0.1243685781955719, 0.13089142739772797, 0.13741427659988403, 0.1439371109008789, 0.15045996010303497, 0.15698280930519104, 0.1635056436061859, 0.17002849280834198, 0.17655134201049805, 0.18307417631149292, 0.189597025513649, 0.19611987471580505, 0.20264270901679993, 0.209165558218956, 0.21568839251995087, 0.22221124172210693, 0.228734090924263, 0.23525694012641907, 0.24177977442741394, 0.24830262362957, 0.2548254728317261]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 6.0, 7.0, 9.0, 11.0, 22.0, 27.0, 40.0, 58.0, 79.0, 137.0, 262.0, 700.0, 2998.0, 61539.0, 973224.0, 7297.0, 1210.0, 427.0, 177.0, 100.0, 65.0, 36.0, 19.0, 19.0, 15.0, 13.0, 7.0, 11.0, 6.0, 7.0, 3.0, 2.0, 1.0, 5.0, 3.0, 1.0, 3.0, 3.0], "bins": [-2.923828125, -2.851104736328125, -2.77838134765625, -2.705657958984375, -2.6329345703125, -2.560211181640625, -2.48748779296875, -2.414764404296875, -2.342041015625, -2.269317626953125, -2.19659423828125, -2.123870849609375, -2.0511474609375, -1.978424072265625, -1.90570068359375, -1.832977294921875, -1.76025390625, -1.687530517578125, -1.61480712890625, -1.542083740234375, -1.4693603515625, -1.396636962890625, -1.32391357421875, -1.251190185546875, -1.178466796875, -1.105743408203125, -1.03302001953125, -0.960296630859375, -0.8875732421875, -0.814849853515625, -0.74212646484375, -0.669403076171875, -0.5966796875, -0.523956298828125, -0.45123291015625, -0.378509521484375, -0.3057861328125, -0.233062744140625, -0.16033935546875, -0.087615966796875, -0.014892578125, 0.057830810546875, 0.13055419921875, 0.203277587890625, 0.2760009765625, 0.348724365234375, 0.42144775390625, 0.494171142578125, 0.56689453125, 0.639617919921875, 0.71234130859375, 0.785064697265625, 0.8577880859375, 0.930511474609375, 1.00323486328125, 1.075958251953125, 1.148681640625, 1.221405029296875, 1.29412841796875, 1.366851806640625, 1.4395751953125, 1.512298583984375, 1.58502197265625, 1.657745361328125, 1.73046875]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 1.0, 0.0, 6.0, 7.0, 9.0, 20.0, 57.0, 152.0, 473.0, 167.0, 66.0, 31.0, 14.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.41259765625, -0.40187835693359375, -0.3911590576171875, -0.38043975830078125, -0.369720458984375, -0.35900115966796875, -0.3482818603515625, -0.33756256103515625, -0.32684326171875, -0.31612396240234375, -0.3054046630859375, -0.29468536376953125, -0.283966064453125, -0.27324676513671875, -0.2625274658203125, -0.25180816650390625, -0.2410888671875, -0.23036956787109375, -0.2196502685546875, -0.20893096923828125, -0.198211669921875, -0.18749237060546875, -0.1767730712890625, -0.16605377197265625, -0.15533447265625, -0.14461517333984375, -0.1338958740234375, -0.12317657470703125, -0.112457275390625, -0.10173797607421875, -0.0910186767578125, -0.08029937744140625, -0.069580078125, -0.05886077880859375, -0.0481414794921875, -0.03742218017578125, -0.026702880859375, -0.01598358154296875, -0.0052642822265625, 0.00545501708984375, 0.01617431640625, 0.02689361572265625, 0.0376129150390625, 0.04833221435546875, 0.059051513671875, 0.06977081298828125, 0.0804901123046875, 0.09120941162109375, 0.1019287109375, 0.11264801025390625, 0.1233673095703125, 0.13408660888671875, 0.144805908203125, 0.15552520751953125, 0.1662445068359375, 0.17696380615234375, 0.18768310546875, 0.19840240478515625, 0.2091217041015625, 0.21984100341796875, 0.230560302734375, 0.24127960205078125, 0.2519989013671875, 0.26271820068359375, 0.2734375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 3.0, 6.0, 9.0, 7.0, 7.0, 18.0, 14.0, 22.0, 23.0, 29.0, 48.0, 55.0, 91.0, 113.0, 157.0, 221.0, 439.0, 950.0, 3043.0, 12235.0, 68368.0, 481526.0, 409369.0, 56325.0, 10533.0, 2816.0, 940.0, 382.0, 246.0, 135.0, 114.0, 78.0, 62.0, 33.0, 26.0, 21.0, 26.0, 11.0, 11.0, 7.0, 12.0, 9.0, 8.0, 3.0, 5.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.29443359375, -0.2860088348388672, -0.2775840759277344, -0.26915931701660156, -0.26073455810546875, -0.25230979919433594, -0.24388504028320312, -0.2354602813720703, -0.2270355224609375, -0.2186107635498047, -0.21018600463867188, -0.20176124572753906, -0.19333648681640625, -0.18491172790527344, -0.17648696899414062, -0.1680622100830078, -0.159637451171875, -0.1512126922607422, -0.14278793334960938, -0.13436317443847656, -0.12593841552734375, -0.11751365661621094, -0.10908889770507812, -0.10066413879394531, -0.0922393798828125, -0.08381462097167969, -0.07538986206054688, -0.06696510314941406, -0.05854034423828125, -0.05011558532714844, -0.041690826416015625, -0.03326606750488281, -0.02484130859375, -0.016416549682617188, -0.007991790771484375, 0.0004329681396484375, 0.00885772705078125, 0.017282485961914062, 0.025707244873046875, 0.03413200378417969, 0.0425567626953125, 0.05098152160644531, 0.059406280517578125, 0.06783103942871094, 0.07625579833984375, 0.08468055725097656, 0.09310531616210938, 0.10153007507324219, 0.109954833984375, 0.11837959289550781, 0.12680435180664062, 0.13522911071777344, 0.14365386962890625, 0.15207862854003906, 0.16050338745117188, 0.1689281463623047, 0.1773529052734375, 0.1857776641845703, 0.19420242309570312, 0.20262718200683594, 0.21105194091796875, 0.21947669982910156, 0.22790145874023438, 0.2363262176513672, 0.2447509765625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 4.0, 4.0, 0.0, 6.0, 6.0, 4.0, 9.0, 9.0, 8.0, 11.0, 15.0, 10.0, 12.0, 21.0, 21.0, 27.0, 23.0, 31.0, 35.0, 38.0, 30.0, 40.0, 30.0, 38.0, 35.0, 48.0, 40.0, 40.0, 32.0, 39.0, 45.0, 33.0, 24.0, 25.0, 31.0, 26.0, 17.0, 16.0, 17.0, 15.0, 15.0, 16.0, 14.0, 9.0, 6.0, 7.0, 4.0, 7.0, 5.0, 2.0, 2.0, 4.0, 2.0, 4.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.1639404296875, -0.158477783203125, -0.15301513671875, -0.147552490234375, -0.14208984375, -0.136627197265625, -0.13116455078125, -0.125701904296875, -0.1202392578125, -0.114776611328125, -0.10931396484375, -0.103851318359375, -0.098388671875, -0.092926025390625, -0.08746337890625, -0.082000732421875, -0.0765380859375, -0.071075439453125, -0.06561279296875, -0.060150146484375, -0.0546875, -0.049224853515625, -0.04376220703125, -0.038299560546875, -0.0328369140625, -0.027374267578125, -0.02191162109375, -0.016448974609375, -0.010986328125, -0.005523681640625, -6.103515625e-05, 0.005401611328125, 0.0108642578125, 0.016326904296875, 0.02178955078125, 0.027252197265625, 0.03271484375, 0.038177490234375, 0.04364013671875, 0.049102783203125, 0.0545654296875, 0.060028076171875, 0.06549072265625, 0.070953369140625, 0.076416015625, 0.081878662109375, 0.08734130859375, 0.092803955078125, 0.0982666015625, 0.103729248046875, 0.10919189453125, 0.114654541015625, 0.1201171875, 0.125579833984375, 0.13104248046875, 0.136505126953125, 0.1419677734375, 0.147430419921875, 0.15289306640625, 0.158355712890625, 0.163818359375, 0.169281005859375, 0.17474365234375, 0.180206298828125, 0.1856689453125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 5.0, 3.0, 3.0, 6.0, 5.0, 8.0, 20.0, 17.0, 30.0, 42.0, 64.0, 103.0, 172.0, 303.0, 593.0, 1181.0, 2576.0, 6024.0, 17043.0, 59943.0, 296138.0, 512084.0, 109270.0, 27272.0, 8947.0, 3476.0, 1565.0, 728.0, 353.0, 222.0, 124.0, 81.0, 47.0, 42.0, 21.0, 18.0, 7.0, 4.0, 9.0, 5.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.1497802734375, -0.1457538604736328, -0.14172744750976562, -0.13770103454589844, -0.13367462158203125, -0.12964820861816406, -0.12562179565429688, -0.12159538269042969, -0.1175689697265625, -0.11354255676269531, -0.10951614379882812, -0.10548973083496094, -0.10146331787109375, -0.09743690490722656, -0.09341049194335938, -0.08938407897949219, -0.085357666015625, -0.08133125305175781, -0.07730484008789062, -0.07327842712402344, -0.06925201416015625, -0.06522560119628906, -0.061199188232421875, -0.05717277526855469, -0.0531463623046875, -0.04911994934082031, -0.045093536376953125, -0.04106712341308594, -0.03704071044921875, -0.03301429748535156, -0.028987884521484375, -0.024961471557617188, -0.02093505859375, -0.016908645629882812, -0.012882232666015625, -0.008855819702148438, -0.00482940673828125, -0.0008029937744140625, 0.003223419189453125, 0.0072498321533203125, 0.0112762451171875, 0.015302658081054688, 0.019329071044921875, 0.023355484008789062, 0.02738189697265625, 0.03140830993652344, 0.035434722900390625, 0.03946113586425781, 0.043487548828125, 0.04751396179199219, 0.051540374755859375, 0.05556678771972656, 0.05959320068359375, 0.06361961364746094, 0.06764602661132812, 0.07167243957519531, 0.0756988525390625, 0.07972526550292969, 0.08375167846679688, 0.08777809143066406, 0.09180450439453125, 0.09583091735839844, 0.09985733032226562, 0.10388374328613281, 0.10791015625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 7.0, 1.0, 4.0, 14.0, 11.0, 21.0, 25.0, 33.0, 40.0, 92.0, 108.0, 128.0, 118.0, 105.0, 101.0, 52.0, 44.0, 24.0, 23.0, 22.0, 12.0, 4.0, 7.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.2590160369873047e-05, -2.198200672864914e-05, -2.1373853087425232e-05, -2.0765699446201324e-05, -2.0157545804977417e-05, -1.954939216375351e-05, -1.8941238522529602e-05, -1.8333084881305695e-05, -1.7724931240081787e-05, -1.711677759885788e-05, -1.6508623957633972e-05, -1.5900470316410065e-05, -1.5292316675186157e-05, -1.468416303396225e-05, -1.4076009392738342e-05, -1.3467855751514435e-05, -1.2859702110290527e-05, -1.225154846906662e-05, -1.1643394827842712e-05, -1.1035241186618805e-05, -1.0427087545394897e-05, -9.81893390417099e-06, -9.210780262947083e-06, -8.602626621723175e-06, -7.994472980499268e-06, -7.38631933927536e-06, -6.778165698051453e-06, -6.170012056827545e-06, -5.561858415603638e-06, -4.95370477437973e-06, -4.345551133155823e-06, -3.7373974919319153e-06, -3.129243850708008e-06, -2.5210902094841003e-06, -1.912936568260193e-06, -1.3047829270362854e-06, -6.966292858123779e-07, -8.847564458847046e-08, 5.19677996635437e-07, 1.1278316378593445e-06, 1.735985279083252e-06, 2.3441389203071594e-06, 2.952292561531067e-06, 3.5604462027549744e-06, 4.168599843978882e-06, 4.776753485202789e-06, 5.384907126426697e-06, 5.993060767650604e-06, 6.601214408874512e-06, 7.209368050098419e-06, 7.817521691322327e-06, 8.425675332546234e-06, 9.033828973770142e-06, 9.641982614994049e-06, 1.0250136256217957e-05, 1.0858289897441864e-05, 1.1466443538665771e-05, 1.2074597179889679e-05, 1.2682750821113586e-05, 1.3290904462337494e-05, 1.3899058103561401e-05, 1.4507211744785309e-05, 1.5115365386009216e-05, 1.5723519027233124e-05, 1.633167266845703e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 5.0, 3.0, 8.0, 5.0, 10.0, 6.0, 12.0, 21.0, 53.0, 65.0, 115.0, 217.0, 356.0, 713.0, 1411.0, 3333.0, 8956.0, 31279.0, 203431.0, 650754.0, 114573.0, 21265.0, 6697.0, 2694.0, 1241.0, 595.0, 280.0, 156.0, 92.0, 80.0, 42.0, 28.0, 12.0, 16.0, 8.0, 10.0, 11.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1490478515625, -0.14397239685058594, -0.13889694213867188, -0.1338214874267578, -0.12874603271484375, -0.12367057800292969, -0.11859512329101562, -0.11351966857910156, -0.1084442138671875, -0.10336875915527344, -0.09829330444335938, -0.09321784973144531, -0.08814239501953125, -0.08306694030761719, -0.07799148559570312, -0.07291603088378906, -0.067840576171875, -0.06276512145996094, -0.057689666748046875, -0.05261421203613281, -0.04753875732421875, -0.04246330261230469, -0.037387847900390625, -0.03231239318847656, -0.0272369384765625, -0.022161483764648438, -0.017086029052734375, -0.012010574340820312, -0.00693511962890625, -0.0018596649169921875, 0.003215789794921875, 0.008291244506835938, 0.01336669921875, 0.018442153930664062, 0.023517608642578125, 0.028593063354492188, 0.03366851806640625, 0.03874397277832031, 0.043819427490234375, 0.04889488220214844, 0.0539703369140625, 0.05904579162597656, 0.06412124633789062, 0.06919670104980469, 0.07427215576171875, 0.07934761047363281, 0.08442306518554688, 0.08949851989746094, 0.094573974609375, 0.09964942932128906, 0.10472488403320312, 0.10980033874511719, 0.11487579345703125, 0.11995124816894531, 0.12502670288085938, 0.13010215759277344, 0.1351776123046875, 0.14025306701660156, 0.14532852172851562, 0.1504039764404297, 0.15547943115234375, 0.1605548858642578, 0.16563034057617188, 0.17070579528808594, 0.17578125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 8.0, 8.0, 6.0, 9.0, 14.0, 16.0, 29.0, 40.0, 40.0, 64.0, 70.0, 78.0, 111.0, 105.0, 95.0, 67.0, 65.0, 38.0, 40.0, 30.0, 19.0, 18.0, 12.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 5.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1285400390625, -0.1251363754272461, -0.12173271179199219, -0.11832904815673828, -0.11492538452148438, -0.11152172088623047, -0.10811805725097656, -0.10471439361572266, -0.10131072998046875, -0.09790706634521484, -0.09450340270996094, -0.09109973907470703, -0.08769607543945312, -0.08429241180419922, -0.08088874816894531, -0.0774850845336914, -0.0740814208984375, -0.0706777572631836, -0.06727409362792969, -0.06387042999267578, -0.060466766357421875, -0.05706310272216797, -0.05365943908691406, -0.050255775451660156, -0.04685211181640625, -0.043448448181152344, -0.04004478454589844, -0.03664112091064453, -0.033237457275390625, -0.02983379364013672, -0.026430130004882812, -0.023026466369628906, -0.019622802734375, -0.016219139099121094, -0.012815475463867188, -0.009411811828613281, -0.006008148193359375, -0.0026044845581054688, 0.0007991790771484375, 0.004202842712402344, 0.00760650634765625, 0.011010169982910156, 0.014413833618164062, 0.01781749725341797, 0.021221160888671875, 0.02462482452392578, 0.028028488159179688, 0.031432151794433594, 0.0348358154296875, 0.038239479064941406, 0.04164314270019531, 0.04504680633544922, 0.048450469970703125, 0.05185413360595703, 0.05525779724121094, 0.058661460876464844, 0.06206512451171875, 0.06546878814697266, 0.06887245178222656, 0.07227611541748047, 0.07567977905273438, 0.07908344268798828, 0.08248710632324219, 0.0858907699584961, 0.08929443359375]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [3.0, 4.0, 9.0, 25.0, 152.0, 385.0, 265.0, 108.0, 28.0, 21.0, 8.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6946492195129395, -0.5722276568412781, -0.4498060643672943, -0.32738447189331055, -0.20496290922164917, -0.08254134654998779, 0.03988027572631836, 0.16230183839797974, 0.2847234010696411, 0.4071449637413025, 0.5295665264129639, 0.65198814868927, 0.7744097113609314, 0.8968312740325928, 1.019252896308899, 1.141674518585205, 1.2640960216522217, 1.3865176439285278, 1.5089391469955444, 1.6313607692718506, 1.7537822723388672, 1.8762038946151733, 1.9986255168914795, 2.121047019958496, 2.243468761444092, 2.3658902645111084, 2.488312005996704, 2.6107335090637207, 2.7331550121307373, 2.855576515197754, 2.9779982566833496, 3.100419759750366, 3.222841262817383, 3.3452627658843994, 3.467684507369995, 3.5901060104370117, 3.7125275135040283, 3.834949016571045, 3.9573707580566406, 4.079792499542236, 4.202213764190674, 4.3246355056762695, 4.447056770324707, 4.569478511810303, 4.691900253295898, 4.814321517944336, 4.936743259429932, 5.059165000915527, 5.181586265563965, 5.3040080070495605, 5.426429271697998, 5.548851013183594, 5.6712727546691895, 5.793694019317627, 5.916115760803223, 6.038537502288818, 6.160959243774414, 6.28338098526001, 6.405802249908447, 6.528223991394043, 6.650645732879639, 6.773066997528076, 6.895488739013672, 7.017910480499268, 7.140331745147705]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 8.0, 6.0, 15.0, 21.0, 23.0, 39.0, 59.0, 60.0, 60.0, 83.0, 71.0, 94.0, 93.0, 76.0, 75.0, 59.0, 41.0, 37.0, 32.0, 21.0, 10.0, 10.0, 7.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9646556377410889, -1.8933935165405273, -1.8221312761306763, -1.7508691549301147, -1.6796069145202637, -1.6083447933197021, -1.5370826721191406, -1.465820550918579, -1.394558310508728, -1.3232961893081665, -1.2520339488983154, -1.180771827697754, -1.1095097064971924, -1.0382474660873413, -0.9669853448867798, -0.8957231640815735, -0.8244609832763672, -0.7531988024711609, -0.6819366216659546, -0.6106745004653931, -0.5394123196601868, -0.46815013885498047, -0.39688798785209656, -0.32562583684921265, -0.25436365604400635, -0.18310149013996124, -0.11183932423591614, -0.04057715833187103, 0.030685007572174072, 0.10194718837738037, 0.17320933938026428, 0.2444714903831482, 0.3157339096069336, 0.3869960904121399, 0.4582582414150238, 0.5295203924179077, 0.600782573223114, 0.6720447540283203, 0.7433068752288818, 0.8145690560340881, 0.8858312368392944, 0.9570934176445007, 1.028355598449707, 1.0996177196502686, 1.17087984085083, 1.2421420812606812, 1.3134042024612427, 1.3846664428710938, 1.4559285640716553, 1.5271906852722168, 1.5984529256820679, 1.6697150468826294, 1.7409772872924805, 1.812239408493042, 1.8835015296936035, 1.954763650894165, 2.0260257720947266, 2.097287893295288, 2.1685500144958496, 2.2398123741149902, 2.3110744953155518, 2.3823366165161133, 2.453598737716675, 2.5248608589172363, 2.596123218536377]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 2.0, 8.0, 9.0, 16.0, 37.0, 43.0, 93.0, 208.0, 1290.0, 3908218.0, 282865.0, 1178.0, 154.0, 57.0, 42.0, 20.0, 13.0, 9.0, 2.0, 3.0, 5.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6494140625, -1.603515625, -1.5576171875, -1.51171875, -1.4658203125, -1.419921875, -1.3740234375, -1.328125, -1.2822265625, -1.236328125, -1.1904296875, -1.14453125, -1.0986328125, -1.052734375, -1.0068359375, -0.9609375, -0.9150390625, -0.869140625, -0.8232421875, -0.77734375, -0.7314453125, -0.685546875, -0.6396484375, -0.59375, -0.5478515625, -0.501953125, -0.4560546875, -0.41015625, -0.3642578125, -0.318359375, -0.2724609375, -0.2265625, -0.1806640625, -0.134765625, -0.0888671875, -0.04296875, 0.0029296875, 0.048828125, 0.0947265625, 0.140625, 0.1865234375, 0.232421875, 0.2783203125, 0.32421875, 0.3701171875, 0.416015625, 0.4619140625, 0.5078125, 0.5537109375, 0.599609375, 0.6455078125, 0.69140625, 0.7373046875, 0.783203125, 0.8291015625, 0.875, 0.9208984375, 0.966796875, 1.0126953125, 1.05859375, 1.1044921875, 1.150390625, 1.1962890625, 1.2421875, 1.2880859375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 5.0, 6.0, 28.0, 62.0, 154.0, 367.0, 227.0, 83.0, 37.0, 25.0, 7.0, 7.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.38720703125, -0.37744903564453125, -0.3676910400390625, -0.35793304443359375, -0.348175048828125, -0.33841705322265625, -0.3286590576171875, -0.31890106201171875, -0.30914306640625, -0.29938507080078125, -0.2896270751953125, -0.27986907958984375, -0.270111083984375, -0.26035308837890625, -0.2505950927734375, -0.24083709716796875, -0.2310791015625, -0.22132110595703125, -0.2115631103515625, -0.20180511474609375, -0.192047119140625, -0.18228912353515625, -0.1725311279296875, -0.16277313232421875, -0.15301513671875, -0.14325714111328125, -0.1334991455078125, -0.12374114990234375, -0.113983154296875, -0.10422515869140625, -0.0944671630859375, -0.08470916748046875, -0.074951171875, -0.06519317626953125, -0.0554351806640625, -0.04567718505859375, -0.035919189453125, -0.02616119384765625, -0.0164031982421875, -0.00664520263671875, 0.00311279296875, 0.01287078857421875, 0.0226287841796875, 0.03238677978515625, 0.042144775390625, 0.05190277099609375, 0.0616607666015625, 0.07141876220703125, 0.0811767578125, 0.09093475341796875, 0.1006927490234375, 0.11045074462890625, 0.120208740234375, 0.12996673583984375, 0.1397247314453125, 0.14948272705078125, 0.15924072265625, 0.16899871826171875, 0.1787567138671875, 0.18851470947265625, 0.198272705078125, 0.20803070068359375, 0.2177886962890625, 0.22754669189453125, 0.2373046875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 7.0, 9.0, 22.0, 23.0, 41.0, 80.0, 136.0, 274.0, 666.0, 2112.0, 9115.0, 61824.0, 1378747.0, 2641926.0, 83981.0, 11277.0, 2539.0, 841.0, 296.0, 135.0, 62.0, 40.0, 27.0, 18.0, 18.0, 12.0, 10.0, 12.0, 5.0, 7.0, 4.0, 4.0, 5.0, 2.0, 2.0, 5.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.24560546875, -0.23495864868164062, -0.22431182861328125, -0.21366500854492188, -0.2030181884765625, -0.19237136840820312, -0.18172454833984375, -0.17107772827148438, -0.160430908203125, -0.14978408813476562, -0.13913726806640625, -0.12849044799804688, -0.1178436279296875, -0.10719680786132812, -0.09654998779296875, -0.08590316772460938, -0.07525634765625, -0.06460952758789062, -0.05396270751953125, -0.043315887451171875, -0.0326690673828125, -0.022022247314453125, -0.01137542724609375, -0.000728607177734375, 0.009918212890625, 0.020565032958984375, 0.03121185302734375, 0.041858673095703125, 0.0525054931640625, 0.06315231323242188, 0.07379913330078125, 0.08444595336914062, 0.0950927734375, 0.10573959350585938, 0.11638641357421875, 0.12703323364257812, 0.1376800537109375, 0.14832687377929688, 0.15897369384765625, 0.16962051391601562, 0.180267333984375, 0.19091415405273438, 0.20156097412109375, 0.21220779418945312, 0.2228546142578125, 0.23350143432617188, 0.24414825439453125, 0.2547950744628906, 0.26544189453125, 0.2760887145996094, 0.28673553466796875, 0.2973823547363281, 0.3080291748046875, 0.3186759948730469, 0.32932281494140625, 0.3399696350097656, 0.350616455078125, 0.3612632751464844, 0.37191009521484375, 0.3825569152832031, 0.3932037353515625, 0.4038505554199219, 0.41449737548828125, 0.4251441955566406, 0.435791015625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 8.0, 2.0, 8.0, 13.0, 20.0, 31.0, 35.0, 83.0, 114.0, 168.0, 299.0, 514.0, 1014.0, 646.0, 376.0, 204.0, 154.0, 100.0, 89.0, 36.0, 41.0, 17.0, 20.0, 18.0, 16.0, 8.0, 8.0, 10.0, 6.0, 4.0, 8.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11370849609375, -0.10986804962158203, -0.10602760314941406, -0.1021871566772461, -0.09834671020507812, -0.09450626373291016, -0.09066581726074219, -0.08682537078857422, -0.08298492431640625, -0.07914447784423828, -0.07530403137207031, -0.07146358489990234, -0.06762313842773438, -0.0637826919555664, -0.05994224548339844, -0.05610179901123047, -0.0522613525390625, -0.04842090606689453, -0.04458045959472656, -0.040740013122558594, -0.036899566650390625, -0.033059120178222656, -0.029218673706054688, -0.02537822723388672, -0.02153778076171875, -0.01769733428955078, -0.013856887817382812, -0.010016441345214844, -0.006175994873046875, -0.0023355484008789062, 0.0015048980712890625, 0.005345344543457031, 0.009185791015625, 0.013026237487792969, 0.016866683959960938, 0.020707130432128906, 0.024547576904296875, 0.028388023376464844, 0.03222846984863281, 0.03606891632080078, 0.03990936279296875, 0.04374980926513672, 0.04759025573730469, 0.051430702209472656, 0.055271148681640625, 0.059111595153808594, 0.06295204162597656, 0.06679248809814453, 0.0706329345703125, 0.07447338104248047, 0.07831382751464844, 0.0821542739868164, 0.08599472045898438, 0.08983516693115234, 0.09367561340332031, 0.09751605987548828, 0.10135650634765625, 0.10519695281982422, 0.10903739929199219, 0.11287784576416016, 0.11671829223632812, 0.1205587387084961, 0.12439918518066406, 0.12823963165283203, 0.132080078125]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 685.0, 327.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.852409362792969, -11.604998588562012, -11.357587814331055, -11.110177040100098, -10.86276626586914, -10.615355491638184, -10.367944717407227, -10.12053394317627, -9.873123168945312, -9.625712394714355, -9.378301620483398, -9.130890846252441, -8.883480072021484, -8.636069297790527, -8.38865852355957, -8.141247749328613, -7.893836975097656, -7.646426200866699, -7.399015426635742, -7.151604652404785, -6.904193878173828, -6.656783103942871, -6.409372329711914, -6.161961555480957, -5.91455078125, -5.667140007019043, -5.419729232788086, -5.172318458557129, -4.924907684326172, -4.677496910095215, -4.430086135864258, -4.182675361633301, -3.935265064239502, -3.687854290008545, -3.440443515777588, -3.193032741546631, -2.945621967315674, -2.698211193084717, -2.4508004188537598, -2.2033896446228027, -1.9559788703918457, -1.7085680961608887, -1.4611573219299316, -1.2137465476989746, -0.9663357734680176, -0.7189249992370605, -0.4715142250061035, -0.22410345077514648, 0.023307323455810547, 0.2707180976867676, 0.5181288719177246, 0.7655396461486816, 1.0129504203796387, 1.2603611946105957, 1.5077719688415527, 1.7551827430725098, 2.002593517303467, 2.250004291534424, 2.497415065765381, 2.744825839996338, 2.992236614227295, 3.239647388458252, 3.487058162689209, 3.734468936920166, 3.981879711151123]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 3.0, 4.0, 9.0, 9.0, 4.0, 9.0, 9.0, 11.0, 16.0, 20.0, 23.0, 34.0, 20.0, 23.0, 41.0, 33.0, 23.0, 36.0, 49.0, 37.0, 48.0, 50.0, 32.0, 46.0, 56.0, 47.0, 40.0, 30.0, 36.0, 26.0, 34.0, 34.0, 27.0, 19.0, 12.0, 12.0, 8.0, 14.0, 8.0, 5.0, 1.0, 5.0, 3.0, 2.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.47381067276000977, -0.4591594636440277, -0.44450825452804565, -0.4298570454120636, -0.41520583629608154, -0.4005545973777771, -0.38590338826179504, -0.371252179145813, -0.35660097002983093, -0.3419497609138489, -0.3272985517978668, -0.31264734268188477, -0.2979961037635803, -0.28334492444992065, -0.2686936855316162, -0.25404247641563416, -0.2393912672996521, -0.22474005818367004, -0.210088849067688, -0.19543762505054474, -0.18078641593456268, -0.16613520681858063, -0.15148398280143738, -0.13683277368545532, -0.12218156456947327, -0.10753035545349121, -0.09287913888692856, -0.0782279223203659, -0.06357671320438385, -0.048925504088401794, -0.03427428752183914, -0.01962307095527649, -0.004971861839294434, 0.00967935100197792, 0.024330563843250275, 0.03898177668452263, 0.05363298952579498, 0.06828419864177704, 0.08293541520833969, 0.09758663177490234, 0.1122378408908844, 0.12688905000686646, 0.1415402591228485, 0.15619148313999176, 0.17084269225597382, 0.18549390137195587, 0.20014512538909912, 0.21479633450508118, 0.22944754362106323, 0.2440987527370453, 0.25874996185302734, 0.2734011709690094, 0.28805238008499146, 0.3027036190032959, 0.31735482811927795, 0.33200603723526, 0.34665724635124207, 0.3613084554672241, 0.3759596645832062, 0.39061087369918823, 0.4052621126174927, 0.41991329193115234, 0.4345645308494568, 0.44921573996543884, 0.4638669490814209]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 7.0, 12.0, 9.0, 6.0, 14.0, 18.0, 18.0, 34.0, 42.0, 55.0, 90.0, 175.0, 285.0, 748.0, 2233.0, 12194.0, 187215.0, 802875.0, 35511.0, 4719.0, 1178.0, 476.0, 218.0, 125.0, 72.0, 60.0, 50.0, 29.0, 24.0, 14.0, 12.0, 9.0, 9.0, 4.0, 1.0, 4.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.48193359375, -0.4669837951660156, -0.45203399658203125, -0.4370841979980469, -0.4221343994140625, -0.4071846008300781, -0.39223480224609375, -0.3772850036621094, -0.362335205078125, -0.3473854064941406, -0.33243560791015625, -0.3174858093261719, -0.3025360107421875, -0.2875862121582031, -0.27263641357421875, -0.2576866149902344, -0.24273681640625, -0.22778701782226562, -0.21283721923828125, -0.19788742065429688, -0.1829376220703125, -0.16798782348632812, -0.15303802490234375, -0.13808822631835938, -0.123138427734375, -0.10818862915039062, -0.09323883056640625, -0.07828903198242188, -0.0633392333984375, -0.048389434814453125, -0.03343963623046875, -0.018489837646484375, -0.0035400390625, 0.011409759521484375, 0.02635955810546875, 0.041309356689453125, 0.0562591552734375, 0.07120895385742188, 0.08615875244140625, 0.10110855102539062, 0.116058349609375, 0.13100814819335938, 0.14595794677734375, 0.16090774536132812, 0.1758575439453125, 0.19080734252929688, 0.20575714111328125, 0.22070693969726562, 0.23565673828125, 0.2506065368652344, 0.26555633544921875, 0.2805061340332031, 0.2954559326171875, 0.3104057312011719, 0.32535552978515625, 0.3403053283691406, 0.355255126953125, 0.3702049255371094, 0.38515472412109375, 0.4001045227050781, 0.4150543212890625, 0.4300041198730469, 0.44495391845703125, 0.4599037170410156, 0.474853515625]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 5.0, 9.0, 23.0, 53.0, 117.0, 303.0, 280.0, 112.0, 50.0, 35.0, 13.0, 6.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.379150390625, -0.36942291259765625, -0.3596954345703125, -0.34996795654296875, -0.340240478515625, -0.33051300048828125, -0.3207855224609375, -0.31105804443359375, -0.30133056640625, -0.29160308837890625, -0.2818756103515625, -0.27214813232421875, -0.262420654296875, -0.25269317626953125, -0.2429656982421875, -0.23323822021484375, -0.2235107421875, -0.21378326416015625, -0.2040557861328125, -0.19432830810546875, -0.184600830078125, -0.17487335205078125, -0.1651458740234375, -0.15541839599609375, -0.14569091796875, -0.13596343994140625, -0.1262359619140625, -0.11650848388671875, -0.106781005859375, -0.09705352783203125, -0.0873260498046875, -0.07759857177734375, -0.06787109375, -0.05814361572265625, -0.0484161376953125, -0.03868865966796875, -0.028961181640625, -0.01923370361328125, -0.0095062255859375, 0.00022125244140625, 0.00994873046875, 0.01967620849609375, 0.0294036865234375, 0.03913116455078125, 0.048858642578125, 0.05858612060546875, 0.0683135986328125, 0.07804107666015625, 0.0877685546875, 0.09749603271484375, 0.1072235107421875, 0.11695098876953125, 0.126678466796875, 0.13640594482421875, 0.1461334228515625, 0.15586090087890625, 0.16558837890625, 0.17531585693359375, 0.1850433349609375, 0.19477081298828125, 0.204498291015625, 0.21422576904296875, 0.2239532470703125, 0.23368072509765625, 0.243408203125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 5.0, 2.0, 5.0, 3.0, 6.0, 6.0, 15.0, 9.0, 14.0, 17.0, 21.0, 18.0, 23.0, 22.0, 22.0, 39.0, 47.0, 57.0, 89.0, 223.0, 1198.0, 73768.0, 962900.0, 8982.0, 488.0, 156.0, 60.0, 49.0, 47.0, 31.0, 31.0, 32.0, 28.0, 19.0, 21.0, 18.0, 20.0, 18.0, 11.0, 9.0, 8.0, 7.0, 2.0, 5.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.95751953125, -0.9269332885742188, -0.8963470458984375, -0.8657608032226562, -0.835174560546875, -0.8045883178710938, -0.7740020751953125, -0.7434158325195312, -0.71282958984375, -0.6822433471679688, -0.6516571044921875, -0.6210708618164062, -0.590484619140625, -0.5598983764648438, -0.5293121337890625, -0.49872589111328125, -0.4681396484375, -0.43755340576171875, -0.4069671630859375, -0.37638092041015625, -0.345794677734375, -0.31520843505859375, -0.2846221923828125, -0.25403594970703125, -0.22344970703125, -0.19286346435546875, -0.1622772216796875, -0.13169097900390625, -0.101104736328125, -0.07051849365234375, -0.0399322509765625, -0.00934600830078125, 0.021240234375, 0.05182647705078125, 0.0824127197265625, 0.11299896240234375, 0.143585205078125, 0.17417144775390625, 0.2047576904296875, 0.23534393310546875, 0.26593017578125, 0.29651641845703125, 0.3271026611328125, 0.35768890380859375, 0.388275146484375, 0.41886138916015625, 0.4494476318359375, 0.48003387451171875, 0.5106201171875, 0.5412063598632812, 0.5717926025390625, 0.6023788452148438, 0.632965087890625, 0.6635513305664062, 0.6941375732421875, 0.7247238159179688, 0.75531005859375, 0.7858963012695312, 0.8164825439453125, 0.8470687866210938, 0.877655029296875, 0.9082412719726562, 0.9388275146484375, 0.9694137573242188, 1.0]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 3.0, 4.0, 2.0, 9.0, 4.0, 9.0, 12.0, 14.0, 21.0, 15.0, 20.0, 24.0, 20.0, 26.0, 29.0, 41.0, 45.0, 44.0, 33.0, 42.0, 45.0, 32.0, 46.0, 43.0, 43.0, 38.0, 40.0, 43.0, 25.0, 31.0, 28.0, 29.0, 23.0, 20.0, 19.0, 15.0, 22.0, 9.0, 8.0, 9.0, 6.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.17333984375, -0.16781234741210938, -0.16228485107421875, -0.15675735473632812, -0.1512298583984375, -0.14570236206054688, -0.14017486572265625, -0.13464736938476562, -0.129119873046875, -0.12359237670898438, -0.11806488037109375, -0.11253738403320312, -0.1070098876953125, -0.10148239135742188, -0.09595489501953125, -0.09042739868164062, -0.08489990234375, -0.07937240600585938, -0.07384490966796875, -0.06831741333007812, -0.0627899169921875, -0.057262420654296875, -0.05173492431640625, -0.046207427978515625, -0.040679931640625, -0.035152435302734375, -0.02962493896484375, -0.024097442626953125, -0.0185699462890625, -0.013042449951171875, -0.00751495361328125, -0.001987457275390625, 0.0035400390625, 0.009067535400390625, 0.01459503173828125, 0.020122528076171875, 0.0256500244140625, 0.031177520751953125, 0.03670501708984375, 0.042232513427734375, 0.047760009765625, 0.053287506103515625, 0.05881500244140625, 0.06434249877929688, 0.0698699951171875, 0.07539749145507812, 0.08092498779296875, 0.08645248413085938, 0.09197998046875, 0.09750747680664062, 0.10303497314453125, 0.10856246948242188, 0.1140899658203125, 0.11961746215820312, 0.12514495849609375, 0.13067245483398438, 0.136199951171875, 0.14172744750976562, 0.14725494384765625, 0.15278244018554688, 0.1583099365234375, 0.16383743286132812, 0.16936492919921875, 0.17489242553710938, 0.180419921875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 6.0, 9.0, 5.0, 14.0, 10.0, 27.0, 36.0, 53.0, 113.0, 212.0, 580.0, 1927.0, 8049.0, 52256.0, 606520.0, 340007.0, 30970.0, 5515.0, 1352.0, 429.0, 205.0, 85.0, 51.0, 39.0, 18.0, 21.0, 9.0, 15.0, 6.0, 5.0, 3.0, 5.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.1829833984375, -0.17815208435058594, -0.17332077026367188, -0.1684894561767578, -0.16365814208984375, -0.1588268280029297, -0.15399551391601562, -0.14916419982910156, -0.1443328857421875, -0.13950157165527344, -0.13467025756835938, -0.1298389434814453, -0.12500762939453125, -0.12017631530761719, -0.11534500122070312, -0.11051368713378906, -0.105682373046875, -0.10085105895996094, -0.09601974487304688, -0.09118843078613281, -0.08635711669921875, -0.08152580261230469, -0.07669448852539062, -0.07186317443847656, -0.0670318603515625, -0.06220054626464844, -0.057369232177734375, -0.05253791809082031, -0.04770660400390625, -0.04287528991699219, -0.038043975830078125, -0.03321266174316406, -0.02838134765625, -0.023550033569335938, -0.018718719482421875, -0.013887405395507812, -0.00905609130859375, -0.0042247772216796875, 0.000606536865234375, 0.0054378509521484375, 0.0102691650390625, 0.015100479125976562, 0.019931793212890625, 0.024763107299804688, 0.02959442138671875, 0.03442573547363281, 0.039257049560546875, 0.04408836364746094, 0.048919677734375, 0.05375099182128906, 0.058582305908203125, 0.06341361999511719, 0.06824493408203125, 0.07307624816894531, 0.07790756225585938, 0.08273887634277344, 0.0875701904296875, 0.09240150451660156, 0.09723281860351562, 0.10206413269042969, 0.10689544677734375, 0.11172676086425781, 0.11655807495117188, 0.12138938903808594, 0.126220703125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 2.0, 7.0, 5.0, 8.0, 9.0, 8.0, 18.0, 14.0, 20.0, 22.0, 40.0, 31.0, 58.0, 46.0, 69.0, 90.0, 75.0, 71.0, 62.0, 59.0, 48.0, 43.0, 25.0, 24.0, 29.0, 18.0, 16.0, 11.0, 21.0, 11.0, 9.0, 6.0, 5.0, 3.0, 1.0, 2.0, 0.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.2040138244628906e-05, -1.1661089956760406e-05, -1.1282041668891907e-05, -1.0902993381023407e-05, -1.0523945093154907e-05, -1.0144896805286407e-05, -9.765848517417908e-06, -9.386800229549408e-06, -9.007751941680908e-06, -8.628703653812408e-06, -8.249655365943909e-06, -7.870607078075409e-06, -7.491558790206909e-06, -7.1125105023384094e-06, -6.73346221446991e-06, -6.35441392660141e-06, -5.97536563873291e-06, -5.59631735086441e-06, -5.217269062995911e-06, -4.838220775127411e-06, -4.459172487258911e-06, -4.080124199390411e-06, -3.7010759115219116e-06, -3.322027623653412e-06, -2.942979335784912e-06, -2.5639310479164124e-06, -2.1848827600479126e-06, -1.8058344721794128e-06, -1.426786184310913e-06, -1.0477378964424133e-06, -6.686896085739136e-07, -2.896413207054138e-07, 8.940696716308594e-08, 4.684552550315857e-07, 8.475035429000854e-07, 1.2265518307685852e-06, 1.605600118637085e-06, 1.9846484065055847e-06, 2.3636966943740845e-06, 2.7427449822425842e-06, 3.121793270111084e-06, 3.5008415579795837e-06, 3.8798898458480835e-06, 4.258938133716583e-06, 4.637986421585083e-06, 5.017034709453583e-06, 5.3960829973220825e-06, 5.775131285190582e-06, 6.154179573059082e-06, 6.533227860927582e-06, 6.9122761487960815e-06, 7.291324436664581e-06, 7.670372724533081e-06, 8.04942101240158e-06, 8.42846930027008e-06, 8.80751758813858e-06, 9.18656587600708e-06, 9.56561416387558e-06, 9.94466245174408e-06, 1.032371073961258e-05, 1.0702759027481079e-05, 1.1081807315349579e-05, 1.1460855603218079e-05, 1.1839903891086578e-05, 1.2218952178955078e-05]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 3.0, 4.0, 5.0, 3.0, 6.0, 9.0, 20.0, 15.0, 26.0, 25.0, 28.0, 53.0, 47.0, 108.0, 286.0, 2106.0, 79487.0, 948444.0, 16503.0, 863.0, 181.0, 89.0, 61.0, 43.0, 23.0, 26.0, 16.0, 12.0, 16.0, 8.0, 6.0, 6.0, 5.0, 4.0, 5.0, 2.0, 7.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.278076171875, -0.26859283447265625, -0.2591094970703125, -0.24962615966796875, -0.240142822265625, -0.23065948486328125, -0.2211761474609375, -0.21169281005859375, -0.20220947265625, -0.19272613525390625, -0.1832427978515625, -0.17375946044921875, -0.164276123046875, -0.15479278564453125, -0.1453094482421875, -0.13582611083984375, -0.1263427734375, -0.11685943603515625, -0.1073760986328125, -0.09789276123046875, -0.088409423828125, -0.07892608642578125, -0.0694427490234375, -0.05995941162109375, -0.05047607421875, -0.04099273681640625, -0.0315093994140625, -0.02202606201171875, -0.012542724609375, -0.00305938720703125, 0.0064239501953125, 0.01590728759765625, 0.025390625, 0.03487396240234375, 0.0443572998046875, 0.05384063720703125, 0.063323974609375, 0.07280731201171875, 0.0822906494140625, 0.09177398681640625, 0.10125732421875, 0.11074066162109375, 0.1202239990234375, 0.12970733642578125, 0.139190673828125, 0.14867401123046875, 0.1581573486328125, 0.16764068603515625, 0.1771240234375, 0.18660736083984375, 0.1960906982421875, 0.20557403564453125, 0.215057373046875, 0.22454071044921875, 0.2340240478515625, 0.24350738525390625, 0.25299072265625, 0.26247406005859375, 0.2719573974609375, 0.28144073486328125, 0.290924072265625, 0.30040740966796875, 0.3098907470703125, 0.31937408447265625, 0.328857421875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 4.0, 3.0, 4.0, 4.0, 4.0, 3.0, 6.0, 15.0, 19.0, 19.0, 22.0, 34.0, 31.0, 37.0, 42.0, 57.0, 64.0, 76.0, 76.0, 79.0, 74.0, 55.0, 42.0, 46.0, 45.0, 24.0, 24.0, 20.0, 13.0, 11.0, 12.0, 7.0, 7.0, 3.0, 3.0, 3.0, 6.0, 5.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.046875, -0.045241355895996094, -0.04360771179199219, -0.04197406768798828, -0.040340423583984375, -0.03870677947998047, -0.03707313537597656, -0.035439491271972656, -0.03380584716796875, -0.032172203063964844, -0.030538558959960938, -0.02890491485595703, -0.027271270751953125, -0.02563762664794922, -0.024003982543945312, -0.022370338439941406, -0.0207366943359375, -0.019103050231933594, -0.017469406127929688, -0.01583576202392578, -0.014202117919921875, -0.012568473815917969, -0.010934829711914062, -0.009301185607910156, -0.00766754150390625, -0.006033897399902344, -0.0044002532958984375, -0.0027666091918945312, -0.001132965087890625, 0.0005006790161132812, 0.0021343231201171875, 0.0037679672241210938, 0.005401611328125, 0.007035255432128906, 0.008668899536132812, 0.010302543640136719, 0.011936187744140625, 0.013569831848144531, 0.015203475952148438, 0.016837120056152344, 0.01847076416015625, 0.020104408264160156, 0.021738052368164062, 0.02337169647216797, 0.025005340576171875, 0.02663898468017578, 0.028272628784179688, 0.029906272888183594, 0.0315399169921875, 0.033173561096191406, 0.03480720520019531, 0.03644084930419922, 0.038074493408203125, 0.03970813751220703, 0.04134178161621094, 0.042975425720214844, 0.04460906982421875, 0.046242713928222656, 0.04787635803222656, 0.04951000213623047, 0.051143646240234375, 0.05277729034423828, 0.05441093444824219, 0.056044578552246094, 0.05767822265625]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 26.0, 573.0, 396.0, 20.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0077080726623535, -2.8395791053771973, -2.67145037651062, -2.503321409225464, -2.3351926803588867, -2.1670637130737305, -1.9989348649978638, -1.830806016921997, -1.6626771688461304, -1.4945483207702637, -1.326419472694397, -1.1582906246185303, -0.9901617169380188, -0.8220328688621521, -0.6539039611816406, -0.4857751131057739, -0.3176462650299072, -0.14951740205287933, 0.01861146092414856, 0.18674033880233765, 0.35486918687820435, 0.522998034954071, 0.6911269426345825, 0.8592557907104492, 1.027384638786316, 1.1955134868621826, 1.3636423349380493, 1.531771183013916, 1.6999001502990723, 1.8680288791656494, 2.0361578464508057, 2.204286575317383, 2.372415542602539, 2.5405445098876953, 2.7086732387542725, 2.8768022060394287, 3.044930934906006, 3.213059902191162, 3.3811888694763184, 3.5493175983428955, 3.7174463272094727, 3.885575294494629, 4.053704261779785, 4.221832752227783, 4.3899617195129395, 4.558090686798096, 4.726219654083252, 4.89434814453125, 5.062477111816406, 5.2306060791015625, 5.398735046386719, 5.566863536834717, 5.734992504119873, 5.903121471405029, 6.0712504386901855, 6.239378929138184, 6.407508373260498, 6.575637340545654, 6.7437663078308105, 6.911894798278809, 7.080023765563965, 7.248152732849121, 7.416281700134277, 7.584410667419434, 7.752539157867432]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 5.0, 3.0, 3.0, 3.0, 11.0, 10.0, 21.0, 19.0, 22.0, 33.0, 47.0, 40.0, 47.0, 46.0, 51.0, 60.0, 73.0, 56.0, 65.0, 61.0, 62.0, 54.0, 40.0, 49.0, 21.0, 25.0, 17.0, 15.0, 13.0, 10.0, 10.0, 10.0, 7.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0104056596755981, -0.977755069732666, -0.9451044797897339, -0.9124538898468018, -0.8798032999038696, -0.8471527099609375, -0.8145021200180054, -0.7818515300750732, -0.7492009401321411, -0.716550350189209, -0.6838997602462769, -0.6512491703033447, -0.6185985803604126, -0.5859479904174805, -0.5532974004745483, -0.5206468105316162, -0.4879962205886841, -0.45534563064575195, -0.4226950407028198, -0.3900444507598877, -0.35739386081695557, -0.32474327087402344, -0.2920926809310913, -0.2594420909881592, -0.22679150104522705, -0.19414091110229492, -0.1614903211593628, -0.12883973121643066, -0.09618914127349854, -0.0635385513305664, -0.030887961387634277, 0.0017626285552978516, 0.03441333770751953, 0.06706392765045166, 0.09971451759338379, 0.13236510753631592, 0.16501569747924805, 0.19766628742218018, 0.2303168773651123, 0.26296746730804443, 0.29561805725097656, 0.3282686471939087, 0.3609192371368408, 0.39356982707977295, 0.4262204170227051, 0.4588710069656372, 0.49152159690856934, 0.5241721868515015, 0.5568227767944336, 0.5894733667373657, 0.6221239566802979, 0.65477454662323, 0.6874251365661621, 0.7200757265090942, 0.7527263164520264, 0.7853769063949585, 0.8180274963378906, 0.8506780862808228, 0.8833286762237549, 0.915979266166687, 0.9486298561096191, 0.9812804460525513, 1.0139310359954834, 1.0465816259384155, 1.0792322158813477]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 4.0, 5.0, 10.0, 16.0, 17.0, 27.0, 54.0, 122.0, 299.0, 1191.0, 15303.0, 4149841.0, 25242.0, 1641.0, 311.0, 105.0, 57.0, 19.0, 11.0, 9.0, 5.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.16796875, -1.1384353637695312, -1.1089019775390625, -1.0793685913085938, -1.049835205078125, -1.0203018188476562, -0.9907684326171875, -0.9612350463867188, -0.93170166015625, -0.9021682739257812, -0.8726348876953125, -0.8431015014648438, -0.813568115234375, -0.7840347290039062, -0.7545013427734375, -0.7249679565429688, -0.6954345703125, -0.6659011840820312, -0.6363677978515625, -0.6068344116210938, -0.577301025390625, -0.5477676391601562, -0.5182342529296875, -0.48870086669921875, -0.45916748046875, -0.42963409423828125, -0.4001007080078125, -0.37056732177734375, -0.341033935546875, -0.31150054931640625, -0.2819671630859375, -0.25243377685546875, -0.222900390625, -0.19336700439453125, -0.1638336181640625, -0.13430023193359375, -0.104766845703125, -0.07523345947265625, -0.0457000732421875, -0.01616668701171875, 0.01336669921875, 0.04290008544921875, 0.0724334716796875, 0.10196685791015625, 0.131500244140625, 0.16103363037109375, 0.1905670166015625, 0.22010040283203125, 0.2496337890625, 0.27916717529296875, 0.3087005615234375, 0.33823394775390625, 0.367767333984375, 0.39730072021484375, 0.4268341064453125, 0.45636749267578125, 0.48590087890625, 0.5154342651367188, 0.5449676513671875, 0.5745010375976562, 0.604034423828125, 0.6335678100585938, 0.6631011962890625, 0.6926345825195312, 0.72216796875]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 3.0, 0.0, 2.0, 6.0, 16.0, 53.0, 96.0, 267.0, 306.0, 150.0, 67.0, 25.0, 11.0, 7.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.36083984375, -0.3513832092285156, -0.34192657470703125, -0.3324699401855469, -0.3230133056640625, -0.3135566711425781, -0.30410003662109375, -0.2946434020996094, -0.285186767578125, -0.2757301330566406, -0.26627349853515625, -0.2568168640136719, -0.2473602294921875, -0.23790359497070312, -0.22844696044921875, -0.21899032592773438, -0.20953369140625, -0.20007705688476562, -0.19062042236328125, -0.18116378784179688, -0.1717071533203125, -0.16225051879882812, -0.15279388427734375, -0.14333724975585938, -0.133880615234375, -0.12442398071289062, -0.11496734619140625, -0.10551071166992188, -0.0960540771484375, -0.08659744262695312, -0.07714080810546875, -0.06768417358398438, -0.0582275390625, -0.048770904541015625, -0.03931427001953125, -0.029857635498046875, -0.0204010009765625, -0.010944366455078125, -0.00148773193359375, 0.007968902587890625, 0.017425537109375, 0.026882171630859375, 0.03633880615234375, 0.045795440673828125, 0.0552520751953125, 0.06470870971679688, 0.07416534423828125, 0.08362197875976562, 0.09307861328125, 0.10253524780273438, 0.11199188232421875, 0.12144851684570312, 0.1309051513671875, 0.14036178588867188, 0.14981842041015625, 0.15927505493164062, 0.168731689453125, 0.17818832397460938, 0.18764495849609375, 0.19710159301757812, 0.2065582275390625, 0.21601486206054688, 0.22547149658203125, 0.23492813110351562, 0.244384765625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 6.0, 16.0, 22.0, 36.0, 86.0, 259.0, 730.0, 5430.0, 728800.0, 3445849.0, 11482.0, 1040.0, 300.0, 127.0, 53.0, 24.0, 11.0, 4.0, 5.0, 3.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.76416015625, -0.7396011352539062, -0.7150421142578125, -0.6904830932617188, -0.665924072265625, -0.6413650512695312, -0.6168060302734375, -0.5922470092773438, -0.56768798828125, -0.5431289672851562, -0.5185699462890625, -0.49401092529296875, -0.469451904296875, -0.44489288330078125, -0.4203338623046875, -0.39577484130859375, -0.3712158203125, -0.34665679931640625, -0.3220977783203125, -0.29753875732421875, -0.272979736328125, -0.24842071533203125, -0.2238616943359375, -0.19930267333984375, -0.17474365234375, -0.15018463134765625, -0.1256256103515625, -0.10106658935546875, -0.076507568359375, -0.05194854736328125, -0.0273895263671875, -0.00283050537109375, 0.021728515625, 0.04628753662109375, 0.0708465576171875, 0.09540557861328125, 0.119964599609375, 0.14452362060546875, 0.1690826416015625, 0.19364166259765625, 0.21820068359375, 0.24275970458984375, 0.2673187255859375, 0.29187774658203125, 0.316436767578125, 0.34099578857421875, 0.3655548095703125, 0.39011383056640625, 0.4146728515625, 0.43923187255859375, 0.4637908935546875, 0.48834991455078125, 0.512908935546875, 0.5374679565429688, 0.5620269775390625, 0.5865859985351562, 0.61114501953125, 0.6357040405273438, 0.6602630615234375, 0.6848220825195312, 0.709381103515625, 0.7339401245117188, 0.7584991455078125, 0.7830581665039062, 0.8076171875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 16.0, 27.0, 44.0, 85.0, 230.0, 583.0, 1395.0, 1073.0, 366.0, 155.0, 50.0, 29.0, 12.0, 4.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.229248046875, -0.22003173828125, -0.2108154296875, -0.20159912109375, -0.1923828125, -0.18316650390625, -0.1739501953125, -0.16473388671875, -0.155517578125, -0.14630126953125, -0.1370849609375, -0.12786865234375, -0.11865234375, -0.10943603515625, -0.1002197265625, -0.09100341796875, -0.081787109375, -0.07257080078125, -0.0633544921875, -0.05413818359375, -0.044921875, -0.03570556640625, -0.0264892578125, -0.01727294921875, -0.008056640625, 0.00115966796875, 0.0103759765625, 0.01959228515625, 0.02880859375, 0.03802490234375, 0.0472412109375, 0.05645751953125, 0.065673828125, 0.07489013671875, 0.0841064453125, 0.09332275390625, 0.1025390625, 0.11175537109375, 0.1209716796875, 0.13018798828125, 0.139404296875, 0.14862060546875, 0.1578369140625, 0.16705322265625, 0.17626953125, 0.18548583984375, 0.1947021484375, 0.20391845703125, 0.213134765625, 0.22235107421875, 0.2315673828125, 0.24078369140625, 0.25, 0.25921630859375, 0.2684326171875, 0.27764892578125, 0.286865234375, 0.29608154296875, 0.3052978515625, 0.31451416015625, 0.32373046875, 0.33294677734375, 0.3421630859375, 0.35137939453125, 0.360595703125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [6.0, 143.0, 856.0, 15.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4515846371650696, -0.2590559124946594, -0.06652718782424927, 0.1260015368461609, 0.31853026151657104, 0.5110589861869812, 0.7035877108573914, 0.8961164355278015, 1.0886452198028564, 1.2811739444732666, 1.4737026691436768, 1.666231393814087, 1.858760118484497, 2.0512888431549072, 2.2438175678253174, 2.4363462924957275, 2.6288750171661377, 2.821403741836548, 3.013932466506958, 3.206461191177368, 3.3989899158477783, 3.5915186405181885, 3.7840473651885986, 3.976576089859009, 4.16910457611084, 4.36163330078125, 4.55416202545166, 4.74669075012207, 4.9392194747924805, 5.131748199462891, 5.324276924133301, 5.516805648803711, 5.709334373474121, 5.901863098144531, 6.094391822814941, 6.286920547485352, 6.479449272155762, 6.671977996826172, 6.864506721496582, 7.057035446166992, 7.249564170837402, 7.4420928955078125, 7.634621620178223, 7.827150344848633, 8.019679069519043, 8.212207794189453, 8.404736518859863, 8.597265243530273, 8.789793968200684, 8.982322692871094, 9.174851417541504, 9.367380142211914, 9.559908866882324, 9.752437591552734, 9.944966316223145, 10.137495040893555, 10.330023765563965, 10.522552490234375, 10.715081214904785, 10.907609939575195, 11.100138664245605, 11.292667388916016, 11.485196113586426, 11.677724838256836, 11.870253562927246]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 6.0, 5.0, 3.0, 11.0, 11.0, 14.0, 12.0, 35.0, 21.0, 24.0, 37.0, 36.0, 48.0, 46.0, 45.0, 47.0, 52.0, 69.0, 78.0, 51.0, 52.0, 41.0, 51.0, 33.0, 33.0, 36.0, 27.0, 19.0, 16.0, 13.0, 9.0, 4.0, 11.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.4525716304779053, -0.4351097047328949, -0.4176477789878845, -0.40018582344055176, -0.3827238976955414, -0.365261971950531, -0.34780001640319824, -0.33033809065818787, -0.3128761649131775, -0.2954142391681671, -0.27795231342315674, -0.260490357875824, -0.2430284321308136, -0.22556650638580322, -0.20810456573963165, -0.19064262509346008, -0.1731806993484497, -0.15571877360343933, -0.13825683295726776, -0.12079489976167679, -0.10333296656608582, -0.08587103337049484, -0.06840910017490387, -0.0509471669793129, -0.033485233783721924, -0.01602330058813095, 0.001438632607460022, 0.018900565803050995, 0.03636249899864197, 0.05382443219423294, 0.07128636538982391, 0.08874829858541489, 0.10621023178100586, 0.12367216497659683, 0.1411340981721878, 0.15859603881835938, 0.17605796456336975, 0.19351989030838013, 0.2109818309545517, 0.22844377160072327, 0.24590569734573364, 0.263367623090744, 0.2808295488357544, 0.29829150438308716, 0.31575343012809753, 0.3332153558731079, 0.3506773114204407, 0.36813923716545105, 0.3856011629104614, 0.4030630886554718, 0.4205250144004822, 0.43798696994781494, 0.4554488956928253, 0.4729108214378357, 0.49037277698516846, 0.5078346729278564, 0.5252966284751892, 0.542758584022522, 0.56022047996521, 0.5776824355125427, 0.5951443910598755, 0.6126062870025635, 0.6300682425498962, 0.6475301384925842, 0.664992094039917]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 6.0, 5.0, 7.0, 7.0, 16.0, 19.0, 26.0, 48.0, 56.0, 81.0, 121.0, 199.0, 336.0, 813.0, 2519.0, 12125.0, 177774.0, 810694.0, 35980.0, 5116.0, 1395.0, 528.0, 226.0, 148.0, 81.0, 59.0, 36.0, 33.0, 23.0, 21.0, 15.0, 9.0, 7.0, 7.0, 2.0, 9.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.86669921875, -0.8434295654296875, -0.820159912109375, -0.7968902587890625, -0.77362060546875, -0.7503509521484375, -0.727081298828125, -0.7038116455078125, -0.6805419921875, -0.6572723388671875, -0.634002685546875, -0.6107330322265625, -0.58746337890625, -0.5641937255859375, -0.540924072265625, -0.5176544189453125, -0.494384765625, -0.4711151123046875, -0.447845458984375, -0.4245758056640625, -0.40130615234375, -0.3780364990234375, -0.354766845703125, -0.3314971923828125, -0.3082275390625, -0.2849578857421875, -0.261688232421875, -0.2384185791015625, -0.21514892578125, -0.1918792724609375, -0.168609619140625, -0.1453399658203125, -0.1220703125, -0.0988006591796875, -0.075531005859375, -0.0522613525390625, -0.02899169921875, -0.0057220458984375, 0.017547607421875, 0.0408172607421875, 0.0640869140625, 0.0873565673828125, 0.110626220703125, 0.1338958740234375, 0.15716552734375, 0.1804351806640625, 0.203704833984375, 0.2269744873046875, 0.250244140625, 0.2735137939453125, 0.296783447265625, 0.3200531005859375, 0.34332275390625, 0.3665924072265625, 0.389862060546875, 0.4131317138671875, 0.4364013671875, 0.4596710205078125, 0.482940673828125, 0.5062103271484375, 0.52947998046875, 0.5527496337890625, 0.576019287109375, 0.5992889404296875, 0.62255859375]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 4.0, 11.0, 34.0, 76.0, 187.0, 337.0, 215.0, 80.0, 37.0, 18.0, 5.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.370361328125, -0.3607444763183594, -0.35112762451171875, -0.3415107727050781, -0.3318939208984375, -0.3222770690917969, -0.31266021728515625, -0.3030433654785156, -0.293426513671875, -0.2838096618652344, -0.27419281005859375, -0.2645759582519531, -0.2549591064453125, -0.24534225463867188, -0.23572540283203125, -0.22610855102539062, -0.21649169921875, -0.20687484741210938, -0.19725799560546875, -0.18764114379882812, -0.1780242919921875, -0.16840744018554688, -0.15879058837890625, -0.14917373657226562, -0.139556884765625, -0.12994003295898438, -0.12032318115234375, -0.11070632934570312, -0.1010894775390625, -0.09147262573242188, -0.08185577392578125, -0.07223892211914062, -0.0626220703125, -0.053005218505859375, -0.04338836669921875, -0.033771514892578125, -0.0241546630859375, -0.014537811279296875, -0.00492095947265625, 0.004695892333984375, 0.014312744140625, 0.023929595947265625, 0.03354644775390625, 0.043163299560546875, 0.0527801513671875, 0.062397003173828125, 0.07201385498046875, 0.08163070678710938, 0.09124755859375, 0.10086441040039062, 0.11048126220703125, 0.12009811401367188, 0.1297149658203125, 0.13933181762695312, 0.14894866943359375, 0.15856552124023438, 0.168182373046875, 0.17779922485351562, 0.18741607666015625, 0.19703292846679688, 0.2066497802734375, 0.21626663208007812, 0.22588348388671875, 0.23550033569335938, 0.2451171875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 11.0, 9.0, 4.0, 14.0, 23.0, 20.0, 26.0, 34.0, 54.0, 62.0, 94.0, 122.0, 209.0, 355.0, 732.0, 2108.0, 8145.0, 47550.0, 510915.0, 427343.0, 40000.0, 7124.0, 1957.0, 692.0, 319.0, 174.0, 121.0, 87.0, 51.0, 55.0, 37.0, 25.0, 22.0, 16.0, 11.0, 7.0, 9.0, 8.0, 2.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0], "bins": [-0.58349609375, -0.5672683715820312, -0.5510406494140625, -0.5348129272460938, -0.518585205078125, -0.5023574829101562, -0.4861297607421875, -0.46990203857421875, -0.45367431640625, -0.43744659423828125, -0.4212188720703125, -0.40499114990234375, -0.388763427734375, -0.37253570556640625, -0.3563079833984375, -0.34008026123046875, -0.3238525390625, -0.30762481689453125, -0.2913970947265625, -0.27516937255859375, -0.258941650390625, -0.24271392822265625, -0.2264862060546875, -0.21025848388671875, -0.19403076171875, -0.17780303955078125, -0.1615753173828125, -0.14534759521484375, -0.129119873046875, -0.11289215087890625, -0.0966644287109375, -0.08043670654296875, -0.064208984375, -0.04798126220703125, -0.0317535400390625, -0.01552581787109375, 0.000701904296875, 0.01692962646484375, 0.0331573486328125, 0.04938507080078125, 0.06561279296875, 0.08184051513671875, 0.0980682373046875, 0.11429595947265625, 0.130523681640625, 0.14675140380859375, 0.1629791259765625, 0.17920684814453125, 0.1954345703125, 0.21166229248046875, 0.2278900146484375, 0.24411773681640625, 0.260345458984375, 0.27657318115234375, 0.2928009033203125, 0.30902862548828125, 0.32525634765625, 0.34148406982421875, 0.3577117919921875, 0.37393951416015625, 0.390167236328125, 0.40639495849609375, 0.4226226806640625, 0.43885040283203125, 0.455078125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 3.0, 5.0, 7.0, 8.0, 10.0, 11.0, 17.0, 21.0, 27.0, 33.0, 43.0, 45.0, 54.0, 61.0, 54.0, 71.0, 64.0, 53.0, 78.0, 55.0, 71.0, 33.0, 28.0, 36.0, 24.0, 23.0, 15.0, 14.0, 15.0, 1.0, 6.0, 6.0, 3.0, 4.0, 1.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.2479248046875, -0.2407073974609375, -0.233489990234375, -0.2262725830078125, -0.21905517578125, -0.2118377685546875, -0.204620361328125, -0.1974029541015625, -0.190185546875, -0.1829681396484375, -0.175750732421875, -0.1685333251953125, -0.16131591796875, -0.1540985107421875, -0.146881103515625, -0.1396636962890625, -0.1324462890625, -0.1252288818359375, -0.118011474609375, -0.1107940673828125, -0.10357666015625, -0.0963592529296875, -0.089141845703125, -0.0819244384765625, -0.07470703125, -0.0674896240234375, -0.060272216796875, -0.0530548095703125, -0.04583740234375, -0.0386199951171875, -0.031402587890625, -0.0241851806640625, -0.0169677734375, -0.0097503662109375, -0.002532958984375, 0.0046844482421875, 0.01190185546875, 0.0191192626953125, 0.026336669921875, 0.0335540771484375, 0.040771484375, 0.0479888916015625, 0.055206298828125, 0.0624237060546875, 0.06964111328125, 0.0768585205078125, 0.084075927734375, 0.0912933349609375, 0.0985107421875, 0.1057281494140625, 0.112945556640625, 0.1201629638671875, 0.12738037109375, 0.1345977783203125, 0.141815185546875, 0.1490325927734375, 0.15625, 0.1634674072265625, 0.170684814453125, 0.1779022216796875, 0.18511962890625, 0.1923370361328125, 0.199554443359375, 0.2067718505859375, 0.2139892578125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 8.0, 5.0, 13.0, 14.0, 12.0, 26.0, 29.0, 47.0, 81.0, 94.0, 145.0, 206.0, 334.0, 500.0, 711.0, 1293.0, 2260.0, 4998.0, 12703.0, 46798.0, 276981.0, 543918.0, 117458.0, 24068.0, 7919.0, 3304.0, 1760.0, 973.0, 628.0, 382.0, 281.0, 168.0, 134.0, 83.0, 63.0, 43.0, 36.0, 20.0, 17.0, 15.0, 5.0, 9.0, 5.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.211181640625, -0.2050189971923828, -0.19885635375976562, -0.19269371032714844, -0.18653106689453125, -0.18036842346191406, -0.17420578002929688, -0.1680431365966797, -0.1618804931640625, -0.1557178497314453, -0.14955520629882812, -0.14339256286621094, -0.13722991943359375, -0.13106727600097656, -0.12490463256835938, -0.11874198913574219, -0.112579345703125, -0.10641670227050781, -0.10025405883789062, -0.09409141540527344, -0.08792877197265625, -0.08176612854003906, -0.07560348510742188, -0.06944084167480469, -0.0632781982421875, -0.05711555480957031, -0.050952911376953125, -0.04479026794433594, -0.03862762451171875, -0.03246498107910156, -0.026302337646484375, -0.020139694213867188, -0.01397705078125, -0.007814407348632812, -0.001651763916015625, 0.0045108795166015625, 0.01067352294921875, 0.016836166381835938, 0.022998809814453125, 0.029161453247070312, 0.0353240966796875, 0.04148674011230469, 0.047649383544921875, 0.05381202697753906, 0.05997467041015625, 0.06613731384277344, 0.07229995727539062, 0.07846260070800781, 0.084625244140625, 0.09078788757324219, 0.09695053100585938, 0.10311317443847656, 0.10927581787109375, 0.11543846130371094, 0.12160110473632812, 0.1277637481689453, 0.1339263916015625, 0.1400890350341797, 0.14625167846679688, 0.15241432189941406, 0.15857696533203125, 0.16473960876464844, 0.17090225219726562, 0.1770648956298828, 0.1832275390625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 6.0, 2.0, 3.0, 10.0, 5.0, 10.0, 23.0, 33.0, 66.0, 143.0, 196.0, 213.0, 126.0, 73.0, 38.0, 15.0, 9.0, 8.0, 10.0, 3.0, 3.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.159046173095703e-05, -3.0415132641792297e-05, -2.9239803552627563e-05, -2.806447446346283e-05, -2.6889145374298096e-05, -2.5713816285133362e-05, -2.4538487195968628e-05, -2.3363158106803894e-05, -2.218782901763916e-05, -2.1012499928474426e-05, -1.9837170839309692e-05, -1.866184175014496e-05, -1.7486512660980225e-05, -1.631118357181549e-05, -1.5135854482650757e-05, -1.3960525393486023e-05, -1.2785196304321289e-05, -1.1609867215156555e-05, -1.0434538125991821e-05, -9.259209036827087e-06, -8.083879947662354e-06, -6.90855085849762e-06, -5.733221769332886e-06, -4.557892680168152e-06, -3.382563591003418e-06, -2.207234501838684e-06, -1.0319054126739502e-06, 1.434236764907837e-07, 1.3187527656555176e-06, 2.4940818548202515e-06, 3.6694109439849854e-06, 4.844740033149719e-06, 6.020069122314453e-06, 7.195398211479187e-06, 8.370727300643921e-06, 9.546056389808655e-06, 1.0721385478973389e-05, 1.1896714568138123e-05, 1.3072043657302856e-05, 1.424737274646759e-05, 1.5422701835632324e-05, 1.6598030924797058e-05, 1.7773360013961792e-05, 1.8948689103126526e-05, 2.012401819229126e-05, 2.1299347281455994e-05, 2.2474676370620728e-05, 2.365000545978546e-05, 2.4825334548950195e-05, 2.600066363811493e-05, 2.7175992727279663e-05, 2.8351321816444397e-05, 2.952665090560913e-05, 3.0701979994773865e-05, 3.18773090839386e-05, 3.305263817310333e-05, 3.4227967262268066e-05, 3.54032963514328e-05, 3.6578625440597534e-05, 3.775395452976227e-05, 3.8929283618927e-05, 4.0104612708091736e-05, 4.127994179725647e-05, 4.2455270886421204e-05, 4.363059997558594e-05]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 4.0, 7.0, 9.0, 12.0, 18.0, 18.0, 25.0, 46.0, 84.0, 133.0, 300.0, 620.0, 2187.0, 10036.0, 69474.0, 568933.0, 351441.0, 36662.0, 6012.0, 1463.0, 523.0, 207.0, 118.0, 69.0, 47.0, 25.0, 29.0, 19.0, 12.0, 5.0, 5.0, 4.0, 4.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.275146484375, -0.26824188232421875, -0.2613372802734375, -0.25443267822265625, -0.247528076171875, -0.24062347412109375, -0.2337188720703125, -0.22681427001953125, -0.21990966796875, -0.21300506591796875, -0.2061004638671875, -0.19919586181640625, -0.192291259765625, -0.18538665771484375, -0.1784820556640625, -0.17157745361328125, -0.1646728515625, -0.15776824951171875, -0.1508636474609375, -0.14395904541015625, -0.137054443359375, -0.13014984130859375, -0.1232452392578125, -0.11634063720703125, -0.10943603515625, -0.10253143310546875, -0.0956268310546875, -0.08872222900390625, -0.081817626953125, -0.07491302490234375, -0.0680084228515625, -0.06110382080078125, -0.05419921875, -0.04729461669921875, -0.0403900146484375, -0.03348541259765625, -0.026580810546875, -0.01967620849609375, -0.0127716064453125, -0.00586700439453125, 0.00103759765625, 0.00794219970703125, 0.0148468017578125, 0.02175140380859375, 0.028656005859375, 0.03556060791015625, 0.0424652099609375, 0.04936981201171875, 0.0562744140625, 0.06317901611328125, 0.0700836181640625, 0.07698822021484375, 0.083892822265625, 0.09079742431640625, 0.0977020263671875, 0.10460662841796875, 0.11151123046875, 0.11841583251953125, 0.1253204345703125, 0.13222503662109375, 0.139129638671875, 0.14603424072265625, 0.1529388427734375, 0.15984344482421875, 0.166748046875]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0, 6.0, 3.0, 4.0, 1.0, 4.0, 6.0, 13.0, 15.0, 16.0, 24.0, 31.0, 38.0, 46.0, 56.0, 52.0, 59.0, 77.0, 73.0, 84.0, 55.0, 56.0, 58.0, 59.0, 38.0, 42.0, 31.0, 18.0, 14.0, 7.0, 8.0, 4.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.076904296875, -0.07480812072753906, -0.07271194458007812, -0.07061576843261719, -0.06851959228515625, -0.06642341613769531, -0.06432723999023438, -0.06223106384277344, -0.0601348876953125, -0.05803871154785156, -0.055942535400390625, -0.05384635925292969, -0.05175018310546875, -0.04965400695800781, -0.047557830810546875, -0.04546165466308594, -0.043365478515625, -0.04126930236816406, -0.039173126220703125, -0.03707695007324219, -0.03498077392578125, -0.03288459777832031, -0.030788421630859375, -0.028692245483398438, -0.0265960693359375, -0.024499893188476562, -0.022403717041015625, -0.020307540893554688, -0.01821136474609375, -0.016115188598632812, -0.014019012451171875, -0.011922836303710938, -0.00982666015625, -0.0077304840087890625, -0.005634307861328125, -0.0035381317138671875, -0.00144195556640625, 0.0006542205810546875, 0.002750396728515625, 0.0048465728759765625, 0.0069427490234375, 0.009038925170898438, 0.011135101318359375, 0.013231277465820312, 0.01532745361328125, 0.017423629760742188, 0.019519805908203125, 0.021615982055664062, 0.023712158203125, 0.025808334350585938, 0.027904510498046875, 0.030000686645507812, 0.03209686279296875, 0.03419303894042969, 0.036289215087890625, 0.03838539123535156, 0.0404815673828125, 0.04257774353027344, 0.044673919677734375, 0.04677009582519531, 0.04886627197265625, 0.05096244812011719, 0.053058624267578125, 0.05515480041503906, 0.0572509765625]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 8.0, 15.0, 51.0, 140.0, 293.0, 283.0, 150.0, 49.0, 17.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.923243522644043, -2.864720344543457, -2.806197166442871, -2.747673988342285, -2.689150810241699, -2.6306276321411133, -2.5721044540405273, -2.5135812759399414, -2.4550580978393555, -2.3965349197387695, -2.3380117416381836, -2.2794885635375977, -2.2209653854370117, -2.162442207336426, -2.10391902923584, -2.045395851135254, -1.9868724346160889, -1.928349256515503, -1.869826078414917, -1.811302900314331, -1.7527797222137451, -1.6942565441131592, -1.6357332468032837, -1.5772100687026978, -1.5186868906021118, -1.4601637125015259, -1.40164053440094, -1.343117356300354, -1.2845940589904785, -1.2260708808898926, -1.1675477027893066, -1.1090245246887207, -1.0505013465881348, -0.9919781684875488, -0.9334549903869629, -0.8749317526817322, -0.8164085745811462, -0.7578853964805603, -0.6993621587753296, -0.6408389806747437, -0.5823158025741577, -0.5237926244735718, -0.46526941657066345, -0.4067462086677551, -0.3482230305671692, -0.28969985246658325, -0.23117664456367493, -0.1726534366607666, -0.11413025856018066, -0.05560706555843353, 0.0029161274433135986, 0.06143932044506073, 0.11996251344680786, 0.1784856915473938, 0.23700889945030212, 0.29553210735321045, 0.3540552854537964, 0.4125784635543823, 0.47110167145729065, 0.529624879360199, 0.5881480574607849, 0.6466712355613708, 0.7051944732666016, 0.7637176513671875, 0.8222408294677734]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 2.0, 9.0, 16.0, 21.0, 29.0, 33.0, 38.0, 47.0, 59.0, 54.0, 69.0, 59.0, 79.0, 80.0, 59.0, 65.0, 54.0, 40.0, 38.0, 26.0, 28.0, 25.0, 18.0, 19.0, 12.0, 6.0, 9.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.759178638458252, -0.7336363196372986, -0.7080939412117004, -0.6825516223907471, -0.6570092439651489, -0.6314669251441956, -0.6059246063232422, -0.580382227897644, -0.5548399090766907, -0.5292975902557373, -0.5037552118301392, -0.4782128930091858, -0.45267054438591003, -0.4271281957626343, -0.4015858769416809, -0.37604352831840515, -0.3505011796951294, -0.32495883107185364, -0.2994164824485779, -0.2738741636276245, -0.24833181500434875, -0.222789466381073, -0.19724713265895844, -0.17170479893684387, -0.14616245031356812, -0.12062010914087296, -0.0950777679681778, -0.06953542679548264, -0.043993085622787476, -0.01845073699951172, 0.007091596722602844, 0.03263393044471741, 0.058176279067993164, 0.08371862024068832, 0.10926096141338348, 0.13480329513549805, 0.1603456437587738, 0.18588799238204956, 0.21143032610416412, 0.2369726598262787, 0.26251500844955444, 0.2880573570728302, 0.31359970569610596, 0.3391420245170593, 0.3646843731403351, 0.39022672176361084, 0.4157690405845642, 0.44131138920783997, 0.4668537378311157, 0.4923960864543915, 0.5179384350776672, 0.5434807538986206, 0.5690231323242188, 0.5945654511451721, 0.6201077699661255, 0.6456501483917236, 0.671192467212677, 0.6967347860336304, 0.7222771644592285, 0.7478194832801819, 0.7733618021011353, 0.7989041805267334, 0.8244464993476868, 0.8499888181686401, 0.8755311965942383]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 7.0, 3.0, 5.0, 13.0, 17.0, 31.0, 40.0, 66.0, 189.0, 578.0, 2901.0, 35093.0, 4096720.0, 54071.0, 3341.0, 896.0, 194.0, 62.0, 32.0, 10.0, 9.0, 3.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.71240234375, -0.6939125061035156, -0.6754226684570312, -0.6569328308105469, -0.6384429931640625, -0.6199531555175781, -0.6014633178710938, -0.5829734802246094, -0.564483642578125, -0.5459938049316406, -0.5275039672851562, -0.5090141296386719, -0.4905242919921875, -0.4720344543457031, -0.45354461669921875, -0.4350547790527344, -0.41656494140625, -0.3980751037597656, -0.37958526611328125, -0.3610954284667969, -0.3426055908203125, -0.3241157531738281, -0.30562591552734375, -0.2871360778808594, -0.268646240234375, -0.2501564025878906, -0.23166656494140625, -0.21317672729492188, -0.1946868896484375, -0.17619705200195312, -0.15770721435546875, -0.13921737670898438, -0.1207275390625, -0.10223770141601562, -0.08374786376953125, -0.06525802612304688, -0.0467681884765625, -0.028278350830078125, -0.00978851318359375, 0.008701324462890625, 0.027191162109375, 0.045680999755859375, 0.06417083740234375, 0.08266067504882812, 0.1011505126953125, 0.11964035034179688, 0.13813018798828125, 0.15662002563476562, 0.17510986328125, 0.19359970092773438, 0.21208953857421875, 0.23057937622070312, 0.2490692138671875, 0.2675590515136719, 0.28604888916015625, 0.3045387268066406, 0.323028564453125, 0.3415184020996094, 0.36000823974609375, 0.3784980773925781, 0.3969879150390625, 0.4154777526855469, 0.43396759033203125, 0.4524574279785156, 0.470947265625]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 15.0, 48.0, 131.0, 274.0, 299.0, 153.0, 49.0, 20.0, 12.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.364990234375, -0.3551368713378906, -0.34528350830078125, -0.3354301452636719, -0.3255767822265625, -0.3157234191894531, -0.30587005615234375, -0.2960166931152344, -0.286163330078125, -0.2763099670410156, -0.26645660400390625, -0.2566032409667969, -0.2467498779296875, -0.23689651489257812, -0.22704315185546875, -0.21718978881835938, -0.20733642578125, -0.19748306274414062, -0.18762969970703125, -0.17777633666992188, -0.1679229736328125, -0.15806961059570312, -0.14821624755859375, -0.13836288452148438, -0.128509521484375, -0.11865615844726562, -0.10880279541015625, -0.09894943237304688, -0.0890960693359375, -0.07924270629882812, -0.06938934326171875, -0.059535980224609375, -0.0496826171875, -0.039829254150390625, -0.02997589111328125, -0.020122528076171875, -0.0102691650390625, -0.000415802001953125, 0.00943756103515625, 0.019290924072265625, 0.029144287109375, 0.038997650146484375, 0.04885101318359375, 0.058704376220703125, 0.0685577392578125, 0.07841110229492188, 0.08826446533203125, 0.09811782836914062, 0.10797119140625, 0.11782455444335938, 0.12767791748046875, 0.13753128051757812, 0.1473846435546875, 0.15723800659179688, 0.16709136962890625, 0.17694473266601562, 0.186798095703125, 0.19665145874023438, 0.20650482177734375, 0.21635818481445312, 0.2262115478515625, 0.23606491088867188, 0.24591827392578125, 0.2557716369628906, 0.265625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 8.0, 8.0, 22.0, 32.0, 59.0, 93.0, 162.0, 353.0, 876.0, 3589.0, 34745.0, 995505.0, 3046312.0, 102855.0, 7470.0, 1312.0, 417.0, 180.0, 107.0, 70.0, 43.0, 23.0, 26.0, 10.0, 11.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.369384765625, -0.3591766357421875, -0.348968505859375, -0.3387603759765625, -0.32855224609375, -0.3183441162109375, -0.308135986328125, -0.2979278564453125, -0.2877197265625, -0.2775115966796875, -0.267303466796875, -0.2570953369140625, -0.24688720703125, -0.2366790771484375, -0.226470947265625, -0.2162628173828125, -0.2060546875, -0.1958465576171875, -0.185638427734375, -0.1754302978515625, -0.16522216796875, -0.1550140380859375, -0.144805908203125, -0.1345977783203125, -0.1243896484375, -0.1141815185546875, -0.103973388671875, -0.0937652587890625, -0.08355712890625, -0.0733489990234375, -0.063140869140625, -0.0529327392578125, -0.042724609375, -0.0325164794921875, -0.022308349609375, -0.0121002197265625, -0.00189208984375, 0.0083160400390625, 0.018524169921875, 0.0287322998046875, 0.0389404296875, 0.0491485595703125, 0.059356689453125, 0.0695648193359375, 0.07977294921875, 0.0899810791015625, 0.100189208984375, 0.1103973388671875, 0.12060546875, 0.1308135986328125, 0.141021728515625, 0.1512298583984375, 0.16143798828125, 0.1716461181640625, 0.181854248046875, 0.1920623779296875, 0.2022705078125, 0.2124786376953125, 0.222686767578125, 0.2328948974609375, 0.24310302734375, 0.2533111572265625, 0.263519287109375, 0.2737274169921875, 0.283935546875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 3.0, 4.0, 8.0, 9.0, 18.0, 23.0, 40.0, 60.0, 92.0, 146.0, 263.0, 398.0, 597.0, 689.0, 602.0, 438.0, 264.0, 171.0, 107.0, 66.0, 38.0, 23.0, 10.0, 10.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0772705078125, -0.07196998596191406, -0.06666946411132812, -0.06136894226074219, -0.05606842041015625, -0.05076789855957031, -0.045467376708984375, -0.04016685485839844, -0.0348663330078125, -0.029565811157226562, -0.024265289306640625, -0.018964767456054688, -0.01366424560546875, -0.008363723754882812, -0.003063201904296875, 0.0022373199462890625, 0.007537841796875, 0.012838363647460938, 0.018138885498046875, 0.023439407348632812, 0.02873992919921875, 0.03404045104980469, 0.039340972900390625, 0.04464149475097656, 0.0499420166015625, 0.05524253845214844, 0.060543060302734375, 0.06584358215332031, 0.07114410400390625, 0.07644462585449219, 0.08174514770507812, 0.08704566955566406, 0.09234619140625, 0.09764671325683594, 0.10294723510742188, 0.10824775695800781, 0.11354827880859375, 0.11884880065917969, 0.12414932250976562, 0.12944984436035156, 0.1347503662109375, 0.14005088806152344, 0.14535140991210938, 0.1506519317626953, 0.15595245361328125, 0.1612529754638672, 0.16655349731445312, 0.17185401916503906, 0.177154541015625, 0.18245506286621094, 0.18775558471679688, 0.1930561065673828, 0.19835662841796875, 0.2036571502685547, 0.20895767211914062, 0.21425819396972656, 0.2195587158203125, 0.22485923767089844, 0.23015975952148438, 0.2354602813720703, 0.24076080322265625, 0.2460613250732422, 0.2513618469238281, 0.25666236877441406, 0.261962890625]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 15.0, 116.0, 448.0, 352.0, 61.0, 12.0, 7.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9357850551605225, -0.8502916097640991, -0.7647981643676758, -0.6793047785758972, -0.5938113331794739, -0.5083178877830505, -0.422824501991272, -0.33733105659484863, -0.2518376111984253, -0.16634418070316315, -0.080850750207901, 0.004642665386199951, 0.09013611078262329, 0.17562955617904663, 0.2611229419708252, 0.34661638736724854, 0.4321098327636719, 0.5176032781600952, 0.6030967235565186, 0.6885901093482971, 0.7740835547447205, 0.8595770001411438, 0.9450703859329224, 1.0305638313293457, 1.116057276725769, 1.2015507221221924, 1.2870441675186157, 1.372537612915039, 1.4580309391021729, 1.5435245037078857, 1.6290178298950195, 1.7145112752914429, 1.800004482269287, 1.8854979276657104, 1.9709913730621338, 2.0564846992492676, 2.1419782638549805, 2.2274715900421143, 2.312964916229248, 2.398458480834961, 2.483952045440674, 2.5694453716278076, 2.6549389362335205, 2.7404322624206543, 2.825925827026367, 2.911419153213501, 2.9969124794006348, 3.0824060440063477, 3.1678993701934814, 3.2533926963806152, 3.338886260986328, 3.424379587173462, 3.509873151779175, 3.5953664779663086, 3.6808600425720215, 3.7663533687591553, 3.851846694946289, 3.937340021133423, 4.022833347320557, 4.1083269119262695, 4.193820476531982, 4.279314041137695, 4.36480712890625, 4.450300693511963, 4.535794258117676]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 1.0, 7.0, 4.0, 7.0, 16.0, 16.0, 14.0, 27.0, 22.0, 30.0, 44.0, 39.0, 48.0, 39.0, 47.0, 57.0, 55.0, 64.0, 58.0, 49.0, 57.0, 53.0, 41.0, 46.0, 47.0, 20.0, 23.0, 19.0, 16.0, 9.0, 13.0, 2.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4985332489013672, -0.4811267852783203, -0.46372032165527344, -0.44631385803222656, -0.4289074242115021, -0.4115009605884552, -0.3940944969654083, -0.37668803334236145, -0.35928159952163696, -0.3418751358985901, -0.3244686722755432, -0.30706220865249634, -0.28965577483177185, -0.272249311208725, -0.2548428475856781, -0.23743638396263123, -0.22002992033958435, -0.20262345671653748, -0.1852170079946518, -0.16781054437160492, -0.15040409564971924, -0.13299763202667236, -0.11559116840362549, -0.09818471223115921, -0.08077825605869293, -0.06337179988622665, -0.04596533998847008, -0.0285588800907135, -0.011152423918247223, 0.006254032254219055, 0.02366049587726593, 0.04106695204973221, 0.058473408222198486, 0.07587986439466476, 0.09328632056713104, 0.11069278419017792, 0.1280992329120636, 0.14550569653511047, 0.16291216015815735, 0.18031862378120422, 0.1977250725030899, 0.21513153612613678, 0.23253798484802246, 0.24994444847106934, 0.2673509120941162, 0.2847573757171631, 0.30216383934020996, 0.31957027316093445, 0.3369767367839813, 0.3543832004070282, 0.3717896640300751, 0.38919609785079956, 0.40660256147384644, 0.4240090250968933, 0.4414154887199402, 0.45882195234298706, 0.47622841596603394, 0.4936348795890808, 0.5110413432121277, 0.5284478068351746, 0.5458542704582214, 0.5632606744766235, 0.5806671380996704, 0.5980736017227173, 0.6154800653457642]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 4.0, 5.0, 16.0, 22.0, 36.0, 45.0, 102.0, 248.0, 763.0, 4028.0, 141799.0, 884556.0, 14814.0, 1386.0, 384.0, 164.0, 79.0, 37.0, 25.0, 13.0, 6.0, 3.0, 8.0, 5.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.251953125, -1.2118682861328125, -1.171783447265625, -1.1316986083984375, -1.09161376953125, -1.0515289306640625, -1.011444091796875, -0.9713592529296875, -0.9312744140625, -0.8911895751953125, -0.851104736328125, -0.8110198974609375, -0.77093505859375, -0.7308502197265625, -0.690765380859375, -0.6506805419921875, -0.610595703125, -0.5705108642578125, -0.530426025390625, -0.4903411865234375, -0.45025634765625, -0.4101715087890625, -0.370086669921875, -0.3300018310546875, -0.2899169921875, -0.2498321533203125, -0.209747314453125, -0.1696624755859375, -0.12957763671875, -0.0894927978515625, -0.049407958984375, -0.0093231201171875, 0.03076171875, 0.0708465576171875, 0.110931396484375, 0.1510162353515625, 0.19110107421875, 0.2311859130859375, 0.271270751953125, 0.3113555908203125, 0.3514404296875, 0.3915252685546875, 0.431610107421875, 0.4716949462890625, 0.51177978515625, 0.5518646240234375, 0.591949462890625, 0.6320343017578125, 0.672119140625, 0.7122039794921875, 0.752288818359375, 0.7923736572265625, 0.83245849609375, 0.8725433349609375, 0.912628173828125, 0.9527130126953125, 0.9927978515625, 1.0328826904296875, 1.072967529296875, 1.1130523681640625, 1.15313720703125, 1.1932220458984375, 1.233306884765625, 1.2733917236328125, 1.3134765625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 19.0, 55.0, 143.0, 304.0, 288.0, 127.0, 36.0, 22.0, 8.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.360595703125, -0.3508186340332031, -0.34104156494140625, -0.3312644958496094, -0.3214874267578125, -0.3117103576660156, -0.30193328857421875, -0.2921562194824219, -0.282379150390625, -0.2726020812988281, -0.26282501220703125, -0.2530479431152344, -0.2432708740234375, -0.23349380493164062, -0.22371673583984375, -0.21393966674804688, -0.20416259765625, -0.19438552856445312, -0.18460845947265625, -0.17483139038085938, -0.1650543212890625, -0.15527725219726562, -0.14550018310546875, -0.13572311401367188, -0.125946044921875, -0.11616897583007812, -0.10639190673828125, -0.09661483764648438, -0.0868377685546875, -0.07706069946289062, -0.06728363037109375, -0.057506561279296875, -0.0477294921875, -0.037952423095703125, -0.02817535400390625, -0.018398284912109375, -0.0086212158203125, 0.001155853271484375, 0.01093292236328125, 0.020709991455078125, 0.030487060546875, 0.040264129638671875, 0.05004119873046875, 0.059818267822265625, 0.0695953369140625, 0.07937240600585938, 0.08914947509765625, 0.09892654418945312, 0.10870361328125, 0.11848068237304688, 0.12825775146484375, 0.13803482055664062, 0.1478118896484375, 0.15758895874023438, 0.16736602783203125, 0.17714309692382812, 0.186920166015625, 0.19669723510742188, 0.20647430419921875, 0.21625137329101562, 0.2260284423828125, 0.23580551147460938, 0.24558258056640625, 0.2553596496582031, 0.26513671875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 4.0, 6.0, 5.0, 14.0, 17.0, 19.0, 20.0, 27.0, 50.0, 56.0, 87.0, 170.0, 308.0, 598.0, 1420.0, 3901.0, 12482.0, 44818.0, 166161.0, 435236.0, 274962.0, 77338.0, 20957.0, 6185.0, 2015.0, 806.0, 353.0, 189.0, 119.0, 84.0, 40.0, 29.0, 20.0, 20.0, 9.0, 12.0, 6.0, 3.0, 3.0, 0.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.384765625, -0.37335205078125, -0.3619384765625, -0.35052490234375, -0.339111328125, -0.32769775390625, -0.3162841796875, -0.30487060546875, -0.29345703125, -0.28204345703125, -0.2706298828125, -0.25921630859375, -0.247802734375, -0.23638916015625, -0.2249755859375, -0.21356201171875, -0.2021484375, -0.19073486328125, -0.1793212890625, -0.16790771484375, -0.156494140625, -0.14508056640625, -0.1336669921875, -0.12225341796875, -0.11083984375, -0.09942626953125, -0.0880126953125, -0.07659912109375, -0.065185546875, -0.05377197265625, -0.0423583984375, -0.03094482421875, -0.01953125, -0.00811767578125, 0.0032958984375, 0.01470947265625, 0.026123046875, 0.03753662109375, 0.0489501953125, 0.06036376953125, 0.07177734375, 0.08319091796875, 0.0946044921875, 0.10601806640625, 0.117431640625, 0.12884521484375, 0.1402587890625, 0.15167236328125, 0.1630859375, 0.17449951171875, 0.1859130859375, 0.19732666015625, 0.208740234375, 0.22015380859375, 0.2315673828125, 0.24298095703125, 0.25439453125, 0.26580810546875, 0.2772216796875, 0.28863525390625, 0.300048828125, 0.31146240234375, 0.3228759765625, 0.33428955078125, 0.345703125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 0.0, 3.0, 1.0, 2.0, 6.0, 7.0, 5.0, 8.0, 9.0, 10.0, 11.0, 12.0, 18.0, 10.0, 16.0, 32.0, 24.0, 24.0, 30.0, 40.0, 40.0, 52.0, 38.0, 46.0, 47.0, 57.0, 36.0, 35.0, 42.0, 36.0, 42.0, 36.0, 29.0, 26.0, 31.0, 27.0, 20.0, 15.0, 13.0, 13.0, 12.0, 12.0, 10.0, 8.0, 4.0, 6.0, 3.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.146484375, -0.14127159118652344, -0.13605880737304688, -0.1308460235595703, -0.12563323974609375, -0.12042045593261719, -0.11520767211914062, -0.10999488830566406, -0.1047821044921875, -0.09956932067871094, -0.09435653686523438, -0.08914375305175781, -0.08393096923828125, -0.07871818542480469, -0.07350540161132812, -0.06829261779785156, -0.063079833984375, -0.05786705017089844, -0.052654266357421875, -0.04744148254394531, -0.04222869873046875, -0.03701591491699219, -0.031803131103515625, -0.026590347290039062, -0.0213775634765625, -0.016164779663085938, -0.010951995849609375, -0.0057392120361328125, -0.00052642822265625, 0.0046863555908203125, 0.009899139404296875, 0.015111923217773438, 0.02032470703125, 0.025537490844726562, 0.030750274658203125, 0.03596305847167969, 0.04117584228515625, 0.04638862609863281, 0.051601409912109375, 0.05681419372558594, 0.0620269775390625, 0.06723976135253906, 0.07245254516601562, 0.07766532897949219, 0.08287811279296875, 0.08809089660644531, 0.09330368041992188, 0.09851646423339844, 0.103729248046875, 0.10894203186035156, 0.11415481567382812, 0.11936759948730469, 0.12458038330078125, 0.1297931671142578, 0.13500595092773438, 0.14021873474121094, 0.1454315185546875, 0.15064430236816406, 0.15585708618164062, 0.1610698699951172, 0.16628265380859375, 0.1714954376220703, 0.17670822143554688, 0.18192100524902344, 0.1871337890625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 6.0, 7.0, 8.0, 21.0, 24.0, 35.0, 45.0, 100.0, 142.0, 280.0, 616.0, 1521.0, 5440.0, 26231.0, 192807.0, 632179.0, 159496.0, 22265.0, 4690.0, 1421.0, 584.0, 287.0, 135.0, 68.0, 59.0, 32.0, 17.0, 15.0, 8.0, 4.0, 3.0, 4.0, 4.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.288330078125, -0.2791633605957031, -0.26999664306640625, -0.2608299255371094, -0.2516632080078125, -0.24249649047851562, -0.23332977294921875, -0.22416305541992188, -0.214996337890625, -0.20582962036132812, -0.19666290283203125, -0.18749618530273438, -0.1783294677734375, -0.16916275024414062, -0.15999603271484375, -0.15082931518554688, -0.14166259765625, -0.13249588012695312, -0.12332916259765625, -0.11416244506835938, -0.1049957275390625, -0.09582901000976562, -0.08666229248046875, -0.07749557495117188, -0.068328857421875, -0.059162139892578125, -0.04999542236328125, -0.040828704833984375, -0.0316619873046875, -0.022495269775390625, -0.01332855224609375, -0.004161834716796875, 0.0050048828125, 0.014171600341796875, 0.02333831787109375, 0.032505035400390625, 0.0416717529296875, 0.050838470458984375, 0.06000518798828125, 0.06917190551757812, 0.078338623046875, 0.08750534057617188, 0.09667205810546875, 0.10583877563476562, 0.1150054931640625, 0.12417221069335938, 0.13333892822265625, 0.14250564575195312, 0.15167236328125, 0.16083908081054688, 0.17000579833984375, 0.17917251586914062, 0.1883392333984375, 0.19750595092773438, 0.20667266845703125, 0.21583938598632812, 0.225006103515625, 0.23417282104492188, 0.24333953857421875, 0.2525062561035156, 0.2616729736328125, 0.2708396911621094, 0.28000640869140625, 0.2891731262207031, 0.29833984375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 5.0, 4.0, 7.0, 8.0, 7.0, 6.0, 10.0, 11.0, 19.0, 21.0, 27.0, 33.0, 45.0, 47.0, 69.0, 81.0, 88.0, 81.0, 84.0, 71.0, 43.0, 53.0, 46.0, 29.0, 24.0, 20.0, 14.0, 15.0, 5.0, 7.0, 6.0, 4.0, 3.0, 7.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2590160369873047e-05, -2.1792016923427582e-05, -2.0993873476982117e-05, -2.019573003053665e-05, -1.9397586584091187e-05, -1.859944313764572e-05, -1.7801299691200256e-05, -1.700315624475479e-05, -1.6205012798309326e-05, -1.540686935186386e-05, -1.4608725905418396e-05, -1.3810582458972931e-05, -1.3012439012527466e-05, -1.2214295566082e-05, -1.1416152119636536e-05, -1.061800867319107e-05, -9.819865226745605e-06, -9.02172178030014e-06, -8.223578333854675e-06, -7.42543488740921e-06, -6.627291440963745e-06, -5.82914799451828e-06, -5.031004548072815e-06, -4.23286110162735e-06, -3.4347176551818848e-06, -2.6365742087364197e-06, -1.8384307622909546e-06, -1.0402873158454895e-06, -2.421438694000244e-07, 5.559995770454407e-07, 1.3541430234909058e-06, 2.152286469936371e-06, 2.950429916381836e-06, 3.748573362827301e-06, 4.546716809272766e-06, 5.344860255718231e-06, 6.143003702163696e-06, 6.941147148609161e-06, 7.739290595054626e-06, 8.537434041500092e-06, 9.335577487945557e-06, 1.0133720934391022e-05, 1.0931864380836487e-05, 1.1730007827281952e-05, 1.2528151273727417e-05, 1.3326294720172882e-05, 1.4124438166618347e-05, 1.4922581613063812e-05, 1.5720725059509277e-05, 1.6518868505954742e-05, 1.7317011952400208e-05, 1.8115155398845673e-05, 1.8913298845291138e-05, 1.9711442291736603e-05, 2.0509585738182068e-05, 2.1307729184627533e-05, 2.2105872631072998e-05, 2.2904016077518463e-05, 2.3702159523963928e-05, 2.4500302970409393e-05, 2.529844641685486e-05, 2.6096589863300323e-05, 2.689473330974579e-05, 2.7692876756191254e-05, 2.849102020263672e-05]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 4.0, 9.0, 6.0, 3.0, 4.0, 6.0, 14.0, 21.0, 26.0, 27.0, 56.0, 93.0, 157.0, 300.0, 709.0, 2192.0, 9164.0, 48193.0, 304104.0, 542270.0, 116277.0, 18944.0, 4006.0, 1062.0, 390.0, 186.0, 116.0, 65.0, 53.0, 23.0, 20.0, 17.0, 14.0, 13.0, 4.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2408447265625, -0.2335987091064453, -0.22635269165039062, -0.21910667419433594, -0.21186065673828125, -0.20461463928222656, -0.19736862182617188, -0.1901226043701172, -0.1828765869140625, -0.1756305694580078, -0.16838455200195312, -0.16113853454589844, -0.15389251708984375, -0.14664649963378906, -0.13940048217773438, -0.1321544647216797, -0.124908447265625, -0.11766242980957031, -0.11041641235351562, -0.10317039489746094, -0.09592437744140625, -0.08867835998535156, -0.08143234252929688, -0.07418632507324219, -0.0669403076171875, -0.05969429016113281, -0.052448272705078125, -0.04520225524902344, -0.03795623779296875, -0.030710220336914062, -0.023464202880859375, -0.016218185424804688, -0.00897216796875, -0.0017261505126953125, 0.005519866943359375, 0.012765884399414062, 0.02001190185546875, 0.027257919311523438, 0.034503936767578125, 0.04174995422363281, 0.0489959716796875, 0.05624198913574219, 0.06348800659179688, 0.07073402404785156, 0.07798004150390625, 0.08522605895996094, 0.09247207641601562, 0.09971809387207031, 0.106964111328125, 0.11421012878417969, 0.12145614624023438, 0.12870216369628906, 0.13594818115234375, 0.14319419860839844, 0.15044021606445312, 0.1576862335205078, 0.1649322509765625, 0.1721782684326172, 0.17942428588867188, 0.18667030334472656, 0.19391632080078125, 0.20116233825683594, 0.20840835571289062, 0.2156543731689453, 0.222900390625]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 2.0, 3.0, 7.0, 9.0, 18.0, 21.0, 21.0, 18.0, 34.0, 35.0, 40.0, 41.0, 56.0, 83.0, 81.0, 66.0, 77.0, 60.0, 60.0, 47.0, 38.0, 41.0, 33.0, 17.0, 18.0, 16.0, 11.0, 17.0, 9.0, 5.0, 3.0, 3.0, 5.0, 6.0, 3.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 3.0], "bins": [-0.10858154296875, -0.10569572448730469, -0.10280990600585938, -0.09992408752441406, -0.09703826904296875, -0.09415245056152344, -0.09126663208007812, -0.08838081359863281, -0.0854949951171875, -0.08260917663574219, -0.07972335815429688, -0.07683753967285156, -0.07395172119140625, -0.07106590270996094, -0.06818008422851562, -0.06529426574707031, -0.062408447265625, -0.05952262878417969, -0.056636810302734375, -0.05375099182128906, -0.05086517333984375, -0.04797935485839844, -0.045093536376953125, -0.04220771789550781, -0.0393218994140625, -0.03643608093261719, -0.033550262451171875, -0.030664443969726562, -0.02777862548828125, -0.024892807006835938, -0.022006988525390625, -0.019121170043945312, -0.0162353515625, -0.013349533081054688, -0.010463714599609375, -0.0075778961181640625, -0.00469207763671875, -0.0018062591552734375, 0.001079559326171875, 0.0039653778076171875, 0.0068511962890625, 0.009737014770507812, 0.012622833251953125, 0.015508651733398438, 0.01839447021484375, 0.021280288696289062, 0.024166107177734375, 0.027051925659179688, 0.029937744140625, 0.03282356262207031, 0.035709381103515625, 0.03859519958496094, 0.04148101806640625, 0.04436683654785156, 0.047252655029296875, 0.05013847351074219, 0.0530242919921875, 0.05591011047363281, 0.058795928955078125, 0.06168174743652344, 0.06456756591796875, 0.06745338439941406, 0.07033920288085938, 0.07322502136230469, 0.07611083984375]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 5.0, 10.0, 27.0, 62.0, 105.0, 146.0, 209.0, 197.0, 104.0, 74.0, 44.0, 21.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4850101172924042, -0.4345357418060303, -0.38406139612197876, -0.33358702063560486, -0.28311264514923096, -0.23263826966285706, -0.18216392397880554, -0.13168954849243164, -0.08121517300605774, -0.030740804970264435, 0.01973356306552887, 0.07020792365074158, 0.12068229913711548, 0.17115667462348938, 0.2216310203075409, 0.2721053957939148, 0.3225797712802887, 0.3730541467666626, 0.4235284924507141, 0.474002867937088, 0.5244772434234619, 0.5749516487121582, 0.6254259347915649, 0.6759003400802612, 0.7263747453689575, 0.776849091053009, 0.8273234963417053, 0.8777978420257568, 0.9282722473144531, 0.9787465929985046, 1.0292209386825562, 1.0796953439712524, 1.1301696300506592, 1.1806440353393555, 1.2311183214187622, 1.2815927267074585, 1.3320671319961548, 1.3825414180755615, 1.4330158233642578, 1.483490228652954, 1.5339646339416504, 1.5844390392303467, 1.6349133253097534, 1.6853877305984497, 1.735862135887146, 1.7863364219665527, 1.836810827255249, 1.8872852325439453, 1.937759518623352, 1.9882339239120483, 2.038708209991455, 2.0891826152801514, 2.1396570205688477, 2.190131425857544, 2.2406058311462402, 2.2910799980163574, 2.3415544033050537, 2.39202880859375, 2.4425032138824463, 2.4929776191711426, 2.5434517860412598, 2.593926191329956, 2.6444005966186523, 2.6948750019073486, 2.745349407196045]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 7.0, 2.0, 14.0, 13.0, 15.0, 25.0, 28.0, 35.0, 42.0, 45.0, 65.0, 48.0, 81.0, 68.0, 68.0, 62.0, 88.0, 62.0, 50.0, 51.0, 35.0, 33.0, 21.0, 19.0, 7.0, 8.0, 5.0, 4.0, 6.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.847917377948761, -0.8168770670890808, -0.7858368158340454, -0.7547965049743652, -0.7237561941146851, -0.6927159428596497, -0.6616756319999695, -0.6306353807449341, -0.5995950698852539, -0.5685547590255737, -0.5375145077705383, -0.5064741969108582, -0.47543391585350037, -0.4443936347961426, -0.4133533239364624, -0.3823130428791046, -0.3512727618217468, -0.32023248076438904, -0.28919219970703125, -0.2581518888473511, -0.2271116077899933, -0.1960713267326355, -0.16503103077411652, -0.13399073481559753, -0.10295045375823975, -0.07191016525030136, -0.040869876742362976, -0.009829588234424591, 0.021210700273513794, 0.05225098133087158, 0.08329127728939056, 0.11433157324790955, 0.1453719139099121, 0.1764121949672699, 0.20745249092578888, 0.23849278688430786, 0.26953306794166565, 0.30057334899902344, 0.3316136598587036, 0.3626539409160614, 0.3936942219734192, 0.424734503030777, 0.45577478408813477, 0.48681509494781494, 0.5178554058074951, 0.5488956570625305, 0.5799359679222107, 0.6109762191772461, 0.6420165300369263, 0.6730568408966064, 0.7040970921516418, 0.735137403011322, 0.7661776542663574, 0.7972179651260376, 0.8282582759857178, 0.859298586845398, 0.8903388381004333, 0.9213791489601135, 0.9524194002151489, 0.9834597110748291, 1.0145000219345093, 1.0455403327941895, 1.07658052444458, 1.1076208353042603, 1.1386611461639404]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 4.0, 5.0, 2.0, 1.0, 3.0, 6.0, 4.0, 4.0, 4.0, 7.0, 6.0, 13.0, 26.0, 34.0, 71.0, 93.0, 182.0, 332.0, 727.0, 2493.0, 12569.0, 1286794.0, 2866121.0, 20162.0, 2725.0, 1110.0, 421.0, 153.0, 106.0, 26.0, 28.0, 24.0, 8.0, 10.0, 1.0, 3.0, 5.0, 4.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.455810546875, -0.4428138732910156, -0.42981719970703125, -0.4168205261230469, -0.4038238525390625, -0.3908271789550781, -0.37783050537109375, -0.3648338317871094, -0.351837158203125, -0.3388404846191406, -0.32584381103515625, -0.3128471374511719, -0.2998504638671875, -0.2868537902832031, -0.27385711669921875, -0.2608604431152344, -0.24786376953125, -0.23486709594726562, -0.22187042236328125, -0.20887374877929688, -0.1958770751953125, -0.18288040161132812, -0.16988372802734375, -0.15688705444335938, -0.143890380859375, -0.13089370727539062, -0.11789703369140625, -0.10490036010742188, -0.0919036865234375, -0.07890701293945312, -0.06591033935546875, -0.052913665771484375, -0.0399169921875, -0.026920318603515625, -0.01392364501953125, -0.000926971435546875, 0.0120697021484375, 0.025066375732421875, 0.03806304931640625, 0.051059722900390625, 0.064056396484375, 0.07705307006835938, 0.09004974365234375, 0.10304641723632812, 0.1160430908203125, 0.12903976440429688, 0.14203643798828125, 0.15503311157226562, 0.16802978515625, 0.18102645874023438, 0.19402313232421875, 0.20701980590820312, 0.2200164794921875, 0.23301315307617188, 0.24600982666015625, 0.2590065002441406, 0.272003173828125, 0.2849998474121094, 0.29799652099609375, 0.3109931945800781, 0.3239898681640625, 0.3369865417480469, 0.34998321533203125, 0.3629798889160156, 0.3759765625]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 21.0, 54.0, 138.0, 273.0, 274.0, 154.0, 56.0, 21.0, 7.0, 7.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3642578125, -0.3546714782714844, -0.34508514404296875, -0.3354988098144531, -0.3259124755859375, -0.3163261413574219, -0.30673980712890625, -0.2971534729003906, -0.287567138671875, -0.2779808044433594, -0.26839447021484375, -0.2588081359863281, -0.2492218017578125, -0.23963546752929688, -0.23004913330078125, -0.22046279907226562, -0.21087646484375, -0.20129013061523438, -0.19170379638671875, -0.18211746215820312, -0.1725311279296875, -0.16294479370117188, -0.15335845947265625, -0.14377212524414062, -0.134185791015625, -0.12459945678710938, -0.11501312255859375, -0.10542678833007812, -0.0958404541015625, -0.08625411987304688, -0.07666778564453125, -0.06708145141601562, -0.0574951171875, -0.047908782958984375, -0.03832244873046875, -0.028736114501953125, -0.0191497802734375, -0.009563446044921875, 2.288818359375e-05, 0.009609222412109375, 0.019195556640625, 0.028781890869140625, 0.03836822509765625, 0.047954559326171875, 0.0575408935546875, 0.06712722778320312, 0.07671356201171875, 0.08629989624023438, 0.09588623046875, 0.10547256469726562, 0.11505889892578125, 0.12464523315429688, 0.1342315673828125, 0.14381790161132812, 0.15340423583984375, 0.16299057006835938, 0.172576904296875, 0.18216323852539062, 0.19174957275390625, 0.20133590698242188, 0.2109222412109375, 0.22050857543945312, 0.23009490966796875, 0.23968124389648438, 0.249267578125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 6.0, 16.0, 20.0, 31.0, 45.0, 69.0, 120.0, 168.0, 313.0, 686.0, 1687.0, 6392.0, 49147.0, 821422.0, 3045169.0, 243584.0, 19584.0, 3524.0, 1135.0, 488.0, 268.0, 133.0, 104.0, 51.0, 40.0, 25.0, 22.0, 9.0, 8.0, 8.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.263671875, -0.2555084228515625, -0.247344970703125, -0.2391815185546875, -0.23101806640625, -0.2228546142578125, -0.214691162109375, -0.2065277099609375, -0.1983642578125, -0.1902008056640625, -0.182037353515625, -0.1738739013671875, -0.16571044921875, -0.1575469970703125, -0.149383544921875, -0.1412200927734375, -0.133056640625, -0.1248931884765625, -0.116729736328125, -0.1085662841796875, -0.10040283203125, -0.0922393798828125, -0.084075927734375, -0.0759124755859375, -0.0677490234375, -0.0595855712890625, -0.051422119140625, -0.0432586669921875, -0.03509521484375, -0.0269317626953125, -0.018768310546875, -0.0106048583984375, -0.00244140625, 0.0057220458984375, 0.013885498046875, 0.0220489501953125, 0.03021240234375, 0.0383758544921875, 0.046539306640625, 0.0547027587890625, 0.0628662109375, 0.0710296630859375, 0.079193115234375, 0.0873565673828125, 0.09552001953125, 0.1036834716796875, 0.111846923828125, 0.1200103759765625, 0.128173828125, 0.1363372802734375, 0.144500732421875, 0.1526641845703125, 0.16082763671875, 0.1689910888671875, 0.177154541015625, 0.1853179931640625, 0.1934814453125, 0.2016448974609375, 0.209808349609375, 0.2179718017578125, 0.22613525390625, 0.2342987060546875, 0.242462158203125, 0.2506256103515625, 0.2587890625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 4.0, 3.0, 6.0, 12.0, 22.0, 25.0, 45.0, 83.0, 123.0, 222.0, 297.0, 419.0, 550.0, 639.0, 540.0, 390.0, 250.0, 162.0, 101.0, 79.0, 39.0, 19.0, 24.0, 12.0, 6.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.150146484375, -0.14504623413085938, -0.13994598388671875, -0.13484573364257812, -0.1297454833984375, -0.12464523315429688, -0.11954498291015625, -0.11444473266601562, -0.109344482421875, -0.10424423217773438, -0.09914398193359375, -0.09404373168945312, -0.0889434814453125, -0.08384323120117188, -0.07874298095703125, -0.07364273071289062, -0.06854248046875, -0.06344223022460938, -0.05834197998046875, -0.053241729736328125, -0.0481414794921875, -0.043041229248046875, -0.03794097900390625, -0.032840728759765625, -0.027740478515625, -0.022640228271484375, -0.01753997802734375, -0.012439727783203125, -0.0073394775390625, -0.002239227294921875, 0.00286102294921875, 0.007961273193359375, 0.0130615234375, 0.018161773681640625, 0.02326202392578125, 0.028362274169921875, 0.0334625244140625, 0.038562774658203125, 0.04366302490234375, 0.048763275146484375, 0.053863525390625, 0.058963775634765625, 0.06406402587890625, 0.06916427612304688, 0.0742645263671875, 0.07936477661132812, 0.08446502685546875, 0.08956527709960938, 0.09466552734375, 0.09976577758789062, 0.10486602783203125, 0.10996627807617188, 0.1150665283203125, 0.12016677856445312, 0.12526702880859375, 0.13036727905273438, 0.135467529296875, 0.14056777954101562, 0.14566802978515625, 0.15076828002929688, 0.1558685302734375, 0.16096878051757812, 0.16606903076171875, 0.17116928100585938, 0.17626953125]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 5.0, 11.0, 117.0, 375.0, 366.0, 118.0, 18.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6448587775230408, -0.5653609037399292, -0.4858630299568176, -0.40636518597602844, -0.32686731219291687, -0.2473694384098053, -0.1678715944290161, -0.08837372064590454, -0.008875846862792969, 0.070622019469738, 0.15011988580226898, 0.22961774468421936, 0.30911561846733093, 0.3886134922504425, 0.4681113362312317, 0.5476092100143433, 0.6271070837974548, 0.7066049575805664, 0.786102831363678, 0.8656007051467896, 0.9450985193252563, 1.0245964527130127, 1.1040942668914795, 1.1835920810699463, 1.2630900144577026, 1.3425878286361694, 1.4220857620239258, 1.5015835762023926, 1.581081509590149, 1.6605793237686157, 1.740077257156372, 1.8195750713348389, 1.8990728855133057, 1.9785706996917725, 2.0580685138702393, 2.137566566467285, 2.217064380645752, 2.2965621948242188, 2.3760600090026855, 2.4555578231811523, 2.5350558757781982, 2.614553689956665, 2.694051504135132, 2.7735495567321777, 2.8530473709106445, 2.9325451850891113, 3.012042999267578, 3.091540813446045, 3.1710386276245117, 3.2505364418029785, 3.3300342559814453, 3.409532308578491, 3.489030122756958, 3.568527936935425, 3.6480257511138916, 3.7275238037109375, 3.8070216178894043, 3.886519432067871, 3.966017246246338, 4.045515060424805, 4.1250128746032715, 4.2045111656188965, 4.284008979797363, 4.36350679397583, 4.443004608154297]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 6.0, 8.0, 9.0, 6.0, 11.0, 19.0, 32.0, 18.0, 30.0, 28.0, 56.0, 45.0, 64.0, 60.0, 59.0, 73.0, 65.0, 49.0, 42.0, 52.0, 44.0, 35.0, 48.0, 21.0, 27.0, 25.0, 22.0, 12.0, 4.0, 7.0, 10.0, 7.0, 7.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6183983683586121, -0.6006501317024231, -0.5829019546508789, -0.5651537179946899, -0.547405481338501, -0.529657244682312, -0.5119090676307678, -0.49416083097457886, -0.4764125943183899, -0.4586643874645233, -0.44091615080833435, -0.4231679439544678, -0.4054197072982788, -0.38767150044441223, -0.36992329359054565, -0.3521750569343567, -0.3344268500804901, -0.31667864322662354, -0.29893040657043457, -0.281182199716568, -0.26343396306037903, -0.24568575620651245, -0.22793753445148468, -0.2101893126964569, -0.19244109094142914, -0.17469286918640137, -0.1569446474313736, -0.13919642567634583, -0.12144821137189865, -0.10369998961687088, -0.0859517753124237, -0.06820355355739594, -0.050455331802368164, -0.03270711004734039, -0.01495889201760292, 0.002789326012134552, 0.020537547767162323, 0.038285769522190094, 0.05603398382663727, 0.07378220558166504, 0.09153042733669281, 0.10927864909172058, 0.12702687084674835, 0.14477509260177612, 0.1625232994556427, 0.18027153611183167, 0.19801974296569824, 0.215767964720726, 0.23351618647575378, 0.25126439332962036, 0.2690126299858093, 0.2867608368396759, 0.30450907349586487, 0.32225728034973145, 0.3400055170059204, 0.357753723859787, 0.37550193071365356, 0.39325013756752014, 0.4109983742237091, 0.4287465810775757, 0.44649481773376465, 0.4642430245876312, 0.4819912314414978, 0.49973946809768677, 0.5174877047538757]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 3.0, 2.0, 8.0, 8.0, 14.0, 14.0, 15.0, 32.0, 35.0, 57.0, 68.0, 136.0, 181.0, 306.0, 574.0, 1229.0, 3164.0, 11014.0, 56523.0, 497315.0, 415599.0, 47252.0, 9759.0, 2830.0, 1069.0, 519.0, 285.0, 173.0, 104.0, 83.0, 50.0, 34.0, 33.0, 20.0, 7.0, 8.0, 4.0, 4.0, 11.0, 3.0, 6.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.490478515625, -0.4760322570800781, -0.46158599853515625, -0.4471397399902344, -0.4326934814453125, -0.4182472229003906, -0.40380096435546875, -0.3893547058105469, -0.374908447265625, -0.3604621887207031, -0.34601593017578125, -0.3315696716308594, -0.3171234130859375, -0.3026771545410156, -0.28823089599609375, -0.2737846374511719, -0.25933837890625, -0.24489212036132812, -0.23044586181640625, -0.21599960327148438, -0.2015533447265625, -0.18710708618164062, -0.17266082763671875, -0.15821456909179688, -0.143768310546875, -0.12932205200195312, -0.11487579345703125, -0.10042953491210938, -0.0859832763671875, -0.07153701782226562, -0.05709075927734375, -0.042644500732421875, -0.0281982421875, -0.013751983642578125, 0.00069427490234375, 0.015140533447265625, 0.0295867919921875, 0.044033050537109375, 0.05847930908203125, 0.07292556762695312, 0.087371826171875, 0.10181808471679688, 0.11626434326171875, 0.13071060180664062, 0.1451568603515625, 0.15960311889648438, 0.17404937744140625, 0.18849563598632812, 0.20294189453125, 0.21738815307617188, 0.23183441162109375, 0.24628067016601562, 0.2607269287109375, 0.2751731872558594, 0.28961944580078125, 0.3040657043457031, 0.318511962890625, 0.3329582214355469, 0.34740447998046875, 0.3618507385253906, 0.3762969970703125, 0.3907432556152344, 0.40518951416015625, 0.4196357727050781, 0.43408203125]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 22.0, 62.0, 147.0, 262.0, 263.0, 160.0, 56.0, 23.0, 5.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.356201171875, -0.34656524658203125, -0.3369293212890625, -0.32729339599609375, -0.317657470703125, -0.30802154541015625, -0.2983856201171875, -0.28874969482421875, -0.27911376953125, -0.26947784423828125, -0.2598419189453125, -0.25020599365234375, -0.240570068359375, -0.23093414306640625, -0.2212982177734375, -0.21166229248046875, -0.2020263671875, -0.19239044189453125, -0.1827545166015625, -0.17311859130859375, -0.163482666015625, -0.15384674072265625, -0.1442108154296875, -0.13457489013671875, -0.12493896484375, -0.11530303955078125, -0.1056671142578125, -0.09603118896484375, -0.086395263671875, -0.07675933837890625, -0.0671234130859375, -0.05748748779296875, -0.0478515625, -0.03821563720703125, -0.0285797119140625, -0.01894378662109375, -0.009307861328125, 0.00032806396484375, 0.0099639892578125, 0.01959991455078125, 0.02923583984375, 0.03887176513671875, 0.0485076904296875, 0.05814361572265625, 0.067779541015625, 0.07741546630859375, 0.0870513916015625, 0.09668731689453125, 0.1063232421875, 0.11595916748046875, 0.1255950927734375, 0.13523101806640625, 0.144866943359375, 0.15450286865234375, 0.1641387939453125, 0.17377471923828125, 0.18341064453125, 0.19304656982421875, 0.2026824951171875, 0.21231842041015625, 0.221954345703125, 0.23159027099609375, 0.2412261962890625, 0.25086212158203125, 0.260498046875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 5.0, 8.0, 4.0, 9.0, 6.0, 11.0, 18.0, 17.0, 17.0, 33.0, 53.0, 65.0, 123.0, 174.0, 338.0, 700.0, 1804.0, 7300.0, 38985.0, 236756.0, 563820.0, 163004.0, 27139.0, 5298.0, 1438.0, 573.0, 315.0, 187.0, 92.0, 63.0, 52.0, 41.0, 19.0, 13.0, 6.0, 20.0, 13.0, 11.0, 8.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.364990234375, -0.3529815673828125, -0.340972900390625, -0.3289642333984375, -0.31695556640625, -0.3049468994140625, -0.292938232421875, -0.2809295654296875, -0.2689208984375, -0.2569122314453125, -0.244903564453125, -0.2328948974609375, -0.22088623046875, -0.2088775634765625, -0.196868896484375, -0.1848602294921875, -0.1728515625, -0.1608428955078125, -0.148834228515625, -0.1368255615234375, -0.12481689453125, -0.1128082275390625, -0.100799560546875, -0.0887908935546875, -0.0767822265625, -0.0647735595703125, -0.052764892578125, -0.0407562255859375, -0.02874755859375, -0.0167388916015625, -0.004730224609375, 0.0072784423828125, 0.019287109375, 0.0312957763671875, 0.043304443359375, 0.0553131103515625, 0.06732177734375, 0.0793304443359375, 0.091339111328125, 0.1033477783203125, 0.1153564453125, 0.1273651123046875, 0.139373779296875, 0.1513824462890625, 0.16339111328125, 0.1753997802734375, 0.187408447265625, 0.1994171142578125, 0.21142578125, 0.2234344482421875, 0.235443115234375, 0.2474517822265625, 0.25946044921875, 0.2714691162109375, 0.283477783203125, 0.2954864501953125, 0.3074951171875, 0.3195037841796875, 0.331512451171875, 0.3435211181640625, 0.35552978515625, 0.3675384521484375, 0.379547119140625, 0.3915557861328125, 0.403564453125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 1.0, 6.0, 8.0, 8.0, 7.0, 8.0, 14.0, 17.0, 16.0, 17.0, 17.0, 18.0, 31.0, 34.0, 35.0, 27.0, 52.0, 42.0, 39.0, 46.0, 56.0, 47.0, 51.0, 47.0, 49.0, 35.0, 37.0, 30.0, 27.0, 27.0, 25.0, 11.0, 25.0, 17.0, 20.0, 16.0, 10.0, 5.0, 8.0, 2.0, 5.0, 3.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1717529296875, -0.1659412384033203, -0.16012954711914062, -0.15431785583496094, -0.14850616455078125, -0.14269447326660156, -0.13688278198242188, -0.1310710906982422, -0.1252593994140625, -0.11944770812988281, -0.11363601684570312, -0.10782432556152344, -0.10201263427734375, -0.09620094299316406, -0.09038925170898438, -0.08457756042480469, -0.078765869140625, -0.07295417785644531, -0.06714248657226562, -0.06133079528808594, -0.05551910400390625, -0.04970741271972656, -0.043895721435546875, -0.03808403015136719, -0.0322723388671875, -0.026460647583007812, -0.020648956298828125, -0.014837265014648438, -0.00902557373046875, -0.0032138824462890625, 0.002597808837890625, 0.008409500122070312, 0.01422119140625, 0.020032882690429688, 0.025844573974609375, 0.03165626525878906, 0.03746795654296875, 0.04327964782714844, 0.049091339111328125, 0.05490303039550781, 0.0607147216796875, 0.06652641296386719, 0.07233810424804688, 0.07814979553222656, 0.08396148681640625, 0.08977317810058594, 0.09558486938476562, 0.10139656066894531, 0.107208251953125, 0.11301994323730469, 0.11883163452148438, 0.12464332580566406, 0.13045501708984375, 0.13626670837402344, 0.14207839965820312, 0.1478900909423828, 0.1537017822265625, 0.1595134735107422, 0.16532516479492188, 0.17113685607910156, 0.17694854736328125, 0.18276023864746094, 0.18857192993164062, 0.1943836212158203, 0.2001953125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 4.0, 6.0, 9.0, 10.0, 16.0, 26.0, 30.0, 39.0, 75.0, 103.0, 132.0, 232.0, 386.0, 636.0, 1084.0, 1847.0, 3354.0, 6706.0, 15335.0, 40385.0, 119954.0, 311734.0, 333025.0, 135452.0, 45027.0, 16836.0, 7512.0, 3755.0, 1956.0, 1063.0, 679.0, 375.0, 280.0, 154.0, 112.0, 73.0, 34.0, 41.0, 20.0, 18.0, 10.0, 13.0, 5.0, 7.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.10504150390625, -0.10176467895507812, -0.09848785400390625, -0.09521102905273438, -0.0919342041015625, -0.08865737915039062, -0.08538055419921875, -0.08210372924804688, -0.078826904296875, -0.07555007934570312, -0.07227325439453125, -0.06899642944335938, -0.0657196044921875, -0.062442779541015625, -0.05916595458984375, -0.055889129638671875, -0.0526123046875, -0.049335479736328125, -0.04605865478515625, -0.042781829833984375, -0.0395050048828125, -0.036228179931640625, -0.03295135498046875, -0.029674530029296875, -0.026397705078125, -0.023120880126953125, -0.01984405517578125, -0.016567230224609375, -0.0132904052734375, -0.010013580322265625, -0.00673675537109375, -0.003459930419921875, -0.00018310546875, 0.003093719482421875, 0.00637054443359375, 0.009647369384765625, 0.0129241943359375, 0.016201019287109375, 0.01947784423828125, 0.022754669189453125, 0.026031494140625, 0.029308319091796875, 0.03258514404296875, 0.035861968994140625, 0.0391387939453125, 0.042415618896484375, 0.04569244384765625, 0.048969268798828125, 0.05224609375, 0.055522918701171875, 0.05879974365234375, 0.062076568603515625, 0.0653533935546875, 0.06863021850585938, 0.07190704345703125, 0.07518386840820312, 0.078460693359375, 0.08173751831054688, 0.08501434326171875, 0.08829116821289062, 0.0915679931640625, 0.09484481811523438, 0.09812164306640625, 0.10139846801757812, 0.10467529296875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 4.0, 4.0, 1.0, 8.0, 5.0, 4.0, 11.0, 10.0, 11.0, 7.0, 11.0, 16.0, 21.0, 25.0, 27.0, 34.0, 45.0, 56.0, 71.0, 90.0, 69.0, 72.0, 80.0, 61.0, 36.0, 51.0, 33.0, 34.0, 21.0, 21.0, 12.0, 8.0, 10.0, 13.0, 7.0, 6.0, 2.0, 1.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.728534698486328e-05, -1.6705133020877838e-05, -1.6124919056892395e-05, -1.5544705092906952e-05, -1.4964491128921509e-05, -1.4384277164936066e-05, -1.3804063200950623e-05, -1.322384923696518e-05, -1.2643635272979736e-05, -1.2063421308994293e-05, -1.148320734500885e-05, -1.0902993381023407e-05, -1.0322779417037964e-05, -9.74256545305252e-06, -9.162351489067078e-06, -8.582137525081635e-06, -8.001923561096191e-06, -7.421709597110748e-06, -6.841495633125305e-06, -6.261281669139862e-06, -5.681067705154419e-06, -5.100853741168976e-06, -4.520639777183533e-06, -3.94042581319809e-06, -3.3602118492126465e-06, -2.7799978852272034e-06, -2.1997839212417603e-06, -1.6195699572563171e-06, -1.039355993270874e-06, -4.591420292854309e-07, 1.210719347000122e-07, 7.012858986854553e-07, 1.2814998626708984e-06, 1.8617138266563416e-06, 2.4419277906417847e-06, 3.0221417546272278e-06, 3.602355718612671e-06, 4.182569682598114e-06, 4.762783646583557e-06, 5.342997610569e-06, 5.923211574554443e-06, 6.5034255385398865e-06, 7.08363950252533e-06, 7.663853466510773e-06, 8.244067430496216e-06, 8.824281394481659e-06, 9.404495358467102e-06, 9.984709322452545e-06, 1.0564923286437988e-05, 1.1145137250423431e-05, 1.1725351214408875e-05, 1.2305565178394318e-05, 1.288577914237976e-05, 1.3465993106365204e-05, 1.4046207070350647e-05, 1.462642103433609e-05, 1.5206634998321533e-05, 1.5786848962306976e-05, 1.636706292629242e-05, 1.6947276890277863e-05, 1.7527490854263306e-05, 1.810770481824875e-05, 1.8687918782234192e-05, 1.9268132746219635e-05, 1.9848346710205078e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 6.0, 10.0, 14.0, 15.0, 25.0, 42.0, 65.0, 121.0, 218.0, 411.0, 820.0, 1669.0, 3793.0, 10834.0, 39637.0, 180930.0, 510240.0, 228969.0, 49338.0, 13114.0, 4454.0, 1900.0, 908.0, 424.0, 251.0, 137.0, 79.0, 39.0, 28.0, 18.0, 17.0, 11.0, 11.0, 3.0, 2.0, 1.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.148193359375, -0.14334678649902344, -0.13850021362304688, -0.1336536407470703, -0.12880706787109375, -0.12396049499511719, -0.11911392211914062, -0.11426734924316406, -0.1094207763671875, -0.10457420349121094, -0.09972763061523438, -0.09488105773925781, -0.09003448486328125, -0.08518791198730469, -0.08034133911132812, -0.07549476623535156, -0.070648193359375, -0.06580162048339844, -0.060955047607421875, -0.05610847473144531, -0.05126190185546875, -0.04641532897949219, -0.041568756103515625, -0.03672218322753906, -0.0318756103515625, -0.027029037475585938, -0.022182464599609375, -0.017335891723632812, -0.01248931884765625, -0.0076427459716796875, -0.002796173095703125, 0.0020503997802734375, 0.00689697265625, 0.011743545532226562, 0.016590118408203125, 0.021436691284179688, 0.02628326416015625, 0.031129837036132812, 0.035976409912109375, 0.04082298278808594, 0.0456695556640625, 0.05051612854003906, 0.055362701416015625, 0.06020927429199219, 0.06505584716796875, 0.06990242004394531, 0.07474899291992188, 0.07959556579589844, 0.084442138671875, 0.08928871154785156, 0.09413528442382812, 0.09898185729980469, 0.10382843017578125, 0.10867500305175781, 0.11352157592773438, 0.11836814880371094, 0.1232147216796875, 0.12806129455566406, 0.13290786743164062, 0.1377544403076172, 0.14260101318359375, 0.1474475860595703, 0.15229415893554688, 0.15714073181152344, 0.1619873046875]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 7.0, 3.0, 5.0, 12.0, 13.0, 27.0, 16.0, 38.0, 64.0, 65.0, 81.0, 107.0, 120.0, 96.0, 82.0, 86.0, 47.0, 42.0, 25.0, 16.0, 12.0, 11.0, 8.0, 6.0, 1.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1263427734375, -0.1224813461303711, -0.11861991882324219, -0.11475849151611328, -0.11089706420898438, -0.10703563690185547, -0.10317420959472656, -0.09931278228759766, -0.09545135498046875, -0.09158992767333984, -0.08772850036621094, -0.08386707305908203, -0.08000564575195312, -0.07614421844482422, -0.07228279113769531, -0.0684213638305664, -0.0645599365234375, -0.060698509216308594, -0.05683708190917969, -0.05297565460205078, -0.049114227294921875, -0.04525279998779297, -0.04139137268066406, -0.037529945373535156, -0.03366851806640625, -0.029807090759277344, -0.025945663452148438, -0.02208423614501953, -0.018222808837890625, -0.014361381530761719, -0.010499954223632812, -0.006638526916503906, -0.002777099609375, 0.0010843276977539062, 0.0049457550048828125, 0.008807182312011719, 0.012668609619140625, 0.01653003692626953, 0.020391464233398438, 0.024252891540527344, 0.02811431884765625, 0.031975746154785156, 0.03583717346191406, 0.03969860076904297, 0.043560028076171875, 0.04742145538330078, 0.05128288269042969, 0.055144309997558594, 0.0590057373046875, 0.0628671646118164, 0.06672859191894531, 0.07059001922607422, 0.07445144653320312, 0.07831287384033203, 0.08217430114746094, 0.08603572845458984, 0.08989715576171875, 0.09375858306884766, 0.09762001037597656, 0.10148143768310547, 0.10534286499023438, 0.10920429229736328, 0.11306571960449219, 0.1169271469116211, 0.12078857421875]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 9.0, 21.0, 79.0, 217.0, 328.0, 240.0, 87.0, 21.0, 11.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.357386350631714, -3.2837908267974854, -3.210195302963257, -3.1365997791290283, -3.0630042552948, -2.989408493041992, -2.9158129692077637, -2.842217445373535, -2.7686219215393066, -2.695026397705078, -2.6214308738708496, -2.547835350036621, -2.4742398262023926, -2.400644302368164, -2.3270487785339355, -2.253453016281128, -2.1798577308654785, -2.10626220703125, -2.0326666831970215, -1.959071159362793, -1.885475516319275, -1.8118799924850464, -1.7382844686508179, -1.6646888256072998, -1.5910933017730713, -1.5174977779388428, -1.4439022541046143, -1.3703067302703857, -1.2967110872268677, -1.2231155633926392, -1.1495200395584106, -1.0759243965148926, -1.0023289918899536, -0.9287334680557251, -0.8551378846168518, -0.7815423607826233, -0.70794677734375, -0.6343512535095215, -0.560755729675293, -0.4871601462364197, -0.41356462240219116, -0.33996906876564026, -0.26637351512908936, -0.19277799129486084, -0.11918243765830994, -0.04558688402175903, 0.028008639812469482, 0.10160422325134277, 0.1751997470855713, 0.2487953007221222, 0.3223908543586731, 0.3959863781929016, 0.4695819318294525, 0.5431774854660034, 0.6167730093002319, 0.6903685927391052, 0.7639641165733337, 0.8375596404075623, 0.9111552238464355, 0.9847507476806641, 1.0583462715148926, 1.131941795349121, 1.2055373191833496, 1.2791329622268677, 1.3527284860610962]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 4.0, 6.0, 1.0, 3.0, 1.0, 5.0, 6.0, 9.0, 17.0, 27.0, 25.0, 27.0, 30.0, 40.0, 41.0, 44.0, 52.0, 56.0, 71.0, 64.0, 64.0, 59.0, 51.0, 63.0, 47.0, 45.0, 39.0, 38.0, 16.0, 20.0, 12.0, 14.0, 4.0, 11.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6040348410606384, -0.5794890522956848, -0.5549432039260864, -0.5303974151611328, -0.5058515667915344, -0.4813057780265808, -0.4567599594593048, -0.4322141408920288, -0.4076683521270752, -0.3831225335597992, -0.3585767149925232, -0.3340309262275696, -0.3094851076602936, -0.2849392890930176, -0.2603934705257416, -0.23584766685962677, -0.21130183339118958, -0.18675601482391357, -0.16221021115779877, -0.13766439259052277, -0.11311858147382736, -0.08857277035713196, -0.06402695178985596, -0.03948114812374115, -0.014935329556465149, 0.009610483422875404, 0.03415629640221596, 0.05870211124420166, 0.08324792236089706, 0.10779373347759247, 0.13233955204486847, 0.15688535571098328, 0.18143117427825928, 0.20597699284553528, 0.23052279651165009, 0.2550686001777649, 0.2796144187450409, 0.3041602373123169, 0.3287060558795929, 0.3532518744468689, 0.3777976632118225, 0.4023434817790985, 0.4268893003463745, 0.4514350891113281, 0.4759809076786041, 0.5005267262458801, 0.5250725746154785, 0.5496183633804321, 0.5741641521453857, 0.5987099409103394, 0.6232557892799377, 0.6478015780448914, 0.6723474264144897, 0.6968932151794434, 0.721439003944397, 0.7459848523139954, 0.7705307006835938, 0.7950764894485474, 0.8196223378181458, 0.8441681265830994, 0.8687139749526978, 0.8932597637176514, 0.917805552482605, 0.9423514008522034, 0.966897189617157]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 4.0, 5.0, 2.0, 3.0, 1.0, 7.0, 13.0, 8.0, 12.0, 21.0, 27.0, 27.0, 49.0, 60.0, 82.0, 131.0, 183.0, 371.0, 644.0, 1291.0, 2727.0, 6530.0, 25047.0, 246263.0, 3489088.0, 370552.0, 36379.0, 8528.0, 2904.0, 1388.0, 886.0, 460.0, 249.0, 138.0, 80.0, 40.0, 30.0, 21.0, 9.0, 8.0, 5.0, 6.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0], "bins": [-0.2469482421875, -0.23980331420898438, -0.23265838623046875, -0.22551345825195312, -0.2183685302734375, -0.21122360229492188, -0.20407867431640625, -0.19693374633789062, -0.189788818359375, -0.18264389038085938, -0.17549896240234375, -0.16835403442382812, -0.1612091064453125, -0.15406417846679688, -0.14691925048828125, -0.13977432250976562, -0.13262939453125, -0.12548446655273438, -0.11833953857421875, -0.11119461059570312, -0.1040496826171875, -0.09690475463867188, -0.08975982666015625, -0.08261489868164062, -0.075469970703125, -0.06832504272460938, -0.06118011474609375, -0.054035186767578125, -0.0468902587890625, -0.039745330810546875, -0.03260040283203125, -0.025455474853515625, -0.018310546875, -0.011165618896484375, -0.00402069091796875, 0.003124237060546875, 0.0102691650390625, 0.017414093017578125, 0.02455902099609375, 0.031703948974609375, 0.038848876953125, 0.045993804931640625, 0.05313873291015625, 0.060283660888671875, 0.0674285888671875, 0.07457351684570312, 0.08171844482421875, 0.08886337280273438, 0.09600830078125, 0.10315322875976562, 0.11029815673828125, 0.11744308471679688, 0.1245880126953125, 0.13173294067382812, 0.13887786865234375, 0.14602279663085938, 0.153167724609375, 0.16031265258789062, 0.16745758056640625, 0.17460250854492188, 0.1817474365234375, 0.18889236450195312, 0.19603729248046875, 0.20318222045898438, 0.2103271484375]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 5.0, 41.0, 80.0, 219.0, 290.0, 206.0, 103.0, 39.0, 14.0, 7.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.363525390625, -0.3538322448730469, -0.34413909912109375, -0.3344459533691406, -0.3247528076171875, -0.3150596618652344, -0.30536651611328125, -0.2956733703613281, -0.285980224609375, -0.2762870788574219, -0.26659393310546875, -0.2569007873535156, -0.2472076416015625, -0.23751449584960938, -0.22782135009765625, -0.21812820434570312, -0.20843505859375, -0.19874191284179688, -0.18904876708984375, -0.17935562133789062, -0.1696624755859375, -0.15996932983398438, -0.15027618408203125, -0.14058303833007812, -0.130889892578125, -0.12119674682617188, -0.11150360107421875, -0.10181045532226562, -0.0921173095703125, -0.08242416381835938, -0.07273101806640625, -0.06303787231445312, -0.0533447265625, -0.043651580810546875, -0.03395843505859375, -0.024265289306640625, -0.0145721435546875, -0.004878997802734375, 0.00481414794921875, 0.014507293701171875, 0.024200439453125, 0.033893585205078125, 0.04358673095703125, 0.053279876708984375, 0.0629730224609375, 0.07266616821289062, 0.08235931396484375, 0.09205245971679688, 0.10174560546875, 0.11143875122070312, 0.12113189697265625, 0.13082504272460938, 0.1405181884765625, 0.15021133422851562, 0.15990447998046875, 0.16959762573242188, 0.179290771484375, 0.18898391723632812, 0.19867706298828125, 0.20837020874023438, 0.2180633544921875, 0.22775650024414062, 0.23744964599609375, 0.24714279174804688, 0.2568359375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 5.0, 11.0, 7.0, 14.0, 14.0, 15.0, 26.0, 31.0, 50.0, 70.0, 107.0, 214.0, 438.0, 1403.0, 6376.0, 44605.0, 621116.0, 3200659.0, 287903.0, 25349.0, 4073.0, 1027.0, 334.0, 162.0, 87.0, 63.0, 36.0, 24.0, 26.0, 14.0, 7.0, 5.0, 7.0, 2.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2352294921875, -0.2272205352783203, -0.21921157836914062, -0.21120262145996094, -0.20319366455078125, -0.19518470764160156, -0.18717575073242188, -0.1791667938232422, -0.1711578369140625, -0.1631488800048828, -0.15513992309570312, -0.14713096618652344, -0.13912200927734375, -0.13111305236816406, -0.12310409545898438, -0.11509513854980469, -0.107086181640625, -0.09907722473144531, -0.09106826782226562, -0.08305931091308594, -0.07505035400390625, -0.06704139709472656, -0.059032440185546875, -0.05102348327636719, -0.0430145263671875, -0.03500556945800781, -0.026996612548828125, -0.018987655639648438, -0.01097869873046875, -0.0029697418212890625, 0.005039215087890625, 0.013048171997070312, 0.02105712890625, 0.029066085815429688, 0.037075042724609375, 0.04508399963378906, 0.05309295654296875, 0.06110191345214844, 0.06911087036132812, 0.07711982727050781, 0.0851287841796875, 0.09313774108886719, 0.10114669799804688, 0.10915565490722656, 0.11716461181640625, 0.12517356872558594, 0.13318252563476562, 0.1411914825439453, 0.149200439453125, 0.1572093963623047, 0.16521835327148438, 0.17322731018066406, 0.18123626708984375, 0.18924522399902344, 0.19725418090820312, 0.2052631378173828, 0.2132720947265625, 0.2212810516357422, 0.22929000854492188, 0.23729896545410156, 0.24530792236328125, 0.25331687927246094, 0.2613258361816406, 0.2693347930908203, 0.27734375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 5.0, 2.0, 8.0, 6.0, 11.0, 12.0, 20.0, 27.0, 51.0, 61.0, 71.0, 83.0, 135.0, 201.0, 338.0, 470.0, 541.0, 506.0, 422.0, 313.0, 213.0, 161.0, 114.0, 83.0, 64.0, 52.0, 31.0, 20.0, 11.0, 16.0, 11.0, 8.0, 7.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12359619140625, -0.11972999572753906, -0.11586380004882812, -0.11199760437011719, -0.10813140869140625, -0.10426521301269531, -0.10039901733398438, -0.09653282165527344, -0.0926666259765625, -0.08880043029785156, -0.08493423461914062, -0.08106803894042969, -0.07720184326171875, -0.07333564758300781, -0.06946945190429688, -0.06560325622558594, -0.061737060546875, -0.05787086486816406, -0.054004669189453125, -0.05013847351074219, -0.04627227783203125, -0.04240608215332031, -0.038539886474609375, -0.03467369079589844, -0.0308074951171875, -0.026941299438476562, -0.023075103759765625, -0.019208908081054688, -0.01534271240234375, -0.011476516723632812, -0.007610321044921875, -0.0037441253662109375, 0.0001220703125, 0.0039882659912109375, 0.007854461669921875, 0.011720657348632812, 0.01558685302734375, 0.019453048706054688, 0.023319244384765625, 0.027185440063476562, 0.0310516357421875, 0.03491783142089844, 0.038784027099609375, 0.04265022277832031, 0.04651641845703125, 0.05038261413574219, 0.054248809814453125, 0.05811500549316406, 0.061981201171875, 0.06584739685058594, 0.06971359252929688, 0.07357978820800781, 0.07744598388671875, 0.08131217956542969, 0.08517837524414062, 0.08904457092285156, 0.0929107666015625, 0.09677696228027344, 0.10064315795898438, 0.10450935363769531, 0.10837554931640625, 0.11224174499511719, 0.11610794067382812, 0.11997413635253906, 0.12384033203125]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 7.0, 8.0, 25.0, 32.0, 44.0, 77.0, 80.0, 96.0, 127.0, 124.0, 105.0, 91.0, 68.0, 37.0, 28.0, 18.0, 17.0, 8.0, 8.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4338633418083191, -0.4148024022579193, -0.39574146270751953, -0.37668052315711975, -0.35761958360671997, -0.3385586142539978, -0.319497674703598, -0.30043673515319824, -0.28137579560279846, -0.2623148560523987, -0.2432539165019989, -0.22419296205043793, -0.20513202250003815, -0.18607108294963837, -0.1670101284980774, -0.1479491889476776, -0.12888824939727783, -0.10982730984687805, -0.09076636284589767, -0.0717054158449173, -0.05264447629451752, -0.03358353674411774, -0.01452258974313736, 0.004538357257843018, 0.023599296808242798, 0.04266024008393288, 0.061721183359622955, 0.08078213036060333, 0.09984306991100311, 0.1189040094614029, 0.13796496391296387, 0.15702590346336365, 0.17608678340911865, 0.19514772295951843, 0.2142086625099182, 0.2332696169614792, 0.2523305416107178, 0.27139151096343994, 0.2904524505138397, 0.3095133900642395, 0.3285743296146393, 0.34763526916503906, 0.36669620871543884, 0.3857571482658386, 0.4048181176185608, 0.4238790273666382, 0.44293999671936035, 0.46200093626976013, 0.4810618758201599, 0.5001228451728821, 0.5191837549209595, 0.5382447242736816, 0.557305634021759, 0.5763666033744812, 0.5954275131225586, 0.6144884824752808, 0.6335494518280029, 0.6526104211807251, 0.6716713309288025, 0.6907323002815247, 0.709793210029602, 0.7288541793823242, 0.7479150891304016, 0.7669760584831238, 0.7860369682312012]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 5.0, 9.0, 5.0, 13.0, 21.0, 19.0, 21.0, 29.0, 31.0, 47.0, 56.0, 61.0, 61.0, 63.0, 75.0, 63.0, 55.0, 64.0, 51.0, 46.0, 40.0, 37.0, 29.0, 29.0, 20.0, 19.0, 9.0, 9.0, 7.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5911972522735596, -0.5745478868484497, -0.5578985214233398, -0.54124915599823, -0.5245997905731201, -0.5079503655433655, -0.4913010001182556, -0.47465163469314575, -0.4580022692680359, -0.441352903842926, -0.42470353841781616, -0.4080541431903839, -0.39140477776527405, -0.3747554123401642, -0.35810601711273193, -0.34145665168762207, -0.3248072862625122, -0.30815792083740234, -0.2915085554122925, -0.27485916018486023, -0.25820979475975037, -0.2415604293346405, -0.22491104900836945, -0.2082616686820984, -0.19161230325698853, -0.17496293783187866, -0.1583135575056076, -0.14166417717933655, -0.12501481175422668, -0.10836543887853622, -0.09171606600284576, -0.0750666931271553, -0.058417320251464844, -0.041767947375774384, -0.025118574500083923, -0.008469201624393463, 0.008180171251296997, 0.024829544126987457, 0.04147891700267792, 0.05812828987836838, 0.07477766275405884, 0.0914270356297493, 0.10807640850543976, 0.12472578138113022, 0.14137515425682068, 0.15802451968193054, 0.1746739000082016, 0.19132328033447266, 0.20797264575958252, 0.22462201118469238, 0.24127139151096344, 0.2579207718372345, 0.27457013726234436, 0.2912195026874542, 0.3078688979148865, 0.32451826333999634, 0.3411676287651062, 0.35781699419021606, 0.3744663596153259, 0.3911157548427582, 0.40776512026786804, 0.4244144856929779, 0.44106388092041016, 0.45771324634552, 0.4743626117706299]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 7.0, 8.0, 18.0, 16.0, 20.0, 25.0, 42.0, 57.0, 100.0, 123.0, 196.0, 343.0, 512.0, 1026.0, 2669.0, 10041.0, 58214.0, 502696.0, 411339.0, 47828.0, 8637.0, 2377.0, 913.0, 485.0, 276.0, 199.0, 113.0, 78.0, 69.0, 30.0, 29.0, 21.0, 12.0, 7.0, 4.0, 9.0, 8.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.44384765625, -0.42995452880859375, -0.4160614013671875, -0.40216827392578125, -0.388275146484375, -0.37438201904296875, -0.3604888916015625, -0.34659576416015625, -0.33270263671875, -0.31880950927734375, -0.3049163818359375, -0.29102325439453125, -0.277130126953125, -0.26323699951171875, -0.2493438720703125, -0.23545074462890625, -0.2215576171875, -0.20766448974609375, -0.1937713623046875, -0.17987823486328125, -0.165985107421875, -0.15209197998046875, -0.1381988525390625, -0.12430572509765625, -0.11041259765625, -0.09651947021484375, -0.0826263427734375, -0.06873321533203125, -0.054840087890625, -0.04094696044921875, -0.0270538330078125, -0.01316070556640625, 0.000732421875, 0.01462554931640625, 0.0285186767578125, 0.04241180419921875, 0.056304931640625, 0.07019805908203125, 0.0840911865234375, 0.09798431396484375, 0.11187744140625, 0.12577056884765625, 0.1396636962890625, 0.15355682373046875, 0.167449951171875, 0.18134307861328125, 0.1952362060546875, 0.20912933349609375, 0.2230224609375, 0.23691558837890625, 0.2508087158203125, 0.26470184326171875, 0.278594970703125, 0.29248809814453125, 0.3063812255859375, 0.32027435302734375, 0.33416748046875, 0.34806060791015625, 0.3619537353515625, 0.37584686279296875, 0.389739990234375, 0.40363311767578125, 0.4175262451171875, 0.43141937255859375, 0.4453125]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 7.0, 37.0, 113.0, 222.0, 302.0, 187.0, 100.0, 22.0, 12.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.380126953125, -0.36994171142578125, -0.3597564697265625, -0.34957122802734375, -0.339385986328125, -0.32920074462890625, -0.3190155029296875, -0.30883026123046875, -0.29864501953125, -0.28845977783203125, -0.2782745361328125, -0.26808929443359375, -0.257904052734375, -0.24771881103515625, -0.2375335693359375, -0.22734832763671875, -0.2171630859375, -0.20697784423828125, -0.1967926025390625, -0.18660736083984375, -0.176422119140625, -0.16623687744140625, -0.1560516357421875, -0.14586639404296875, -0.13568115234375, -0.12549591064453125, -0.1153106689453125, -0.10512542724609375, -0.094940185546875, -0.08475494384765625, -0.0745697021484375, -0.06438446044921875, -0.05419921875, -0.04401397705078125, -0.0338287353515625, -0.02364349365234375, -0.013458251953125, -0.00327301025390625, 0.0069122314453125, 0.01709747314453125, 0.02728271484375, 0.03746795654296875, 0.0476531982421875, 0.05783843994140625, 0.068023681640625, 0.07820892333984375, 0.0883941650390625, 0.09857940673828125, 0.1087646484375, 0.11894989013671875, 0.1291351318359375, 0.13932037353515625, 0.149505615234375, 0.15969085693359375, 0.1698760986328125, 0.18006134033203125, 0.19024658203125, 0.20043182373046875, 0.2106170654296875, 0.22080230712890625, 0.230987548828125, 0.24117279052734375, 0.2513580322265625, 0.26154327392578125, 0.271728515625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 7.0, 6.0, 6.0, 10.0, 12.0, 14.0, 26.0, 34.0, 62.0, 82.0, 148.0, 278.0, 554.0, 1221.0, 2550.0, 5862.0, 12948.0, 28933.0, 62966.0, 138501.0, 280034.0, 271735.0, 132381.0, 59785.0, 27691.0, 12454.0, 5539.0, 2429.0, 1116.0, 493.0, 279.0, 146.0, 78.0, 51.0, 37.0, 32.0, 18.0, 12.0, 6.0, 3.0, 5.0, 7.0, 4.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1702880859375, -0.16512298583984375, -0.1599578857421875, -0.15479278564453125, -0.149627685546875, -0.14446258544921875, -0.1392974853515625, -0.13413238525390625, -0.12896728515625, -0.12380218505859375, -0.1186370849609375, -0.11347198486328125, -0.108306884765625, -0.10314178466796875, -0.0979766845703125, -0.09281158447265625, -0.087646484375, -0.08248138427734375, -0.0773162841796875, -0.07215118408203125, -0.066986083984375, -0.06182098388671875, -0.0566558837890625, -0.05149078369140625, -0.04632568359375, -0.04116058349609375, -0.0359954833984375, -0.03083038330078125, -0.025665283203125, -0.02050018310546875, -0.0153350830078125, -0.01016998291015625, -0.0050048828125, 0.00016021728515625, 0.0053253173828125, 0.01049041748046875, 0.015655517578125, 0.02082061767578125, 0.0259857177734375, 0.03115081787109375, 0.03631591796875, 0.04148101806640625, 0.0466461181640625, 0.05181121826171875, 0.056976318359375, 0.06214141845703125, 0.0673065185546875, 0.07247161865234375, 0.07763671875, 0.08280181884765625, 0.0879669189453125, 0.09313201904296875, 0.098297119140625, 0.10346221923828125, 0.1086273193359375, 0.11379241943359375, 0.11895751953125, 0.12412261962890625, 0.1292877197265625, 0.13445281982421875, 0.139617919921875, 0.14478302001953125, 0.1499481201171875, 0.15511322021484375, 0.1602783203125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 7.0, 6.0, 11.0, 15.0, 15.0, 19.0, 13.0, 13.0, 23.0, 34.0, 26.0, 27.0, 37.0, 39.0, 43.0, 34.0, 41.0, 56.0, 41.0, 46.0, 44.0, 33.0, 35.0, 32.0, 29.0, 31.0, 28.0, 27.0, 32.0, 19.0, 26.0, 18.0, 24.0, 17.0, 8.0, 9.0, 11.0, 7.0, 6.0, 5.0, 6.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.15185546875, -0.14703369140625, -0.1422119140625, -0.13739013671875, -0.132568359375, -0.12774658203125, -0.1229248046875, -0.11810302734375, -0.11328125, -0.10845947265625, -0.1036376953125, -0.09881591796875, -0.093994140625, -0.08917236328125, -0.0843505859375, -0.07952880859375, -0.07470703125, -0.06988525390625, -0.0650634765625, -0.06024169921875, -0.055419921875, -0.05059814453125, -0.0457763671875, -0.04095458984375, -0.0361328125, -0.03131103515625, -0.0264892578125, -0.02166748046875, -0.016845703125, -0.01202392578125, -0.0072021484375, -0.00238037109375, 0.00244140625, 0.00726318359375, 0.0120849609375, 0.01690673828125, 0.021728515625, 0.02655029296875, 0.0313720703125, 0.03619384765625, 0.041015625, 0.04583740234375, 0.0506591796875, 0.05548095703125, 0.060302734375, 0.06512451171875, 0.0699462890625, 0.07476806640625, 0.07958984375, 0.08441162109375, 0.0892333984375, 0.09405517578125, 0.098876953125, 0.10369873046875, 0.1085205078125, 0.11334228515625, 0.1181640625, 0.12298583984375, 0.1278076171875, 0.13262939453125, 0.137451171875, 0.14227294921875, 0.1470947265625, 0.15191650390625, 0.15673828125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 6.0, 5.0, 11.0, 14.0, 22.0, 28.0, 41.0, 91.0, 127.0, 171.0, 281.0, 390.0, 698.0, 1060.0, 1798.0, 3261.0, 6050.0, 12099.0, 25353.0, 54155.0, 113211.0, 199538.0, 246108.0, 187351.0, 101899.0, 48656.0, 22455.0, 10848.0, 5568.0, 2908.0, 1631.0, 964.0, 639.0, 374.0, 250.0, 165.0, 113.0, 64.0, 53.0, 30.0, 27.0, 16.0, 13.0, 11.0, 6.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.060516357421875, -0.05865001678466797, -0.05678367614746094, -0.054917335510253906, -0.053050994873046875, -0.051184654235839844, -0.04931831359863281, -0.04745197296142578, -0.04558563232421875, -0.04371929168701172, -0.04185295104980469, -0.039986610412597656, -0.038120269775390625, -0.036253929138183594, -0.03438758850097656, -0.03252124786376953, -0.0306549072265625, -0.02878856658935547, -0.026922225952148438, -0.025055885314941406, -0.023189544677734375, -0.021323204040527344, -0.019456863403320312, -0.01759052276611328, -0.01572418212890625, -0.013857841491699219, -0.011991500854492188, -0.010125160217285156, -0.008258819580078125, -0.006392478942871094, -0.0045261383056640625, -0.0026597976684570312, -0.00079345703125, 0.0010728836059570312, 0.0029392242431640625, 0.004805564880371094, 0.006671905517578125, 0.008538246154785156, 0.010404586791992188, 0.012270927429199219, 0.01413726806640625, 0.01600360870361328, 0.017869949340820312, 0.019736289978027344, 0.021602630615234375, 0.023468971252441406, 0.025335311889648438, 0.02720165252685547, 0.0290679931640625, 0.03093433380126953, 0.03280067443847656, 0.034667015075683594, 0.036533355712890625, 0.038399696350097656, 0.04026603698730469, 0.04213237762451172, 0.04399871826171875, 0.04586505889892578, 0.04773139953613281, 0.049597740173339844, 0.051464080810546875, 0.053330421447753906, 0.05519676208496094, 0.05706310272216797, 0.058929443359375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 2.0, 7.0, 6.0, 7.0, 7.0, 10.0, 12.0, 16.0, 16.0, 15.0, 24.0, 27.0, 41.0, 57.0, 49.0, 64.0, 74.0, 88.0, 68.0, 71.0, 80.0, 66.0, 42.0, 20.0, 22.0, 25.0, 13.0, 14.0, 11.0, 6.0, 6.0, 6.0, 6.0, 3.0, 6.0, 7.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9371509552001953e-05, -1.8790364265441895e-05, -1.8209218978881836e-05, -1.7628073692321777e-05, -1.704692840576172e-05, -1.646578311920166e-05, -1.58846378326416e-05, -1.5303492546081543e-05, -1.4722347259521484e-05, -1.4141201972961426e-05, -1.3560056686401367e-05, -1.2978911399841309e-05, -1.239776611328125e-05, -1.1816620826721191e-05, -1.1235475540161133e-05, -1.0654330253601074e-05, -1.0073184967041016e-05, -9.492039680480957e-06, -8.910894393920898e-06, -8.32974910736084e-06, -7.748603820800781e-06, -7.167458534240723e-06, -6.586313247680664e-06, -6.0051679611206055e-06, -5.424022674560547e-06, -4.842877388000488e-06, -4.26173210144043e-06, -3.680586814880371e-06, -3.0994415283203125e-06, -2.518296241760254e-06, -1.9371509552001953e-06, -1.3560056686401367e-06, -7.748603820800781e-07, -1.9371509552001953e-07, 3.8743019104003906e-07, 9.685754776000977e-07, 1.5497207641601562e-06, 2.130866050720215e-06, 2.7120113372802734e-06, 3.293156623840332e-06, 3.874301910400391e-06, 4.455447196960449e-06, 5.036592483520508e-06, 5.617737770080566e-06, 6.198883056640625e-06, 6.780028343200684e-06, 7.361173629760742e-06, 7.9423189163208e-06, 8.52346420288086e-06, 9.104609489440918e-06, 9.685754776000977e-06, 1.0266900062561035e-05, 1.0848045349121094e-05, 1.1429190635681152e-05, 1.2010335922241211e-05, 1.259148120880127e-05, 1.3172626495361328e-05, 1.3753771781921387e-05, 1.4334917068481445e-05, 1.4916062355041504e-05, 1.5497207641601562e-05, 1.607835292816162e-05, 1.665949821472168e-05, 1.7240643501281738e-05, 1.7821788787841797e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 6.0, 3.0, 13.0, 7.0, 17.0, 21.0, 37.0, 68.0, 102.0, 140.0, 292.0, 428.0, 818.0, 1547.0, 2777.0, 5486.0, 11057.0, 23009.0, 50710.0, 110552.0, 209134.0, 263744.0, 189015.0, 95459.0, 43828.0, 20201.0, 9630.0, 4675.0, 2561.0, 1390.0, 720.0, 448.0, 269.0, 143.0, 101.0, 49.0, 40.0, 19.0, 13.0, 3.0, 9.0, 4.0, 4.0, 1.0, 3.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.049957275390625, -0.04813432693481445, -0.046311378479003906, -0.04448843002319336, -0.04266548156738281, -0.040842533111572266, -0.03901958465576172, -0.03719663619995117, -0.035373687744140625, -0.03355073928833008, -0.03172779083251953, -0.029904842376708984, -0.028081893920898438, -0.02625894546508789, -0.024435997009277344, -0.022613048553466797, -0.02079010009765625, -0.018967151641845703, -0.017144203186035156, -0.01532125473022461, -0.013498306274414062, -0.011675357818603516, -0.009852409362792969, -0.008029460906982422, -0.006206512451171875, -0.004383563995361328, -0.0025606155395507812, -0.0007376670837402344, 0.0010852813720703125, 0.0029082298278808594, 0.004731178283691406, 0.006554126739501953, 0.0083770751953125, 0.010200023651123047, 0.012022972106933594, 0.01384592056274414, 0.015668869018554688, 0.017491817474365234, 0.01931476593017578, 0.021137714385986328, 0.022960662841796875, 0.024783611297607422, 0.02660655975341797, 0.028429508209228516, 0.030252456665039062, 0.03207540512084961, 0.033898353576660156, 0.0357213020324707, 0.03754425048828125, 0.0393671989440918, 0.041190147399902344, 0.04301309585571289, 0.04483604431152344, 0.046658992767333984, 0.04848194122314453, 0.05030488967895508, 0.052127838134765625, 0.05395078659057617, 0.05577373504638672, 0.057596683502197266, 0.05941963195800781, 0.06124258041381836, 0.0630655288696289, 0.06488847732543945, 0.06671142578125]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 9.0, 7.0, 5.0, 3.0, 8.0, 14.0, 15.0, 15.0, 24.0, 16.0, 26.0, 37.0, 44.0, 37.0, 42.0, 60.0, 48.0, 52.0, 64.0, 53.0, 49.0, 45.0, 52.0, 49.0, 26.0, 39.0, 32.0, 24.0, 19.0, 17.0, 14.0, 9.0, 10.0, 5.0, 5.0, 3.0, 6.0, 2.0, 4.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.056304931640625, -0.05462503433227539, -0.05294513702392578, -0.05126523971557617, -0.04958534240722656, -0.04790544509887695, -0.046225547790527344, -0.044545650482177734, -0.042865753173828125, -0.041185855865478516, -0.039505958557128906, -0.0378260612487793, -0.03614616394042969, -0.03446626663208008, -0.03278636932373047, -0.03110647201538086, -0.02942657470703125, -0.02774667739868164, -0.02606678009033203, -0.024386882781982422, -0.022706985473632812, -0.021027088165283203, -0.019347190856933594, -0.017667293548583984, -0.015987396240234375, -0.014307498931884766, -0.012627601623535156, -0.010947704315185547, -0.009267807006835938, -0.007587909698486328, -0.005908012390136719, -0.004228115081787109, -0.0025482177734375, -0.0008683204650878906, 0.0008115768432617188, 0.002491474151611328, 0.0041713714599609375, 0.005851268768310547, 0.007531166076660156, 0.009211063385009766, 0.010890960693359375, 0.012570858001708984, 0.014250755310058594, 0.015930652618408203, 0.017610549926757812, 0.019290447235107422, 0.02097034454345703, 0.02265024185180664, 0.02433013916015625, 0.02601003646850586, 0.02768993377685547, 0.029369831085205078, 0.031049728393554688, 0.0327296257019043, 0.034409523010253906, 0.036089420318603516, 0.037769317626953125, 0.039449214935302734, 0.041129112243652344, 0.04280900955200195, 0.04448890686035156, 0.04616880416870117, 0.04784870147705078, 0.04952859878540039, 0.05120849609375]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 9.0, 24.0, 47.0, 114.0, 156.0, 201.0, 200.0, 130.0, 62.0, 33.0, 21.0, 9.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2694859504699707, -1.2220635414123535, -1.1746411323547363, -1.1272187232971191, -1.079796314239502, -1.0323739051818848, -0.9849514365196228, -0.9375290274620056, -0.8901066184043884, -0.8426842093467712, -0.795261800289154, -0.7478393316268921, -0.7004169225692749, -0.6529945135116577, -0.6055721044540405, -0.5581496953964233, -0.5107272863388062, -0.46330487728118896, -0.4158824682235718, -0.3684600293636322, -0.321037620306015, -0.2736152112483978, -0.22619277238845825, -0.17877036333084106, -0.13134795427322388, -0.08392553776502609, -0.03650312125682831, 0.010919302701950073, 0.05834171175956726, 0.10576412081718445, 0.15318655967712402, 0.2006089687347412, 0.2480313777923584, 0.2954537868499756, 0.3428761959075928, 0.39029863476753235, 0.43772104382514954, 0.4851434528827667, 0.5325658917427063, 0.5799883008003235, 0.6274107098579407, 0.6748331189155579, 0.722255527973175, 0.769677996635437, 0.8171004056930542, 0.8645228147506714, 0.9119452238082886, 0.9593676328659058, 1.006790041923523, 1.0542124509811401, 1.1016348600387573, 1.1490572690963745, 1.1964796781539917, 1.2439020872116089, 1.2913246154785156, 1.3387470245361328, 1.38616943359375, 1.4335918426513672, 1.4810142517089844, 1.5284366607666016, 1.5758590698242188, 1.623281478881836, 1.6707038879394531, 1.7181262969970703, 1.7655487060546875]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 6.0, 5.0, 11.0, 15.0, 13.0, 21.0, 20.0, 25.0, 30.0, 38.0, 41.0, 45.0, 57.0, 45.0, 47.0, 56.0, 53.0, 57.0, 54.0, 51.0, 43.0, 41.0, 36.0, 37.0, 22.0, 21.0, 24.0, 21.0, 12.0, 12.0, 13.0, 9.0, 7.0, 4.0, 7.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8182801604270935, -0.795838475227356, -0.7733968496322632, -0.7509551644325256, -0.7285134792327881, -0.7060718536376953, -0.6836301684379578, -0.6611884832382202, -0.6387468576431274, -0.6163051724433899, -0.5938635468482971, -0.5714218616485596, -0.548980176448822, -0.5265384912490845, -0.5040968656539917, -0.48165518045425415, -0.4592134952545166, -0.43677183985710144, -0.4143301546573639, -0.39188849925994873, -0.3694468140602112, -0.347005158662796, -0.32456350326538086, -0.3021218180656433, -0.27968016266822815, -0.257238507270813, -0.23479682207107544, -0.21235516667366028, -0.18991349637508392, -0.16747182607650757, -0.1450301706790924, -0.12258850038051605, -0.1001468300819397, -0.07770515978336334, -0.055263496935367584, -0.032821834087371826, -0.010380163788795471, 0.012061506509780884, 0.034503161907196045, 0.0569448322057724, 0.07938650250434875, 0.10182817280292511, 0.12426983565092087, 0.14671149849891663, 0.16915316879749298, 0.19159483909606934, 0.2140364944934845, 0.23647816479206085, 0.2589198350906372, 0.28136149048805237, 0.3038031756877899, 0.3262448310852051, 0.3486865162849426, 0.3711281716823578, 0.39356982707977295, 0.4160115122795105, 0.43845316767692566, 0.4608948230743408, 0.48333650827407837, 0.5057781934738159, 0.5282198190689087, 0.5506615042686462, 0.5731031894683838, 0.5955448150634766, 0.6179865002632141]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 9.0, 7.0, 13.0, 16.0, 14.0, 18.0, 40.0, 55.0, 101.0, 179.0, 341.0, 829.0, 2711.0, 14427.0, 558776.0, 3565885.0, 43963.0, 4749.0, 1388.0, 387.0, 169.0, 87.0, 56.0, 28.0, 15.0, 4.0, 3.0, 6.0, 4.0, 1.0, 3.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.54541015625, -0.5307464599609375, -0.516082763671875, -0.5014190673828125, -0.48675537109375, -0.4720916748046875, -0.457427978515625, -0.4427642822265625, -0.4281005859375, -0.4134368896484375, -0.398773193359375, -0.3841094970703125, -0.36944580078125, -0.3547821044921875, -0.340118408203125, -0.3254547119140625, -0.310791015625, -0.2961273193359375, -0.281463623046875, -0.2667999267578125, -0.25213623046875, -0.2374725341796875, -0.222808837890625, -0.2081451416015625, -0.1934814453125, -0.1788177490234375, -0.164154052734375, -0.1494903564453125, -0.13482666015625, -0.1201629638671875, -0.105499267578125, -0.0908355712890625, -0.076171875, -0.0615081787109375, -0.046844482421875, -0.0321807861328125, -0.01751708984375, -0.0028533935546875, 0.011810302734375, 0.0264739990234375, 0.0411376953125, 0.0558013916015625, 0.070465087890625, 0.0851287841796875, 0.09979248046875, 0.1144561767578125, 0.129119873046875, 0.1437835693359375, 0.158447265625, 0.1731109619140625, 0.187774658203125, 0.2024383544921875, 0.21710205078125, 0.2317657470703125, 0.246429443359375, 0.2610931396484375, 0.2757568359375, 0.2904205322265625, 0.305084228515625, 0.3197479248046875, 0.33441162109375, 0.3490753173828125, 0.363739013671875, 0.3784027099609375, 0.39306640625]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 17.0, 54.0, 134.0, 250.0, 259.0, 163.0, 80.0, 32.0, 9.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.377197265625, -0.3670387268066406, -0.35688018798828125, -0.3467216491699219, -0.3365631103515625, -0.3264045715332031, -0.31624603271484375, -0.3060874938964844, -0.295928955078125, -0.2857704162597656, -0.27561187744140625, -0.2654533386230469, -0.2552947998046875, -0.24513626098632812, -0.23497772216796875, -0.22481918334960938, -0.21466064453125, -0.20450210571289062, -0.19434356689453125, -0.18418502807617188, -0.1740264892578125, -0.16386795043945312, -0.15370941162109375, -0.14355087280273438, -0.133392333984375, -0.12323379516601562, -0.11307525634765625, -0.10291671752929688, -0.0927581787109375, -0.08259963989257812, -0.07244110107421875, -0.062282562255859375, -0.0521240234375, -0.041965484619140625, -0.03180694580078125, -0.021648406982421875, -0.0114898681640625, -0.001331329345703125, 0.00882720947265625, 0.018985748291015625, 0.029144287109375, 0.039302825927734375, 0.04946136474609375, 0.059619903564453125, 0.0697784423828125, 0.07993698120117188, 0.09009552001953125, 0.10025405883789062, 0.11041259765625, 0.12057113647460938, 0.13072967529296875, 0.14088821411132812, 0.1510467529296875, 0.16120529174804688, 0.17136383056640625, 0.18152236938476562, 0.191680908203125, 0.20183944702148438, 0.21199798583984375, 0.22215652465820312, 0.2323150634765625, 0.24247360229492188, 0.25263214111328125, 0.2627906799316406, 0.27294921875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 7.0, 6.0, 7.0, 7.0, 16.0, 31.0, 20.0, 32.0, 51.0, 57.0, 105.0, 162.0, 430.0, 1579.0, 9203.0, 96157.0, 2182614.0, 1813118.0, 80670.0, 7888.0, 1338.0, 387.0, 159.0, 85.0, 47.0, 35.0, 29.0, 16.0, 8.0, 7.0, 2.0, 4.0, 6.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.29150390625, -0.28266143798828125, -0.2738189697265625, -0.26497650146484375, -0.256134033203125, -0.24729156494140625, -0.2384490966796875, -0.22960662841796875, -0.22076416015625, -0.21192169189453125, -0.2030792236328125, -0.19423675537109375, -0.185394287109375, -0.17655181884765625, -0.1677093505859375, -0.15886688232421875, -0.1500244140625, -0.14118194580078125, -0.1323394775390625, -0.12349700927734375, -0.114654541015625, -0.10581207275390625, -0.0969696044921875, -0.08812713623046875, -0.07928466796875, -0.07044219970703125, -0.0615997314453125, -0.05275726318359375, -0.043914794921875, -0.03507232666015625, -0.0262298583984375, -0.01738739013671875, -0.008544921875, 0.00029754638671875, 0.0091400146484375, 0.01798248291015625, 0.026824951171875, 0.03566741943359375, 0.0445098876953125, 0.05335235595703125, 0.06219482421875, 0.07103729248046875, 0.0798797607421875, 0.08872222900390625, 0.097564697265625, 0.10640716552734375, 0.1152496337890625, 0.12409210205078125, 0.1329345703125, 0.14177703857421875, 0.1506195068359375, 0.15946197509765625, 0.168304443359375, 0.17714691162109375, 0.1859893798828125, 0.19483184814453125, 0.20367431640625, 0.21251678466796875, 0.2213592529296875, 0.23020172119140625, 0.239044189453125, 0.24788665771484375, 0.2567291259765625, 0.26557159423828125, 0.2744140625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 4.0, 8.0, 11.0, 12.0, 17.0, 34.0, 42.0, 64.0, 72.0, 83.0, 149.0, 195.0, 258.0, 349.0, 412.0, 491.0, 437.0, 352.0, 286.0, 199.0, 144.0, 112.0, 77.0, 67.0, 44.0, 35.0, 21.0, 29.0, 13.0, 14.0, 11.0, 8.0, 7.0, 2.0, 4.0, 2.0, 5.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.11700439453125, -0.11350822448730469, -0.11001205444335938, -0.10651588439941406, -0.10301971435546875, -0.09952354431152344, -0.09602737426757812, -0.09253120422363281, -0.0890350341796875, -0.08553886413574219, -0.08204269409179688, -0.07854652404785156, -0.07505035400390625, -0.07155418395996094, -0.06805801391601562, -0.06456184387207031, -0.061065673828125, -0.05756950378417969, -0.054073333740234375, -0.05057716369628906, -0.04708099365234375, -0.04358482360839844, -0.040088653564453125, -0.03659248352050781, -0.0330963134765625, -0.029600143432617188, -0.026103973388671875, -0.022607803344726562, -0.01911163330078125, -0.015615463256835938, -0.012119293212890625, -0.008623123168945312, -0.005126953125, -0.0016307830810546875, 0.001865386962890625, 0.0053615570068359375, 0.00885772705078125, 0.012353897094726562, 0.015850067138671875, 0.019346237182617188, 0.0228424072265625, 0.026338577270507812, 0.029834747314453125, 0.03333091735839844, 0.03682708740234375, 0.04032325744628906, 0.043819427490234375, 0.04731559753417969, 0.050811767578125, 0.05430793762207031, 0.057804107666015625, 0.06130027770996094, 0.06479644775390625, 0.06829261779785156, 0.07178878784179688, 0.07528495788574219, 0.0787811279296875, 0.08227729797363281, 0.08577346801757812, 0.08926963806152344, 0.09276580810546875, 0.09626197814941406, 0.09975814819335938, 0.10325431823730469, 0.10675048828125]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 17.0, 41.0, 100.0, 212.0, 250.0, 200.0, 129.0, 43.0, 12.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4067245721817017, -1.3604570627212524, -1.3141895532608032, -1.267922043800354, -1.2216546535491943, -1.1753871440887451, -1.129119634628296, -1.0828521251678467, -1.0365846157073975, -0.9903171062469482, -0.944049596786499, -0.8977821469306946, -0.8515146374702454, -0.8052471280097961, -0.7589796781539917, -0.7127121686935425, -0.6664446592330933, -0.620177149772644, -0.5739096403121948, -0.5276421904563904, -0.48137468099594116, -0.43510717153549194, -0.3888396918773651, -0.3425722122192383, -0.29630470275878906, -0.25003719329833984, -0.203769713640213, -0.157502219080925, -0.11123472452163696, -0.06496722996234894, -0.018699735403060913, 0.027567744255065918, 0.07383513450622559, 0.12010262906551361, 0.16637012362480164, 0.21263761818408966, 0.2589051127433777, 0.3051726222038269, 0.35144010186195374, 0.39770758152008057, 0.4439750909805298, 0.490242600440979, 0.5365101099014282, 0.5827775597572327, 0.6290450692176819, 0.6753125786781311, 0.7215800285339355, 0.7678475379943848, 0.814115047454834, 0.8603825569152832, 0.9066500663757324, 0.9529175162315369, 0.9991850256919861, 1.0454524755477905, 1.0917199850082397, 1.137987494468689, 1.1842550039291382, 1.2305225133895874, 1.2767900228500366, 1.3230575323104858, 1.3693249225616455, 1.4155924320220947, 1.461859941482544, 1.5081274509429932, 1.5543949604034424]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 5.0, 5.0, 7.0, 9.0, 11.0, 10.0, 14.0, 10.0, 14.0, 23.0, 23.0, 30.0, 25.0, 30.0, 27.0, 36.0, 37.0, 40.0, 43.0, 28.0, 29.0, 41.0, 56.0, 52.0, 53.0, 34.0, 45.0, 35.0, 30.0, 24.0, 26.0, 22.0, 21.0, 12.0, 22.0, 13.0, 11.0, 19.0, 6.0, 5.0, 5.0, 4.0, 6.0, 5.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.34487593173980713, -0.33303433656692505, -0.3211927115917206, -0.3093510866165161, -0.29750949144363403, -0.28566789627075195, -0.2738262712955475, -0.261984646320343, -0.25014305114746094, -0.23830144107341766, -0.2264598309993744, -0.21461822092533112, -0.20277661085128784, -0.19093500077724457, -0.1790933907032013, -0.16725178062915802, -0.15541017055511475, -0.14356856048107147, -0.1317269504070282, -0.11988534033298492, -0.10804373025894165, -0.09620212018489838, -0.0843605101108551, -0.07251890003681183, -0.060677289962768555, -0.04883567988872528, -0.03699406981468201, -0.025152459740638733, -0.013310849666595459, -0.001469239592552185, 0.010372370481491089, 0.022213980555534363, 0.03405559062957764, 0.04589720070362091, 0.057738810777664185, 0.06958042085170746, 0.08142203092575073, 0.093263640999794, 0.10510525107383728, 0.11694686114788055, 0.12878847122192383, 0.1406300812959671, 0.15247169137001038, 0.16431330144405365, 0.17615491151809692, 0.1879965215921402, 0.19983813166618347, 0.21167974174022675, 0.22352135181427002, 0.2353629618883133, 0.24720457196235657, 0.25904619693756104, 0.2708877921104431, 0.2827293872833252, 0.29457101225852966, 0.30641263723373413, 0.3182542324066162, 0.3300958275794983, 0.34193745255470276, 0.3537790775299072, 0.3656206727027893, 0.3774622678756714, 0.38930389285087585, 0.4011455178260803, 0.4129871129989624]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 4.0, 5.0, 7.0, 9.0, 10.0, 20.0, 14.0, 21.0, 34.0, 46.0, 65.0, 82.0, 140.0, 206.0, 397.0, 610.0, 1382.0, 3810.0, 14039.0, 76726.0, 491818.0, 385656.0, 56277.0, 11277.0, 3125.0, 1188.0, 561.0, 349.0, 195.0, 130.0, 88.0, 76.0, 58.0, 36.0, 24.0, 11.0, 9.0, 10.0, 8.0, 6.0, 6.0, 9.0, 5.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.57666015625, -0.55859375, -0.54052734375, -0.5224609375, -0.50439453125, -0.486328125, -0.46826171875, -0.4501953125, -0.43212890625, -0.4140625, -0.39599609375, -0.3779296875, -0.35986328125, -0.341796875, -0.32373046875, -0.3056640625, -0.28759765625, -0.26953125, -0.25146484375, -0.2333984375, -0.21533203125, -0.197265625, -0.17919921875, -0.1611328125, -0.14306640625, -0.125, -0.10693359375, -0.0888671875, -0.07080078125, -0.052734375, -0.03466796875, -0.0166015625, 0.00146484375, 0.01953125, 0.03759765625, 0.0556640625, 0.07373046875, 0.091796875, 0.10986328125, 0.1279296875, 0.14599609375, 0.1640625, 0.18212890625, 0.2001953125, 0.21826171875, 0.236328125, 0.25439453125, 0.2724609375, 0.29052734375, 0.30859375, 0.32666015625, 0.3447265625, 0.36279296875, 0.380859375, 0.39892578125, 0.4169921875, 0.43505859375, 0.453125, 0.47119140625, 0.4892578125, 0.50732421875, 0.525390625, 0.54345703125, 0.5615234375, 0.57958984375]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 12.0, 55.0, 134.0, 252.0, 269.0, 168.0, 72.0, 32.0, 8.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.38671875, -0.37630462646484375, -0.3658905029296875, -0.35547637939453125, -0.345062255859375, -0.33464813232421875, -0.3242340087890625, -0.31381988525390625, -0.30340576171875, -0.29299163818359375, -0.2825775146484375, -0.27216339111328125, -0.261749267578125, -0.25133514404296875, -0.2409210205078125, -0.23050689697265625, -0.2200927734375, -0.20967864990234375, -0.1992645263671875, -0.18885040283203125, -0.178436279296875, -0.16802215576171875, -0.1576080322265625, -0.14719390869140625, -0.13677978515625, -0.12636566162109375, -0.1159515380859375, -0.10553741455078125, -0.095123291015625, -0.08470916748046875, -0.0742950439453125, -0.06388092041015625, -0.053466796875, -0.04305267333984375, -0.0326385498046875, -0.02222442626953125, -0.011810302734375, -0.00139617919921875, 0.0090179443359375, 0.01943206787109375, 0.02984619140625, 0.04026031494140625, 0.0506744384765625, 0.06108856201171875, 0.071502685546875, 0.08191680908203125, 0.0923309326171875, 0.10274505615234375, 0.1131591796875, 0.12357330322265625, 0.1339874267578125, 0.14440155029296875, 0.154815673828125, 0.16522979736328125, 0.1756439208984375, 0.18605804443359375, 0.19647216796875, 0.20688629150390625, 0.2173004150390625, 0.22771453857421875, 0.238128662109375, 0.24854278564453125, 0.2589569091796875, 0.26937103271484375, 0.27978515625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 6.0, 1.0, 9.0, 7.0, 12.0, 17.0, 26.0, 33.0, 65.0, 123.0, 199.0, 397.0, 877.0, 2027.0, 5887.0, 17714.0, 59275.0, 184625.0, 381048.0, 263777.0, 91045.0, 27478.0, 8603.0, 3036.0, 1183.0, 520.0, 238.0, 117.0, 76.0, 47.0, 28.0, 16.0, 9.0, 14.0, 4.0, 7.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.290771484375, -0.280975341796875, -0.27117919921875, -0.261383056640625, -0.2515869140625, -0.241790771484375, -0.23199462890625, -0.222198486328125, -0.21240234375, -0.202606201171875, -0.19281005859375, -0.183013916015625, -0.1732177734375, -0.163421630859375, -0.15362548828125, -0.143829345703125, -0.134033203125, -0.124237060546875, -0.11444091796875, -0.104644775390625, -0.0948486328125, -0.085052490234375, -0.07525634765625, -0.065460205078125, -0.0556640625, -0.045867919921875, -0.03607177734375, -0.026275634765625, -0.0164794921875, -0.006683349609375, 0.00311279296875, 0.012908935546875, 0.022705078125, 0.032501220703125, 0.04229736328125, 0.052093505859375, 0.0618896484375, 0.071685791015625, 0.08148193359375, 0.091278076171875, 0.10107421875, 0.110870361328125, 0.12066650390625, 0.130462646484375, 0.1402587890625, 0.150054931640625, 0.15985107421875, 0.169647216796875, 0.179443359375, 0.189239501953125, 0.19903564453125, 0.208831787109375, 0.2186279296875, 0.228424072265625, 0.23822021484375, 0.248016357421875, 0.2578125, 0.267608642578125, 0.27740478515625, 0.287200927734375, 0.2969970703125, 0.306793212890625, 0.31658935546875, 0.326385498046875, 0.336181640625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 4.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 4.0, 3.0, 6.0, 9.0, 15.0, 9.0, 10.0, 11.0, 14.0, 14.0, 25.0, 32.0, 35.0, 26.0, 33.0, 33.0, 42.0, 39.0, 40.0, 45.0, 43.0, 41.0, 41.0, 47.0, 39.0, 41.0, 32.0, 33.0, 34.0, 33.0, 21.0, 20.0, 22.0, 9.0, 22.0, 15.0, 12.0, 7.0, 10.0, 9.0, 5.0, 3.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.19482421875, -0.18836402893066406, -0.18190383911132812, -0.1754436492919922, -0.16898345947265625, -0.1625232696533203, -0.15606307983398438, -0.14960289001464844, -0.1431427001953125, -0.13668251037597656, -0.13022232055664062, -0.12376213073730469, -0.11730194091796875, -0.11084175109863281, -0.10438156127929688, -0.09792137145996094, -0.091461181640625, -0.08500099182128906, -0.07854080200195312, -0.07208061218261719, -0.06562042236328125, -0.05916023254394531, -0.052700042724609375, -0.04623985290527344, -0.0397796630859375, -0.03331947326660156, -0.026859283447265625, -0.020399093627929688, -0.01393890380859375, -0.0074787139892578125, -0.001018524169921875, 0.0054416656494140625, 0.01190185546875, 0.018362045288085938, 0.024822235107421875, 0.03128242492675781, 0.03774261474609375, 0.04420280456542969, 0.050662994384765625, 0.05712318420410156, 0.0635833740234375, 0.07004356384277344, 0.07650375366210938, 0.08296394348144531, 0.08942413330078125, 0.09588432312011719, 0.10234451293945312, 0.10880470275878906, 0.115264892578125, 0.12172508239746094, 0.12818527221679688, 0.1346454620361328, 0.14110565185546875, 0.1475658416748047, 0.15402603149414062, 0.16048622131347656, 0.1669464111328125, 0.17340660095214844, 0.17986679077148438, 0.1863269805908203, 0.19278717041015625, 0.1992473602294922, 0.20570755004882812, 0.21216773986816406, 0.2186279296875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 4.0, 10.0, 15.0, 35.0, 51.0, 86.0, 134.0, 246.0, 411.0, 689.0, 1341.0, 2434.0, 5128.0, 10768.0, 25874.0, 66325.0, 171859.0, 320503.0, 257429.0, 110847.0, 42294.0, 17017.0, 7443.0, 3607.0, 1735.0, 966.0, 561.0, 307.0, 176.0, 105.0, 53.0, 40.0, 24.0, 19.0, 8.0, 6.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0], "bins": [-0.14208984375, -0.13851642608642578, -0.13494300842285156, -0.13136959075927734, -0.12779617309570312, -0.1242227554321289, -0.12064933776855469, -0.11707592010498047, -0.11350250244140625, -0.10992908477783203, -0.10635566711425781, -0.1027822494506836, -0.09920883178710938, -0.09563541412353516, -0.09206199645996094, -0.08848857879638672, -0.0849151611328125, -0.08134174346923828, -0.07776832580566406, -0.07419490814208984, -0.07062149047851562, -0.0670480728149414, -0.06347465515136719, -0.05990123748779297, -0.05632781982421875, -0.05275440216064453, -0.04918098449707031, -0.045607566833496094, -0.042034149169921875, -0.038460731506347656, -0.03488731384277344, -0.03131389617919922, -0.027740478515625, -0.02416706085205078, -0.020593643188476562, -0.017020225524902344, -0.013446807861328125, -0.009873390197753906, -0.0062999725341796875, -0.0027265548706054688, 0.00084686279296875, 0.004420280456542969, 0.007993698120117188, 0.011567115783691406, 0.015140533447265625, 0.018713951110839844, 0.022287368774414062, 0.02586078643798828, 0.0294342041015625, 0.03300762176513672, 0.03658103942871094, 0.040154457092285156, 0.043727874755859375, 0.047301292419433594, 0.05087471008300781, 0.05444812774658203, 0.05802154541015625, 0.06159496307373047, 0.06516838073730469, 0.0687417984008789, 0.07231521606445312, 0.07588863372802734, 0.07946205139160156, 0.08303546905517578, 0.08660888671875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 5.0, 7.0, 5.0, 9.0, 14.0, 17.0, 18.0, 24.0, 16.0, 34.0, 33.0, 41.0, 51.0, 80.0, 76.0, 83.0, 54.0, 65.0, 62.0, 54.0, 33.0, 46.0, 30.0, 28.0, 26.0, 14.0, 14.0, 12.0, 9.0, 6.0, 2.0, 7.0, 7.0, 4.0, 2.0, 3.0, 2.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.4378299713134766e-05, -2.3633241653442383e-05, -2.288818359375e-05, -2.2143125534057617e-05, -2.1398067474365234e-05, -2.065300941467285e-05, -1.990795135498047e-05, -1.9162893295288086e-05, -1.8417835235595703e-05, -1.767277717590332e-05, -1.6927719116210938e-05, -1.6182661056518555e-05, -1.5437602996826172e-05, -1.4692544937133789e-05, -1.3947486877441406e-05, -1.3202428817749023e-05, -1.245737075805664e-05, -1.1712312698364258e-05, -1.0967254638671875e-05, -1.0222196578979492e-05, -9.47713851928711e-06, -8.732080459594727e-06, -7.987022399902344e-06, -7.241964340209961e-06, -6.496906280517578e-06, -5.751848220825195e-06, -5.0067901611328125e-06, -4.26173210144043e-06, -3.516674041748047e-06, -2.771615982055664e-06, -2.0265579223632812e-06, -1.2814998626708984e-06, -5.364418029785156e-07, 2.086162567138672e-07, 9.5367431640625e-07, 1.6987323760986328e-06, 2.4437904357910156e-06, 3.1888484954833984e-06, 3.933906555175781e-06, 4.678964614868164e-06, 5.424022674560547e-06, 6.16908073425293e-06, 6.9141387939453125e-06, 7.659196853637695e-06, 8.404254913330078e-06, 9.149312973022461e-06, 9.894371032714844e-06, 1.0639429092407227e-05, 1.138448715209961e-05, 1.2129545211791992e-05, 1.2874603271484375e-05, 1.3619661331176758e-05, 1.436471939086914e-05, 1.5109777450561523e-05, 1.5854835510253906e-05, 1.659989356994629e-05, 1.7344951629638672e-05, 1.8090009689331055e-05, 1.8835067749023438e-05, 1.958012580871582e-05, 2.0325183868408203e-05, 2.1070241928100586e-05, 2.181529998779297e-05, 2.256035804748535e-05, 2.3305416107177734e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 2.0, 1.0, 2.0, 4.0, 6.0, 8.0, 10.0, 16.0, 25.0, 32.0, 50.0, 76.0, 124.0, 202.0, 342.0, 659.0, 1237.0, 2524.0, 5320.0, 11579.0, 28971.0, 78085.0, 213983.0, 361875.0, 214313.0, 78409.0, 28613.0, 11625.0, 5270.0, 2437.0, 1233.0, 626.0, 334.0, 212.0, 122.0, 86.0, 48.0, 33.0, 17.0, 16.0, 10.0, 5.0, 2.0, 5.0, 3.0, 2.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.13525390625, -0.13144397735595703, -0.12763404846191406, -0.1238241195678711, -0.12001419067382812, -0.11620426177978516, -0.11239433288574219, -0.10858440399169922, -0.10477447509765625, -0.10096454620361328, -0.09715461730957031, -0.09334468841552734, -0.08953475952148438, -0.0857248306274414, -0.08191490173339844, -0.07810497283935547, -0.0742950439453125, -0.07048511505126953, -0.06667518615722656, -0.0628652572631836, -0.059055328369140625, -0.055245399475097656, -0.05143547058105469, -0.04762554168701172, -0.04381561279296875, -0.04000568389892578, -0.03619575500488281, -0.032385826110839844, -0.028575897216796875, -0.024765968322753906, -0.020956039428710938, -0.01714611053466797, -0.013336181640625, -0.009526252746582031, -0.0057163238525390625, -0.0019063949584960938, 0.001903533935546875, 0.005713462829589844, 0.009523391723632812, 0.013333320617675781, 0.01714324951171875, 0.02095317840576172, 0.024763107299804688, 0.028573036193847656, 0.032382965087890625, 0.036192893981933594, 0.04000282287597656, 0.04381275177001953, 0.0476226806640625, 0.05143260955810547, 0.05524253845214844, 0.059052467346191406, 0.06286239624023438, 0.06667232513427734, 0.07048225402832031, 0.07429218292236328, 0.07810211181640625, 0.08191204071044922, 0.08572196960449219, 0.08953189849853516, 0.09334182739257812, 0.0971517562866211, 0.10096168518066406, 0.10477161407470703, 0.10858154296875]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 4.0, 5.0, 4.0, 9.0, 10.0, 12.0, 8.0, 20.0, 20.0, 32.0, 38.0, 39.0, 69.0, 66.0, 68.0, 86.0, 71.0, 68.0, 87.0, 63.0, 56.0, 38.0, 25.0, 25.0, 24.0, 15.0, 10.0, 11.0, 7.0, 5.0, 5.0, 5.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0986328125, -0.09517383575439453, -0.09171485900878906, -0.0882558822631836, -0.08479690551757812, -0.08133792877197266, -0.07787895202636719, -0.07441997528076172, -0.07096099853515625, -0.06750202178955078, -0.06404304504394531, -0.060584068298339844, -0.057125091552734375, -0.053666114807128906, -0.05020713806152344, -0.04674816131591797, -0.0432891845703125, -0.03983020782470703, -0.03637123107910156, -0.032912254333496094, -0.029453277587890625, -0.025994300842285156, -0.022535324096679688, -0.01907634735107422, -0.01561737060546875, -0.012158393859863281, -0.008699417114257812, -0.005240440368652344, -0.001781463623046875, 0.0016775131225585938, 0.0051364898681640625, 0.008595466613769531, 0.012054443359375, 0.015513420104980469, 0.018972396850585938, 0.022431373596191406, 0.025890350341796875, 0.029349327087402344, 0.03280830383300781, 0.03626728057861328, 0.03972625732421875, 0.04318523406982422, 0.04664421081542969, 0.050103187561035156, 0.053562164306640625, 0.057021141052246094, 0.06048011779785156, 0.06393909454345703, 0.0673980712890625, 0.07085704803466797, 0.07431602478027344, 0.0777750015258789, 0.08123397827148438, 0.08469295501708984, 0.08815193176269531, 0.09161090850830078, 0.09506988525390625, 0.09852886199951172, 0.10198783874511719, 0.10544681549072266, 0.10890579223632812, 0.1123647689819336, 0.11582374572753906, 0.11928272247314453, 0.12274169921875]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 6.0, 4.0, 13.0, 23.0, 69.0, 97.0, 136.0, 195.0, 173.0, 124.0, 81.0, 49.0, 19.0, 12.0, 7.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.255275845527649, -1.1950390338897705, -1.1348023414611816, -1.0745655298233032, -1.0143287181854248, -0.9540919065475464, -0.8938551545143127, -0.8336184024810791, -0.7733815908432007, -0.7131447792053223, -0.6529080271720886, -0.592671275138855, -0.5324344635009766, -0.47219768166542053, -0.4119608998298645, -0.35172411799430847, -0.29148733615875244, -0.2312505543231964, -0.17101377248764038, -0.11077699065208435, -0.05054020881652832, 0.00969657301902771, 0.06993335485458374, 0.13017013669013977, 0.1904069185256958, 0.25064370036125183, 0.31088048219680786, 0.3711172640323639, 0.4313540458679199, 0.49159082770347595, 0.551827609539032, 0.6120643615722656, 0.6723012924194336, 0.732538104057312, 0.7927748560905457, 0.8530116081237793, 0.9132484197616577, 0.9734852313995361, 1.033721923828125, 1.0939587354660034, 1.1541955471038818, 1.2144323587417603, 1.2746691703796387, 1.3349058628082275, 1.395142674446106, 1.4553794860839844, 1.5156161785125732, 1.5758529901504517, 1.63608980178833, 1.6963266134262085, 1.756563425064087, 1.8168001174926758, 1.8770369291305542, 1.9372737407684326, 1.9975104331970215, 2.0577473640441895, 2.1179840564727783, 2.178220748901367, 2.238457679748535, 2.298694372177124, 2.358931064605713, 2.419167995452881, 2.4794046878814697, 2.5396416187286377, 2.5998783111572266]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 11.0, 19.0, 16.0, 27.0, 35.0, 28.0, 34.0, 53.0, 58.0, 40.0, 47.0, 50.0, 50.0, 72.0, 61.0, 54.0, 63.0, 56.0, 37.0, 44.0, 31.0, 26.0, 19.0, 12.0, 16.0, 5.0, 14.0, 5.0, 2.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1224405765533447, -1.0854933261871338, -1.0485460758209229, -1.011598825454712, -0.974651575088501, -0.93770432472229, -0.9007571339607239, -0.8638098835945129, -0.826862633228302, -0.7899153828620911, -0.7529681324958801, -0.7160208821296692, -0.679073691368103, -0.6421264410018921, -0.6051791906356812, -0.5682319402694702, -0.5312846899032593, -0.49433743953704834, -0.4573901891708374, -0.42044296860694885, -0.3834957182407379, -0.346548467874527, -0.3096012473106384, -0.2726539969444275, -0.23570674657821655, -0.19875949621200562, -0.16181226074695587, -0.12486501783132553, -0.08791777491569519, -0.05097052454948425, -0.01402328908443451, 0.022923946380615234, 0.05987119674682617, 0.09681843966245651, 0.13376568257808685, 0.1707129180431366, 0.20766016840934753, 0.24460741877555847, 0.281554639339447, 0.31850188970565796, 0.3554491400718689, 0.39239639043807983, 0.42934364080429077, 0.4662908613681793, 0.5032380819320679, 0.5401853322982788, 0.5771325826644897, 0.6140798330307007, 0.6510270833969116, 0.6879743337631226, 0.7249215841293335, 0.7618688344955444, 0.7988160848617554, 0.8357633352279663, 0.8727105259895325, 0.9096577763557434, 0.9466050267219543, 0.9835522770881653, 1.0204994678497314, 1.0574467182159424, 1.0943939685821533, 1.1313412189483643, 1.1682884693145752, 1.2052357196807861, 1.242182970046997]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 7.0, 8.0, 12.0, 28.0, 63.0, 116.0, 281.0, 816.0, 4180.0, 66592.0, 4017751.0, 98212.0, 4909.0, 943.0, 202.0, 92.0, 42.0, 18.0, 11.0, 1.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7021484375, -0.6829299926757812, -0.6637115478515625, -0.6444931030273438, -0.625274658203125, -0.6060562133789062, -0.5868377685546875, -0.5676193237304688, -0.54840087890625, -0.5291824340820312, -0.5099639892578125, -0.49074554443359375, -0.471527099609375, -0.45230865478515625, -0.4330902099609375, -0.41387176513671875, -0.3946533203125, -0.37543487548828125, -0.3562164306640625, -0.33699798583984375, -0.317779541015625, -0.29856109619140625, -0.2793426513671875, -0.26012420654296875, -0.24090576171875, -0.22168731689453125, -0.2024688720703125, -0.18325042724609375, -0.164031982421875, -0.14481353759765625, -0.1255950927734375, -0.10637664794921875, -0.087158203125, -0.06793975830078125, -0.0487213134765625, -0.02950286865234375, -0.010284423828125, 0.00893402099609375, 0.0281524658203125, 0.04737091064453125, 0.06658935546875, 0.08580780029296875, 0.1050262451171875, 0.12424468994140625, 0.143463134765625, 0.16268157958984375, 0.1819000244140625, 0.20111846923828125, 0.2203369140625, 0.23955535888671875, 0.2587738037109375, 0.27799224853515625, 0.297210693359375, 0.31642913818359375, 0.3356475830078125, 0.35486602783203125, 0.37408447265625, 0.39330291748046875, 0.4125213623046875, 0.43173980712890625, 0.450958251953125, 0.47017669677734375, 0.4893951416015625, 0.5086135864257812, 0.52783203125]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 5.0, 7.0, 39.0, 106.0, 157.0, 233.0, 200.0, 151.0, 62.0, 33.0, 14.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.396484375, -0.385406494140625, -0.37432861328125, -0.363250732421875, -0.3521728515625, -0.341094970703125, -0.33001708984375, -0.318939208984375, -0.307861328125, -0.296783447265625, -0.28570556640625, -0.274627685546875, -0.2635498046875, -0.252471923828125, -0.24139404296875, -0.230316162109375, -0.21923828125, -0.208160400390625, -0.19708251953125, -0.186004638671875, -0.1749267578125, -0.163848876953125, -0.15277099609375, -0.141693115234375, -0.130615234375, -0.119537353515625, -0.10845947265625, -0.097381591796875, -0.0863037109375, -0.075225830078125, -0.06414794921875, -0.053070068359375, -0.0419921875, -0.030914306640625, -0.01983642578125, -0.008758544921875, 0.0023193359375, 0.013397216796875, 0.02447509765625, 0.035552978515625, 0.046630859375, 0.057708740234375, 0.06878662109375, 0.079864501953125, 0.0909423828125, 0.102020263671875, 0.11309814453125, 0.124176025390625, 0.13525390625, 0.146331787109375, 0.15740966796875, 0.168487548828125, 0.1795654296875, 0.190643310546875, 0.20172119140625, 0.212799072265625, 0.223876953125, 0.234954833984375, 0.24603271484375, 0.257110595703125, 0.2681884765625, 0.279266357421875, 0.29034423828125, 0.301422119140625, 0.3125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 1.0, 10.0, 7.0, 11.0, 19.0, 46.0, 135.0, 297.0, 825.0, 3400.0, 20136.0, 283234.0, 3481162.0, 375906.0, 23925.0, 3720.0, 942.0, 291.0, 113.0, 58.0, 26.0, 10.0, 10.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2274169921875, -0.2168598175048828, -0.20630264282226562, -0.19574546813964844, -0.18518829345703125, -0.17463111877441406, -0.16407394409179688, -0.1535167694091797, -0.1429595947265625, -0.1324024200439453, -0.12184524536132812, -0.11128807067871094, -0.10073089599609375, -0.09017372131347656, -0.07961654663085938, -0.06905937194824219, -0.058502197265625, -0.04794502258300781, -0.037387847900390625, -0.026830673217773438, -0.01627349853515625, -0.0057163238525390625, 0.004840850830078125, 0.015398025512695312, 0.0259552001953125, 0.03651237487792969, 0.047069549560546875, 0.05762672424316406, 0.06818389892578125, 0.07874107360839844, 0.08929824829101562, 0.09985542297363281, 0.11041259765625, 0.12096977233886719, 0.13152694702148438, 0.14208412170410156, 0.15264129638671875, 0.16319847106933594, 0.17375564575195312, 0.1843128204345703, 0.1948699951171875, 0.2054271697998047, 0.21598434448242188, 0.22654151916503906, 0.23709869384765625, 0.24765586853027344, 0.2582130432128906, 0.2687702178955078, 0.279327392578125, 0.2898845672607422, 0.3004417419433594, 0.31099891662597656, 0.32155609130859375, 0.33211326599121094, 0.3426704406738281, 0.3532276153564453, 0.3637847900390625, 0.3743419647216797, 0.3848991394042969, 0.39545631408691406, 0.40601348876953125, 0.41657066345214844, 0.4271278381347656, 0.4376850128173828, 0.4482421875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 2.0, 6.0, 7.0, 4.0, 15.0, 13.0, 23.0, 22.0, 30.0, 56.0, 67.0, 98.0, 145.0, 207.0, 313.0, 485.0, 596.0, 574.0, 415.0, 268.0, 184.0, 141.0, 112.0, 70.0, 43.0, 47.0, 28.0, 14.0, 23.0, 9.0, 16.0, 12.0, 4.0, 6.0, 6.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.1468505859375, -0.14250946044921875, -0.1381683349609375, -0.13382720947265625, -0.129486083984375, -0.12514495849609375, -0.1208038330078125, -0.11646270751953125, -0.11212158203125, -0.10778045654296875, -0.1034393310546875, -0.09909820556640625, -0.094757080078125, -0.09041595458984375, -0.0860748291015625, -0.08173370361328125, -0.077392578125, -0.07305145263671875, -0.0687103271484375, -0.06436920166015625, -0.060028076171875, -0.05568695068359375, -0.0513458251953125, -0.04700469970703125, -0.04266357421875, -0.03832244873046875, -0.0339813232421875, -0.02964019775390625, -0.025299072265625, -0.02095794677734375, -0.0166168212890625, -0.01227569580078125, -0.0079345703125, -0.00359344482421875, 0.0007476806640625, 0.00508880615234375, 0.009429931640625, 0.01377105712890625, 0.0181121826171875, 0.02245330810546875, 0.02679443359375, 0.03113555908203125, 0.0354766845703125, 0.03981781005859375, 0.044158935546875, 0.04850006103515625, 0.0528411865234375, 0.05718231201171875, 0.0615234375, 0.06586456298828125, 0.0702056884765625, 0.07454681396484375, 0.078887939453125, 0.08322906494140625, 0.0875701904296875, 0.09191131591796875, 0.09625244140625, 0.10059356689453125, 0.1049346923828125, 0.10927581787109375, 0.113616943359375, 0.11795806884765625, 0.1222991943359375, 0.12664031982421875, 0.1309814453125]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 15.0, 33.0, 69.0, 131.0, 219.0, 205.0, 168.0, 82.0, 47.0, 23.0, 11.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.042356014251709, -0.9966728687286377, -0.9509896636009216, -0.9053065180778503, -0.8596233129501343, -0.813940167427063, -0.7682570219039917, -0.7225738763809204, -0.6768906712532043, -0.6312075257301331, -0.585524320602417, -0.5398411750793457, -0.494157999753952, -0.44847482442855835, -0.40279167890548706, -0.3571085035800934, -0.3114253282546997, -0.26574215292930603, -0.22005899250507355, -0.17437583208084106, -0.1286926567554474, -0.08300948143005371, -0.03732633590698242, 0.008356839418411255, 0.05404001474380493, 0.09972318261861801, 0.1454063504934311, 0.19108951091766357, 0.23677268624305725, 0.2824558615684509, 0.3281390070915222, 0.3738221824169159, 0.4195054769515991, 0.4651886522769928, 0.5108718276023865, 0.5565549731254578, 0.6022381782531738, 0.6479213237762451, 0.6936044692993164, 0.7392876148223877, 0.7849708199501038, 0.830653965473175, 0.8763371706008911, 0.9220203161239624, 0.9677034616470337, 1.0133867263793945, 1.0590698719024658, 1.104753017425537, 1.1504361629486084, 1.1961193084716797, 1.241802453994751, 1.2874855995178223, 1.333168864250183, 1.3788520097732544, 1.4245351552963257, 1.470218300819397, 1.5159015655517578, 1.561584711074829, 1.6072678565979004, 1.6529510021209717, 1.6986342668533325, 1.7443174123764038, 1.790000557899475, 1.8356837034225464, 1.8813668489456177]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 0.0, 2.0, 3.0, 4.0, 3.0, 12.0, 13.0, 10.0, 19.0, 27.0, 24.0, 27.0, 43.0, 38.0, 33.0, 46.0, 51.0, 57.0, 52.0, 65.0, 51.0, 67.0, 57.0, 45.0, 50.0, 35.0, 37.0, 32.0, 21.0, 15.0, 22.0, 6.0, 10.0, 9.0, 6.0, 9.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6175454258918762, -0.5980497598648071, -0.5785541534423828, -0.5590584874153137, -0.5395628213882446, -0.5200672149658203, -0.5005715489387512, -0.4810759127140045, -0.4615802764892578, -0.4420846402645111, -0.4225890040397644, -0.4030933380126953, -0.3835977017879486, -0.3641020655632019, -0.3446063995361328, -0.3251107633113861, -0.3056151270866394, -0.2861194908618927, -0.266623854637146, -0.2471281886100769, -0.2276325523853302, -0.2081369161605835, -0.1886412650346756, -0.1691456139087677, -0.149649977684021, -0.1301543414592743, -0.1106586903333664, -0.09116304665803909, -0.07166740298271179, -0.05217175930738449, -0.03267611563205719, -0.013180464506149292, 0.0063152313232421875, 0.02581087499856949, 0.04530651867389679, 0.06480216234922409, 0.08429780602455139, 0.10379344969987869, 0.123289093375206, 0.1427847445011139, 0.1622803807258606, 0.1817760169506073, 0.2012716680765152, 0.2207673192024231, 0.2402629554271698, 0.2597585916519165, 0.2792542576789856, 0.2987498939037323, 0.318245530128479, 0.3377411663532257, 0.3572368025779724, 0.3767324686050415, 0.3962281048297882, 0.4157237410545349, 0.435219407081604, 0.4547150433063507, 0.4742106795310974, 0.4937063157558441, 0.5132019519805908, 0.5326976180076599, 0.552193284034729, 0.5716888904571533, 0.5911845564842224, 0.6106802225112915, 0.6301758289337158]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 6.0, 2.0, 1.0, 6.0, 4.0, 10.0, 19.0, 28.0, 33.0, 58.0, 79.0, 147.0, 258.0, 437.0, 765.0, 2065.0, 7850.0, 40120.0, 302082.0, 593907.0, 80864.0, 14125.0, 3313.0, 1111.0, 527.0, 309.0, 162.0, 93.0, 64.0, 36.0, 26.0, 23.0, 17.0, 9.0, 2.0, 3.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53564453125, -0.5190048217773438, -0.5023651123046875, -0.48572540283203125, -0.469085693359375, -0.45244598388671875, -0.4358062744140625, -0.41916656494140625, -0.40252685546875, -0.38588714599609375, -0.3692474365234375, -0.35260772705078125, -0.335968017578125, -0.31932830810546875, -0.3026885986328125, -0.28604888916015625, -0.2694091796875, -0.25276947021484375, -0.2361297607421875, -0.21949005126953125, -0.202850341796875, -0.18621063232421875, -0.1695709228515625, -0.15293121337890625, -0.13629150390625, -0.11965179443359375, -0.1030120849609375, -0.08637237548828125, -0.069732666015625, -0.05309295654296875, -0.0364532470703125, -0.01981353759765625, -0.003173828125, 0.01346588134765625, 0.0301055908203125, 0.04674530029296875, 0.063385009765625, 0.08002471923828125, 0.0966644287109375, 0.11330413818359375, 0.12994384765625, 0.14658355712890625, 0.1632232666015625, 0.17986297607421875, 0.196502685546875, 0.21314239501953125, 0.2297821044921875, 0.24642181396484375, 0.2630615234375, 0.27970123291015625, 0.2963409423828125, 0.31298065185546875, 0.329620361328125, 0.34626007080078125, 0.3628997802734375, 0.37953948974609375, 0.39617919921875, 0.41281890869140625, 0.4294586181640625, 0.44609832763671875, 0.462738037109375, 0.47937774658203125, 0.4960174560546875, 0.5126571655273438, 0.529296875]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 3.0, 6.0, 28.0, 79.0, 147.0, 223.0, 229.0, 154.0, 86.0, 35.0, 17.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.40283203125, -0.3916435241699219, -0.38045501708984375, -0.3692665100097656, -0.3580780029296875, -0.3468894958496094, -0.33570098876953125, -0.3245124816894531, -0.313323974609375, -0.3021354675292969, -0.29094696044921875, -0.2797584533691406, -0.2685699462890625, -0.2573814392089844, -0.24619293212890625, -0.23500442504882812, -0.22381591796875, -0.21262741088867188, -0.20143890380859375, -0.19025039672851562, -0.1790618896484375, -0.16787338256835938, -0.15668487548828125, -0.14549636840820312, -0.134307861328125, -0.12311935424804688, -0.11193084716796875, -0.10074234008789062, -0.0895538330078125, -0.07836532592773438, -0.06717681884765625, -0.055988311767578125, -0.0447998046875, -0.033611297607421875, -0.02242279052734375, -0.011234283447265625, -4.57763671875e-05, 0.011142730712890625, 0.02233123779296875, 0.033519744873046875, 0.044708251953125, 0.055896759033203125, 0.06708526611328125, 0.07827377319335938, 0.0894622802734375, 0.10065078735351562, 0.11183929443359375, 0.12302780151367188, 0.13421630859375, 0.14540481567382812, 0.15659332275390625, 0.16778182983398438, 0.1789703369140625, 0.19015884399414062, 0.20134735107421875, 0.21253585815429688, 0.223724365234375, 0.23491287231445312, 0.24610137939453125, 0.2572898864746094, 0.2684783935546875, 0.2796669006347656, 0.29085540771484375, 0.3020439147949219, 0.313232421875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 4.0, 4.0, 1.0, 4.0, 10.0, 13.0, 17.0, 36.0, 23.0, 49.0, 78.0, 151.0, 344.0, 738.0, 2697.0, 12578.0, 73312.0, 500695.0, 389335.0, 55051.0, 9827.0, 2278.0, 684.0, 266.0, 136.0, 66.0, 41.0, 35.0, 24.0, 11.0, 9.0, 11.0, 12.0, 4.0, 4.0, 3.0, 2.0, 0.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.39111328125, -0.377105712890625, -0.36309814453125, -0.349090576171875, -0.3350830078125, -0.321075439453125, -0.30706787109375, -0.293060302734375, -0.279052734375, -0.265045166015625, -0.25103759765625, -0.237030029296875, -0.2230224609375, -0.209014892578125, -0.19500732421875, -0.180999755859375, -0.1669921875, -0.152984619140625, -0.13897705078125, -0.124969482421875, -0.1109619140625, -0.096954345703125, -0.08294677734375, -0.068939208984375, -0.054931640625, -0.040924072265625, -0.02691650390625, -0.012908935546875, 0.0010986328125, 0.015106201171875, 0.02911376953125, 0.043121337890625, 0.05712890625, 0.071136474609375, 0.08514404296875, 0.099151611328125, 0.1131591796875, 0.127166748046875, 0.14117431640625, 0.155181884765625, 0.169189453125, 0.183197021484375, 0.19720458984375, 0.211212158203125, 0.2252197265625, 0.239227294921875, 0.25323486328125, 0.267242431640625, 0.28125, 0.295257568359375, 0.30926513671875, 0.323272705078125, 0.3372802734375, 0.351287841796875, 0.36529541015625, 0.379302978515625, 0.393310546875, 0.407318115234375, 0.42132568359375, 0.435333251953125, 0.4493408203125, 0.463348388671875, 0.47735595703125, 0.491363525390625, 0.50537109375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 5.0, 0.0, 2.0, 6.0, 4.0, 6.0, 5.0, 10.0, 10.0, 16.0, 11.0, 22.0, 28.0, 27.0, 24.0, 39.0, 30.0, 36.0, 49.0, 44.0, 37.0, 47.0, 51.0, 54.0, 56.0, 49.0, 38.0, 42.0, 41.0, 33.0, 29.0, 29.0, 23.0, 28.0, 21.0, 14.0, 5.0, 10.0, 5.0, 7.0, 6.0, 6.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.235107421875, -0.22747802734375, -0.2198486328125, -0.21221923828125, -0.20458984375, -0.19696044921875, -0.1893310546875, -0.18170166015625, -0.174072265625, -0.16644287109375, -0.1588134765625, -0.15118408203125, -0.1435546875, -0.13592529296875, -0.1282958984375, -0.12066650390625, -0.113037109375, -0.10540771484375, -0.0977783203125, -0.09014892578125, -0.08251953125, -0.07489013671875, -0.0672607421875, -0.05963134765625, -0.052001953125, -0.04437255859375, -0.0367431640625, -0.02911376953125, -0.021484375, -0.01385498046875, -0.0062255859375, 0.00140380859375, 0.009033203125, 0.01666259765625, 0.0242919921875, 0.03192138671875, 0.03955078125, 0.04718017578125, 0.0548095703125, 0.06243896484375, 0.070068359375, 0.07769775390625, 0.0853271484375, 0.09295654296875, 0.1005859375, 0.10821533203125, 0.1158447265625, 0.12347412109375, 0.131103515625, 0.13873291015625, 0.1463623046875, 0.15399169921875, 0.16162109375, 0.16925048828125, 0.1768798828125, 0.18450927734375, 0.192138671875, 0.19976806640625, 0.2073974609375, 0.21502685546875, 0.22265625, 0.23028564453125, 0.2379150390625, 0.24554443359375, 0.253173828125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 7.0, 1.0, 3.0, 12.0, 11.0, 30.0, 35.0, 60.0, 112.0, 244.0, 564.0, 1477.0, 4406.0, 13566.0, 44050.0, 152637.0, 472337.0, 257801.0, 69647.0, 21164.0, 6656.0, 2203.0, 818.0, 353.0, 164.0, 75.0, 48.0, 29.0, 14.0, 8.0, 7.0, 9.0, 5.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1956787109375, -0.19048690795898438, -0.18529510498046875, -0.18010330200195312, -0.1749114990234375, -0.16971969604492188, -0.16452789306640625, -0.15933609008789062, -0.154144287109375, -0.14895248413085938, -0.14376068115234375, -0.13856887817382812, -0.1333770751953125, -0.12818527221679688, -0.12299346923828125, -0.11780166625976562, -0.11260986328125, -0.10741806030273438, -0.10222625732421875, -0.09703445434570312, -0.0918426513671875, -0.08665084838867188, -0.08145904541015625, -0.07626724243164062, -0.071075439453125, -0.06588363647460938, -0.06069183349609375, -0.055500030517578125, -0.0503082275390625, -0.045116424560546875, -0.03992462158203125, -0.034732818603515625, -0.029541015625, -0.024349212646484375, -0.01915740966796875, -0.013965606689453125, -0.0087738037109375, -0.003582000732421875, 0.00160980224609375, 0.006801605224609375, 0.011993408203125, 0.017185211181640625, 0.02237701416015625, 0.027568817138671875, 0.0327606201171875, 0.037952423095703125, 0.04314422607421875, 0.048336029052734375, 0.05352783203125, 0.058719635009765625, 0.06391143798828125, 0.06910324096679688, 0.0742950439453125, 0.07948684692382812, 0.08467864990234375, 0.08987045288085938, 0.095062255859375, 0.10025405883789062, 0.10544586181640625, 0.11063766479492188, 0.1158294677734375, 0.12102127075195312, 0.12621307373046875, 0.13140487670898438, 0.1365966796875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 5.0, 4.0, 5.0, 6.0, 4.0, 9.0, 9.0, 17.0, 13.0, 23.0, 19.0, 31.0, 37.0, 47.0, 70.0, 102.0, 96.0, 93.0, 98.0, 76.0, 55.0, 39.0, 32.0, 31.0, 22.0, 16.0, 8.0, 7.0, 4.0, 8.0, 4.0, 2.0, 8.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2649765014648438e-05, -2.1871179342269897e-05, -2.1092593669891357e-05, -2.0314007997512817e-05, -1.9535422325134277e-05, -1.8756836652755737e-05, -1.7978250980377197e-05, -1.7199665307998657e-05, -1.6421079635620117e-05, -1.5642493963241577e-05, -1.4863908290863037e-05, -1.4085322618484497e-05, -1.3306736946105957e-05, -1.2528151273727417e-05, -1.1749565601348877e-05, -1.0970979928970337e-05, -1.0192394256591797e-05, -9.413808584213257e-06, -8.635222911834717e-06, -7.856637239456177e-06, -7.078051567077637e-06, -6.299465894699097e-06, -5.520880222320557e-06, -4.742294549942017e-06, -3.9637088775634766e-06, -3.1851232051849365e-06, -2.4065375328063965e-06, -1.6279518604278564e-06, -8.493661880493164e-07, -7.078051567077637e-08, 7.078051567077637e-07, 1.4863908290863037e-06, 2.2649765014648438e-06, 3.043562173843384e-06, 3.822147846221924e-06, 4.600733518600464e-06, 5.379319190979004e-06, 6.157904863357544e-06, 6.936490535736084e-06, 7.715076208114624e-06, 8.493661880493164e-06, 9.272247552871704e-06, 1.0050833225250244e-05, 1.0829418897628784e-05, 1.1608004570007324e-05, 1.2386590242385864e-05, 1.3165175914764404e-05, 1.3943761587142944e-05, 1.4722347259521484e-05, 1.5500932931900024e-05, 1.6279518604278564e-05, 1.7058104276657104e-05, 1.7836689949035645e-05, 1.8615275621414185e-05, 1.9393861293792725e-05, 2.0172446966171265e-05, 2.0951032638549805e-05, 2.1729618310928345e-05, 2.2508203983306885e-05, 2.3286789655685425e-05, 2.4065375328063965e-05, 2.4843961000442505e-05, 2.5622546672821045e-05, 2.6401132345199585e-05, 2.7179718017578125e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 6.0, 7.0, 7.0, 7.0, 11.0, 15.0, 18.0, 45.0, 92.0, 184.0, 435.0, 1150.0, 3725.0, 14973.0, 65603.0, 362984.0, 484281.0, 87747.0, 19975.0, 4927.0, 1443.0, 513.0, 186.0, 91.0, 46.0, 34.0, 16.0, 5.0, 6.0, 7.0, 3.0, 4.0, 2.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.22900390625, -0.22247886657714844, -0.21595382690429688, -0.2094287872314453, -0.20290374755859375, -0.1963787078857422, -0.18985366821289062, -0.18332862854003906, -0.1768035888671875, -0.17027854919433594, -0.16375350952148438, -0.1572284698486328, -0.15070343017578125, -0.1441783905029297, -0.13765335083007812, -0.13112831115722656, -0.124603271484375, -0.11807823181152344, -0.11155319213867188, -0.10502815246582031, -0.09850311279296875, -0.09197807312011719, -0.08545303344726562, -0.07892799377441406, -0.0724029541015625, -0.06587791442871094, -0.059352874755859375, -0.05282783508300781, -0.04630279541015625, -0.03977775573730469, -0.033252716064453125, -0.026727676391601562, -0.02020263671875, -0.013677597045898438, -0.007152557373046875, -0.0006275177001953125, 0.00589752197265625, 0.012422561645507812, 0.018947601318359375, 0.025472640991210938, 0.0319976806640625, 0.03852272033691406, 0.045047760009765625, 0.05157279968261719, 0.05809783935546875, 0.06462287902832031, 0.07114791870117188, 0.07767295837402344, 0.084197998046875, 0.09072303771972656, 0.09724807739257812, 0.10377311706542969, 0.11029815673828125, 0.11682319641113281, 0.12334823608398438, 0.12987327575683594, 0.1363983154296875, 0.14292335510253906, 0.14944839477539062, 0.1559734344482422, 0.16249847412109375, 0.1690235137939453, 0.17554855346679688, 0.18207359313964844, 0.1885986328125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 4.0, 4.0, 4.0, 3.0, 15.0, 11.0, 8.0, 7.0, 12.0, 13.0, 24.0, 11.0, 19.0, 32.0, 34.0, 54.0, 45.0, 48.0, 80.0, 88.0, 77.0, 69.0, 60.0, 44.0, 34.0, 40.0, 21.0, 22.0, 14.0, 16.0, 10.0, 10.0, 8.0, 9.0, 8.0, 10.0, 6.0, 3.0, 6.0, 7.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.087890625, -0.08492469787597656, -0.08195877075195312, -0.07899284362792969, -0.07602691650390625, -0.07306098937988281, -0.07009506225585938, -0.06712913513183594, -0.0641632080078125, -0.06119728088378906, -0.058231353759765625, -0.05526542663574219, -0.05229949951171875, -0.04933357238769531, -0.046367645263671875, -0.04340171813964844, -0.040435791015625, -0.03746986389160156, -0.034503936767578125, -0.03153800964355469, -0.02857208251953125, -0.025606155395507812, -0.022640228271484375, -0.019674301147460938, -0.0167083740234375, -0.013742446899414062, -0.010776519775390625, -0.0078105926513671875, -0.00484466552734375, -0.0018787384033203125, 0.001087188720703125, 0.0040531158447265625, 0.00701904296875, 0.009984970092773438, 0.012950897216796875, 0.015916824340820312, 0.01888275146484375, 0.021848678588867188, 0.024814605712890625, 0.027780532836914062, 0.0307464599609375, 0.03371238708496094, 0.036678314208984375, 0.03964424133300781, 0.04261016845703125, 0.04557609558105469, 0.048542022705078125, 0.05150794982910156, 0.054473876953125, 0.05743980407714844, 0.060405731201171875, 0.06337165832519531, 0.06633758544921875, 0.06930351257324219, 0.07226943969726562, 0.07523536682128906, 0.0782012939453125, 0.08116722106933594, 0.08413314819335938, 0.08709907531738281, 0.09006500244140625, 0.09303092956542969, 0.09599685668945312, 0.09896278381347656, 0.1019287109375]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 8.0, 10.0, 21.0, 24.0, 31.0, 45.0, 69.0, 91.0, 110.0, 100.0, 94.0, 94.0, 76.0, 58.0, 60.0, 38.0, 24.0, 10.0, 13.0, 9.0, 11.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-1.4894912242889404, -1.4582393169403076, -1.4269875288009644, -1.3957356214523315, -1.3644837141036987, -1.3332319259643555, -1.3019800186157227, -1.2707281112670898, -1.239476203918457, -1.2082242965698242, -1.176972508430481, -1.1457206010818481, -1.1144686937332153, -1.083216905593872, -1.0519649982452393, -1.0207130908966064, -0.9894613027572632, -0.9582094550132751, -0.9269575476646423, -0.8957056999206543, -0.8644537925720215, -0.8332019448280334, -0.8019500970840454, -0.7706981897354126, -0.7394463419914246, -0.7081944942474365, -0.6769425868988037, -0.6456907391548157, -0.6144388914108276, -0.5831869840621948, -0.5519351363182068, -0.5206832885742188, -0.48943138122558594, -0.4581795036792755, -0.4269276261329651, -0.39567577838897705, -0.3644239008426666, -0.3331720232963562, -0.30192017555236816, -0.27066829800605774, -0.23941642045974731, -0.2081645429134369, -0.17691268026828766, -0.14566081762313843, -0.114408940076828, -0.08315706253051758, -0.05190519988536835, -0.020653337240219116, 0.010598540306091309, 0.041850410401821136, 0.07310228049755096, 0.10435415059328079, 0.13560602068901062, 0.16685789823532104, 0.19810976088047028, 0.2293616235256195, 0.26061350107192993, 0.29186537861824036, 0.3231172561645508, 0.3543691039085388, 0.38562098145484924, 0.41687285900115967, 0.4481247067451477, 0.47937658429145813, 0.5106284618377686]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 2.0, 2.0, 2.0, 3.0, 5.0, 1.0, 11.0, 7.0, 9.0, 17.0, 16.0, 23.0, 20.0, 21.0, 26.0, 23.0, 35.0, 37.0, 46.0, 47.0, 49.0, 29.0, 42.0, 50.0, 47.0, 41.0, 33.0, 37.0, 45.0, 36.0, 38.0, 30.0, 26.0, 27.0, 24.0, 17.0, 25.0, 14.0, 9.0, 8.0, 8.0, 4.0, 7.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.9020313024520874, -0.8772913813591003, -0.8525514006614685, -0.8278114795684814, -0.8030715584754944, -0.7783316373825073, -0.7535916566848755, -0.7288517355918884, -0.7041118144989014, -0.6793718934059143, -0.6546319127082825, -0.6298919916152954, -0.6051520705223083, -0.5804121494293213, -0.5556721687316895, -0.5309322476387024, -0.5061922669410706, -0.4814523160457611, -0.45671239495277405, -0.4319724440574646, -0.40723252296447754, -0.3824925720691681, -0.35775262117385864, -0.3330127000808716, -0.30827274918556213, -0.2835327982902527, -0.2587928771972656, -0.23405292630195618, -0.20931299030780792, -0.18457305431365967, -0.15983310341835022, -0.13509316742420197, -0.11035329103469849, -0.08561335504055023, -0.06087341159582138, -0.03613346815109253, -0.011393532156944275, 0.01334640383720398, 0.03808635473251343, 0.06282629072666168, 0.08756622672080994, 0.11230616271495819, 0.13704609870910645, 0.1617860496044159, 0.18652598559856415, 0.2112659215927124, 0.23600587248802185, 0.2607458233833313, 0.28548574447631836, 0.3102256953716278, 0.33496561646461487, 0.3597055673599243, 0.3844454884529114, 0.4091854393482208, 0.4339253902435303, 0.45866531133651733, 0.4834052622318268, 0.5081452131271362, 0.5328851342201233, 0.5576250553131104, 0.5823650360107422, 0.6071049571037292, 0.6318448781967163, 0.6565848588943481, 0.6813247799873352]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 2.0, 3.0, 3.0, 7.0, 8.0, 11.0, 18.0, 15.0, 34.0, 39.0, 74.0, 124.0, 233.0, 458.0, 939.0, 2312.0, 7134.0, 32663.0, 514897.0, 3450576.0, 158750.0, 18291.0, 4692.0, 1738.0, 628.0, 288.0, 164.0, 71.0, 40.0, 24.0, 20.0, 6.0, 5.0, 5.0, 1.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.406005859375, -0.39382171630859375, -0.3816375732421875, -0.36945343017578125, -0.357269287109375, -0.34508514404296875, -0.3329010009765625, -0.32071685791015625, -0.30853271484375, -0.29634857177734375, -0.2841644287109375, -0.27198028564453125, -0.259796142578125, -0.24761199951171875, -0.2354278564453125, -0.22324371337890625, -0.2110595703125, -0.19887542724609375, -0.1866912841796875, -0.17450714111328125, -0.162322998046875, -0.15013885498046875, -0.1379547119140625, -0.12577056884765625, -0.11358642578125, -0.10140228271484375, -0.0892181396484375, -0.07703399658203125, -0.064849853515625, -0.05266571044921875, -0.0404815673828125, -0.02829742431640625, -0.01611328125, -0.00392913818359375, 0.0082550048828125, 0.02043914794921875, 0.032623291015625, 0.04480743408203125, 0.0569915771484375, 0.06917572021484375, 0.08135986328125, 0.09354400634765625, 0.1057281494140625, 0.11791229248046875, 0.130096435546875, 0.14228057861328125, 0.1544647216796875, 0.16664886474609375, 0.1788330078125, 0.19101715087890625, 0.2032012939453125, 0.21538543701171875, 0.227569580078125, 0.23975372314453125, 0.2519378662109375, 0.26412200927734375, 0.27630615234375, 0.28849029541015625, 0.3006744384765625, 0.31285858154296875, 0.325042724609375, 0.33722686767578125, 0.3494110107421875, 0.36159515380859375, 0.373779296875]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 0.0, 1.0, 1.0, 2.0, 9.0, 35.0, 94.0, 159.0, 216.0, 205.0, 138.0, 93.0, 43.0, 12.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.418212890625, -0.4065666198730469, -0.39492034912109375, -0.3832740783691406, -0.3716278076171875, -0.3599815368652344, -0.34833526611328125, -0.3366889953613281, -0.325042724609375, -0.3133964538574219, -0.30175018310546875, -0.2901039123535156, -0.2784576416015625, -0.2668113708496094, -0.25516510009765625, -0.24351882934570312, -0.23187255859375, -0.22022628784179688, -0.20858001708984375, -0.19693374633789062, -0.1852874755859375, -0.17364120483398438, -0.16199493408203125, -0.15034866333007812, -0.138702392578125, -0.12705612182617188, -0.11540985107421875, -0.10376358032226562, -0.0921173095703125, -0.08047103881835938, -0.06882476806640625, -0.057178497314453125, -0.0455322265625, -0.033885955810546875, -0.02223968505859375, -0.010593414306640625, 0.0010528564453125, 0.012699127197265625, 0.02434539794921875, 0.035991668701171875, 0.047637939453125, 0.059284210205078125, 0.07093048095703125, 0.08257675170898438, 0.0942230224609375, 0.10586929321289062, 0.11751556396484375, 0.12916183471679688, 0.14080810546875, 0.15245437622070312, 0.16410064697265625, 0.17574691772460938, 0.1873931884765625, 0.19903945922851562, 0.21068572998046875, 0.22233200073242188, 0.233978271484375, 0.24562454223632812, 0.25727081298828125, 0.2689170837402344, 0.2805633544921875, 0.2922096252441406, 0.30385589599609375, 0.3155021667480469, 0.3271484375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 6.0, 6.0, 6.0, 14.0, 7.0, 15.0, 18.0, 35.0, 49.0, 64.0, 153.0, 364.0, 1424.0, 7375.0, 71420.0, 2124181.0, 1914017.0, 66022.0, 7067.0, 1350.0, 348.0, 137.0, 68.0, 37.0, 27.0, 22.0, 11.0, 13.0, 6.0, 8.0, 6.0, 5.0, 0.0, 1.0, 1.0, 5.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.384521484375, -0.37078094482421875, -0.3570404052734375, -0.34329986572265625, -0.329559326171875, -0.31581878662109375, -0.3020782470703125, -0.28833770751953125, -0.27459716796875, -0.26085662841796875, -0.2471160888671875, -0.23337554931640625, -0.219635009765625, -0.20589447021484375, -0.1921539306640625, -0.17841339111328125, -0.1646728515625, -0.15093231201171875, -0.1371917724609375, -0.12345123291015625, -0.109710693359375, -0.09597015380859375, -0.0822296142578125, -0.06848907470703125, -0.05474853515625, -0.04100799560546875, -0.0272674560546875, -0.01352691650390625, 0.000213623046875, 0.01395416259765625, 0.0276947021484375, 0.04143524169921875, 0.05517578125, 0.06891632080078125, 0.0826568603515625, 0.09639739990234375, 0.110137939453125, 0.12387847900390625, 0.1376190185546875, 0.15135955810546875, 0.16510009765625, 0.17884063720703125, 0.1925811767578125, 0.20632171630859375, 0.220062255859375, 0.23380279541015625, 0.2475433349609375, 0.26128387451171875, 0.2750244140625, 0.28876495361328125, 0.3025054931640625, 0.31624603271484375, 0.329986572265625, 0.34372711181640625, 0.3574676513671875, 0.37120819091796875, 0.38494873046875, 0.39868927001953125, 0.4124298095703125, 0.42617034912109375, 0.439910888671875, 0.45365142822265625, 0.4673919677734375, 0.48113250732421875, 0.494873046875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 6.0, 4.0, 6.0, 29.0, 30.0, 77.0, 135.0, 275.0, 609.0, 1092.0, 933.0, 441.0, 215.0, 111.0, 47.0, 27.0, 22.0, 6.0, 4.0, 7.0, 9.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.448974609375, -0.4374122619628906, -0.42584991455078125, -0.4142875671386719, -0.4027252197265625, -0.3911628723144531, -0.37960052490234375, -0.3680381774902344, -0.356475830078125, -0.3449134826660156, -0.33335113525390625, -0.3217887878417969, -0.3102264404296875, -0.2986640930175781, -0.28710174560546875, -0.2755393981933594, -0.26397705078125, -0.2524147033691406, -0.24085235595703125, -0.22929000854492188, -0.2177276611328125, -0.20616531372070312, -0.19460296630859375, -0.18304061889648438, -0.171478271484375, -0.15991592407226562, -0.14835357666015625, -0.13679122924804688, -0.1252288818359375, -0.11366653442382812, -0.10210418701171875, -0.09054183959960938, -0.0789794921875, -0.06741714477539062, -0.05585479736328125, -0.044292449951171875, -0.0327301025390625, -0.021167755126953125, -0.00960540771484375, 0.001956939697265625, 0.013519287109375, 0.025081634521484375, 0.03664398193359375, 0.048206329345703125, 0.0597686767578125, 0.07133102416992188, 0.08289337158203125, 0.09445571899414062, 0.10601806640625, 0.11758041381835938, 0.12914276123046875, 0.14070510864257812, 0.1522674560546875, 0.16382980346679688, 0.17539215087890625, 0.18695449829101562, 0.198516845703125, 0.21007919311523438, 0.22164154052734375, 0.23320388793945312, 0.2447662353515625, 0.2563285827636719, 0.26789093017578125, 0.2794532775878906, 0.291015625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 12.0, 29.0, 68.0, 156.0, 219.0, 214.0, 147.0, 93.0, 41.0, 17.0, 6.0, 5.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.8760266304016113, -2.8149070739746094, -2.7537877559661865, -2.6926681995391846, -2.6315488815307617, -2.5704293251037598, -2.509309768676758, -2.448190450668335, -2.387070894241333, -2.325951337814331, -2.264832019805908, -2.2037124633789062, -2.1425931453704834, -2.0814735889434814, -2.0203542709350586, -1.9592347145080566, -1.8981152772903442, -1.8369958400726318, -1.7758764028549194, -1.714756965637207, -1.653637409210205, -1.5925179719924927, -1.5313985347747803, -1.4702790975570679, -1.4091596603393555, -1.348040223121643, -1.2869207859039307, -1.2258012294769287, -1.1646817922592163, -1.103562355041504, -1.0424429178237915, -0.9813234806060791, -0.9202039241790771, -0.8590844869613647, -0.7979649901390076, -0.7368455529212952, -0.675726056098938, -0.6146066188812256, -0.5534871816635132, -0.4923677146434784, -0.4312482476234436, -0.3701287806034088, -0.309009313583374, -0.24788987636566162, -0.18677040934562683, -0.12565094232559204, -0.06453150510787964, -0.0034120380878448486, 0.05770742893218994, 0.11882688850164413, 0.17994634807109833, 0.24106580018997192, 0.3021852672100067, 0.3633047342300415, 0.4244241714477539, 0.4855436384677887, 0.5466631054878235, 0.6077825427055359, 0.6689020395278931, 0.7300214767456055, 0.7911409139633179, 0.852260410785675, 0.9133798480033875, 0.9744993448257446, 1.035618782043457]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 2.0, 7.0, 6.0, 12.0, 16.0, 21.0, 33.0, 30.0, 34.0, 45.0, 45.0, 45.0, 61.0, 67.0, 79.0, 83.0, 69.0, 56.0, 53.0, 50.0, 49.0, 35.0, 26.0, 31.0, 14.0, 12.0, 8.0, 2.0, 6.0, 4.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8735185861587524, -0.8428614139556885, -0.8122041821479797, -0.781546950340271, -0.750889778137207, -0.7202326059341431, -0.6895753741264343, -0.6589181423187256, -0.6282609701156616, -0.5976037979125977, -0.5669465661048889, -0.5362893342971802, -0.5056321620941162, -0.47497496008872986, -0.4443177580833435, -0.41366055607795715, -0.3830033540725708, -0.35234615206718445, -0.3216889500617981, -0.29103174805641174, -0.2603745460510254, -0.22971734404563904, -0.19906014204025269, -0.16840294003486633, -0.13774573802947998, -0.10708853602409363, -0.07643133401870728, -0.04577413201332092, -0.01511693000793457, 0.015540271997451782, 0.046197474002838135, 0.07685467600822449, 0.10751187801361084, 0.1381690800189972, 0.16882628202438354, 0.1994834840297699, 0.23014068603515625, 0.2607978880405426, 0.29145509004592896, 0.3221122920513153, 0.35276949405670166, 0.383426696062088, 0.41408389806747437, 0.4447411000728607, 0.47539830207824707, 0.506055474281311, 0.5367127060890198, 0.5673699378967285, 0.5980271100997925, 0.6286842823028564, 0.6593415141105652, 0.6899987459182739, 0.7206559181213379, 0.7513130903244019, 0.7819703221321106, 0.8126275539398193, 0.8432847261428833, 0.8739418983459473, 0.904599130153656, 0.9352563619613647, 0.9659135341644287, 0.9965707063674927, 1.0272278785705566, 1.0578851699829102, 1.0885423421859741]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 7.0, 8.0, 15.0, 23.0, 26.0, 25.0, 49.0, 84.0, 86.0, 137.0, 193.0, 284.0, 454.0, 861.0, 1927.0, 5110.0, 14700.0, 46678.0, 162711.0, 436719.0, 266593.0, 75193.0, 23316.0, 7717.0, 2769.0, 1176.0, 583.0, 337.0, 249.0, 171.0, 91.0, 80.0, 55.0, 34.0, 28.0, 26.0, 14.0, 9.0, 6.0, 2.0, 1.0, 4.0, 2.0, 0.0, 4.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.416015625, -0.4040260314941406, -0.39203643798828125, -0.3800468444824219, -0.3680572509765625, -0.3560676574707031, -0.34407806396484375, -0.3320884704589844, -0.320098876953125, -0.3081092834472656, -0.29611968994140625, -0.2841300964355469, -0.2721405029296875, -0.2601509094238281, -0.24816131591796875, -0.23617172241210938, -0.22418212890625, -0.21219253540039062, -0.20020294189453125, -0.18821334838867188, -0.1762237548828125, -0.16423416137695312, -0.15224456787109375, -0.14025497436523438, -0.128265380859375, -0.11627578735351562, -0.10428619384765625, -0.09229660034179688, -0.0803070068359375, -0.06831741333007812, -0.05632781982421875, -0.044338226318359375, -0.0323486328125, -0.020359039306640625, -0.00836944580078125, 0.003620147705078125, 0.0156097412109375, 0.027599334716796875, 0.03958892822265625, 0.051578521728515625, 0.063568115234375, 0.07555770874023438, 0.08754730224609375, 0.09953689575195312, 0.1115264892578125, 0.12351608276367188, 0.13550567626953125, 0.14749526977539062, 0.15948486328125, 0.17147445678710938, 0.18346405029296875, 0.19545364379882812, 0.2074432373046875, 0.21943283081054688, 0.23142242431640625, 0.24341201782226562, 0.255401611328125, 0.2673912048339844, 0.27938079833984375, 0.2913703918457031, 0.3033599853515625, 0.3153495788574219, 0.32733917236328125, 0.3393287658691406, 0.351318359375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 12.0, 30.0, 73.0, 132.0, 191.0, 206.0, 165.0, 98.0, 70.0, 23.0, 7.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.407958984375, -0.396392822265625, -0.38482666015625, -0.373260498046875, -0.3616943359375, -0.350128173828125, -0.33856201171875, -0.326995849609375, -0.3154296875, -0.303863525390625, -0.29229736328125, -0.280731201171875, -0.2691650390625, -0.257598876953125, -0.24603271484375, -0.234466552734375, -0.222900390625, -0.211334228515625, -0.19976806640625, -0.188201904296875, -0.1766357421875, -0.165069580078125, -0.15350341796875, -0.141937255859375, -0.13037109375, -0.118804931640625, -0.10723876953125, -0.095672607421875, -0.0841064453125, -0.072540283203125, -0.06097412109375, -0.049407958984375, -0.037841796875, -0.026275634765625, -0.01470947265625, -0.003143310546875, 0.0084228515625, 0.019989013671875, 0.03155517578125, 0.043121337890625, 0.0546875, 0.066253662109375, 0.07781982421875, 0.089385986328125, 0.1009521484375, 0.112518310546875, 0.12408447265625, 0.135650634765625, 0.147216796875, 0.158782958984375, 0.17034912109375, 0.181915283203125, 0.1934814453125, 0.205047607421875, 0.21661376953125, 0.228179931640625, 0.23974609375, 0.251312255859375, 0.26287841796875, 0.274444580078125, 0.2860107421875, 0.297576904296875, 0.30914306640625, 0.320709228515625, 0.332275390625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 8.0, 8.0, 7.0, 16.0, 14.0, 18.0, 29.0, 38.0, 59.0, 116.0, 168.0, 294.0, 626.0, 1251.0, 2744.0, 6264.0, 14247.0, 32725.0, 81344.0, 213430.0, 357342.0, 203810.0, 77527.0, 31308.0, 13684.0, 6080.0, 2715.0, 1292.0, 593.0, 319.0, 182.0, 105.0, 60.0, 40.0, 27.0, 22.0, 10.0, 10.0, 6.0, 7.0, 4.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.290771484375, -0.2820854187011719, -0.27339935302734375, -0.2647132873535156, -0.2560272216796875, -0.24734115600585938, -0.23865509033203125, -0.22996902465820312, -0.221282958984375, -0.21259689331054688, -0.20391082763671875, -0.19522476196289062, -0.1865386962890625, -0.17785263061523438, -0.16916656494140625, -0.16048049926757812, -0.15179443359375, -0.14310836791992188, -0.13442230224609375, -0.12573623657226562, -0.1170501708984375, -0.10836410522460938, -0.09967803955078125, -0.09099197387695312, -0.082305908203125, -0.07361984252929688, -0.06493377685546875, -0.056247711181640625, -0.0475616455078125, -0.038875579833984375, -0.03018951416015625, -0.021503448486328125, -0.0128173828125, -0.004131317138671875, 0.00455474853515625, 0.013240814208984375, 0.0219268798828125, 0.030612945556640625, 0.03929901123046875, 0.047985076904296875, 0.056671142578125, 0.06535720825195312, 0.07404327392578125, 0.08272933959960938, 0.0914154052734375, 0.10010147094726562, 0.10878753662109375, 0.11747360229492188, 0.12615966796875, 0.13484573364257812, 0.14353179931640625, 0.15221786499023438, 0.1609039306640625, 0.16958999633789062, 0.17827606201171875, 0.18696212768554688, 0.195648193359375, 0.20433425903320312, 0.21302032470703125, 0.22170639038085938, 0.2303924560546875, 0.23907852172851562, 0.24776458740234375, 0.2564506530761719, 0.26513671875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 3.0, 3.0, 2.0, 2.0, 3.0, 3.0, 7.0, 5.0, 8.0, 9.0, 17.0, 15.0, 11.0, 16.0, 19.0, 30.0, 29.0, 39.0, 31.0, 40.0, 40.0, 32.0, 32.0, 40.0, 41.0, 55.0, 44.0, 43.0, 37.0, 32.0, 33.0, 30.0, 26.0, 41.0, 40.0, 18.0, 17.0, 17.0, 17.0, 20.0, 14.0, 10.0, 9.0, 5.0, 6.0, 4.0, 3.0, 2.0, 6.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2371826171875, -0.2289142608642578, -0.22064590454101562, -0.21237754821777344, -0.20410919189453125, -0.19584083557128906, -0.18757247924804688, -0.1793041229248047, -0.1710357666015625, -0.1627674102783203, -0.15449905395507812, -0.14623069763183594, -0.13796234130859375, -0.12969398498535156, -0.12142562866210938, -0.11315727233886719, -0.104888916015625, -0.09662055969238281, -0.08835220336914062, -0.08008384704589844, -0.07181549072265625, -0.06354713439941406, -0.055278778076171875, -0.04701042175292969, -0.0387420654296875, -0.030473709106445312, -0.022205352783203125, -0.013936996459960938, -0.00566864013671875, 0.0025997161865234375, 0.010868072509765625, 0.019136428833007812, 0.02740478515625, 0.03567314147949219, 0.043941497802734375, 0.05220985412597656, 0.06047821044921875, 0.06874656677246094, 0.07701492309570312, 0.08528327941894531, 0.0935516357421875, 0.10181999206542969, 0.11008834838867188, 0.11835670471191406, 0.12662506103515625, 0.13489341735839844, 0.14316177368164062, 0.1514301300048828, 0.159698486328125, 0.1679668426513672, 0.17623519897460938, 0.18450355529785156, 0.19277191162109375, 0.20104026794433594, 0.20930862426757812, 0.2175769805908203, 0.2258453369140625, 0.2341136932373047, 0.24238204956054688, 0.25065040588378906, 0.25891876220703125, 0.26718711853027344, 0.2754554748535156, 0.2837238311767578, 0.2919921875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 6.0, 11.0, 8.0, 14.0, 23.0, 42.0, 34.0, 82.0, 131.0, 188.0, 299.0, 460.0, 744.0, 1303.0, 2224.0, 4177.0, 10115.0, 32141.0, 127053.0, 413162.0, 329938.0, 87504.0, 22682.0, 7780.0, 3599.0, 1884.0, 1092.0, 692.0, 429.0, 294.0, 159.0, 101.0, 69.0, 33.0, 27.0, 22.0, 16.0, 5.0, 2.0, 7.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1939697265625, -0.18747520446777344, -0.18098068237304688, -0.1744861602783203, -0.16799163818359375, -0.1614971160888672, -0.15500259399414062, -0.14850807189941406, -0.1420135498046875, -0.13551902770996094, -0.12902450561523438, -0.12252998352050781, -0.11603546142578125, -0.10954093933105469, -0.10304641723632812, -0.09655189514160156, -0.090057373046875, -0.08356285095214844, -0.07706832885742188, -0.07057380676269531, -0.06407928466796875, -0.05758476257324219, -0.051090240478515625, -0.04459571838378906, -0.0381011962890625, -0.03160667419433594, -0.025112152099609375, -0.018617630004882812, -0.01212310791015625, -0.0056285858154296875, 0.000865936279296875, 0.0073604583740234375, 0.01385498046875, 0.020349502563476562, 0.026844024658203125, 0.03333854675292969, 0.03983306884765625, 0.04632759094238281, 0.052822113037109375, 0.05931663513183594, 0.0658111572265625, 0.07230567932128906, 0.07880020141601562, 0.08529472351074219, 0.09178924560546875, 0.09828376770019531, 0.10477828979492188, 0.11127281188964844, 0.117767333984375, 0.12426185607910156, 0.13075637817382812, 0.1372509002685547, 0.14374542236328125, 0.1502399444580078, 0.15673446655273438, 0.16322898864746094, 0.1697235107421875, 0.17621803283691406, 0.18271255493164062, 0.1892070770263672, 0.19570159912109375, 0.2021961212158203, 0.20869064331054688, 0.21518516540527344, 0.2216796875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 3.0, 6.0, 5.0, 7.0, 8.0, 9.0, 12.0, 18.0, 20.0, 22.0, 21.0, 26.0, 34.0, 39.0, 55.0, 75.0, 103.0, 71.0, 80.0, 68.0, 62.0, 57.0, 40.0, 24.0, 24.0, 13.0, 27.0, 17.0, 13.0, 6.0, 9.0, 4.0, 4.0, 5.0, 4.0, 2.0, 2.0, 2.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-3.266334533691406e-05, -3.177672624588013e-05, -3.089010715484619e-05, -3.0003488063812256e-05, -2.911686897277832e-05, -2.8230249881744385e-05, -2.734363079071045e-05, -2.6457011699676514e-05, -2.5570392608642578e-05, -2.4683773517608643e-05, -2.3797154426574707e-05, -2.291053533554077e-05, -2.2023916244506836e-05, -2.11372971534729e-05, -2.0250678062438965e-05, -1.936405897140503e-05, -1.8477439880371094e-05, -1.7590820789337158e-05, -1.6704201698303223e-05, -1.5817582607269287e-05, -1.4930963516235352e-05, -1.4044344425201416e-05, -1.315772533416748e-05, -1.2271106243133545e-05, -1.138448715209961e-05, -1.0497868061065674e-05, -9.611248970031738e-06, -8.724629878997803e-06, -7.838010787963867e-06, -6.951391696929932e-06, -6.064772605895996e-06, -5.1781535148620605e-06, -4.291534423828125e-06, -3.4049153327941895e-06, -2.518296241760254e-06, -1.6316771507263184e-06, -7.450580596923828e-07, 1.4156103134155273e-07, 1.0281801223754883e-06, 1.914799213409424e-06, 2.8014183044433594e-06, 3.688037395477295e-06, 4.5746564865112305e-06, 5.461275577545166e-06, 6.3478946685791016e-06, 7.234513759613037e-06, 8.121132850646973e-06, 9.007751941680908e-06, 9.894371032714844e-06, 1.078099012374878e-05, 1.1667609214782715e-05, 1.255422830581665e-05, 1.3440847396850586e-05, 1.4327466487884521e-05, 1.5214085578918457e-05, 1.6100704669952393e-05, 1.6987323760986328e-05, 1.7873942852020264e-05, 1.87605619430542e-05, 1.9647181034088135e-05, 2.053380012512207e-05, 2.1420419216156006e-05, 2.230703830718994e-05, 2.3193657398223877e-05, 2.4080276489257812e-05]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 1.0, 5.0, 3.0, 18.0, 11.0, 20.0, 30.0, 53.0, 89.0, 127.0, 234.0, 382.0, 676.0, 1187.0, 2103.0, 4172.0, 10631.0, 42322.0, 224482.0, 545155.0, 167704.0, 32298.0, 8709.0, 3704.0, 1903.0, 1083.0, 600.0, 360.0, 188.0, 123.0, 75.0, 33.0, 27.0, 16.0, 12.0, 7.0, 6.0, 1.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.282470703125, -0.2744941711425781, -0.26651763916015625, -0.2585411071777344, -0.2505645751953125, -0.24258804321289062, -0.23461151123046875, -0.22663497924804688, -0.218658447265625, -0.21068191528320312, -0.20270538330078125, -0.19472885131835938, -0.1867523193359375, -0.17877578735351562, -0.17079925537109375, -0.16282272338867188, -0.15484619140625, -0.14686965942382812, -0.13889312744140625, -0.13091659545898438, -0.1229400634765625, -0.11496353149414062, -0.10698699951171875, -0.09901046752929688, -0.091033935546875, -0.08305740356445312, -0.07508087158203125, -0.06710433959960938, -0.0591278076171875, -0.051151275634765625, -0.04317474365234375, -0.035198211669921875, -0.0272216796875, -0.019245147705078125, -0.01126861572265625, -0.003292083740234375, 0.0046844482421875, 0.012660980224609375, 0.02063751220703125, 0.028614044189453125, 0.036590576171875, 0.044567108154296875, 0.05254364013671875, 0.060520172119140625, 0.0684967041015625, 0.07647323608398438, 0.08444976806640625, 0.09242630004882812, 0.10040283203125, 0.10837936401367188, 0.11635589599609375, 0.12433242797851562, 0.1323089599609375, 0.14028549194335938, 0.14826202392578125, 0.15623855590820312, 0.164215087890625, 0.17219161987304688, 0.18016815185546875, 0.18814468383789062, 0.1961212158203125, 0.20409774780273438, 0.21207427978515625, 0.22005081176757812, 0.22802734375]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 9.0, 8.0, 17.0, 22.0, 28.0, 36.0, 56.0, 87.0, 123.0, 134.0, 102.0, 117.0, 81.0, 62.0, 41.0, 21.0, 16.0, 16.0, 10.0, 5.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.202392578125, -0.19603919982910156, -0.18968582153320312, -0.1833324432373047, -0.17697906494140625, -0.1706256866455078, -0.16427230834960938, -0.15791893005371094, -0.1515655517578125, -0.14521217346191406, -0.13885879516601562, -0.1325054168701172, -0.12615203857421875, -0.11979866027832031, -0.11344528198242188, -0.10709190368652344, -0.100738525390625, -0.09438514709472656, -0.08803176879882812, -0.08167839050292969, -0.07532501220703125, -0.06897163391113281, -0.06261825561523438, -0.05626487731933594, -0.0499114990234375, -0.04355812072753906, -0.037204742431640625, -0.030851364135742188, -0.02449798583984375, -0.018144607543945312, -0.011791229248046875, -0.0054378509521484375, 0.00091552734375, 0.0072689056396484375, 0.013622283935546875, 0.019975662231445312, 0.02632904052734375, 0.03268241882324219, 0.039035797119140625, 0.04538917541503906, 0.0517425537109375, 0.05809593200683594, 0.06444931030273438, 0.07080268859863281, 0.07715606689453125, 0.08350944519042969, 0.08986282348632812, 0.09621620178222656, 0.102569580078125, 0.10892295837402344, 0.11527633666992188, 0.12162971496582031, 0.12798309326171875, 0.1343364715576172, 0.14068984985351562, 0.14704322814941406, 0.1533966064453125, 0.15974998474121094, 0.16610336303710938, 0.1724567413330078, 0.17881011962890625, 0.1851634979248047, 0.19151687622070312, 0.19787025451660156, 0.2042236328125]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 13.0, 8.0, 25.0, 59.0, 81.0, 108.0, 141.0, 164.0, 140.0, 97.0, 79.0, 41.0, 30.0, 11.0, 5.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6752134561538696, -1.6113948822021484, -1.5475764274597168, -1.4837578535079956, -1.419939398765564, -1.3561208248138428, -1.2923023700714111, -1.22848379611969, -1.1646652221679688, -1.1008466482162476, -1.037028193473816, -0.9732096195220947, -0.9093911647796631, -0.8455725908279419, -0.7817540764808655, -0.7179355621337891, -0.6541171073913574, -0.590298593044281, -0.5264800786972046, -0.4626615345478058, -0.39884302020072937, -0.33502450585365295, -0.27120596170425415, -0.20738744735717773, -0.14356893301010132, -0.0797504112124443, -0.015931889414787292, 0.04788663983345032, 0.11170515418052673, 0.17552366852760315, 0.23934221267700195, 0.30316072702407837, 0.36697936058044434, 0.43079787492752075, 0.49461638927459717, 0.5584349632263184, 0.62225341796875, 0.6860719919204712, 0.7498905062675476, 0.813709020614624, 0.8775275349617004, 0.9413460493087769, 1.005164623260498, 1.0689830780029297, 1.1328016519546509, 1.1966201066970825, 1.2604386806488037, 1.3242571353912354, 1.3880757093429565, 1.4518942832946777, 1.5157127380371094, 1.5795313119888306, 1.6433497667312622, 1.7071683406829834, 1.770986795425415, 1.8348053693771362, 1.8986239433288574, 1.9624425172805786, 2.0262610912323, 2.0900795459747314, 2.153898000717163, 2.2177164554595947, 2.2815351486206055, 2.345353603363037, 2.4091720581054688]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 3.0, 7.0, 3.0, 5.0, 6.0, 10.0, 4.0, 6.0, 11.0, 8.0, 6.0, 13.0, 21.0, 20.0, 18.0, 12.0, 23.0, 9.0, 26.0, 30.0, 31.0, 26.0, 35.0, 45.0, 35.0, 42.0, 31.0, 33.0, 27.0, 36.0, 47.0, 27.0, 38.0, 35.0, 37.0, 21.0, 24.0, 21.0, 20.0, 15.0, 18.0, 14.0, 21.0, 9.0, 20.0, 10.0, 8.0, 12.0, 14.0, 3.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 4.0, 0.0, 3.0], "bins": [-0.701142430305481, -0.6790093183517456, -0.6568761467933655, -0.6347430348396301, -0.61260986328125, -0.5904767513275146, -0.5683435797691345, -0.5462104678153992, -0.524077296257019, -0.5019441843032837, -0.47981101274490356, -0.4576778709888458, -0.4355447292327881, -0.41341158747673035, -0.3912784457206726, -0.36914533376693726, -0.3470121920108795, -0.3248790502548218, -0.30274590849876404, -0.2806127667427063, -0.25847962498664856, -0.23634648323059082, -0.21421335637569427, -0.19208021461963654, -0.1699470728635788, -0.14781393110752106, -0.12568078935146332, -0.10354765504598618, -0.08141451328992844, -0.0592813715338707, -0.037148237228393555, -0.015015095472335815, 0.007118046283721924, 0.029251186177134514, 0.051384326070547104, 0.07351746410131454, 0.09565060585737228, 0.11778374761343002, 0.13991688191890717, 0.1620500236749649, 0.18418316543102264, 0.20631630718708038, 0.22844944894313812, 0.25058257579803467, 0.2727157175540924, 0.29484885931015015, 0.3169820010662079, 0.3391151428222656, 0.36124828457832336, 0.3833814263343811, 0.40551456809043884, 0.4276477098464966, 0.4497808516025543, 0.47191399335861206, 0.4940471053123474, 0.5161802768707275, 0.5383133888244629, 0.5604465007781982, 0.5825796723365784, 0.6047127842903137, 0.6268459558486938, 0.6489790678024292, 0.6711122393608093, 0.6932453513145447, 0.7153785228729248]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 13.0, 14.0, 15.0, 40.0, 70.0, 99.0, 185.0, 359.0, 970.0, 3744.0, 25131.0, 699223.0, 3367010.0, 86888.0, 8098.0, 1583.0, 429.0, 189.0, 103.0, 51.0, 25.0, 17.0, 6.0, 12.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.580078125, -0.5631256103515625, -0.546173095703125, -0.5292205810546875, -0.51226806640625, -0.4953155517578125, -0.478363037109375, -0.4614105224609375, -0.4444580078125, -0.4275054931640625, -0.410552978515625, -0.3936004638671875, -0.37664794921875, -0.3596954345703125, -0.342742919921875, -0.3257904052734375, -0.308837890625, -0.2918853759765625, -0.274932861328125, -0.2579803466796875, -0.24102783203125, -0.2240753173828125, -0.207122802734375, -0.1901702880859375, -0.1732177734375, -0.1562652587890625, -0.139312744140625, -0.1223602294921875, -0.10540771484375, -0.0884552001953125, -0.071502685546875, -0.0545501708984375, -0.03759765625, -0.0206451416015625, -0.003692626953125, 0.0132598876953125, 0.03021240234375, 0.0471649169921875, 0.064117431640625, 0.0810699462890625, 0.0980224609375, 0.1149749755859375, 0.131927490234375, 0.1488800048828125, 0.16583251953125, 0.1827850341796875, 0.199737548828125, 0.2166900634765625, 0.233642578125, 0.2505950927734375, 0.267547607421875, 0.2845001220703125, 0.30145263671875, 0.3184051513671875, 0.335357666015625, 0.3523101806640625, 0.3692626953125, 0.3862152099609375, 0.403167724609375, 0.4201202392578125, 0.43707275390625, 0.4540252685546875, 0.470977783203125, 0.4879302978515625, 0.5048828125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 8.0, 27.0, 68.0, 75.0, 141.0, 192.0, 158.0, 146.0, 88.0, 62.0, 23.0, 17.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.41748046875, -0.4055328369140625, -0.393585205078125, -0.3816375732421875, -0.36968994140625, -0.3577423095703125, -0.345794677734375, -0.3338470458984375, -0.3218994140625, -0.3099517822265625, -0.298004150390625, -0.2860565185546875, -0.27410888671875, -0.2621612548828125, -0.250213623046875, -0.2382659912109375, -0.226318359375, -0.2143707275390625, -0.202423095703125, -0.1904754638671875, -0.17852783203125, -0.1665802001953125, -0.154632568359375, -0.1426849365234375, -0.1307373046875, -0.1187896728515625, -0.106842041015625, -0.0948944091796875, -0.08294677734375, -0.0709991455078125, -0.059051513671875, -0.0471038818359375, -0.03515625, -0.0232086181640625, -0.011260986328125, 0.0006866455078125, 0.01263427734375, 0.0245819091796875, 0.036529541015625, 0.0484771728515625, 0.0604248046875, 0.0723724365234375, 0.084320068359375, 0.0962677001953125, 0.10821533203125, 0.1201629638671875, 0.132110595703125, 0.1440582275390625, 0.156005859375, 0.1679534912109375, 0.179901123046875, 0.1918487548828125, 0.20379638671875, 0.2157440185546875, 0.227691650390625, 0.2396392822265625, 0.2515869140625, 0.2635345458984375, 0.275482177734375, 0.2874298095703125, 0.29937744140625, 0.3113250732421875, 0.323272705078125, 0.3352203369140625, 0.34716796875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 3.0, 6.0, 5.0, 13.0, 13.0, 16.0, 31.0, 41.0, 64.0, 90.0, 150.0, 215.0, 360.0, 547.0, 961.0, 1694.0, 3134.0, 6140.0, 13265.0, 31256.0, 82325.0, 244989.0, 810417.0, 1840782.0, 783143.0, 237813.0, 80362.0, 30298.0, 12805.0, 6104.0, 3113.0, 1598.0, 983.0, 551.0, 354.0, 234.0, 136.0, 92.0, 60.0, 38.0, 25.0, 19.0, 11.0, 14.0, 6.0, 4.0, 1.0, 2.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1966552734375, -0.1907825469970703, -0.18490982055664062, -0.17903709411621094, -0.17316436767578125, -0.16729164123535156, -0.16141891479492188, -0.1555461883544922, -0.1496734619140625, -0.1438007354736328, -0.13792800903320312, -0.13205528259277344, -0.12618255615234375, -0.12030982971191406, -0.11443710327148438, -0.10856437683105469, -0.102691650390625, -0.09681892395019531, -0.09094619750976562, -0.08507347106933594, -0.07920074462890625, -0.07332801818847656, -0.06745529174804688, -0.06158256530761719, -0.0557098388671875, -0.04983711242675781, -0.043964385986328125, -0.03809165954589844, -0.03221893310546875, -0.026346206665039062, -0.020473480224609375, -0.014600753784179688, -0.00872802734375, -0.0028553009033203125, 0.003017425537109375, 0.008890151977539062, 0.01476287841796875, 0.020635604858398438, 0.026508331298828125, 0.03238105773925781, 0.0382537841796875, 0.04412651062011719, 0.049999237060546875, 0.05587196350097656, 0.06174468994140625, 0.06761741638183594, 0.07349014282226562, 0.07936286926269531, 0.085235595703125, 0.09110832214355469, 0.09698104858398438, 0.10285377502441406, 0.10872650146484375, 0.11459922790527344, 0.12047195434570312, 0.1263446807861328, 0.1322174072265625, 0.1380901336669922, 0.14396286010742188, 0.14983558654785156, 0.15570831298828125, 0.16158103942871094, 0.16745376586914062, 0.1733264923095703, 0.17919921875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 8.0, 8.0, 13.0, 16.0, 21.0, 49.0, 51.0, 82.0, 121.0, 155.0, 258.0, 384.0, 606.0, 715.0, 547.0, 359.0, 217.0, 149.0, 105.0, 54.0, 46.0, 32.0, 21.0, 9.0, 13.0, 11.0, 4.0, 6.0, 5.0, 3.0, 7.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2174072265625, -0.2094745635986328, -0.20154190063476562, -0.19360923767089844, -0.18567657470703125, -0.17774391174316406, -0.16981124877929688, -0.1618785858154297, -0.1539459228515625, -0.1460132598876953, -0.13808059692382812, -0.13014793395996094, -0.12221527099609375, -0.11428260803222656, -0.10634994506835938, -0.09841728210449219, -0.090484619140625, -0.08255195617675781, -0.07461929321289062, -0.06668663024902344, -0.05875396728515625, -0.05082130432128906, -0.042888641357421875, -0.03495597839355469, -0.0270233154296875, -0.019090652465820312, -0.011157989501953125, -0.0032253265380859375, 0.00470733642578125, 0.012639999389648438, 0.020572662353515625, 0.028505325317382812, 0.03643798828125, 0.04437065124511719, 0.052303314208984375, 0.06023597717285156, 0.06816864013671875, 0.07610130310058594, 0.08403396606445312, 0.09196662902832031, 0.0998992919921875, 0.10783195495605469, 0.11576461791992188, 0.12369728088378906, 0.13162994384765625, 0.13956260681152344, 0.14749526977539062, 0.1554279327392578, 0.163360595703125, 0.1712932586669922, 0.17922592163085938, 0.18715858459472656, 0.19509124755859375, 0.20302391052246094, 0.21095657348632812, 0.2188892364501953, 0.2268218994140625, 0.2347545623779297, 0.24268722534179688, 0.25061988830566406, 0.25855255126953125, 0.26648521423339844, 0.2744178771972656, 0.2823505401611328, 0.290283203125]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 8.0, 10.0, 11.0, 35.0, 70.0, 107.0, 135.0, 159.0, 155.0, 140.0, 79.0, 39.0, 36.0, 17.0, 9.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7652361392974854, -0.7113974094390869, -0.6575586199760437, -0.6037198901176453, -0.5498811602592468, -0.496042400598526, -0.4422036409378052, -0.38836491107940674, -0.3345261514186859, -0.2806873917579651, -0.22684866189956665, -0.17300990223884583, -0.1191711574792862, -0.06533241271972656, -0.011493653059005737, 0.0423450767993927, 0.09618383646011353, 0.15002258121967316, 0.2038613259792328, 0.2577000856399536, 0.31153881549835205, 0.3653775751590729, 0.4192163348197937, 0.47305506467819214, 0.5268938541412354, 0.5807325839996338, 0.634571373462677, 0.6884101033210754, 0.7422488331794739, 0.7960876226425171, 0.8499263525009155, 0.903765082359314, 0.9576038122177124, 1.0114425420761108, 1.0652812719345093, 1.1191201210021973, 1.1729588508605957, 1.2267975807189941, 1.2806363105773926, 1.334475040435791, 1.3883137702941895, 1.442152500152588, 1.4959912300109863, 1.5498299598693848, 1.6036688089370728, 1.6575075387954712, 1.7113462686538696, 1.765184998512268, 1.819023847579956, 1.8728625774383545, 1.926701307296753, 1.9805400371551514, 2.03437876701355, 2.0882174968719482, 2.142056465148926, 2.195895195007324, 2.2497336864471436, 2.303572416305542, 2.3574111461639404, 2.411249876022339, 2.4650886058807373, 2.5189273357391357, 2.5727663040161133, 2.6266050338745117, 2.68044376373291]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 1.0, 4.0, 3.0, 8.0, 11.0, 11.0, 15.0, 17.0, 14.0, 12.0, 18.0, 17.0, 21.0, 30.0, 32.0, 41.0, 31.0, 36.0, 43.0, 42.0, 40.0, 41.0, 45.0, 39.0, 38.0, 39.0, 38.0, 44.0, 34.0, 35.0, 37.0, 24.0, 27.0, 19.0, 21.0, 21.0, 13.0, 10.0, 7.0, 11.0, 4.0, 5.0, 2.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.651323139667511, -0.6287564635276794, -0.6061898469924927, -0.5836231708526611, -0.5610565543174744, -0.5384898781776428, -0.515923261642456, -0.4933565855026245, -0.47078990936279297, -0.4482232630252838, -0.42565661668777466, -0.4030899405479431, -0.38052329421043396, -0.3579566478729248, -0.33539000153541565, -0.3128233551979065, -0.29025670886039734, -0.2676900625228882, -0.24512340128421783, -0.22255675494670868, -0.19999009370803833, -0.17742344737052917, -0.15485680103302002, -0.13229013979434967, -0.10972349345684052, -0.08715683966875076, -0.06459018588066101, -0.042023539543151855, -0.019456885755062103, 0.003109768033027649, 0.025676414370536804, 0.04824307560920715, 0.07080972194671631, 0.09337637573480606, 0.11594302952289581, 0.13850967586040497, 0.16107633709907532, 0.18364298343658447, 0.20620962977409363, 0.22877629101276398, 0.2513429522514343, 0.2739095985889435, 0.29647624492645264, 0.3190429210662842, 0.34160956740379333, 0.3641762137413025, 0.38674286007881165, 0.4093095064163208, 0.43187615275382996, 0.4544427990913391, 0.47700944542884827, 0.4995760917663574, 0.522142767906189, 0.5447094440460205, 0.5672760605812073, 0.5898427367210388, 0.6124093532562256, 0.6349760293960571, 0.6575426459312439, 0.6801093220710754, 0.7026759386062622, 0.7252426147460938, 0.7478092908859253, 0.7703759074211121, 0.7929425835609436]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 3.0, 7.0, 10.0, 6.0, 14.0, 9.0, 19.0, 15.0, 40.0, 45.0, 60.0, 63.0, 105.0, 161.0, 208.0, 363.0, 694.0, 1279.0, 2555.0, 5188.0, 10875.0, 23095.0, 52778.0, 139665.0, 350212.0, 283241.0, 101460.0, 40804.0, 18272.0, 8595.0, 4137.0, 1977.0, 1020.0, 549.0, 304.0, 198.0, 144.0, 102.0, 67.0, 62.0, 32.0, 27.0, 21.0, 14.0, 19.0, 13.0, 5.0, 4.0, 9.0, 5.0, 5.0, 1.0, 1.0, 5.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.264404296875, -0.2558326721191406, -0.24726104736328125, -0.23868942260742188, -0.2301177978515625, -0.22154617309570312, -0.21297454833984375, -0.20440292358398438, -0.195831298828125, -0.18725967407226562, -0.17868804931640625, -0.17011642456054688, -0.1615447998046875, -0.15297317504882812, -0.14440155029296875, -0.13582992553710938, -0.12725830078125, -0.11868667602539062, -0.11011505126953125, -0.10154342651367188, -0.0929718017578125, -0.08440017700195312, -0.07582855224609375, -0.06725692749023438, -0.058685302734375, -0.050113677978515625, -0.04154205322265625, -0.032970428466796875, -0.0243988037109375, -0.015827178955078125, -0.00725555419921875, 0.001316070556640625, 0.0098876953125, 0.018459320068359375, 0.02703094482421875, 0.035602569580078125, 0.0441741943359375, 0.052745819091796875, 0.06131744384765625, 0.06988906860351562, 0.078460693359375, 0.08703231811523438, 0.09560394287109375, 0.10417556762695312, 0.1127471923828125, 0.12131881713867188, 0.12989044189453125, 0.13846206665039062, 0.14703369140625, 0.15560531616210938, 0.16417694091796875, 0.17274856567382812, 0.1813201904296875, 0.18989181518554688, 0.19846343994140625, 0.20703506469726562, 0.215606689453125, 0.22417831420898438, 0.23274993896484375, 0.24132156372070312, 0.2498931884765625, 0.2584648132324219, 0.26703643798828125, 0.2756080627441406, 0.2841796875]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 5.0, 22.0, 33.0, 73.0, 118.0, 144.0, 169.0, 172.0, 120.0, 82.0, 42.0, 20.0, 8.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4267578125, -0.4143943786621094, -0.40203094482421875, -0.3896675109863281, -0.3773040771484375, -0.3649406433105469, -0.35257720947265625, -0.3402137756347656, -0.327850341796875, -0.3154869079589844, -0.30312347412109375, -0.2907600402832031, -0.2783966064453125, -0.2660331726074219, -0.25366973876953125, -0.24130630493164062, -0.22894287109375, -0.21657943725585938, -0.20421600341796875, -0.19185256958007812, -0.1794891357421875, -0.16712570190429688, -0.15476226806640625, -0.14239883422851562, -0.130035400390625, -0.11767196655273438, -0.10530853271484375, -0.09294509887695312, -0.0805816650390625, -0.06821823120117188, -0.05585479736328125, -0.043491363525390625, -0.0311279296875, -0.018764495849609375, -0.00640106201171875, 0.005962371826171875, 0.0183258056640625, 0.030689239501953125, 0.04305267333984375, 0.055416107177734375, 0.067779541015625, 0.08014297485351562, 0.09250640869140625, 0.10486984252929688, 0.1172332763671875, 0.12959671020507812, 0.14196014404296875, 0.15432357788085938, 0.16668701171875, 0.17905044555664062, 0.19141387939453125, 0.20377731323242188, 0.2161407470703125, 0.22850418090820312, 0.24086761474609375, 0.2532310485839844, 0.265594482421875, 0.2779579162597656, 0.29032135009765625, 0.3026847839355469, 0.3150482177734375, 0.3274116516113281, 0.33977508544921875, 0.3521385192871094, 0.364501953125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 6.0, 7.0, 13.0, 17.0, 27.0, 28.0, 56.0, 91.0, 115.0, 214.0, 406.0, 732.0, 1444.0, 3101.0, 6346.0, 13999.0, 32029.0, 84847.0, 288357.0, 406668.0, 130476.0, 44462.0, 18762.0, 8445.0, 4021.0, 1945.0, 890.0, 416.0, 253.0, 130.0, 71.0, 50.0, 38.0, 23.0, 19.0, 23.0, 11.0, 7.0, 4.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.291015625, -0.28104400634765625, -0.2710723876953125, -0.26110076904296875, -0.251129150390625, -0.24115753173828125, -0.2311859130859375, -0.22121429443359375, -0.21124267578125, -0.20127105712890625, -0.1912994384765625, -0.18132781982421875, -0.171356201171875, -0.16138458251953125, -0.1514129638671875, -0.14144134521484375, -0.1314697265625, -0.12149810791015625, -0.1115264892578125, -0.10155487060546875, -0.091583251953125, -0.08161163330078125, -0.0716400146484375, -0.06166839599609375, -0.05169677734375, -0.04172515869140625, -0.0317535400390625, -0.02178192138671875, -0.011810302734375, -0.00183868408203125, 0.0081329345703125, 0.01810455322265625, 0.028076171875, 0.03804779052734375, 0.0480194091796875, 0.05799102783203125, 0.067962646484375, 0.07793426513671875, 0.0879058837890625, 0.09787750244140625, 0.10784912109375, 0.11782073974609375, 0.1277923583984375, 0.13776397705078125, 0.147735595703125, 0.15770721435546875, 0.1676788330078125, 0.17765045166015625, 0.1876220703125, 0.19759368896484375, 0.2075653076171875, 0.21753692626953125, 0.227508544921875, 0.23748016357421875, 0.2474517822265625, 0.25742340087890625, 0.26739501953125, 0.27736663818359375, 0.2873382568359375, 0.29730987548828125, 0.307281494140625, 0.31725311279296875, 0.3272247314453125, 0.33719635009765625, 0.34716796875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 4.0, 6.0, 5.0, 9.0, 7.0, 9.0, 17.0, 19.0, 20.0, 20.0, 27.0, 33.0, 32.0, 35.0, 48.0, 42.0, 39.0, 40.0, 47.0, 52.0, 44.0, 66.0, 40.0, 43.0, 32.0, 38.0, 36.0, 25.0, 30.0, 27.0, 19.0, 19.0, 13.0, 10.0, 11.0, 9.0, 4.0, 7.0, 2.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.316650390625, -0.3062019348144531, -0.29575347900390625, -0.2853050231933594, -0.2748565673828125, -0.2644081115722656, -0.25395965576171875, -0.24351119995117188, -0.233062744140625, -0.22261428833007812, -0.21216583251953125, -0.20171737670898438, -0.1912689208984375, -0.18082046508789062, -0.17037200927734375, -0.15992355346679688, -0.14947509765625, -0.13902664184570312, -0.12857818603515625, -0.11812973022460938, -0.1076812744140625, -0.09723281860351562, -0.08678436279296875, -0.07633590698242188, -0.065887451171875, -0.055438995361328125, -0.04499053955078125, -0.034542083740234375, -0.0240936279296875, -0.013645172119140625, -0.00319671630859375, 0.007251739501953125, 0.0177001953125, 0.028148651123046875, 0.03859710693359375, 0.049045562744140625, 0.0594940185546875, 0.06994247436523438, 0.08039093017578125, 0.09083938598632812, 0.101287841796875, 0.11173629760742188, 0.12218475341796875, 0.13263320922851562, 0.1430816650390625, 0.15353012084960938, 0.16397857666015625, 0.17442703247070312, 0.18487548828125, 0.19532394409179688, 0.20577239990234375, 0.21622085571289062, 0.2266693115234375, 0.23711776733398438, 0.24756622314453125, 0.2580146789550781, 0.268463134765625, 0.2789115905761719, 0.28936004638671875, 0.2998085021972656, 0.3102569580078125, 0.3207054138183594, 0.33115386962890625, 0.3416023254394531, 0.35205078125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 4.0, 11.0, 16.0, 28.0, 40.0, 72.0, 134.0, 257.0, 567.0, 1148.0, 2741.0, 6573.0, 16269.0, 43979.0, 185231.0, 557262.0, 166920.0, 41188.0, 15030.0, 6181.0, 2589.0, 1172.0, 546.0, 265.0, 134.0, 73.0, 40.0, 33.0, 13.0, 15.0, 6.0, 1.0, 6.0, 2.0, 0.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2423095703125, -0.23460960388183594, -0.22690963745117188, -0.2192096710205078, -0.21150970458984375, -0.2038097381591797, -0.19610977172851562, -0.18840980529785156, -0.1807098388671875, -0.17300987243652344, -0.16530990600585938, -0.1576099395751953, -0.14990997314453125, -0.1422100067138672, -0.13451004028320312, -0.12681007385253906, -0.119110107421875, -0.11141014099121094, -0.10371017456054688, -0.09601020812988281, -0.08831024169921875, -0.08061027526855469, -0.07291030883789062, -0.06521034240722656, -0.0575103759765625, -0.04981040954589844, -0.042110443115234375, -0.03441047668457031, -0.02671051025390625, -0.019010543823242188, -0.011310577392578125, -0.0036106109619140625, 0.00408935546875, 0.011789321899414062, 0.019489288330078125, 0.027189254760742188, 0.03488922119140625, 0.04258918762207031, 0.050289154052734375, 0.05798912048339844, 0.0656890869140625, 0.07338905334472656, 0.08108901977539062, 0.08878898620605469, 0.09648895263671875, 0.10418891906738281, 0.11188888549804688, 0.11958885192871094, 0.127288818359375, 0.13498878479003906, 0.14268875122070312, 0.1503887176513672, 0.15808868408203125, 0.1657886505126953, 0.17348861694335938, 0.18118858337402344, 0.1888885498046875, 0.19658851623535156, 0.20428848266601562, 0.2119884490966797, 0.21968841552734375, 0.2273883819580078, 0.23508834838867188, 0.24278831481933594, 0.25048828125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 4.0, 7.0, 3.0, 10.0, 1.0, 9.0, 9.0, 10.0, 17.0, 13.0, 18.0, 25.0, 35.0, 43.0, 50.0, 85.0, 94.0, 88.0, 87.0, 66.0, 71.0, 52.0, 30.0, 25.0, 37.0, 17.0, 15.0, 11.0, 12.0, 10.0, 7.0, 6.0, 5.0, 5.0, 5.0, 2.0, 7.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.6464462280273438e-05, -2.5627203285694122e-05, -2.4789944291114807e-05, -2.3952685296535492e-05, -2.3115426301956177e-05, -2.227816730737686e-05, -2.1440908312797546e-05, -2.060364931821823e-05, -1.9766390323638916e-05, -1.89291313290596e-05, -1.8091872334480286e-05, -1.725461333990097e-05, -1.6417354345321655e-05, -1.558009535074234e-05, -1.4742836356163025e-05, -1.390557736158371e-05, -1.3068318367004395e-05, -1.223105937242508e-05, -1.1393800377845764e-05, -1.0556541383266449e-05, -9.719282388687134e-06, -8.882023394107819e-06, -8.044764399528503e-06, -7.207505404949188e-06, -6.370246410369873e-06, -5.532987415790558e-06, -4.695728421211243e-06, -3.8584694266319275e-06, -3.0212104320526123e-06, -2.183951437473297e-06, -1.346692442893982e-06, -5.094334483146667e-07, 3.2782554626464844e-07, 1.1650845408439636e-06, 2.002343535423279e-06, 2.839602530002594e-06, 3.676861524581909e-06, 4.514120519161224e-06, 5.3513795137405396e-06, 6.188638508319855e-06, 7.02589750289917e-06, 7.863156497478485e-06, 8.7004154920578e-06, 9.537674486637115e-06, 1.037493348121643e-05, 1.1212192475795746e-05, 1.2049451470375061e-05, 1.2886710464954376e-05, 1.3723969459533691e-05, 1.4561228454113007e-05, 1.5398487448692322e-05, 1.6235746443271637e-05, 1.7073005437850952e-05, 1.7910264432430267e-05, 1.8747523427009583e-05, 1.9584782421588898e-05, 2.0422041416168213e-05, 2.1259300410747528e-05, 2.2096559405326843e-05, 2.293381839990616e-05, 2.3771077394485474e-05, 2.460833638906479e-05, 2.5445595383644104e-05, 2.628285437822342e-05, 2.7120113372802734e-05]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 5.0, 3.0, 6.0, 10.0, 11.0, 11.0, 20.0, 40.0, 57.0, 111.0, 229.0, 448.0, 1189.0, 3537.0, 11835.0, 45504.0, 325320.0, 562583.0, 73250.0, 16889.0, 4730.0, 1594.0, 616.0, 252.0, 119.0, 81.0, 43.0, 22.0, 20.0, 11.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.350830078125, -0.3402442932128906, -0.32965850830078125, -0.3190727233886719, -0.3084869384765625, -0.2979011535644531, -0.28731536865234375, -0.2767295837402344, -0.266143798828125, -0.2555580139160156, -0.24497222900390625, -0.23438644409179688, -0.2238006591796875, -0.21321487426757812, -0.20262908935546875, -0.19204330444335938, -0.18145751953125, -0.17087173461914062, -0.16028594970703125, -0.14970016479492188, -0.1391143798828125, -0.12852859497070312, -0.11794281005859375, -0.10735702514648438, -0.096771240234375, -0.08618545532226562, -0.07559967041015625, -0.06501388549804688, -0.0544281005859375, -0.043842315673828125, -0.03325653076171875, -0.022670745849609375, -0.0120849609375, -0.001499176025390625, 0.00908660888671875, 0.019672393798828125, 0.0302581787109375, 0.040843963623046875, 0.05142974853515625, 0.062015533447265625, 0.072601318359375, 0.08318710327148438, 0.09377288818359375, 0.10435867309570312, 0.1149444580078125, 0.12553024291992188, 0.13611602783203125, 0.14670181274414062, 0.15728759765625, 0.16787338256835938, 0.17845916748046875, 0.18904495239257812, 0.1996307373046875, 0.21021652221679688, 0.22080230712890625, 0.23138809204101562, 0.241973876953125, 0.2525596618652344, 0.26314544677734375, 0.2737312316894531, 0.2843170166015625, 0.2949028015136719, 0.30548858642578125, 0.3160743713378906, 0.32666015625]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 5.0, 7.0, 5.0, 8.0, 12.0, 12.0, 27.0, 18.0, 36.0, 62.0, 71.0, 83.0, 120.0, 119.0, 110.0, 81.0, 56.0, 39.0, 19.0, 18.0, 23.0, 12.0, 10.0, 11.0, 9.0, 8.0, 2.0, 5.0, 1.0, 3.0, 2.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.20703125, -0.20079994201660156, -0.19456863403320312, -0.1883373260498047, -0.18210601806640625, -0.1758747100830078, -0.16964340209960938, -0.16341209411621094, -0.1571807861328125, -0.15094947814941406, -0.14471817016601562, -0.1384868621826172, -0.13225555419921875, -0.1260242462158203, -0.11979293823242188, -0.11356163024902344, -0.107330322265625, -0.10109901428222656, -0.09486770629882812, -0.08863639831542969, -0.08240509033203125, -0.07617378234863281, -0.06994247436523438, -0.06371116638183594, -0.0574798583984375, -0.05124855041503906, -0.045017242431640625, -0.03878593444824219, -0.03255462646484375, -0.026323318481445312, -0.020092010498046875, -0.013860702514648438, -0.00762939453125, -0.0013980865478515625, 0.004833221435546875, 0.011064529418945312, 0.01729583740234375, 0.023527145385742188, 0.029758453369140625, 0.03598976135253906, 0.0422210693359375, 0.04845237731933594, 0.054683685302734375, 0.06091499328613281, 0.06714630126953125, 0.07337760925292969, 0.07960891723632812, 0.08584022521972656, 0.092071533203125, 0.09830284118652344, 0.10453414916992188, 0.11076545715332031, 0.11699676513671875, 0.12322807312011719, 0.12945938110351562, 0.13569068908691406, 0.1419219970703125, 0.14815330505371094, 0.15438461303710938, 0.1606159210205078, 0.16684722900390625, 0.1730785369873047, 0.17930984497070312, 0.18554115295410156, 0.1917724609375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 8.0, 36.0, 236.0, 375.0, 249.0, 98.0, 10.0, 5.0], "bins": [-11.049266815185547, -10.863822937011719, -10.678378105163574, -10.492934226989746, -10.307490348815918, -10.122045516967773, -9.936601638793945, -9.751157760620117, -9.565712928771973, -9.380269050598145, -9.19482421875, -9.009380340576172, -8.823936462402344, -8.6384916305542, -8.453047752380371, -8.267602920532227, -8.082159042358398, -7.896714687347412, -7.711270809173584, -7.525826454162598, -7.340382099151611, -7.154937744140625, -6.969493865966797, -6.7840495109558105, -6.598605632781982, -6.413161277770996, -6.227717399597168, -6.042273044586182, -5.856828689575195, -5.671384334564209, -5.485940456390381, -5.3004961013793945, -5.115051746368408, -4.929607391357422, -4.744163513183594, -4.558719158172607, -4.373274803161621, -4.187830448150635, -4.002386569976807, -3.8169422149658203, -3.631497859954834, -3.4460537433624268, -3.2606093883514404, -3.075165271759033, -2.889720916748047, -2.7042768001556396, -2.5188326835632324, -2.333388328552246, -2.1479439735412598, -1.962499737739563, -1.7770555019378662, -1.591611385345459, -1.4061670303344727, -1.2207229137420654, -1.0352786779403687, -0.8498344421386719, -0.6643903255462646, -0.47894608974456787, -0.2935018837451935, -0.10805767774581909, 0.07738655805587769, 0.26283079385757446, 0.44827497005462646, 0.6337192058563232, 0.81916344165802]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 5.0, 4.0, 5.0, 3.0, 5.0, 4.0, 15.0, 10.0, 9.0, 9.0, 18.0, 22.0, 15.0, 18.0, 24.0, 22.0, 34.0, 36.0, 38.0, 37.0, 50.0, 41.0, 30.0, 46.0, 36.0, 37.0, 36.0, 32.0, 39.0, 35.0, 34.0, 31.0, 33.0, 26.0, 18.0, 9.0, 20.0, 18.0, 8.0, 17.0, 18.0, 14.0, 12.0, 8.0, 2.0, 6.0, 6.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.9292447566986084, -0.899410605430603, -0.8695763945579529, -0.8397422432899475, -0.8099080920219421, -0.780073881149292, -0.7502397298812866, -0.7204055786132812, -0.6905714273452759, -0.6607372760772705, -0.6309030652046204, -0.601068913936615, -0.5712347626686096, -0.5414005517959595, -0.5115664005279541, -0.48173224925994873, -0.45189806818962097, -0.4220638871192932, -0.39222973585128784, -0.3623955547809601, -0.3325614035129547, -0.30272722244262695, -0.2728930711746216, -0.24305889010429382, -0.21322472393512726, -0.1833905577659607, -0.15355639159679413, -0.12372221797704697, -0.0938880518078804, -0.06405387818813324, -0.034219712018966675, -0.00438554584980011, 0.025448620319366455, 0.05528278648853302, 0.08511695265769958, 0.11495112627744675, 0.14478528499603271, 0.17461946606636047, 0.20445363223552704, 0.2342877984046936, 0.264121949672699, 0.29395613074302673, 0.3237902820110321, 0.35362446308135986, 0.38345861434936523, 0.413292795419693, 0.44312697649002075, 0.4729611277580261, 0.5027953386306763, 0.5326294898986816, 0.5624637007713318, 0.5922978520393372, 0.6221320033073425, 0.6519662141799927, 0.681800365447998, 0.7116345167160034, 0.7414686679840088, 0.7713028192520142, 0.8011370301246643, 0.8309711813926697, 0.860805332660675, 0.8906395435333252, 0.9204736948013306, 0.9503078460693359, 0.9801419973373413]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 3.0, 3.0, 10.0, 17.0, 28.0, 27.0, 47.0, 72.0, 125.0, 204.0, 387.0, 959.0, 3021.0, 13789.0, 116582.0, 2795870.0, 1184342.0, 66063.0, 9277.0, 2107.0, 695.0, 261.0, 155.0, 78.0, 55.0, 39.0, 20.0, 22.0, 12.0, 7.0, 2.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.478271484375, -0.4632682800292969, -0.44826507568359375, -0.4332618713378906, -0.4182586669921875, -0.4032554626464844, -0.38825225830078125, -0.3732490539550781, -0.358245849609375, -0.3432426452636719, -0.32823944091796875, -0.3132362365722656, -0.2982330322265625, -0.2832298278808594, -0.26822662353515625, -0.2532234191894531, -0.23822021484375, -0.22321701049804688, -0.20821380615234375, -0.19321060180664062, -0.1782073974609375, -0.16320419311523438, -0.14820098876953125, -0.13319778442382812, -0.118194580078125, -0.10319137573242188, -0.08818817138671875, -0.07318496704101562, -0.0581817626953125, -0.043178558349609375, -0.02817535400390625, -0.013172149658203125, 0.0018310546875, 0.016834259033203125, 0.03183746337890625, 0.046840667724609375, 0.0618438720703125, 0.07684707641601562, 0.09185028076171875, 0.10685348510742188, 0.121856689453125, 0.13685989379882812, 0.15186309814453125, 0.16686630249023438, 0.1818695068359375, 0.19687271118164062, 0.21187591552734375, 0.22687911987304688, 0.24188232421875, 0.2568855285644531, 0.27188873291015625, 0.2868919372558594, 0.3018951416015625, 0.3168983459472656, 0.33190155029296875, 0.3469047546386719, 0.361907958984375, 0.3769111633300781, 0.39191436767578125, 0.4069175720214844, 0.4219207763671875, 0.4369239807128906, 0.45192718505859375, 0.4669303894042969, 0.48193359375]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 0.0, 8.0, 23.0, 26.0, 57.0, 84.0, 136.0, 124.0, 157.0, 136.0, 113.0, 62.0, 40.0, 25.0, 15.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.425537109375, -0.4130744934082031, -0.40061187744140625, -0.3881492614746094, -0.3756866455078125, -0.3632240295410156, -0.35076141357421875, -0.3382987976074219, -0.325836181640625, -0.3133735656738281, -0.30091094970703125, -0.2884483337402344, -0.2759857177734375, -0.2635231018066406, -0.25106048583984375, -0.23859786987304688, -0.22613525390625, -0.21367263793945312, -0.20121002197265625, -0.18874740600585938, -0.1762847900390625, -0.16382217407226562, -0.15135955810546875, -0.13889694213867188, -0.126434326171875, -0.11397171020507812, -0.10150909423828125, -0.08904647827148438, -0.0765838623046875, -0.06412124633789062, -0.05165863037109375, -0.039196014404296875, -0.0267333984375, -0.014270782470703125, -0.00180816650390625, 0.010654449462890625, 0.0231170654296875, 0.035579681396484375, 0.04804229736328125, 0.060504913330078125, 0.072967529296875, 0.08543014526367188, 0.09789276123046875, 0.11035537719726562, 0.1228179931640625, 0.13528060913085938, 0.14774322509765625, 0.16020584106445312, 0.17266845703125, 0.18513107299804688, 0.19759368896484375, 0.21005630493164062, 0.2225189208984375, 0.23498153686523438, 0.24744415283203125, 0.2599067687988281, 0.272369384765625, 0.2848320007324219, 0.29729461669921875, 0.3097572326660156, 0.3222198486328125, 0.3346824645996094, 0.34714508056640625, 0.3596076965332031, 0.3720703125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 2.0, 0.0, 6.0, 5.0, 5.0, 10.0, 21.0, 21.0, 32.0, 34.0, 75.0, 93.0, 134.0, 188.0, 284.0, 434.0, 666.0, 1113.0, 1976.0, 3440.0, 6826.0, 14063.0, 31575.0, 78221.0, 207900.0, 612055.0, 1718573.0, 991115.0, 322623.0, 116904.0, 46023.0, 19659.0, 9344.0, 4564.0, 2430.0, 1435.0, 832.0, 532.0, 341.0, 210.0, 154.0, 112.0, 84.0, 57.0, 35.0, 17.0, 23.0, 11.0, 11.0, 5.0, 5.0, 4.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.20263671875, -0.1958160400390625, -0.188995361328125, -0.1821746826171875, -0.17535400390625, -0.1685333251953125, -0.161712646484375, -0.1548919677734375, -0.1480712890625, -0.1412506103515625, -0.134429931640625, -0.1276092529296875, -0.12078857421875, -0.1139678955078125, -0.107147216796875, -0.1003265380859375, -0.093505859375, -0.0866851806640625, -0.079864501953125, -0.0730438232421875, -0.06622314453125, -0.0594024658203125, -0.052581787109375, -0.0457611083984375, -0.0389404296875, -0.0321197509765625, -0.025299072265625, -0.0184783935546875, -0.01165771484375, -0.0048370361328125, 0.001983642578125, 0.0088043212890625, 0.015625, 0.0224456787109375, 0.029266357421875, 0.0360870361328125, 0.04290771484375, 0.0497283935546875, 0.056549072265625, 0.0633697509765625, 0.0701904296875, 0.0770111083984375, 0.083831787109375, 0.0906524658203125, 0.09747314453125, 0.1042938232421875, 0.111114501953125, 0.1179351806640625, 0.124755859375, 0.1315765380859375, 0.138397216796875, 0.1452178955078125, 0.15203857421875, 0.1588592529296875, 0.165679931640625, 0.1725006103515625, 0.1793212890625, 0.1861419677734375, 0.192962646484375, 0.1997833251953125, 0.20660400390625, 0.2134246826171875, 0.220245361328125, 0.2270660400390625, 0.23388671875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 5.0, 5.0, 6.0, 8.0, 12.0, 17.0, 33.0, 31.0, 52.0, 78.0, 113.0, 192.0, 328.0, 416.0, 577.0, 700.0, 500.0, 311.0, 192.0, 155.0, 110.0, 75.0, 43.0, 28.0, 29.0, 17.0, 12.0, 11.0, 8.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.240234375, -0.23226165771484375, -0.2242889404296875, -0.21631622314453125, -0.208343505859375, -0.20037078857421875, -0.1923980712890625, -0.18442535400390625, -0.17645263671875, -0.16847991943359375, -0.1605072021484375, -0.15253448486328125, -0.144561767578125, -0.13658905029296875, -0.1286163330078125, -0.12064361572265625, -0.1126708984375, -0.10469818115234375, -0.0967254638671875, -0.08875274658203125, -0.080780029296875, -0.07280731201171875, -0.0648345947265625, -0.05686187744140625, -0.04888916015625, -0.04091644287109375, -0.0329437255859375, -0.02497100830078125, -0.016998291015625, -0.00902557373046875, -0.0010528564453125, 0.00691986083984375, 0.014892578125, 0.02286529541015625, 0.0308380126953125, 0.03881072998046875, 0.046783447265625, 0.05475616455078125, 0.0627288818359375, 0.07070159912109375, 0.07867431640625, 0.08664703369140625, 0.0946197509765625, 0.10259246826171875, 0.110565185546875, 0.11853790283203125, 0.1265106201171875, 0.13448333740234375, 0.1424560546875, 0.15042877197265625, 0.1584014892578125, 0.16637420654296875, 0.174346923828125, 0.18231964111328125, 0.1902923583984375, 0.19826507568359375, 0.20623779296875, 0.21421051025390625, 0.2221832275390625, 0.23015594482421875, 0.238128662109375, 0.24610137939453125, 0.2540740966796875, 0.26204681396484375, 0.27001953125]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 5.0, 4.0, 1.0, 6.0, 8.0, 5.0, 12.0, 12.0, 32.0, 28.0, 40.0, 43.0, 52.0, 48.0, 69.0, 70.0, 77.0, 71.0, 72.0, 62.0, 58.0, 49.0, 40.0, 41.0, 24.0, 26.0, 15.0, 12.0, 11.0, 6.0, 5.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.718791127204895, -0.6925047636032104, -0.6662184000015259, -0.6399320960044861, -0.6136457324028015, -0.5873593688011169, -0.5610730648040771, -0.5347867012023926, -0.508500337600708, -0.48221397399902344, -0.45592764019966125, -0.4296413064002991, -0.4033549427986145, -0.37706857919692993, -0.35078224539756775, -0.32449591159820557, -0.298209547996521, -0.2719231843948364, -0.24563685059547424, -0.21935050189495087, -0.1930641531944275, -0.1667778044939041, -0.14049145579338074, -0.11420510709285736, -0.08791875839233398, -0.06163240969181061, -0.03534606099128723, -0.009059712290763855, 0.01722663640975952, 0.0435129851102829, 0.06979933381080627, 0.09608568251132965, 0.1223720908164978, 0.14865843951702118, 0.17494478821754456, 0.20123113691806793, 0.2275174856185913, 0.2538038492202759, 0.28009018301963806, 0.30637651681900024, 0.3326628804206848, 0.3589492440223694, 0.38523557782173157, 0.41152191162109375, 0.4378082752227783, 0.4640946388244629, 0.4903809726238251, 0.5166673064231873, 0.5429536700248718, 0.5692400336265564, 0.5955263376235962, 0.6218127012252808, 0.6480990648269653, 0.6743854284286499, 0.7006717920303345, 0.7269580960273743, 0.7532444596290588, 0.7795308232307434, 0.8058171272277832, 0.8321034908294678, 0.8583898544311523, 0.8846762180328369, 0.9109625816345215, 0.9372488856315613, 0.9635352492332458]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 5.0, 7.0, 11.0, 9.0, 13.0, 16.0, 16.0, 10.0, 20.0, 14.0, 24.0, 21.0, 31.0, 30.0, 27.0, 37.0, 43.0, 39.0, 35.0, 39.0, 41.0, 36.0, 40.0, 47.0, 26.0, 30.0, 44.0, 40.0, 40.0, 33.0, 24.0, 23.0, 28.0, 13.0, 21.0, 17.0, 11.0, 6.0, 7.0, 14.0, 3.0, 4.0, 2.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.5934332013130188, -0.5736249089241028, -0.5538166761398315, -0.5340083837509155, -0.5142000913619995, -0.4943918287754059, -0.47458356618881226, -0.45477527379989624, -0.4349669814109802, -0.4151587188243866, -0.3953504264354706, -0.37554216384887695, -0.35573387145996094, -0.3359256088733673, -0.3161173462867737, -0.29630905389785767, -0.27650079131126404, -0.2566925287246704, -0.2368842363357544, -0.21707597374916077, -0.19726768136024475, -0.17745941877365112, -0.1576511412858963, -0.13784286379814148, -0.11803458631038666, -0.09822630882263184, -0.07841803133487701, -0.05860976129770279, -0.03880148380994797, -0.018993206322193146, 0.0008150637149810791, 0.0206233412027359, 0.04043161869049072, 0.060239896178245544, 0.08004817366600037, 0.09985644370317459, 0.11966472119092941, 0.13947299122810364, 0.15928126871585846, 0.17908954620361328, 0.1988978236913681, 0.21870610117912292, 0.23851437866687775, 0.25832265615463257, 0.2781309187412262, 0.2979392111301422, 0.31774747371673584, 0.33755576610565186, 0.3573640286922455, 0.3771722912788391, 0.3969805836677551, 0.41678884625434875, 0.43659713864326477, 0.4564054012298584, 0.4762136936187744, 0.49602195620536804, 0.5158302187919617, 0.5356385111808777, 0.5554467439651489, 0.5752550363540649, 0.595063328742981, 0.614871621131897, 0.6346798539161682, 0.6544881463050842, 0.6742964386940002]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 8.0, 11.0, 11.0, 8.0, 16.0, 29.0, 23.0, 42.0, 65.0, 108.0, 183.0, 284.0, 580.0, 1067.0, 2029.0, 4099.0, 8075.0, 16303.0, 34254.0, 84400.0, 271090.0, 403650.0, 130118.0, 48288.0, 21687.0, 10808.0, 5506.0, 2692.0, 1422.0, 699.0, 386.0, 220.0, 120.0, 80.0, 60.0, 37.0, 27.0, 17.0, 11.0, 18.0, 7.0, 3.0, 7.0, 4.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.281982421875, -0.2729454040527344, -0.26390838623046875, -0.2548713684082031, -0.2458343505859375, -0.23679733276367188, -0.22776031494140625, -0.21872329711914062, -0.209686279296875, -0.20064926147460938, -0.19161224365234375, -0.18257522583007812, -0.1735382080078125, -0.16450119018554688, -0.15546417236328125, -0.14642715454101562, -0.13739013671875, -0.12835311889648438, -0.11931610107421875, -0.11027908325195312, -0.1012420654296875, -0.09220504760742188, -0.08316802978515625, -0.07413101196289062, -0.065093994140625, -0.056056976318359375, -0.04701995849609375, -0.037982940673828125, -0.0289459228515625, -0.019908905029296875, -0.01087188720703125, -0.001834869384765625, 0.0072021484375, 0.016239166259765625, 0.02527618408203125, 0.034313201904296875, 0.0433502197265625, 0.052387237548828125, 0.06142425537109375, 0.07046127319335938, 0.079498291015625, 0.08853530883789062, 0.09757232666015625, 0.10660934448242188, 0.1156463623046875, 0.12468338012695312, 0.13372039794921875, 0.14275741577148438, 0.15179443359375, 0.16083145141601562, 0.16986846923828125, 0.17890548706054688, 0.1879425048828125, 0.19697952270507812, 0.20601654052734375, 0.21505355834960938, 0.224090576171875, 0.23312759399414062, 0.24216461181640625, 0.2512016296386719, 0.2602386474609375, 0.2692756652832031, 0.27831268310546875, 0.2873497009277344, 0.29638671875]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 1.0, 1.0, 7.0, 10.0, 32.0, 50.0, 69.0, 103.0, 126.0, 151.0, 143.0, 107.0, 90.0, 63.0, 30.0, 18.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.42529296875, -0.4129981994628906, -0.40070343017578125, -0.3884086608886719, -0.3761138916015625, -0.3638191223144531, -0.35152435302734375, -0.3392295837402344, -0.326934814453125, -0.3146400451660156, -0.30234527587890625, -0.2900505065917969, -0.2777557373046875, -0.2654609680175781, -0.25316619873046875, -0.24087142944335938, -0.22857666015625, -0.21628189086914062, -0.20398712158203125, -0.19169235229492188, -0.1793975830078125, -0.16710281372070312, -0.15480804443359375, -0.14251327514648438, -0.130218505859375, -0.11792373657226562, -0.10562896728515625, -0.09333419799804688, -0.0810394287109375, -0.06874465942382812, -0.05644989013671875, -0.044155120849609375, -0.0318603515625, -0.019565582275390625, -0.00727081298828125, 0.005023956298828125, 0.0173187255859375, 0.029613494873046875, 0.04190826416015625, 0.054203033447265625, 0.066497802734375, 0.07879257202148438, 0.09108734130859375, 0.10338211059570312, 0.1156768798828125, 0.12797164916992188, 0.14026641845703125, 0.15256118774414062, 0.16485595703125, 0.17715072631835938, 0.18944549560546875, 0.20174026489257812, 0.2140350341796875, 0.22632980346679688, 0.23862457275390625, 0.2509193420410156, 0.263214111328125, 0.2755088806152344, 0.28780364990234375, 0.3000984191894531, 0.3123931884765625, 0.3246879577636719, 0.33698272705078125, 0.3492774963378906, 0.361572265625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 9.0, 7.0, 6.0, 10.0, 22.0, 33.0, 43.0, 65.0, 91.0, 171.0, 388.0, 1223.0, 4165.0, 15203.0, 58280.0, 458490.0, 433039.0, 56458.0, 14753.0, 4079.0, 1167.0, 403.0, 179.0, 90.0, 54.0, 35.0, 28.0, 26.0, 18.0, 7.0, 7.0, 5.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5498046875, -0.5308380126953125, -0.511871337890625, -0.4929046630859375, -0.47393798828125, -0.4549713134765625, -0.436004638671875, -0.4170379638671875, -0.3980712890625, -0.3791046142578125, -0.360137939453125, -0.3411712646484375, -0.32220458984375, -0.3032379150390625, -0.284271240234375, -0.2653045654296875, -0.246337890625, -0.2273712158203125, -0.208404541015625, -0.1894378662109375, -0.17047119140625, -0.1515045166015625, -0.132537841796875, -0.1135711669921875, -0.0946044921875, -0.0756378173828125, -0.056671142578125, -0.0377044677734375, -0.01873779296875, 0.0002288818359375, 0.019195556640625, 0.0381622314453125, 0.05712890625, 0.0760955810546875, 0.095062255859375, 0.1140289306640625, 0.13299560546875, 0.1519622802734375, 0.170928955078125, 0.1898956298828125, 0.2088623046875, 0.2278289794921875, 0.246795654296875, 0.2657623291015625, 0.28472900390625, 0.3036956787109375, 0.322662353515625, 0.3416290283203125, 0.360595703125, 0.3795623779296875, 0.398529052734375, 0.4174957275390625, 0.43646240234375, 0.4554290771484375, 0.474395751953125, 0.4933624267578125, 0.5123291015625, 0.5312957763671875, 0.550262451171875, 0.5692291259765625, 0.58819580078125, 0.6071624755859375, 0.626129150390625, 0.6450958251953125, 0.6640625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 5.0, 3.0, 6.0, 6.0, 5.0, 6.0, 11.0, 12.0, 19.0, 19.0, 10.0, 14.0, 21.0, 23.0, 27.0, 42.0, 47.0, 44.0, 58.0, 52.0, 54.0, 57.0, 54.0, 54.0, 48.0, 53.0, 36.0, 41.0, 32.0, 26.0, 28.0, 18.0, 19.0, 11.0, 13.0, 8.0, 6.0, 1.0, 5.0, 6.0, 1.0, 5.0, 3.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.43505859375, -0.422027587890625, -0.40899658203125, -0.395965576171875, -0.3829345703125, -0.369903564453125, -0.35687255859375, -0.343841552734375, -0.330810546875, -0.317779541015625, -0.30474853515625, -0.291717529296875, -0.2786865234375, -0.265655517578125, -0.25262451171875, -0.239593505859375, -0.2265625, -0.213531494140625, -0.20050048828125, -0.187469482421875, -0.1744384765625, -0.161407470703125, -0.14837646484375, -0.135345458984375, -0.122314453125, -0.109283447265625, -0.09625244140625, -0.083221435546875, -0.0701904296875, -0.057159423828125, -0.04412841796875, -0.031097412109375, -0.01806640625, -0.005035400390625, 0.00799560546875, 0.021026611328125, 0.0340576171875, 0.047088623046875, 0.06011962890625, 0.073150634765625, 0.086181640625, 0.099212646484375, 0.11224365234375, 0.125274658203125, 0.1383056640625, 0.151336669921875, 0.16436767578125, 0.177398681640625, 0.1904296875, 0.203460693359375, 0.21649169921875, 0.229522705078125, 0.2425537109375, 0.255584716796875, 0.26861572265625, 0.281646728515625, 0.294677734375, 0.307708740234375, 0.32073974609375, 0.333770751953125, 0.3468017578125, 0.359832763671875, 0.37286376953125, 0.385894775390625, 0.39892578125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 6.0, 4.0, 7.0, 6.0, 8.0, 13.0, 15.0, 21.0, 37.0, 62.0, 79.0, 90.0, 180.0, 367.0, 572.0, 1012.0, 1799.0, 3107.0, 5459.0, 10004.0, 18081.0, 34507.0, 91580.0, 443158.0, 305591.0, 68187.0, 29480.0, 15334.0, 8636.0, 4774.0, 2701.0, 1473.0, 838.0, 542.0, 300.0, 181.0, 121.0, 67.0, 46.0, 37.0, 25.0, 15.0, 11.0, 16.0, 3.0, 4.0, 0.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.1895751953125, -0.18362808227539062, -0.17768096923828125, -0.17173385620117188, -0.1657867431640625, -0.15983963012695312, -0.15389251708984375, -0.14794540405273438, -0.141998291015625, -0.13605117797851562, -0.13010406494140625, -0.12415695190429688, -0.1182098388671875, -0.11226272583007812, -0.10631561279296875, -0.10036849975585938, -0.09442138671875, -0.08847427368164062, -0.08252716064453125, -0.07658004760742188, -0.0706329345703125, -0.06468582153320312, -0.05873870849609375, -0.052791595458984375, -0.046844482421875, -0.040897369384765625, -0.03495025634765625, -0.029003143310546875, -0.0230560302734375, -0.017108917236328125, -0.01116180419921875, -0.005214691162109375, 0.000732421875, 0.006679534912109375, 0.01262664794921875, 0.018573760986328125, 0.0245208740234375, 0.030467987060546875, 0.03641510009765625, 0.042362213134765625, 0.048309326171875, 0.054256439208984375, 0.06020355224609375, 0.06615066528320312, 0.0720977783203125, 0.07804489135742188, 0.08399200439453125, 0.08993911743164062, 0.09588623046875, 0.10183334350585938, 0.10778045654296875, 0.11372756958007812, 0.1196746826171875, 0.12562179565429688, 0.13156890869140625, 0.13751602172851562, 0.143463134765625, 0.14941024780273438, 0.15535736083984375, 0.16130447387695312, 0.1672515869140625, 0.17319869995117188, 0.17914581298828125, 0.18509292602539062, 0.1910400390625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 5.0, 3.0, 7.0, 9.0, 9.0, 21.0, 17.0, 24.0, 38.0, 72.0, 170.0, 240.0, 182.0, 60.0, 38.0, 27.0, 22.0, 16.0, 19.0, 8.0, 4.0, 1.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.750490188598633e-05, -4.548113793134689e-05, -4.345737397670746e-05, -4.1433610022068024e-05, -3.940984606742859e-05, -3.7386082112789154e-05, -3.536231815814972e-05, -3.3338554203510284e-05, -3.131479024887085e-05, -2.9291026294231415e-05, -2.726726233959198e-05, -2.5243498384952545e-05, -2.321973443031311e-05, -2.1195970475673676e-05, -1.917220652103424e-05, -1.7148442566394806e-05, -1.5124678611755371e-05, -1.3100914657115936e-05, -1.1077150702476501e-05, -9.053386747837067e-06, -7.029622793197632e-06, -5.005858838558197e-06, -2.982094883918762e-06, -9.583309292793274e-07, 1.0654330253601074e-06, 3.0891969799995422e-06, 5.112960934638977e-06, 7.136724889278412e-06, 9.160488843917847e-06, 1.1184252798557281e-05, 1.3208016753196716e-05, 1.5231780707836151e-05, 1.7255544662475586e-05, 1.927930861711502e-05, 2.1303072571754456e-05, 2.332683652639389e-05, 2.5350600481033325e-05, 2.737436443567276e-05, 2.9398128390312195e-05, 3.142189234495163e-05, 3.3445656299591064e-05, 3.54694202542305e-05, 3.7493184208869934e-05, 3.951694816350937e-05, 4.1540712118148804e-05, 4.356447607278824e-05, 4.558824002742767e-05, 4.761200398206711e-05, 4.963576793670654e-05, 5.165953189134598e-05, 5.368329584598541e-05, 5.570705980062485e-05, 5.773082375526428e-05, 5.975458770990372e-05, 6.177835166454315e-05, 6.380211561918259e-05, 6.582587957382202e-05, 6.784964352846146e-05, 6.987340748310089e-05, 7.189717143774033e-05, 7.392093539237976e-05, 7.59446993470192e-05, 7.796846330165863e-05, 7.999222725629807e-05, 8.20159912109375e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 4.0, 2.0, 9.0, 10.0, 8.0, 12.0, 25.0, 32.0, 44.0, 88.0, 166.0, 309.0, 635.0, 1386.0, 3171.0, 7381.0, 17104.0, 41535.0, 148957.0, 604995.0, 149988.0, 42172.0, 17017.0, 7468.0, 3221.0, 1427.0, 680.0, 323.0, 155.0, 76.0, 52.0, 25.0, 18.0, 17.0, 17.0, 4.0, 7.0, 8.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.25927734375, -0.25197410583496094, -0.24467086791992188, -0.2373676300048828, -0.23006439208984375, -0.2227611541748047, -0.21545791625976562, -0.20815467834472656, -0.2008514404296875, -0.19354820251464844, -0.18624496459960938, -0.1789417266845703, -0.17163848876953125, -0.1643352508544922, -0.15703201293945312, -0.14972877502441406, -0.142425537109375, -0.13512229919433594, -0.12781906127929688, -0.12051582336425781, -0.11321258544921875, -0.10590934753417969, -0.09860610961914062, -0.09130287170410156, -0.0839996337890625, -0.07669639587402344, -0.06939315795898438, -0.06208992004394531, -0.05478668212890625, -0.04748344421386719, -0.040180206298828125, -0.03287696838378906, -0.02557373046875, -0.018270492553710938, -0.010967254638671875, -0.0036640167236328125, 0.00363922119140625, 0.010942459106445312, 0.018245697021484375, 0.025548934936523438, 0.0328521728515625, 0.04015541076660156, 0.047458648681640625, 0.05476188659667969, 0.06206512451171875, 0.06936836242675781, 0.07667160034179688, 0.08397483825683594, 0.091278076171875, 0.09858131408691406, 0.10588455200195312, 0.11318778991699219, 0.12049102783203125, 0.1277942657470703, 0.13509750366210938, 0.14240074157714844, 0.1497039794921875, 0.15700721740722656, 0.16431045532226562, 0.1716136932373047, 0.17891693115234375, 0.1862201690673828, 0.19352340698242188, 0.20082664489746094, 0.2081298828125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 1.0, 3.0, 1.0, 1.0, 8.0, 8.0, 7.0, 8.0, 2.0, 11.0, 20.0, 26.0, 31.0, 59.0, 54.0, 95.0, 139.0, 152.0, 107.0, 85.0, 43.0, 35.0, 20.0, 17.0, 11.0, 5.0, 15.0, 11.0, 7.0, 7.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1734619140625, -0.1680755615234375, -0.162689208984375, -0.1573028564453125, -0.15191650390625, -0.1465301513671875, -0.141143798828125, -0.1357574462890625, -0.13037109375, -0.1249847412109375, -0.119598388671875, -0.1142120361328125, -0.10882568359375, -0.1034393310546875, -0.098052978515625, -0.0926666259765625, -0.0872802734375, -0.0818939208984375, -0.076507568359375, -0.0711212158203125, -0.06573486328125, -0.0603485107421875, -0.054962158203125, -0.0495758056640625, -0.044189453125, -0.0388031005859375, -0.033416748046875, -0.0280303955078125, -0.02264404296875, -0.0172576904296875, -0.011871337890625, -0.0064849853515625, -0.0010986328125, 0.0042877197265625, 0.009674072265625, 0.0150604248046875, 0.02044677734375, 0.0258331298828125, 0.031219482421875, 0.0366058349609375, 0.0419921875, 0.0473785400390625, 0.052764892578125, 0.0581512451171875, 0.06353759765625, 0.0689239501953125, 0.074310302734375, 0.0796966552734375, 0.0850830078125, 0.0904693603515625, 0.095855712890625, 0.1012420654296875, 0.10662841796875, 0.1120147705078125, 0.117401123046875, 0.1227874755859375, 0.128173828125, 0.1335601806640625, 0.138946533203125, 0.1443328857421875, 0.14971923828125, 0.1551055908203125, 0.160491943359375, 0.1658782958984375, 0.1712646484375]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 15.0, 47.0, 98.0, 250.0, 286.0, 217.0, 78.0, 16.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.158699035644531, -8.005964279174805, -7.8532304763793945, -7.700496196746826, -7.547761917114258, -7.3950276374816895, -7.242293357849121, -7.089559078216553, -6.936824798583984, -6.784090518951416, -6.631356239318848, -6.478621959686279, -6.325887680053711, -6.173153400421143, -6.020419120788574, -5.867684841156006, -5.7149505615234375, -5.562216281890869, -5.409482002258301, -5.256747722625732, -5.104013442993164, -4.951279163360596, -4.798544883728027, -4.645810604095459, -4.493075847625732, -4.340341567993164, -4.187607288360596, -4.034873008728027, -3.882138729095459, -3.7294044494628906, -3.5766701698303223, -3.423935890197754, -3.2712018489837646, -3.1184675693511963, -2.965733289718628, -2.8129990100860596, -2.660264730453491, -2.507530450820923, -2.3547959327697754, -2.202061653137207, -2.0493273735046387, -1.8965930938720703, -1.743858814239502, -1.5911245346069336, -1.4383902549743652, -1.2856559753417969, -1.132921576499939, -0.9801872968673706, -0.8274531364440918, -0.6747188568115234, -0.5219845771789551, -0.36925023794174194, -0.21651595830917358, -0.06378167867660522, 0.08895266056060791, 0.24168694019317627, 0.39442121982574463, 0.547155499458313, 0.6998897790908813, 0.8526241183280945, 1.0053584575653076, 1.158092737197876, 1.3108270168304443, 1.4635612964630127, 1.616295576095581]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 3.0, 2.0, 7.0, 3.0, 6.0, 4.0, 10.0, 14.0, 19.0, 15.0, 33.0, 13.0, 21.0, 31.0, 31.0, 36.0, 49.0, 33.0, 39.0, 47.0, 40.0, 37.0, 65.0, 47.0, 55.0, 41.0, 30.0, 53.0, 30.0, 19.0, 29.0, 15.0, 27.0, 21.0, 9.0, 19.0, 16.0, 8.0, 9.0, 5.0, 4.0, 4.0, 5.0, 5.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.187944769859314, -1.1518250703811646, -1.1157053709030151, -1.0795856714248657, -1.0434659719467163, -1.007346272468567, -0.9712266325950623, -0.9351069331169128, -0.8989872336387634, -0.862867534160614, -0.8267478346824646, -0.7906281352043152, -0.7545084953308105, -0.7183887958526611, -0.6822690963745117, -0.6461493968963623, -0.6100296974182129, -0.5739099979400635, -0.5377902984619141, -0.5016705989837646, -0.4655509293079376, -0.4294312298297882, -0.3933115601539612, -0.35719186067581177, -0.32107216119766235, -0.28495246171951294, -0.24883277714252472, -0.2127130925655365, -0.17659339308738708, -0.14047369360923767, -0.10435400903224945, -0.06823432445526123, -0.032114505767822266, 0.0040051862597465515, 0.04012487828731537, 0.07624457031488419, 0.112364262342453, 0.14848396182060242, 0.18460364639759064, 0.22072333097457886, 0.25684303045272827, 0.2929627299308777, 0.3290824294090271, 0.3652020990848541, 0.40132179856300354, 0.43744149804115295, 0.47356116771698, 0.5096808671951294, 0.5458005666732788, 0.5819202661514282, 0.6180399656295776, 0.654159665107727, 0.6902793645858765, 0.7263990640640259, 0.7625187039375305, 0.7986384034156799, 0.8347581028938293, 0.8708778023719788, 0.9069975018501282, 0.9431172013282776, 0.9792368412017822, 1.0153565406799316, 1.051476240158081, 1.0875959396362305, 1.1237156391143799]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 6.0, 11.0, 8.0, 9.0, 25.0, 17.0, 38.0, 42.0, 63.0, 99.0, 180.0, 349.0, 586.0, 1301.0, 2787.0, 6972.0, 19202.0, 59939.0, 229760.0, 1385139.0, 2073609.0, 300874.0, 75555.0, 23302.0, 8345.0, 3283.0, 1415.0, 654.0, 296.0, 166.0, 90.0, 53.0, 34.0, 23.0, 19.0, 10.0, 8.0, 5.0, 7.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.29736328125, -0.2883758544921875, -0.279388427734375, -0.2704010009765625, -0.26141357421875, -0.2524261474609375, -0.243438720703125, -0.2344512939453125, -0.2254638671875, -0.2164764404296875, -0.207489013671875, -0.1985015869140625, -0.18951416015625, -0.1805267333984375, -0.171539306640625, -0.1625518798828125, -0.153564453125, -0.1445770263671875, -0.135589599609375, -0.1266021728515625, -0.11761474609375, -0.1086273193359375, -0.099639892578125, -0.0906524658203125, -0.0816650390625, -0.0726776123046875, -0.063690185546875, -0.0547027587890625, -0.04571533203125, -0.0367279052734375, -0.027740478515625, -0.0187530517578125, -0.009765625, -0.0007781982421875, 0.008209228515625, 0.0171966552734375, 0.02618408203125, 0.0351715087890625, 0.044158935546875, 0.0531463623046875, 0.0621337890625, 0.0711212158203125, 0.080108642578125, 0.0890960693359375, 0.09808349609375, 0.1070709228515625, 0.116058349609375, 0.1250457763671875, 0.134033203125, 0.1430206298828125, 0.152008056640625, 0.1609954833984375, 0.16998291015625, 0.1789703369140625, 0.187957763671875, 0.1969451904296875, 0.2059326171875, 0.2149200439453125, 0.223907470703125, 0.2328948974609375, 0.24188232421875, 0.2508697509765625, 0.259857177734375, 0.2688446044921875, 0.27783203125]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 6.0, 9.0, 13.0, 34.0, 59.0, 70.0, 91.0, 104.0, 143.0, 121.0, 118.0, 94.0, 62.0, 43.0, 21.0, 15.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.431884765625, -0.4194297790527344, -0.40697479248046875, -0.3945198059082031, -0.3820648193359375, -0.3696098327636719, -0.35715484619140625, -0.3446998596191406, -0.332244873046875, -0.3197898864746094, -0.30733489990234375, -0.2948799133300781, -0.2824249267578125, -0.2699699401855469, -0.25751495361328125, -0.24505996704101562, -0.23260498046875, -0.22014999389648438, -0.20769500732421875, -0.19524002075195312, -0.1827850341796875, -0.17033004760742188, -0.15787506103515625, -0.14542007446289062, -0.132965087890625, -0.12051010131835938, -0.10805511474609375, -0.09560012817382812, -0.0831451416015625, -0.07069015502929688, -0.05823516845703125, -0.045780181884765625, -0.0333251953125, -0.020870208740234375, -0.00841522216796875, 0.004039764404296875, 0.0164947509765625, 0.028949737548828125, 0.04140472412109375, 0.053859710693359375, 0.066314697265625, 0.07876968383789062, 0.09122467041015625, 0.10367965698242188, 0.1161346435546875, 0.12858963012695312, 0.14104461669921875, 0.15349960327148438, 0.16595458984375, 0.17840957641601562, 0.19086456298828125, 0.20331954956054688, 0.2157745361328125, 0.22822952270507812, 0.24068450927734375, 0.2531394958496094, 0.265594482421875, 0.2780494689941406, 0.29050445556640625, 0.3029594421386719, 0.3154144287109375, 0.3278694152832031, 0.34032440185546875, 0.3527793884277344, 0.365234375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 7.0, 5.0, 12.0, 11.0, 21.0, 23.0, 42.0, 45.0, 73.0, 111.0, 169.0, 232.0, 372.0, 554.0, 855.0, 1445.0, 2629.0, 5218.0, 11087.0, 26405.0, 73440.0, 237142.0, 947420.0, 2110080.0, 542464.0, 149091.0, 48955.0, 18719.0, 8177.0, 4036.0, 2071.0, 1201.0, 717.0, 481.0, 313.0, 201.0, 120.0, 114.0, 74.0, 44.0, 40.0, 14.0, 23.0, 6.0, 9.0, 6.0, 4.0, 2.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.343505859375, -0.3328742980957031, -0.32224273681640625, -0.3116111755371094, -0.3009796142578125, -0.2903480529785156, -0.27971649169921875, -0.2690849304199219, -0.258453369140625, -0.24782180786132812, -0.23719024658203125, -0.22655868530273438, -0.2159271240234375, -0.20529556274414062, -0.19466400146484375, -0.18403244018554688, -0.17340087890625, -0.16276931762695312, -0.15213775634765625, -0.14150619506835938, -0.1308746337890625, -0.12024307250976562, -0.10961151123046875, -0.09897994995117188, -0.088348388671875, -0.07771682739257812, -0.06708526611328125, -0.056453704833984375, -0.0458221435546875, -0.035190582275390625, -0.02455902099609375, -0.013927459716796875, -0.0032958984375, 0.007335662841796875, 0.01796722412109375, 0.028598785400390625, 0.0392303466796875, 0.049861907958984375, 0.06049346923828125, 0.07112503051757812, 0.081756591796875, 0.09238815307617188, 0.10301971435546875, 0.11365127563476562, 0.1242828369140625, 0.13491439819335938, 0.14554595947265625, 0.15617752075195312, 0.16680908203125, 0.17744064331054688, 0.18807220458984375, 0.19870376586914062, 0.2093353271484375, 0.21996688842773438, 0.23059844970703125, 0.24123001098632812, 0.251861572265625, 0.2624931335449219, 0.27312469482421875, 0.2837562561035156, 0.2943878173828125, 0.3050193786621094, 0.31565093994140625, 0.3262825012207031, 0.3369140625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 4.0, 3.0, 9.0, 4.0, 9.0, 11.0, 14.0, 27.0, 42.0, 62.0, 97.0, 174.0, 282.0, 484.0, 841.0, 735.0, 475.0, 294.0, 162.0, 121.0, 77.0, 57.0, 25.0, 22.0, 14.0, 12.0, 10.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.351806640625, -0.34043121337890625, -0.3290557861328125, -0.31768035888671875, -0.306304931640625, -0.29492950439453125, -0.2835540771484375, -0.27217864990234375, -0.26080322265625, -0.24942779541015625, -0.2380523681640625, -0.22667694091796875, -0.215301513671875, -0.20392608642578125, -0.1925506591796875, -0.18117523193359375, -0.1697998046875, -0.15842437744140625, -0.1470489501953125, -0.13567352294921875, -0.124298095703125, -0.11292266845703125, -0.1015472412109375, -0.09017181396484375, -0.07879638671875, -0.06742095947265625, -0.0560455322265625, -0.04467010498046875, -0.033294677734375, -0.02191925048828125, -0.0105438232421875, 0.00083160400390625, 0.01220703125, 0.02358245849609375, 0.0349578857421875, 0.04633331298828125, 0.057708740234375, 0.06908416748046875, 0.0804595947265625, 0.09183502197265625, 0.10321044921875, 0.11458587646484375, 0.1259613037109375, 0.13733673095703125, 0.148712158203125, 0.16008758544921875, 0.1714630126953125, 0.18283843994140625, 0.1942138671875, 0.20558929443359375, 0.2169647216796875, 0.22834014892578125, 0.239715576171875, 0.25109100341796875, 0.2624664306640625, 0.27384185791015625, 0.28521728515625, 0.29659271240234375, 0.3079681396484375, 0.31934356689453125, 0.330718994140625, 0.34209442138671875, 0.3534698486328125, 0.36484527587890625, 0.376220703125]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 5.0, 5.0, 8.0, 12.0, 18.0, 18.0, 41.0, 63.0, 68.0, 78.0, 100.0, 97.0, 96.0, 65.0, 64.0, 66.0, 67.0, 33.0, 36.0, 20.0, 14.0, 11.0, 5.0, 2.0, 8.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8440837860107422, -0.800579309463501, -0.7570748329162598, -0.7135703563690186, -0.6700658798217773, -0.6265614032745361, -0.5830568671226501, -0.5395523905754089, -0.4960479140281677, -0.4525434374809265, -0.4090389609336853, -0.3655344545841217, -0.3220299780368805, -0.2785255014896393, -0.23502099514007568, -0.19151651859283447, -0.14801204204559326, -0.10450755804777145, -0.061003074049949646, -0.01749858260154724, 0.02600589394569397, 0.06951037049293518, 0.11301487684249878, 0.15651935338974, 0.2000238299369812, 0.2435283064842224, 0.2870327830314636, 0.3305372893810272, 0.37404176592826843, 0.41754624247550964, 0.46105074882507324, 0.5045552253723145, 0.5480598211288452, 0.5915642976760864, 0.6350687742233276, 0.6785732507705688, 0.7220777273178101, 0.7655822038650513, 0.8090867400169373, 0.8525912165641785, 0.8960956931114197, 0.9396001696586609, 0.9831046462059021, 1.026609182357788, 1.0701136589050293, 1.1136181354522705, 1.1571226119995117, 1.200627088546753, 1.2441315650939941, 1.2876360416412354, 1.3311405181884766, 1.3746449947357178, 1.418149471282959, 1.4616539478302002, 1.5051584243774414, 1.5486629009246826, 1.5921673774719238, 1.635671854019165, 1.6791763305664062, 1.7226808071136475, 1.7661852836608887, 1.8096897602081299, 1.853194236755371, 1.8966987133026123, 1.940203309059143]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 4.0, 3.0, 3.0, 3.0, 3.0, 8.0, 9.0, 4.0, 9.0, 12.0, 14.0, 18.0, 12.0, 20.0, 28.0, 31.0, 24.0, 30.0, 28.0, 34.0, 43.0, 38.0, 53.0, 56.0, 40.0, 37.0, 29.0, 30.0, 40.0, 42.0, 28.0, 33.0, 38.0, 31.0, 26.0, 23.0, 21.0, 20.0, 11.0, 10.0, 17.0, 7.0, 7.0, 10.0, 6.0, 5.0, 2.0, 7.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.9024205207824707, -0.8757908940315247, -0.8491612672805786, -0.8225316405296326, -0.7959020137786865, -0.7692723870277405, -0.7426427602767944, -0.7160131335258484, -0.6893835067749023, -0.6627538800239563, -0.6361242532730103, -0.6094946265220642, -0.5828649997711182, -0.5562353730201721, -0.5296057462692261, -0.50297611951828, -0.476346492767334, -0.44971686601638794, -0.4230872392654419, -0.39645761251449585, -0.3698279857635498, -0.34319835901260376, -0.3165687322616577, -0.28993910551071167, -0.2633094787597656, -0.23667985200881958, -0.21005022525787354, -0.1834205985069275, -0.15679097175598145, -0.1301613450050354, -0.10353171825408936, -0.07690209150314331, -0.05027240514755249, -0.023642778396606445, 0.0029868483543395996, 0.029616475105285645, 0.05624610185623169, 0.08287572860717773, 0.10950535535812378, 0.13613498210906982, 0.16276460886001587, 0.18939423561096191, 0.21602386236190796, 0.242653489112854, 0.26928311586380005, 0.2959127426147461, 0.32254236936569214, 0.3491719961166382, 0.37580162286758423, 0.4024312496185303, 0.4290608763694763, 0.45569050312042236, 0.4823201298713684, 0.5089497566223145, 0.5355793833732605, 0.5622090101242065, 0.5888386368751526, 0.6154682636260986, 0.6420978903770447, 0.6687275171279907, 0.6953571438789368, 0.7219867706298828, 0.7486163973808289, 0.7752460241317749, 0.801875650882721]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 3.0, 2.0, 7.0, 4.0, 5.0, 5.0, 13.0, 18.0, 18.0, 38.0, 42.0, 72.0, 111.0, 180.0, 214.0, 432.0, 655.0, 1146.0, 1909.0, 3401.0, 6229.0, 11375.0, 21008.0, 39666.0, 77108.0, 166414.0, 295474.0, 215712.0, 99865.0, 49321.0, 26201.0, 14133.0, 7753.0, 4185.0, 2414.0, 1323.0, 821.0, 477.0, 279.0, 182.0, 100.0, 74.0, 46.0, 42.0, 27.0, 14.0, 10.0, 8.0, 9.0, 5.0, 6.0, 1.0, 1.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.207275390625, -0.20004653930664062, -0.19281768798828125, -0.18558883666992188, -0.1783599853515625, -0.17113113403320312, -0.16390228271484375, -0.15667343139648438, -0.149444580078125, -0.14221572875976562, -0.13498687744140625, -0.12775802612304688, -0.1205291748046875, -0.11330032348632812, -0.10607147216796875, -0.09884262084960938, -0.09161376953125, -0.08438491821289062, -0.07715606689453125, -0.06992721557617188, -0.0626983642578125, -0.055469512939453125, -0.04824066162109375, -0.041011810302734375, -0.033782958984375, -0.026554107666015625, -0.01932525634765625, -0.012096405029296875, -0.0048675537109375, 0.002361297607421875, 0.00959014892578125, 0.016819000244140625, 0.0240478515625, 0.031276702880859375, 0.03850555419921875, 0.045734405517578125, 0.0529632568359375, 0.060192108154296875, 0.06742095947265625, 0.07464981079101562, 0.081878662109375, 0.08910751342773438, 0.09633636474609375, 0.10356521606445312, 0.1107940673828125, 0.11802291870117188, 0.12525177001953125, 0.13248062133789062, 0.13970947265625, 0.14693832397460938, 0.15416717529296875, 0.16139602661132812, 0.1686248779296875, 0.17585372924804688, 0.18308258056640625, 0.19031143188476562, 0.197540283203125, 0.20476913452148438, 0.21199798583984375, 0.21922683715820312, 0.2264556884765625, 0.23368453979492188, 0.24091339111328125, 0.24814224243164062, 0.25537109375]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 5.0, 6.0, 23.0, 45.0, 40.0, 58.0, 91.0, 102.0, 110.0, 124.0, 123.0, 105.0, 73.0, 55.0, 17.0, 20.0, 8.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.427734375, -0.41512298583984375, -0.4025115966796875, -0.38990020751953125, -0.377288818359375, -0.36467742919921875, -0.3520660400390625, -0.33945465087890625, -0.32684326171875, -0.31423187255859375, -0.3016204833984375, -0.28900909423828125, -0.276397705078125, -0.26378631591796875, -0.2511749267578125, -0.23856353759765625, -0.2259521484375, -0.21334075927734375, -0.2007293701171875, -0.18811798095703125, -0.175506591796875, -0.16289520263671875, -0.1502838134765625, -0.13767242431640625, -0.12506103515625, -0.11244964599609375, -0.0998382568359375, -0.08722686767578125, -0.074615478515625, -0.06200408935546875, -0.0493927001953125, -0.03678131103515625, -0.024169921875, -0.01155853271484375, 0.0010528564453125, 0.01366424560546875, 0.026275634765625, 0.03888702392578125, 0.0514984130859375, 0.06410980224609375, 0.07672119140625, 0.08933258056640625, 0.1019439697265625, 0.11455535888671875, 0.127166748046875, 0.13977813720703125, 0.1523895263671875, 0.16500091552734375, 0.1776123046875, 0.19022369384765625, 0.2028350830078125, 0.21544647216796875, 0.228057861328125, 0.24066925048828125, 0.2532806396484375, 0.26589202880859375, 0.27850341796875, 0.29111480712890625, 0.3037261962890625, 0.31633758544921875, 0.328948974609375, 0.34156036376953125, 0.3541717529296875, 0.36678314208984375, 0.37939453125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 5.0, 8.0, 4.0, 11.0, 7.0, 15.0, 19.0, 24.0, 25.0, 45.0, 39.0, 77.0, 146.0, 244.0, 553.0, 1327.0, 3412.0, 9900.0, 30837.0, 113839.0, 530273.0, 271465.0, 58585.0, 17749.0, 5942.0, 2128.0, 872.0, 397.0, 196.0, 114.0, 75.0, 49.0, 46.0, 23.0, 30.0, 21.0, 16.0, 12.0, 6.0, 5.0, 2.0, 5.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.546875, -0.530181884765625, -0.51348876953125, -0.496795654296875, -0.4801025390625, -0.463409423828125, -0.44671630859375, -0.430023193359375, -0.413330078125, -0.396636962890625, -0.37994384765625, -0.363250732421875, -0.3465576171875, -0.329864501953125, -0.31317138671875, -0.296478271484375, -0.27978515625, -0.263092041015625, -0.24639892578125, -0.229705810546875, -0.2130126953125, -0.196319580078125, -0.17962646484375, -0.162933349609375, -0.146240234375, -0.129547119140625, -0.11285400390625, -0.096160888671875, -0.0794677734375, -0.062774658203125, -0.04608154296875, -0.029388427734375, -0.0126953125, 0.003997802734375, 0.02069091796875, 0.037384033203125, 0.0540771484375, 0.070770263671875, 0.08746337890625, 0.104156494140625, 0.120849609375, 0.137542724609375, 0.15423583984375, 0.170928955078125, 0.1876220703125, 0.204315185546875, 0.22100830078125, 0.237701416015625, 0.25439453125, 0.271087646484375, 0.28778076171875, 0.304473876953125, 0.3211669921875, 0.337860107421875, 0.35455322265625, 0.371246337890625, 0.387939453125, 0.404632568359375, 0.42132568359375, 0.438018798828125, 0.4547119140625, 0.471405029296875, 0.48809814453125, 0.504791259765625, 0.521484375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 2.0, 4.0, 2.0, 2.0, 6.0, 5.0, 9.0, 7.0, 13.0, 11.0, 22.0, 31.0, 12.0, 34.0, 40.0, 28.0, 28.0, 43.0, 41.0, 32.0, 43.0, 51.0, 53.0, 45.0, 59.0, 50.0, 42.0, 45.0, 39.0, 41.0, 31.0, 20.0, 23.0, 18.0, 14.0, 14.0, 9.0, 4.0, 8.0, 7.0, 5.0, 3.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.50439453125, -0.4898796081542969, -0.47536468505859375, -0.4608497619628906, -0.4463348388671875, -0.4318199157714844, -0.41730499267578125, -0.4027900695800781, -0.388275146484375, -0.3737602233886719, -0.35924530029296875, -0.3447303771972656, -0.3302154541015625, -0.3157005310058594, -0.30118560791015625, -0.2866706848144531, -0.27215576171875, -0.2576408386230469, -0.24312591552734375, -0.22861099243164062, -0.2140960693359375, -0.19958114624023438, -0.18506622314453125, -0.17055130004882812, -0.156036376953125, -0.14152145385742188, -0.12700653076171875, -0.11249160766601562, -0.0979766845703125, -0.08346176147460938, -0.06894683837890625, -0.054431915283203125, -0.0399169921875, -0.025402069091796875, -0.01088714599609375, 0.003627777099609375, 0.0181427001953125, 0.032657623291015625, 0.04717254638671875, 0.061687469482421875, 0.076202392578125, 0.09071731567382812, 0.10523223876953125, 0.11974716186523438, 0.1342620849609375, 0.14877700805664062, 0.16329193115234375, 0.17780685424804688, 0.19232177734375, 0.20683670043945312, 0.22135162353515625, 0.23586654663085938, 0.2503814697265625, 0.2648963928222656, 0.27941131591796875, 0.2939262390136719, 0.308441162109375, 0.3229560852050781, 0.33747100830078125, 0.3519859313964844, 0.3665008544921875, 0.3810157775878906, 0.39553070068359375, 0.4100456237792969, 0.424560546875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 5.0, 6.0, 13.0, 21.0, 30.0, 30.0, 69.0, 104.0, 176.0, 283.0, 435.0, 882.0, 1642.0, 3108.0, 6475.0, 13230.0, 27433.0, 54547.0, 129858.0, 430889.0, 230364.0, 75819.0, 37128.0, 18208.0, 8827.0, 4263.0, 2169.0, 1122.0, 593.0, 324.0, 194.0, 117.0, 83.0, 34.0, 23.0, 19.0, 19.0, 6.0, 2.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1783447265625, -0.1721343994140625, -0.165924072265625, -0.1597137451171875, -0.15350341796875, -0.1472930908203125, -0.141082763671875, -0.1348724365234375, -0.128662109375, -0.1224517822265625, -0.116241455078125, -0.1100311279296875, -0.10382080078125, -0.0976104736328125, -0.091400146484375, -0.0851898193359375, -0.0789794921875, -0.0727691650390625, -0.066558837890625, -0.0603485107421875, -0.05413818359375, -0.0479278564453125, -0.041717529296875, -0.0355072021484375, -0.029296875, -0.0230865478515625, -0.016876220703125, -0.0106658935546875, -0.00445556640625, 0.0017547607421875, 0.007965087890625, 0.0141754150390625, 0.0203857421875, 0.0265960693359375, 0.032806396484375, 0.0390167236328125, 0.04522705078125, 0.0514373779296875, 0.057647705078125, 0.0638580322265625, 0.070068359375, 0.0762786865234375, 0.082489013671875, 0.0886993408203125, 0.09490966796875, 0.1011199951171875, 0.107330322265625, 0.1135406494140625, 0.1197509765625, 0.1259613037109375, 0.132171630859375, 0.1383819580078125, 0.14459228515625, 0.1508026123046875, 0.157012939453125, 0.1632232666015625, 0.16943359375, 0.1756439208984375, 0.181854248046875, 0.1880645751953125, 0.19427490234375, 0.2004852294921875, 0.206695556640625, 0.2129058837890625, 0.2191162109375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 8.0, 8.0, 4.0, 14.0, 12.0, 13.0, 24.0, 15.0, 28.0, 46.0, 48.0, 80.0, 119.0, 137.0, 133.0, 105.0, 45.0, 30.0, 27.0, 5.0, 15.0, 20.0, 14.0, 10.0, 7.0, 6.0, 7.0, 4.0, 6.0, 2.0, 2.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.310773849487305e-05, -5.172844976186752e-05, -5.0349161028862e-05, -4.8969872295856476e-05, -4.759058356285095e-05, -4.621129482984543e-05, -4.4832006096839905e-05, -4.345271736383438e-05, -4.207342863082886e-05, -4.0694139897823334e-05, -3.931485116481781e-05, -3.7935562431812286e-05, -3.655627369880676e-05, -3.517698496580124e-05, -3.3797696232795715e-05, -3.241840749979019e-05, -3.103911876678467e-05, -2.9659830033779144e-05, -2.828054130077362e-05, -2.6901252567768097e-05, -2.5521963834762573e-05, -2.414267510175705e-05, -2.2763386368751526e-05, -2.1384097635746002e-05, -2.000480890274048e-05, -1.8625520169734955e-05, -1.724623143672943e-05, -1.5866942703723907e-05, -1.4487653970718384e-05, -1.310836523771286e-05, -1.1729076504707336e-05, -1.0349787771701813e-05, -8.970499038696289e-06, -7.591210305690765e-06, -6.211921572685242e-06, -4.832632839679718e-06, -3.4533441066741943e-06, -2.0740553736686707e-06, -6.94766640663147e-07, 6.845220923423767e-07, 2.0638108253479004e-06, 3.443099558353424e-06, 4.822388291358948e-06, 6.2016770243644714e-06, 7.580965757369995e-06, 8.960254490375519e-06, 1.0339543223381042e-05, 1.1718831956386566e-05, 1.309812068939209e-05, 1.4477409422397614e-05, 1.5856698155403137e-05, 1.723598688840866e-05, 1.8615275621414185e-05, 1.9994564354419708e-05, 2.1373853087425232e-05, 2.2753141820430756e-05, 2.413243055343628e-05, 2.5511719286441803e-05, 2.6891008019447327e-05, 2.827029675245285e-05, 2.9649585485458374e-05, 3.10288742184639e-05, 3.240816295146942e-05, 3.3787451684474945e-05, 3.516674041748047e-05]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 6.0, 8.0, 11.0, 20.0, 27.0, 57.0, 106.0, 289.0, 1003.0, 6478.0, 63109.0, 760397.0, 195366.0, 18672.0, 2218.0, 445.0, 166.0, 66.0, 42.0, 27.0, 22.0, 9.0, 5.0, 8.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6875, -0.6687850952148438, -0.6500701904296875, -0.6313552856445312, -0.612640380859375, -0.5939254760742188, -0.5752105712890625, -0.5564956665039062, -0.53778076171875, -0.5190658569335938, -0.5003509521484375, -0.48163604736328125, -0.462921142578125, -0.44420623779296875, -0.4254913330078125, -0.40677642822265625, -0.3880615234375, -0.36934661865234375, -0.3506317138671875, -0.33191680908203125, -0.313201904296875, -0.29448699951171875, -0.2757720947265625, -0.25705718994140625, -0.23834228515625, -0.21962738037109375, -0.2009124755859375, -0.18219757080078125, -0.163482666015625, -0.14476776123046875, -0.1260528564453125, -0.10733795166015625, -0.088623046875, -0.06990814208984375, -0.0511932373046875, -0.03247833251953125, -0.013763427734375, 0.00495147705078125, 0.0236663818359375, 0.04238128662109375, 0.06109619140625, 0.07981109619140625, 0.0985260009765625, 0.11724090576171875, 0.135955810546875, 0.15467071533203125, 0.1733856201171875, 0.19210052490234375, 0.2108154296875, 0.22953033447265625, 0.2482452392578125, 0.26696014404296875, 0.285675048828125, 0.30438995361328125, 0.3231048583984375, 0.34181976318359375, 0.36053466796875, 0.37924957275390625, 0.3979644775390625, 0.41667938232421875, 0.435394287109375, 0.45410919189453125, 0.4728240966796875, 0.49153900146484375, 0.51025390625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 2.0, 2.0, 3.0, 9.0, 8.0, 10.0, 12.0, 11.0, 16.0, 19.0, 22.0, 27.0, 31.0, 45.0, 68.0, 85.0, 105.0, 118.0, 90.0, 71.0, 60.0, 34.0, 22.0, 17.0, 23.0, 11.0, 18.0, 10.0, 11.0, 15.0, 6.0, 5.0, 5.0, 3.0, 2.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.220947265625, -0.21503067016601562, -0.20911407470703125, -0.20319747924804688, -0.1972808837890625, -0.19136428833007812, -0.18544769287109375, -0.17953109741210938, -0.173614501953125, -0.16769790649414062, -0.16178131103515625, -0.15586471557617188, -0.1499481201171875, -0.14403152465820312, -0.13811492919921875, -0.13219833374023438, -0.12628173828125, -0.12036514282226562, -0.11444854736328125, -0.10853195190429688, -0.1026153564453125, -0.09669876098632812, -0.09078216552734375, -0.08486557006835938, -0.078948974609375, -0.07303237915039062, -0.06711578369140625, -0.061199188232421875, -0.0552825927734375, -0.049365997314453125, -0.04344940185546875, -0.037532806396484375, -0.0316162109375, -0.025699615478515625, -0.01978302001953125, -0.013866424560546875, -0.0079498291015625, -0.002033233642578125, 0.00388336181640625, 0.009799957275390625, 0.015716552734375, 0.021633148193359375, 0.02754974365234375, 0.033466339111328125, 0.0393829345703125, 0.045299530029296875, 0.05121612548828125, 0.057132720947265625, 0.06304931640625, 0.06896591186523438, 0.07488250732421875, 0.08079910278320312, 0.0867156982421875, 0.09263229370117188, 0.09854888916015625, 0.10446548461914062, 0.110382080078125, 0.11629867553710938, 0.12221527099609375, 0.12813186645507812, 0.1340484619140625, 0.13996505737304688, 0.14588165283203125, 0.15179824829101562, 0.15771484375]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [2.0, 4.0, 2.0, 11.0, 13.0, 43.0, 80.0, 162.0, 219.0, 204.0, 158.0, 68.0, 26.0, 15.0, 6.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1647193431854248, -1.0363401174545288, -0.9079607725143433, -0.7795815467834473, -0.6512022614479065, -0.5228229761123657, -0.3944437503814697, -0.26606446504592896, -0.13768517971038818, -0.009305909276008606, 0.11907336115837097, 0.24745261669158936, 0.3758319020271301, 0.5042111873626709, 0.6325904130935669, 0.7609696984291077, 0.8893489837646484, 1.0177282094955444, 1.14610755443573, 1.274486780166626, 1.4028661251068115, 1.5312453508377075, 1.6596245765686035, 1.788003921508789, 1.916383147239685, 2.044762372970581, 2.1731417179107666, 2.301520824432373, 2.4299001693725586, 2.558279514312744, 2.6866588592529297, 2.815037965774536, 2.9434170722961426, 3.071796417236328, 3.2001755237579346, 3.32855486869812, 3.4569342136383057, 3.585313320159912, 3.7136926651000977, 3.842072010040283, 3.9704513549804688, 4.098830699920654, 4.22721004486084, 4.355588912963867, 4.483968257904053, 4.612347602844238, 4.740726947784424, 4.869106292724609, 4.997485160827637, 5.125864505767822, 5.254243850708008, 5.382622718811035, 5.511002063751221, 5.639381408691406, 5.767760753631592, 5.896140098571777, 6.024519443511963, 6.152898788452148, 6.281278133392334, 6.4096574783325195, 6.538036346435547, 6.666415691375732, 6.794795036315918, 6.9231743812561035, 7.051553726196289]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 5.0, 6.0, 4.0, 8.0, 6.0, 4.0, 16.0, 11.0, 23.0, 19.0, 24.0, 21.0, 20.0, 28.0, 23.0, 29.0, 33.0, 37.0, 47.0, 34.0, 38.0, 41.0, 36.0, 42.0, 42.0, 36.0, 46.0, 39.0, 32.0, 16.0, 26.0, 21.0, 28.0, 28.0, 14.0, 19.0, 14.0, 21.0, 20.0, 10.0, 9.0, 8.0, 6.0, 5.0, 5.0, 2.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1130900382995605, -1.0770313739776611, -1.0409727096557617, -1.0049141645431519, -0.9688555002212524, -0.932796835899353, -0.8967382311820984, -0.8606796264648438, -0.8246209621429443, -0.7885622978210449, -0.7525036931037903, -0.7164450883865356, -0.6803864240646362, -0.6443277597427368, -0.6082691550254822, -0.5722105503082275, -0.5361518859863281, -0.5000932216644287, -0.4640346169471741, -0.42797598242759705, -0.39191734790802, -0.355858713388443, -0.31980007886886597, -0.28374144434928894, -0.24768280982971191, -0.2116241753101349, -0.17556554079055786, -0.13950690627098083, -0.10344827175140381, -0.06738963723182678, -0.031331002712249756, 0.0047276318073272705, 0.04078638553619385, 0.07684502005577087, 0.1129036545753479, 0.14896228909492493, 0.18502092361450195, 0.22107955813407898, 0.257138192653656, 0.29319682717323303, 0.32925546169281006, 0.3653140962123871, 0.4013727307319641, 0.43743136525154114, 0.47348999977111816, 0.5095486640930176, 0.5456072688102722, 0.5816658735275269, 0.6177245378494263, 0.6537832021713257, 0.6898418068885803, 0.725900411605835, 0.7619590759277344, 0.7980177402496338, 0.8340763449668884, 0.8701349496841431, 0.9061936140060425, 0.9422522783279419, 0.9783108830451965, 1.0143694877624512, 1.0504281520843506, 1.08648681640625, 1.1225454807281494, 1.1586040258407593, 1.1946626901626587]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 5.0, 4.0, 3.0, 8.0, 7.0, 15.0, 28.0, 36.0, 38.0, 67.0, 99.0, 144.0, 215.0, 375.0, 585.0, 1207.0, 2325.0, 5276.0, 13163.0, 39148.0, 145319.0, 798953.0, 2560778.0, 478129.0, 101210.0, 28824.0, 10172.0, 4128.0, 1896.0, 872.0, 476.0, 284.0, 188.0, 121.0, 69.0, 43.0, 28.0, 14.0, 12.0, 9.0, 4.0, 4.0, 5.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.38134765625, -0.3708610534667969, -0.36037445068359375, -0.3498878479003906, -0.3394012451171875, -0.3289146423339844, -0.31842803955078125, -0.3079414367675781, -0.297454833984375, -0.2869682312011719, -0.27648162841796875, -0.2659950256347656, -0.2555084228515625, -0.24502182006835938, -0.23453521728515625, -0.22404861450195312, -0.21356201171875, -0.20307540893554688, -0.19258880615234375, -0.18210220336914062, -0.1716156005859375, -0.16112899780273438, -0.15064239501953125, -0.14015579223632812, -0.129669189453125, -0.11918258666992188, -0.10869598388671875, -0.09820938110351562, -0.0877227783203125, -0.07723617553710938, -0.06674957275390625, -0.056262969970703125, -0.0457763671875, -0.035289764404296875, -0.02480316162109375, -0.014316558837890625, -0.0038299560546875, 0.006656646728515625, 0.01714324951171875, 0.027629852294921875, 0.038116455078125, 0.048603057861328125, 0.05908966064453125, 0.06957626342773438, 0.0800628662109375, 0.09054946899414062, 0.10103607177734375, 0.11152267456054688, 0.12200927734375, 0.13249588012695312, 0.14298248291015625, 0.15346908569335938, 0.1639556884765625, 0.17444229125976562, 0.18492889404296875, 0.19541549682617188, 0.205902099609375, 0.21638870239257812, 0.22687530517578125, 0.23736190795898438, 0.2478485107421875, 0.2583351135253906, 0.26882171630859375, 0.2793083190917969, 0.289794921875]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 8.0, 12.0, 17.0, 34.0, 42.0, 58.0, 67.0, 79.0, 90.0, 118.0, 123.0, 110.0, 89.0, 57.0, 39.0, 27.0, 24.0, 10.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.432861328125, -0.4203224182128906, -0.40778350830078125, -0.3952445983886719, -0.3827056884765625, -0.3701667785644531, -0.35762786865234375, -0.3450889587402344, -0.332550048828125, -0.3200111389160156, -0.30747222900390625, -0.2949333190917969, -0.2823944091796875, -0.2698554992675781, -0.25731658935546875, -0.24477767944335938, -0.23223876953125, -0.21969985961914062, -0.20716094970703125, -0.19462203979492188, -0.1820831298828125, -0.16954421997070312, -0.15700531005859375, -0.14446640014648438, -0.131927490234375, -0.11938858032226562, -0.10684967041015625, -0.09431076049804688, -0.0817718505859375, -0.06923294067382812, -0.05669403076171875, -0.044155120849609375, -0.0316162109375, -0.019077301025390625, -0.00653839111328125, 0.006000518798828125, 0.0185394287109375, 0.031078338623046875, 0.04361724853515625, 0.056156158447265625, 0.068695068359375, 0.08123397827148438, 0.09377288818359375, 0.10631179809570312, 0.1188507080078125, 0.13138961791992188, 0.14392852783203125, 0.15646743774414062, 0.16900634765625, 0.18154525756835938, 0.19408416748046875, 0.20662307739257812, 0.2191619873046875, 0.23170089721679688, 0.24423980712890625, 0.2567787170410156, 0.269317626953125, 0.2818565368652344, 0.29439544677734375, 0.3069343566894531, 0.3194732666015625, 0.3320121765136719, 0.34455108642578125, 0.3570899963378906, 0.36962890625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 4.0, 2.0, 7.0, 5.0, 8.0, 6.0, 9.0, 16.0, 17.0, 18.0, 37.0, 37.0, 78.0, 88.0, 140.0, 163.0, 247.0, 344.0, 523.0, 779.0, 1277.0, 2034.0, 3685.0, 6887.0, 14522.0, 35404.0, 104234.0, 391988.0, 2052066.0, 1215764.0, 242478.0, 70516.0, 26066.0, 11259.0, 5484.0, 3013.0, 1750.0, 1111.0, 668.0, 441.0, 345.0, 212.0, 157.0, 110.0, 67.0, 56.0, 51.0, 35.0, 25.0, 12.0, 13.0, 16.0, 7.0, 2.0, 4.0, 1.0, 2.0, 3.0], "bins": [-0.447265625, -0.43442535400390625, -0.4215850830078125, -0.40874481201171875, -0.395904541015625, -0.38306427001953125, -0.3702239990234375, -0.35738372802734375, -0.34454345703125, -0.33170318603515625, -0.3188629150390625, -0.30602264404296875, -0.293182373046875, -0.28034210205078125, -0.2675018310546875, -0.25466156005859375, -0.2418212890625, -0.22898101806640625, -0.2161407470703125, -0.20330047607421875, -0.190460205078125, -0.17761993408203125, -0.1647796630859375, -0.15193939208984375, -0.13909912109375, -0.12625885009765625, -0.1134185791015625, -0.10057830810546875, -0.087738037109375, -0.07489776611328125, -0.0620574951171875, -0.04921722412109375, -0.036376953125, -0.02353668212890625, -0.0106964111328125, 0.00214385986328125, 0.014984130859375, 0.02782440185546875, 0.0406646728515625, 0.05350494384765625, 0.06634521484375, 0.07918548583984375, 0.0920257568359375, 0.10486602783203125, 0.117706298828125, 0.13054656982421875, 0.1433868408203125, 0.15622711181640625, 0.1690673828125, 0.18190765380859375, 0.1947479248046875, 0.20758819580078125, 0.220428466796875, 0.23326873779296875, 0.2461090087890625, 0.25894927978515625, 0.27178955078125, 0.28462982177734375, 0.2974700927734375, 0.31031036376953125, 0.323150634765625, 0.33599090576171875, 0.3488311767578125, 0.36167144775390625, 0.37451171875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 7.0, 5.0, 9.0, 5.0, 12.0, 18.0, 24.0, 33.0, 46.0, 75.0, 137.0, 203.0, 380.0, 750.0, 900.0, 549.0, 331.0, 214.0, 133.0, 70.0, 48.0, 46.0, 20.0, 23.0, 9.0, 6.0, 5.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.609375, -0.5942611694335938, -0.5791473388671875, -0.5640335083007812, -0.548919677734375, -0.5338058471679688, -0.5186920166015625, -0.5035781860351562, -0.48846435546875, -0.47335052490234375, -0.4582366943359375, -0.44312286376953125, -0.428009033203125, -0.41289520263671875, -0.3977813720703125, -0.38266754150390625, -0.3675537109375, -0.35243988037109375, -0.3373260498046875, -0.32221221923828125, -0.307098388671875, -0.29198455810546875, -0.2768707275390625, -0.26175689697265625, -0.24664306640625, -0.23152923583984375, -0.2164154052734375, -0.20130157470703125, -0.186187744140625, -0.17107391357421875, -0.1559600830078125, -0.14084625244140625, -0.125732421875, -0.11061859130859375, -0.0955047607421875, -0.08039093017578125, -0.065277099609375, -0.05016326904296875, -0.0350494384765625, -0.01993560791015625, -0.00482177734375, 0.01029205322265625, 0.0254058837890625, 0.04051971435546875, 0.055633544921875, 0.07074737548828125, 0.0858612060546875, 0.10097503662109375, 0.1160888671875, 0.13120269775390625, 0.1463165283203125, 0.16143035888671875, 0.176544189453125, 0.19165802001953125, 0.2067718505859375, 0.22188568115234375, 0.23699951171875, 0.25211334228515625, 0.2672271728515625, 0.28234100341796875, 0.297454833984375, 0.31256866455078125, 0.3276824951171875, 0.34279632568359375, 0.35791015625]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 5.0, 7.0, 17.0, 9.0, 20.0, 38.0, 47.0, 63.0, 76.0, 84.0, 84.0, 95.0, 112.0, 86.0, 63.0, 52.0, 50.0, 27.0, 19.0, 17.0, 9.0, 14.0, 6.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1602160930633545, -1.0958607196807861, -1.0315054655075073, -0.9671501517295837, -0.9027948379516602, -0.8384395241737366, -0.774084210395813, -0.7097288966178894, -0.6453735828399658, -0.5810182690620422, -0.5166629552841187, -0.45230764150619507, -0.3879523277282715, -0.3235970139503479, -0.2592417001724243, -0.19488638639450073, -0.13053107261657715, -0.06617575883865356, -0.0018204450607299805, 0.0625348687171936, 0.1268901824951172, 0.19124549627304077, 0.25560081005096436, 0.31995612382888794, 0.3843114376068115, 0.4486667513847351, 0.5130220651626587, 0.5773773789405823, 0.6417326927185059, 0.7060880064964294, 0.770443320274353, 0.8347986340522766, 0.8991537094116211, 0.9635090231895447, 1.0278643369674683, 1.092219591140747, 1.1565749645233154, 1.2209303379058838, 1.2852855920791626, 1.3496408462524414, 1.4139962196350098, 1.4783515930175781, 1.542706847190857, 1.6070621013641357, 1.671417474746704, 1.7357728481292725, 1.8001281023025513, 1.86448335647583, 1.9288387298583984, 1.9931941032409668, 2.057549476623535, 2.1219046115875244, 2.1862599849700928, 2.250615358352661, 2.3149704933166504, 2.3793258666992188, 2.443681240081787, 2.5080366134643555, 2.572391986846924, 2.636747121810913, 2.7011024951934814, 2.76545786857605, 2.829813003540039, 2.8941683769226074, 2.958523750305176]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 1.0, 1.0, 3.0, 8.0, 6.0, 6.0, 9.0, 13.0, 7.0, 9.0, 15.0, 22.0, 20.0, 19.0, 26.0, 20.0, 29.0, 30.0, 29.0, 30.0, 41.0, 48.0, 40.0, 27.0, 36.0, 32.0, 46.0, 41.0, 33.0, 32.0, 37.0, 32.0, 31.0, 27.0, 21.0, 26.0, 22.0, 26.0, 19.0, 15.0, 15.0, 6.0, 8.0, 8.0, 8.0, 8.0, 6.0, 1.0, 4.0, 4.0, 2.0, 3.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.9450762271881104, -0.9114661812782288, -0.8778561353683472, -0.8442460894584656, -0.810636043548584, -0.7770260572433472, -0.7434160113334656, -0.709805965423584, -0.6761959195137024, -0.6425858736038208, -0.6089758276939392, -0.5753657817840576, -0.5417557954788208, -0.5081456899642944, -0.4745357036590576, -0.440925657749176, -0.40731561183929443, -0.37370556592941284, -0.34009552001953125, -0.30648550391197205, -0.27287545800209045, -0.23926541209220886, -0.20565538108348846, -0.17204535007476807, -0.13843530416488647, -0.10482526570558548, -0.07121522724628448, -0.03760518878698349, -0.003995150327682495, 0.029614895582199097, 0.0632249265909195, 0.09683495759963989, 0.13044500350952148, 0.16405504941940308, 0.19766508042812347, 0.23127511143684387, 0.26488515734672546, 0.29849520325660706, 0.33210521936416626, 0.36571526527404785, 0.39932531118392944, 0.43293535709381104, 0.4665454030036926, 0.5001554489135742, 0.533765435218811, 0.5673755407333374, 0.6009855270385742, 0.6345955729484558, 0.6682056188583374, 0.701815664768219, 0.7354257106781006, 0.7690357565879822, 0.8026458024978638, 0.8362557888031006, 0.8698658347129822, 0.9034758806228638, 0.9370859265327454, 0.970695972442627, 1.0043059587478638, 1.0379160642623901, 1.071526050567627, 1.1051361560821533, 1.1387461423873901, 1.172356128692627, 1.2059662342071533]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 10.0, 10.0, 15.0, 7.0, 29.0, 45.0, 65.0, 79.0, 133.0, 156.0, 287.0, 362.0, 658.0, 931.0, 1588.0, 2396.0, 3781.0, 6108.0, 9785.0, 15301.0, 24997.0, 40275.0, 68239.0, 117066.0, 199456.0, 220555.0, 135719.0, 78477.0, 46526.0, 28136.0, 17572.0, 11125.0, 6848.0, 4292.0, 2621.0, 1726.0, 1101.0, 725.0, 443.0, 306.0, 188.0, 127.0, 96.0, 62.0, 47.0, 22.0, 21.0, 15.0, 14.0, 8.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 2.0], "bins": [-0.2498779296875, -0.24210166931152344, -0.23432540893554688, -0.2265491485595703, -0.21877288818359375, -0.2109966278076172, -0.20322036743164062, -0.19544410705566406, -0.1876678466796875, -0.17989158630371094, -0.17211532592773438, -0.1643390655517578, -0.15656280517578125, -0.1487865447998047, -0.14101028442382812, -0.13323402404785156, -0.125457763671875, -0.11768150329589844, -0.10990524291992188, -0.10212898254394531, -0.09435272216796875, -0.08657646179199219, -0.07880020141601562, -0.07102394104003906, -0.0632476806640625, -0.05547142028808594, -0.047695159912109375, -0.03991889953613281, -0.03214263916015625, -0.024366378784179688, -0.016590118408203125, -0.008813858032226562, -0.00103759765625, 0.0067386627197265625, 0.014514923095703125, 0.022291183471679688, 0.03006744384765625, 0.03784370422363281, 0.045619964599609375, 0.05339622497558594, 0.0611724853515625, 0.06894874572753906, 0.07672500610351562, 0.08450126647949219, 0.09227752685546875, 0.10005378723144531, 0.10783004760742188, 0.11560630798339844, 0.123382568359375, 0.13115882873535156, 0.13893508911132812, 0.1467113494873047, 0.15448760986328125, 0.1622638702392578, 0.17004013061523438, 0.17781639099121094, 0.1855926513671875, 0.19336891174316406, 0.20114517211914062, 0.2089214324951172, 0.21669769287109375, 0.2244739532470703, 0.23225021362304688, 0.24002647399902344, 0.247802734375]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 13.0, 9.0, 14.0, 20.0, 36.0, 42.0, 68.0, 70.0, 85.0, 96.0, 112.0, 96.0, 97.0, 77.0, 57.0, 46.0, 27.0, 25.0, 8.0, 7.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.41552734375, -0.4034156799316406, -0.39130401611328125, -0.3791923522949219, -0.3670806884765625, -0.3549690246582031, -0.34285736083984375, -0.3307456970214844, -0.318634033203125, -0.3065223693847656, -0.29441070556640625, -0.2822990417480469, -0.2701873779296875, -0.2580757141113281, -0.24596405029296875, -0.23385238647460938, -0.22174072265625, -0.20962905883789062, -0.19751739501953125, -0.18540573120117188, -0.1732940673828125, -0.16118240356445312, -0.14907073974609375, -0.13695907592773438, -0.124847412109375, -0.11273574829101562, -0.10062408447265625, -0.08851242065429688, -0.0764007568359375, -0.06428909301757812, -0.05217742919921875, -0.040065765380859375, -0.0279541015625, -0.015842437744140625, -0.00373077392578125, 0.008380889892578125, 0.0204925537109375, 0.032604217529296875, 0.04471588134765625, 0.056827545166015625, 0.068939208984375, 0.08105087280273438, 0.09316253662109375, 0.10527420043945312, 0.1173858642578125, 0.12949752807617188, 0.14160919189453125, 0.15372085571289062, 0.16583251953125, 0.17794418334960938, 0.19005584716796875, 0.20216751098632812, 0.2142791748046875, 0.22639083862304688, 0.23850250244140625, 0.2506141662597656, 0.262725830078125, 0.2748374938964844, 0.28694915771484375, 0.2990608215332031, 0.3111724853515625, 0.3232841491699219, 0.33539581298828125, 0.3475074768066406, 0.359619140625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 1.0, 5.0, 6.0, 11.0, 11.0, 10.0, 19.0, 19.0, 26.0, 46.0, 56.0, 68.0, 149.0, 244.0, 561.0, 1575.0, 6111.0, 30738.0, 189659.0, 646876.0, 141178.0, 23780.0, 4986.0, 1302.0, 483.0, 203.0, 132.0, 82.0, 52.0, 37.0, 39.0, 27.0, 6.0, 19.0, 8.0, 4.0, 8.0, 8.0, 3.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.048828125, -1.0174484252929688, -0.9860687255859375, -0.9546890258789062, -0.923309326171875, -0.8919296264648438, -0.8605499267578125, -0.8291702270507812, -0.79779052734375, -0.7664108276367188, -0.7350311279296875, -0.7036514282226562, -0.672271728515625, -0.6408920288085938, -0.6095123291015625, -0.5781326293945312, -0.5467529296875, -0.5153732299804688, -0.4839935302734375, -0.45261383056640625, -0.421234130859375, -0.38985443115234375, -0.3584747314453125, -0.32709503173828125, -0.29571533203125, -0.26433563232421875, -0.2329559326171875, -0.20157623291015625, -0.170196533203125, -0.13881683349609375, -0.1074371337890625, -0.07605743408203125, -0.044677734375, -0.01329803466796875, 0.0180816650390625, 0.04946136474609375, 0.080841064453125, 0.11222076416015625, 0.1436004638671875, 0.17498016357421875, 0.20635986328125, 0.23773956298828125, 0.2691192626953125, 0.30049896240234375, 0.331878662109375, 0.36325836181640625, 0.3946380615234375, 0.42601776123046875, 0.4573974609375, 0.48877716064453125, 0.5201568603515625, 0.5515365600585938, 0.582916259765625, 0.6142959594726562, 0.6456756591796875, 0.6770553588867188, 0.70843505859375, 0.7398147583007812, 0.7711944580078125, 0.8025741577148438, 0.833953857421875, 0.8653335571289062, 0.8967132568359375, 0.9280929565429688, 0.95947265625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 6.0, 5.0, 1.0, 4.0, 5.0, 12.0, 12.0, 9.0, 13.0, 14.0, 11.0, 16.0, 19.0, 25.0, 37.0, 37.0, 31.0, 30.0, 40.0, 40.0, 57.0, 51.0, 60.0, 49.0, 52.0, 51.0, 41.0, 37.0, 30.0, 35.0, 25.0, 26.0, 18.0, 26.0, 17.0, 11.0, 9.0, 8.0, 8.0, 10.0, 7.0, 7.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0], "bins": [-0.65673828125, -0.6376495361328125, -0.618560791015625, -0.5994720458984375, -0.58038330078125, -0.5612945556640625, -0.542205810546875, -0.5231170654296875, -0.5040283203125, -0.4849395751953125, -0.465850830078125, -0.4467620849609375, -0.42767333984375, -0.4085845947265625, -0.389495849609375, -0.3704071044921875, -0.351318359375, -0.3322296142578125, -0.313140869140625, -0.2940521240234375, -0.27496337890625, -0.2558746337890625, -0.236785888671875, -0.2176971435546875, -0.1986083984375, -0.1795196533203125, -0.160430908203125, -0.1413421630859375, -0.12225341796875, -0.1031646728515625, -0.084075927734375, -0.0649871826171875, -0.0458984375, -0.0268096923828125, -0.007720947265625, 0.0113677978515625, 0.03045654296875, 0.0495452880859375, 0.068634033203125, 0.0877227783203125, 0.1068115234375, 0.1259002685546875, 0.144989013671875, 0.1640777587890625, 0.18316650390625, 0.2022552490234375, 0.221343994140625, 0.2404327392578125, 0.259521484375, 0.2786102294921875, 0.297698974609375, 0.3167877197265625, 0.33587646484375, 0.3549652099609375, 0.374053955078125, 0.3931427001953125, 0.4122314453125, 0.4313201904296875, 0.450408935546875, 0.4694976806640625, 0.48858642578125, 0.5076751708984375, 0.526763916015625, 0.5458526611328125, 0.56494140625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 10.0, 7.0, 9.0, 8.0, 10.0, 17.0, 29.0, 51.0, 62.0, 136.0, 187.0, 340.0, 546.0, 994.0, 1815.0, 3561.0, 7694.0, 17346.0, 40157.0, 98762.0, 253664.0, 368283.0, 148321.0, 60004.0, 25277.0, 10900.0, 4937.0, 2451.0, 1225.0, 693.0, 398.0, 274.0, 130.0, 88.0, 51.0, 39.0, 29.0, 18.0, 14.0, 8.0, 6.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0], "bins": [-0.270263671875, -0.2625904083251953, -0.2549171447753906, -0.24724388122558594, -0.23957061767578125, -0.23189735412597656, -0.22422409057617188, -0.2165508270263672, -0.2088775634765625, -0.2012042999267578, -0.19353103637695312, -0.18585777282714844, -0.17818450927734375, -0.17051124572753906, -0.16283798217773438, -0.1551647186279297, -0.147491455078125, -0.1398181915283203, -0.13214492797851562, -0.12447166442871094, -0.11679840087890625, -0.10912513732910156, -0.10145187377929688, -0.09377861022949219, -0.0861053466796875, -0.07843208312988281, -0.07075881958007812, -0.06308555603027344, -0.05541229248046875, -0.04773902893066406, -0.040065765380859375, -0.03239250183105469, -0.02471923828125, -0.017045974731445312, -0.009372711181640625, -0.0016994476318359375, 0.00597381591796875, 0.013647079467773438, 0.021320343017578125, 0.028993606567382812, 0.0366668701171875, 0.04434013366699219, 0.052013397216796875, 0.05968666076660156, 0.06735992431640625, 0.07503318786621094, 0.08270645141601562, 0.09037971496582031, 0.098052978515625, 0.10572624206542969, 0.11339950561523438, 0.12107276916503906, 0.12874603271484375, 0.13641929626464844, 0.14409255981445312, 0.1517658233642578, 0.1594390869140625, 0.1671123504638672, 0.17478561401367188, 0.18245887756347656, 0.19013214111328125, 0.19780540466308594, 0.20547866821289062, 0.2131519317626953, 0.2208251953125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 4.0, 3.0, 1.0, 3.0, 0.0, 4.0, 4.0, 5.0, 10.0, 8.0, 18.0, 17.0, 20.0, 25.0, 28.0, 47.0, 62.0, 76.0, 98.0, 107.0, 101.0, 89.0, 50.0, 46.0, 39.0, 31.0, 18.0, 20.0, 16.0, 13.0, 13.0, 10.0, 5.0, 7.0, 6.0, 2.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.935264587402344e-05, -4.7637149691581726e-05, -4.5921653509140015e-05, -4.42061573266983e-05, -4.249066114425659e-05, -4.077516496181488e-05, -3.905966877937317e-05, -3.734417259693146e-05, -3.5628676414489746e-05, -3.3913180232048035e-05, -3.219768404960632e-05, -3.0482187867164612e-05, -2.87666916847229e-05, -2.705119550228119e-05, -2.5335699319839478e-05, -2.3620203137397766e-05, -2.1904706954956055e-05, -2.0189210772514343e-05, -1.8473714590072632e-05, -1.675821840763092e-05, -1.5042722225189209e-05, -1.3327226042747498e-05, -1.1611729860305786e-05, -9.896233677864075e-06, -8.180737495422363e-06, -6.465241312980652e-06, -4.7497451305389404e-06, -3.034248948097229e-06, -1.3187527656555176e-06, 3.9674341678619385e-07, 2.1122395992279053e-06, 3.827735781669617e-06, 5.543231964111328e-06, 7.2587281465530396e-06, 8.974224328994751e-06, 1.0689720511436462e-05, 1.2405216693878174e-05, 1.4120712876319885e-05, 1.5836209058761597e-05, 1.7551705241203308e-05, 1.926720142364502e-05, 2.098269760608673e-05, 2.2698193788528442e-05, 2.4413689970970154e-05, 2.6129186153411865e-05, 2.7844682335853577e-05, 2.9560178518295288e-05, 3.1275674700737e-05, 3.299117088317871e-05, 3.470666706562042e-05, 3.6422163248062134e-05, 3.8137659430503845e-05, 3.985315561294556e-05, 4.156865179538727e-05, 4.328414797782898e-05, 4.499964416027069e-05, 4.67151403427124e-05, 4.8430636525154114e-05, 5.0146132707595825e-05, 5.186162889003754e-05, 5.357712507247925e-05, 5.529262125492096e-05, 5.700811743736267e-05, 5.872361361980438e-05, 6.0439109802246094e-05]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 5.0, 5.0, 4.0, 8.0, 16.0, 22.0, 25.0, 35.0, 46.0, 86.0, 162.0, 351.0, 1021.0, 3546.0, 15040.0, 79866.0, 467330.0, 396879.0, 66563.0, 12971.0, 2964.0, 860.0, 321.0, 173.0, 74.0, 62.0, 40.0, 25.0, 21.0, 14.0, 4.0, 5.0, 4.0, 1.0, 3.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4453125, -0.4309234619140625, -0.416534423828125, -0.4021453857421875, -0.38775634765625, -0.3733673095703125, -0.358978271484375, -0.3445892333984375, -0.3302001953125, -0.3158111572265625, -0.301422119140625, -0.2870330810546875, -0.27264404296875, -0.2582550048828125, -0.243865966796875, -0.2294769287109375, -0.215087890625, -0.2006988525390625, -0.186309814453125, -0.1719207763671875, -0.15753173828125, -0.1431427001953125, -0.128753662109375, -0.1143646240234375, -0.0999755859375, -0.0855865478515625, -0.071197509765625, -0.0568084716796875, -0.04241943359375, -0.0280303955078125, -0.013641357421875, 0.0007476806640625, 0.01513671875, 0.0295257568359375, 0.043914794921875, 0.0583038330078125, 0.07269287109375, 0.0870819091796875, 0.101470947265625, 0.1158599853515625, 0.1302490234375, 0.1446380615234375, 0.159027099609375, 0.1734161376953125, 0.18780517578125, 0.2021942138671875, 0.216583251953125, 0.2309722900390625, 0.245361328125, 0.2597503662109375, 0.274139404296875, 0.2885284423828125, 0.30291748046875, 0.3173065185546875, 0.331695556640625, 0.3460845947265625, 0.3604736328125, 0.3748626708984375, 0.389251708984375, 0.4036407470703125, 0.41802978515625, 0.4324188232421875, 0.446807861328125, 0.4611968994140625, 0.4755859375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 2.0, 5.0, 3.0, 5.0, 9.0, 12.0, 8.0, 14.0, 6.0, 21.0, 18.0, 22.0, 38.0, 32.0, 39.0, 40.0, 49.0, 83.0, 60.0, 78.0, 74.0, 65.0, 51.0, 41.0, 41.0, 34.0, 25.0, 21.0, 20.0, 21.0, 8.0, 15.0, 5.0, 6.0, 6.0, 4.0, 3.0, 9.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1983642578125, -0.191802978515625, -0.18524169921875, -0.178680419921875, -0.172119140625, -0.165557861328125, -0.15899658203125, -0.152435302734375, -0.1458740234375, -0.139312744140625, -0.13275146484375, -0.126190185546875, -0.11962890625, -0.113067626953125, -0.10650634765625, -0.099945068359375, -0.0933837890625, -0.086822509765625, -0.08026123046875, -0.073699951171875, -0.067138671875, -0.060577392578125, -0.05401611328125, -0.047454833984375, -0.0408935546875, -0.034332275390625, -0.02777099609375, -0.021209716796875, -0.0146484375, -0.008087158203125, -0.00152587890625, 0.005035400390625, 0.0115966796875, 0.018157958984375, 0.02471923828125, 0.031280517578125, 0.037841796875, 0.044403076171875, 0.05096435546875, 0.057525634765625, 0.0640869140625, 0.070648193359375, 0.07720947265625, 0.083770751953125, 0.09033203125, 0.096893310546875, 0.10345458984375, 0.110015869140625, 0.1165771484375, 0.123138427734375, 0.12969970703125, 0.136260986328125, 0.142822265625, 0.149383544921875, 0.15594482421875, 0.162506103515625, 0.1690673828125, 0.175628662109375, 0.18218994140625, 0.188751220703125, 0.1953125, 0.201873779296875, 0.20843505859375, 0.214996337890625, 0.2215576171875]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 2.0, 17.0, 55.0, 168.0, 280.0, 253.0, 174.0, 45.0, 11.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-13.262722969055176, -13.021618843078613, -12.78051471710205, -12.539409637451172, -12.29830551147461, -12.057201385498047, -11.816097259521484, -11.574993133544922, -11.333888053894043, -11.09278392791748, -10.851679801940918, -10.610574722290039, -10.369470596313477, -10.128366470336914, -9.887262344360352, -9.646158218383789, -9.405054092407227, -9.163949966430664, -8.922845840454102, -8.681740760803223, -8.44063663482666, -8.199532508850098, -7.958428382873535, -7.7173237800598145, -7.476219177246094, -7.235115051269531, -6.9940104484558105, -6.752906322479248, -6.511801719665527, -6.270697593688965, -6.029593467712402, -5.788488864898682, -5.547384262084961, -5.306280136108398, -5.065175533294678, -4.824071407318115, -4.5829668045043945, -4.341862678527832, -4.1007585525512695, -3.859653949737549, -3.6185495853424072, -3.3774452209472656, -3.136340856552124, -2.8952364921569824, -2.65413236618042, -2.413027763366699, -2.1719236373901367, -1.9308192729949951, -1.6897149085998535, -1.448610544204712, -1.2075061798095703, -0.9664019346237183, -0.7252975702285767, -0.48419320583343506, -0.243088960647583, -0.0019845962524414062, 0.2391197681427002, 0.4802241027355194, 0.7213284373283386, 0.9624327421188354, 1.203537106513977, 1.4446414709091187, 1.6857457160949707, 1.9268500804901123, 2.167954444885254]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 8.0, 1.0, 5.0, 2.0, 6.0, 8.0, 6.0, 17.0, 20.0, 22.0, 9.0, 13.0, 30.0, 19.0, 26.0, 28.0, 33.0, 37.0, 37.0, 51.0, 46.0, 40.0, 37.0, 41.0, 43.0, 49.0, 44.0, 33.0, 31.0, 30.0, 30.0, 32.0, 20.0, 28.0, 22.0, 15.0, 13.0, 19.0, 6.0, 9.0, 6.0, 8.0, 11.0, 4.0, 4.0, 6.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.836522102355957, -1.7824931144714355, -1.728464126586914, -1.6744352579116821, -1.6204062700271606, -1.5663772821426392, -1.5123482942581177, -1.4583194255828857, -1.4042904376983643, -1.3502614498138428, -1.2962324619293213, -1.2422035932540894, -1.1881746053695679, -1.1341456174850464, -1.080116629600525, -1.026087760925293, -0.9720587134361267, -0.9180297255516052, -0.8640007972717285, -0.809971809387207, -0.7559428811073303, -0.7019138932228088, -0.6478849649429321, -0.5938559770584106, -0.5398269891738892, -0.48579803109169006, -0.43176907300949097, -0.3777400851249695, -0.3237111568450928, -0.2696821689605713, -0.2156532108783722, -0.1616242527961731, -0.10759532451629639, -0.05356636270880699, 0.00046259909868240356, 0.0544915646314621, 0.1085205227136612, 0.16254949569702148, 0.21657845377922058, 0.2706074118614197, 0.3246363699436188, 0.37866532802581787, 0.43269428610801697, 0.48672324419021606, 0.5407522320747375, 0.5947811603546143, 0.6488101482391357, 0.7028391361236572, 0.7568680644035339, 0.8108970522880554, 0.8649259805679321, 0.9189549684524536, 0.9729838967323303, 1.027012825012207, 1.0810418128967285, 1.13507080078125, 1.1890997886657715, 1.243128776550293, 1.2971577644348145, 1.3511866331100464, 1.4052156209945679, 1.4592446088790894, 1.5132735967636108, 1.5673024654388428, 1.6213314533233643]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 6.0, 5.0, 7.0, 19.0, 24.0, 21.0, 35.0, 48.0, 66.0, 109.0, 144.0, 199.0, 337.0, 475.0, 739.0, 1211.0, 1980.0, 3338.0, 5976.0, 11259.0, 22655.0, 46548.0, 105453.0, 275239.0, 950687.0, 1871056.0, 559750.0, 188213.0, 77012.0, 34995.0, 16715.0, 8751.0, 4632.0, 2527.0, 1496.0, 875.0, 592.0, 351.0, 247.0, 144.0, 118.0, 73.0, 56.0, 27.0, 21.0, 19.0, 6.0, 18.0, 6.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.28369140625, -0.27565574645996094, -0.2676200866699219, -0.2595844268798828, -0.25154876708984375, -0.2435131072998047, -0.23547744750976562, -0.22744178771972656, -0.2194061279296875, -0.21137046813964844, -0.20333480834960938, -0.1952991485595703, -0.18726348876953125, -0.1792278289794922, -0.17119216918945312, -0.16315650939941406, -0.155120849609375, -0.14708518981933594, -0.13904953002929688, -0.1310138702392578, -0.12297821044921875, -0.11494255065917969, -0.10690689086914062, -0.09887123107910156, -0.0908355712890625, -0.08279991149902344, -0.07476425170898438, -0.06672859191894531, -0.05869293212890625, -0.05065727233886719, -0.042621612548828125, -0.03458595275878906, -0.02655029296875, -0.018514633178710938, -0.010478973388671875, -0.0024433135986328125, 0.00559234619140625, 0.013628005981445312, 0.021663665771484375, 0.029699325561523438, 0.0377349853515625, 0.04577064514160156, 0.053806304931640625, 0.06184196472167969, 0.06987762451171875, 0.07791328430175781, 0.08594894409179688, 0.09398460388183594, 0.102020263671875, 0.11005592346191406, 0.11809158325195312, 0.1261272430419922, 0.13416290283203125, 0.1421985626220703, 0.15023422241210938, 0.15826988220214844, 0.1663055419921875, 0.17434120178222656, 0.18237686157226562, 0.1904125213623047, 0.19844818115234375, 0.2064838409423828, 0.21451950073242188, 0.22255516052246094, 0.2305908203125]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 10.0, 9.0, 18.0, 22.0, 33.0, 44.0, 50.0, 61.0, 75.0, 92.0, 93.0, 95.0, 89.0, 76.0, 66.0, 54.0, 42.0, 38.0, 20.0, 10.0, 7.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.44189453125, -0.4292030334472656, -0.41651153564453125, -0.4038200378417969, -0.3911285400390625, -0.3784370422363281, -0.36574554443359375, -0.3530540466308594, -0.340362548828125, -0.3276710510253906, -0.31497955322265625, -0.3022880554199219, -0.2895965576171875, -0.2769050598144531, -0.26421356201171875, -0.2515220642089844, -0.23883056640625, -0.22613906860351562, -0.21344757080078125, -0.20075607299804688, -0.1880645751953125, -0.17537307739257812, -0.16268157958984375, -0.14999008178710938, -0.137298583984375, -0.12460708618164062, -0.11191558837890625, -0.09922409057617188, -0.0865325927734375, -0.07384109497070312, -0.06114959716796875, -0.048458099365234375, -0.0357666015625, -0.023075103759765625, -0.01038360595703125, 0.002307891845703125, 0.0149993896484375, 0.027690887451171875, 0.04038238525390625, 0.053073883056640625, 0.065765380859375, 0.07845687866210938, 0.09114837646484375, 0.10383987426757812, 0.1165313720703125, 0.12922286987304688, 0.14191436767578125, 0.15460586547851562, 0.16729736328125, 0.17998886108398438, 0.19268035888671875, 0.20537185668945312, 0.2180633544921875, 0.23075485229492188, 0.24344635009765625, 0.2561378479003906, 0.268829345703125, 0.2815208435058594, 0.29421234130859375, 0.3069038391113281, 0.3195953369140625, 0.3322868347167969, 0.34497833251953125, 0.3576698303222656, 0.370361328125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 5.0, 3.0, 7.0, 11.0, 8.0, 14.0, 31.0, 45.0, 45.0, 100.0, 137.0, 206.0, 367.0, 659.0, 1260.0, 2989.0, 8025.0, 27168.0, 113866.0, 673191.0, 2719638.0, 517253.0, 93601.0, 22858.0, 7188.0, 2739.0, 1274.0, 620.0, 327.0, 244.0, 138.0, 96.0, 40.0, 38.0, 32.0, 20.0, 11.0, 8.0, 12.0, 5.0, 5.0, 5.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.73974609375, -0.717620849609375, -0.69549560546875, -0.673370361328125, -0.6512451171875, -0.629119873046875, -0.60699462890625, -0.584869384765625, -0.562744140625, -0.540618896484375, -0.51849365234375, -0.496368408203125, -0.4742431640625, -0.452117919921875, -0.42999267578125, -0.407867431640625, -0.3857421875, -0.363616943359375, -0.34149169921875, -0.319366455078125, -0.2972412109375, -0.275115966796875, -0.25299072265625, -0.230865478515625, -0.208740234375, -0.186614990234375, -0.16448974609375, -0.142364501953125, -0.1202392578125, -0.098114013671875, -0.07598876953125, -0.053863525390625, -0.03173828125, -0.009613037109375, 0.01251220703125, 0.034637451171875, 0.0567626953125, 0.078887939453125, 0.10101318359375, 0.123138427734375, 0.145263671875, 0.167388916015625, 0.18951416015625, 0.211639404296875, 0.2337646484375, 0.255889892578125, 0.27801513671875, 0.300140380859375, 0.322265625, 0.344390869140625, 0.36651611328125, 0.388641357421875, 0.4107666015625, 0.432891845703125, 0.45501708984375, 0.477142333984375, 0.499267578125, 0.521392822265625, 0.54351806640625, 0.565643310546875, 0.5877685546875, 0.609893798828125, 0.63201904296875, 0.654144287109375, 0.67626953125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 10.0, 10.0, 8.0, 34.0, 27.0, 61.0, 76.0, 151.0, 211.0, 417.0, 626.0, 881.0, 601.0, 334.0, 193.0, 156.0, 83.0, 70.0, 37.0, 22.0, 16.0, 13.0, 10.0, 11.0, 4.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6083984375, -0.588409423828125, -0.56842041015625, -0.548431396484375, -0.5284423828125, -0.508453369140625, -0.48846435546875, -0.468475341796875, -0.448486328125, -0.428497314453125, -0.40850830078125, -0.388519287109375, -0.3685302734375, -0.348541259765625, -0.32855224609375, -0.308563232421875, -0.28857421875, -0.268585205078125, -0.24859619140625, -0.228607177734375, -0.2086181640625, -0.188629150390625, -0.16864013671875, -0.148651123046875, -0.128662109375, -0.108673095703125, -0.08868408203125, -0.068695068359375, -0.0487060546875, -0.028717041015625, -0.00872802734375, 0.011260986328125, 0.03125, 0.051239013671875, 0.07122802734375, 0.091217041015625, 0.1112060546875, 0.131195068359375, 0.15118408203125, 0.171173095703125, 0.191162109375, 0.211151123046875, 0.23114013671875, 0.251129150390625, 0.2711181640625, 0.291107177734375, 0.31109619140625, 0.331085205078125, 0.35107421875, 0.371063232421875, 0.39105224609375, 0.411041259765625, 0.4310302734375, 0.451019287109375, 0.47100830078125, 0.490997314453125, 0.510986328125, 0.530975341796875, 0.55096435546875, 0.570953369140625, 0.5909423828125, 0.610931396484375, 0.63092041015625, 0.650909423828125, 0.6708984375]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 18.0, 20.0, 26.0, 53.0, 79.0, 76.0, 121.0, 90.0, 114.0, 88.0, 107.0, 64.0, 45.0, 34.0, 19.0, 12.0, 8.0, 6.0, 3.0, 3.0, 6.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.621370553970337, -3.5297844409942627, -3.4381985664367676, -3.3466124534606934, -3.255026340484619, -3.163440465927124, -3.07185435295105, -2.9802684783935547, -2.8886823654174805, -2.7970962524414062, -2.705510377883911, -2.613924264907837, -2.522338390350342, -2.4307522773742676, -2.3391661643981934, -2.247580051422119, -2.155994176864624, -2.06440806388855, -1.9728221893310547, -1.8812360763549805, -1.7896500825881958, -1.6980640888214111, -1.606477975845337, -1.5148919820785522, -1.4233059883117676, -1.331719994544983, -1.2401340007781982, -1.148547887802124, -1.0569618940353394, -0.9653759002685547, -0.8737898468971252, -0.7822037935256958, -0.690617561340332, -0.5990315675735474, -0.5074455142021179, -0.41585949063301086, -0.3242734670639038, -0.23268744349479675, -0.1411014199256897, -0.049515366554260254, 0.042070627212524414, 0.13365665078163147, 0.22524267435073853, 0.3168286979198456, 0.40841472148895264, 0.5000007152557373, 0.5915867686271667, 0.6831728219985962, 0.7747588157653809, 0.8663448095321655, 0.957930862903595, 1.0495169162750244, 1.141102910041809, 1.2326889038085938, 1.324275016784668, 1.4158610105514526, 1.5074470043182373, 1.599032998085022, 1.6906189918518066, 1.7822051048278809, 1.8737910985946655, 1.9653770923614502, 2.0569632053375244, 2.1485490798950195, 2.2401351928710938]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 3.0, 1.0, 6.0, 5.0, 1.0, 5.0, 10.0, 4.0, 19.0, 17.0, 12.0, 15.0, 24.0, 28.0, 27.0, 25.0, 28.0, 33.0, 29.0, 46.0, 42.0, 44.0, 47.0, 29.0, 44.0, 33.0, 40.0, 34.0, 40.0, 38.0, 23.0, 44.0, 26.0, 23.0, 24.0, 18.0, 15.0, 21.0, 17.0, 9.0, 16.0, 14.0, 4.0, 6.0, 7.0, 6.0, 5.0, 0.0, 3.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3691236972808838, -1.320310354232788, -1.271497130393982, -1.2226837873458862, -1.17387056350708, -1.1250572204589844, -1.0762438774108887, -1.027430534362793, -0.9786173105239868, -0.9298040270805359, -0.880990743637085, -0.8321774005889893, -0.7833641171455383, -0.7345508337020874, -0.6857374906539917, -0.6369242072105408, -0.5881109237670898, -0.5392976403236389, -0.4904843270778656, -0.4416710138320923, -0.39285773038864136, -0.34404444694519043, -0.2952311336994171, -0.2464178204536438, -0.19760453701019287, -0.14879123866558075, -0.09997794032096863, -0.051164641976356506, -0.0023513436317443848, 0.04646195471286774, 0.09527525305747986, 0.14408856630325317, 0.1929018497467041, 0.24171514809131622, 0.29052844643592834, 0.33934175968170166, 0.3881550431251526, 0.4369683265686035, 0.48578163981437683, 0.5345949530601501, 0.5834082365036011, 0.632221519947052, 0.6810348033905029, 0.7298481464385986, 0.7786614298820496, 0.8274747133255005, 0.8762880563735962, 0.9251013398170471, 0.973914623260498, 1.0227279663085938, 1.0715411901474, 1.1203545331954956, 1.1691677570343018, 1.2179811000823975, 1.2667944431304932, 1.3156077861785889, 1.364421010017395, 1.4132343530654907, 1.4620475769042969, 1.5108609199523926, 1.5596742630004883, 1.6084874868392944, 1.6573008298873901, 1.7061140537261963, 1.754927396774292]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 3.0, 3.0, 8.0, 8.0, 12.0, 27.0, 40.0, 33.0, 50.0, 60.0, 93.0, 151.0, 229.0, 284.0, 440.0, 606.0, 912.0, 1339.0, 1940.0, 2766.0, 4122.0, 6220.0, 9234.0, 14561.0, 23109.0, 38833.0, 72497.0, 160517.0, 299418.0, 202332.0, 88015.0, 45727.0, 26540.0, 16367.0, 10622.0, 6891.0, 4548.0, 3252.0, 2082.0, 1422.0, 999.0, 701.0, 505.0, 300.0, 216.0, 152.0, 115.0, 81.0, 55.0, 43.0, 32.0, 21.0, 11.0, 5.0, 8.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.287109375, -0.2780342102050781, -0.26895904541015625, -0.2598838806152344, -0.2508087158203125, -0.24173355102539062, -0.23265838623046875, -0.22358322143554688, -0.214508056640625, -0.20543289184570312, -0.19635772705078125, -0.18728256225585938, -0.1782073974609375, -0.16913223266601562, -0.16005706787109375, -0.15098190307617188, -0.14190673828125, -0.13283157348632812, -0.12375640869140625, -0.11468124389648438, -0.1056060791015625, -0.09653091430664062, -0.08745574951171875, -0.07838058471679688, -0.069305419921875, -0.060230255126953125, -0.05115509033203125, -0.042079925537109375, -0.0330047607421875, -0.023929595947265625, -0.01485443115234375, -0.005779266357421875, 0.0032958984375, 0.012371063232421875, 0.02144622802734375, 0.030521392822265625, 0.0395965576171875, 0.048671722412109375, 0.05774688720703125, 0.06682205200195312, 0.075897216796875, 0.08497238159179688, 0.09404754638671875, 0.10312271118164062, 0.1121978759765625, 0.12127304077148438, 0.13034820556640625, 0.13942337036132812, 0.14849853515625, 0.15757369995117188, 0.16664886474609375, 0.17572402954101562, 0.1847991943359375, 0.19387435913085938, 0.20294952392578125, 0.21202468872070312, 0.221099853515625, 0.23017501831054688, 0.23925018310546875, 0.24832534790039062, 0.2574005126953125, 0.2664756774902344, 0.27555084228515625, 0.2846260070800781, 0.293701171875]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 8.0, 10.0, 11.0, 16.0, 24.0, 30.0, 33.0, 42.0, 46.0, 66.0, 70.0, 63.0, 74.0, 87.0, 64.0, 65.0, 65.0, 52.0, 53.0, 39.0, 28.0, 23.0, 20.0, 8.0, 7.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.41796875, -0.406005859375, -0.39404296875, -0.382080078125, -0.3701171875, -0.358154296875, -0.34619140625, -0.334228515625, -0.322265625, -0.310302734375, -0.29833984375, -0.286376953125, -0.2744140625, -0.262451171875, -0.25048828125, -0.238525390625, -0.2265625, -0.214599609375, -0.20263671875, -0.190673828125, -0.1787109375, -0.166748046875, -0.15478515625, -0.142822265625, -0.130859375, -0.118896484375, -0.10693359375, -0.094970703125, -0.0830078125, -0.071044921875, -0.05908203125, -0.047119140625, -0.03515625, -0.023193359375, -0.01123046875, 0.000732421875, 0.0126953125, 0.024658203125, 0.03662109375, 0.048583984375, 0.060546875, 0.072509765625, 0.08447265625, 0.096435546875, 0.1083984375, 0.120361328125, 0.13232421875, 0.144287109375, 0.15625, 0.168212890625, 0.18017578125, 0.192138671875, 0.2041015625, 0.216064453125, 0.22802734375, 0.239990234375, 0.251953125, 0.263916015625, 0.27587890625, 0.287841796875, 0.2998046875, 0.311767578125, 0.32373046875, 0.335693359375, 0.34765625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 4.0, 4.0, 5.0, 11.0, 5.0, 9.0, 13.0, 23.0, 35.0, 63.0, 94.0, 164.0, 303.0, 654.0, 1564.0, 3806.0, 10171.0, 29169.0, 98894.0, 549273.0, 268523.0, 56047.0, 18529.0, 6475.0, 2564.0, 1128.0, 452.0, 232.0, 122.0, 71.0, 41.0, 21.0, 24.0, 18.0, 14.0, 5.0, 7.0, 6.0, 7.0, 6.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.8544921875, -0.8306121826171875, -0.806732177734375, -0.7828521728515625, -0.75897216796875, -0.7350921630859375, -0.711212158203125, -0.6873321533203125, -0.6634521484375, -0.6395721435546875, -0.615692138671875, -0.5918121337890625, -0.56793212890625, -0.5440521240234375, -0.520172119140625, -0.4962921142578125, -0.472412109375, -0.4485321044921875, -0.424652099609375, -0.4007720947265625, -0.37689208984375, -0.3530120849609375, -0.329132080078125, -0.3052520751953125, -0.2813720703125, -0.2574920654296875, -0.233612060546875, -0.2097320556640625, -0.18585205078125, -0.1619720458984375, -0.138092041015625, -0.1142120361328125, -0.09033203125, -0.0664520263671875, -0.042572021484375, -0.0186920166015625, 0.00518798828125, 0.0290679931640625, 0.052947998046875, 0.0768280029296875, 0.1007080078125, 0.1245880126953125, 0.148468017578125, 0.1723480224609375, 0.19622802734375, 0.2201080322265625, 0.243988037109375, 0.2678680419921875, 0.291748046875, 0.3156280517578125, 0.339508056640625, 0.3633880615234375, 0.38726806640625, 0.4111480712890625, 0.435028076171875, 0.4589080810546875, 0.4827880859375, 0.5066680908203125, 0.530548095703125, 0.5544281005859375, 0.57830810546875, 0.6021881103515625, 0.626068115234375, 0.6499481201171875, 0.673828125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 3.0, 2.0, 8.0, 3.0, 9.0, 6.0, 6.0, 9.0, 11.0, 12.0, 14.0, 19.0, 22.0, 28.0, 31.0, 24.0, 29.0, 36.0, 44.0, 27.0, 42.0, 51.0, 48.0, 47.0, 34.0, 49.0, 52.0, 41.0, 40.0, 38.0, 39.0, 22.0, 24.0, 17.0, 21.0, 17.0, 15.0, 16.0, 12.0, 6.0, 11.0, 8.0, 1.0, 7.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.736328125, -0.7141036987304688, -0.6918792724609375, -0.6696548461914062, -0.647430419921875, -0.6252059936523438, -0.6029815673828125, -0.5807571411132812, -0.55853271484375, -0.5363082885742188, -0.5140838623046875, -0.49185943603515625, -0.469635009765625, -0.44741058349609375, -0.4251861572265625, -0.40296173095703125, -0.3807373046875, -0.35851287841796875, -0.3362884521484375, -0.31406402587890625, -0.291839599609375, -0.26961517333984375, -0.2473907470703125, -0.22516632080078125, -0.20294189453125, -0.18071746826171875, -0.1584930419921875, -0.13626861572265625, -0.114044189453125, -0.09181976318359375, -0.0695953369140625, -0.04737091064453125, -0.025146484375, -0.00292205810546875, 0.0193023681640625, 0.04152679443359375, 0.063751220703125, 0.08597564697265625, 0.1082000732421875, 0.13042449951171875, 0.15264892578125, 0.17487335205078125, 0.1970977783203125, 0.21932220458984375, 0.241546630859375, 0.26377105712890625, 0.2859954833984375, 0.30821990966796875, 0.3304443359375, 0.35266876220703125, 0.3748931884765625, 0.39711761474609375, 0.419342041015625, 0.44156646728515625, 0.4637908935546875, 0.48601531982421875, 0.50823974609375, 0.5304641723632812, 0.5526885986328125, 0.5749130249023438, 0.597137451171875, 0.6193618774414062, 0.6415863037109375, 0.6638107299804688, 0.68603515625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 5.0, 3.0, 7.0, 10.0, 10.0, 11.0, 26.0, 36.0, 57.0, 96.0, 192.0, 382.0, 812.0, 1765.0, 3991.0, 9278.0, 21493.0, 50190.0, 125017.0, 433173.0, 258021.0, 82897.0, 34573.0, 14892.0, 6423.0, 2766.0, 1234.0, 568.0, 280.0, 136.0, 93.0, 36.0, 32.0, 15.0, 17.0, 6.0, 2.0, 4.0, 7.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1854248046875, -0.17875099182128906, -0.17207717895507812, -0.1654033660888672, -0.15872955322265625, -0.1520557403564453, -0.14538192749023438, -0.13870811462402344, -0.1320343017578125, -0.12536048889160156, -0.11868667602539062, -0.11201286315917969, -0.10533905029296875, -0.09866523742675781, -0.09199142456054688, -0.08531761169433594, -0.078643798828125, -0.07196998596191406, -0.06529617309570312, -0.05862236022949219, -0.05194854736328125, -0.04527473449707031, -0.038600921630859375, -0.03192710876464844, -0.0252532958984375, -0.018579483032226562, -0.011905670166015625, -0.0052318572998046875, 0.00144195556640625, 0.008115768432617188, 0.014789581298828125, 0.021463394165039062, 0.02813720703125, 0.03481101989746094, 0.041484832763671875, 0.04815864562988281, 0.05483245849609375, 0.06150627136230469, 0.06818008422851562, 0.07485389709472656, 0.0815277099609375, 0.08820152282714844, 0.09487533569335938, 0.10154914855957031, 0.10822296142578125, 0.11489677429199219, 0.12157058715820312, 0.12824440002441406, 0.134918212890625, 0.14159202575683594, 0.14826583862304688, 0.1549396514892578, 0.16161346435546875, 0.1682872772216797, 0.17496109008789062, 0.18163490295410156, 0.1883087158203125, 0.19498252868652344, 0.20165634155273438, 0.2083301544189453, 0.21500396728515625, 0.2216777801513672, 0.22835159301757812, 0.23502540588378906, 0.24169921875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 3.0, 4.0, 3.0, 8.0, 7.0, 9.0, 6.0, 9.0, 18.0, 32.0, 45.0, 62.0, 110.0, 152.0, 165.0, 120.0, 75.0, 48.0, 23.0, 15.0, 21.0, 22.0, 10.0, 8.0, 6.0, 3.0, 2.0, 2.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.64320182800293e-05, -4.471186548471451e-05, -4.299171268939972e-05, -4.127155989408493e-05, -3.955140709877014e-05, -3.783125430345535e-05, -3.6111101508140564e-05, -3.4390948712825775e-05, -3.2670795917510986e-05, -3.09506431221962e-05, -2.923049032688141e-05, -2.751033753156662e-05, -2.579018473625183e-05, -2.4070031940937042e-05, -2.2349879145622253e-05, -2.0629726350307465e-05, -1.8909573554992676e-05, -1.7189420759677887e-05, -1.5469267964363098e-05, -1.374911516904831e-05, -1.202896237373352e-05, -1.0308809578418732e-05, -8.588656783103943e-06, -6.868503987789154e-06, -5.148351192474365e-06, -3.4281983971595764e-06, -1.7080456018447876e-06, 1.210719347000122e-08, 1.73225998878479e-06, 3.452412784099579e-06, 5.172565579414368e-06, 6.8927183747291565e-06, 8.612871170043945e-06, 1.0333023965358734e-05, 1.2053176760673523e-05, 1.3773329555988312e-05, 1.54934823513031e-05, 1.721363514661789e-05, 1.8933787941932678e-05, 2.0653940737247467e-05, 2.2374093532562256e-05, 2.4094246327877045e-05, 2.5814399123191833e-05, 2.7534551918506622e-05, 2.925470471382141e-05, 3.09748575091362e-05, 3.269501030445099e-05, 3.441516309976578e-05, 3.6135315895080566e-05, 3.7855468690395355e-05, 3.9575621485710144e-05, 4.129577428102493e-05, 4.301592707633972e-05, 4.473607987165451e-05, 4.64562326669693e-05, 4.817638546228409e-05, 4.989653825759888e-05, 5.1616691052913666e-05, 5.3336843848228455e-05, 5.5056996643543243e-05, 5.677714943885803e-05, 5.849730223417282e-05, 6.021745502948761e-05, 6.19376078248024e-05, 6.365776062011719e-05]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 3.0, 4.0, 3.0, 12.0, 24.0, 46.0, 92.0, 178.0, 440.0, 1213.0, 4530.0, 20780.0, 105283.0, 613257.0, 246730.0, 43408.0, 9148.0, 2213.0, 665.0, 252.0, 128.0, 66.0, 28.0, 18.0, 12.0, 3.0, 6.0, 4.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.400390625, -0.38886260986328125, -0.3773345947265625, -0.36580657958984375, -0.354278564453125, -0.34275054931640625, -0.3312225341796875, -0.31969451904296875, -0.30816650390625, -0.29663848876953125, -0.2851104736328125, -0.27358245849609375, -0.262054443359375, -0.25052642822265625, -0.2389984130859375, -0.22747039794921875, -0.2159423828125, -0.20441436767578125, -0.1928863525390625, -0.18135833740234375, -0.169830322265625, -0.15830230712890625, -0.1467742919921875, -0.13524627685546875, -0.12371826171875, -0.11219024658203125, -0.1006622314453125, -0.08913421630859375, -0.077606201171875, -0.06607818603515625, -0.0545501708984375, -0.04302215576171875, -0.031494140625, -0.01996612548828125, -0.0084381103515625, 0.00308990478515625, 0.014617919921875, 0.02614593505859375, 0.0376739501953125, 0.04920196533203125, 0.06072998046875, 0.07225799560546875, 0.0837860107421875, 0.09531402587890625, 0.106842041015625, 0.11837005615234375, 0.1298980712890625, 0.14142608642578125, 0.1529541015625, 0.16448211669921875, 0.1760101318359375, 0.18753814697265625, 0.199066162109375, 0.21059417724609375, 0.2221221923828125, 0.23365020751953125, 0.24517822265625, 0.25670623779296875, 0.2682342529296875, 0.27976226806640625, 0.291290283203125, 0.30281829833984375, 0.3143463134765625, 0.32587432861328125, 0.33740234375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 1.0, 3.0, 0.0, 6.0, 6.0, 5.0, 6.0, 6.0, 7.0, 15.0, 16.0, 19.0, 28.0, 29.0, 36.0, 48.0, 74.0, 89.0, 124.0, 104.0, 82.0, 64.0, 41.0, 35.0, 29.0, 36.0, 22.0, 17.0, 12.0, 11.0, 8.0, 5.0, 7.0, 7.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.200927734375, -0.194976806640625, -0.18902587890625, -0.183074951171875, -0.1771240234375, -0.171173095703125, -0.16522216796875, -0.159271240234375, -0.1533203125, -0.147369384765625, -0.14141845703125, -0.135467529296875, -0.1295166015625, -0.123565673828125, -0.11761474609375, -0.111663818359375, -0.105712890625, -0.099761962890625, -0.09381103515625, -0.087860107421875, -0.0819091796875, -0.075958251953125, -0.07000732421875, -0.064056396484375, -0.05810546875, -0.052154541015625, -0.04620361328125, -0.040252685546875, -0.0343017578125, -0.028350830078125, -0.02239990234375, -0.016448974609375, -0.010498046875, -0.004547119140625, 0.00140380859375, 0.007354736328125, 0.0133056640625, 0.019256591796875, 0.02520751953125, 0.031158447265625, 0.037109375, 0.043060302734375, 0.04901123046875, 0.054962158203125, 0.0609130859375, 0.066864013671875, 0.07281494140625, 0.078765869140625, 0.084716796875, 0.090667724609375, 0.09661865234375, 0.102569580078125, 0.1085205078125, 0.114471435546875, 0.12042236328125, 0.126373291015625, 0.13232421875, 0.138275146484375, 0.14422607421875, 0.150177001953125, 0.1561279296875, 0.162078857421875, 0.16802978515625, 0.173980712890625, 0.179931640625]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 4.0, 12.0, 18.0, 49.0, 112.0, 160.0, 181.0, 176.0, 144.0, 81.0, 37.0, 14.0, 6.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.021129608154297, -2.889021635055542, -2.756913661956787, -2.6248059272766113, -2.4926979541778564, -2.3605899810791016, -2.2284820079803467, -2.096374034881592, -1.9642661809921265, -1.8321582078933716, -1.7000503540039062, -1.5679423809051514, -1.4358344078063965, -1.3037265539169312, -1.1716185808181763, -1.039510726928711, -0.907402753829956, -0.775294840335846, -0.6431869268417358, -0.511078953742981, -0.37897104024887085, -0.24686312675476074, -0.11475515365600586, 0.017352759838104248, 0.14946067333221436, 0.28156858682632446, 0.41367653012275696, 0.5457844734191895, 0.6778923869132996, 0.8100003004074097, 0.9421082735061646, 1.0742161273956299, 1.2063241004943848, 1.3384320735931396, 1.470539927482605, 1.6026479005813599, 1.7347557544708252, 1.86686372756958, 1.998971700668335, 2.13107967376709, 2.2631874084472656, 2.3952953815460205, 2.5274033546447754, 2.659511089324951, 2.791619062423706, 2.923727035522461, 3.055835008621216, 3.1879429817199707, 3.3200509548187256, 3.4521589279174805, 3.5842669010162354, 3.7163748741149902, 3.848482608795166, 3.980590581893921, 4.112698554992676, 4.244806289672852, 4.3769145011901855, 4.509022235870361, 4.641130447387695, 4.773238182067871, 4.905346393585205, 5.037454128265381, 5.169562339782715, 5.301670074462891, 5.433777809143066]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 6.0, 6.0, 11.0, 17.0, 12.0, 17.0, 16.0, 23.0, 25.0, 26.0, 25.0, 34.0, 33.0, 34.0, 41.0, 52.0, 44.0, 39.0, 48.0, 44.0, 29.0, 47.0, 33.0, 44.0, 43.0, 28.0, 32.0, 23.0, 31.0, 11.0, 22.0, 20.0, 12.0, 20.0, 9.0, 15.0, 10.0, 2.0, 5.0, 3.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.9440405368804932, -1.8873573541641235, -1.830674171447754, -1.7739911079406738, -1.7173079252243042, -1.6606247425079346, -1.6039416790008545, -1.5472584962844849, -1.4905753135681152, -1.4338921308517456, -1.377208948135376, -1.320525884628296, -1.2638427019119263, -1.2071595191955566, -1.1504764556884766, -1.093793272972107, -1.0371100902557373, -0.9804269075393677, -0.9237437844276428, -0.867060661315918, -0.8103774785995483, -0.7536942958831787, -0.6970111727714539, -0.640328049659729, -0.5836448669433594, -0.5269616842269897, -0.4702785611152649, -0.41359540820121765, -0.3569122552871704, -0.30022910237312317, -0.24354594945907593, -0.1868627965450287, -0.13017964363098145, -0.0734964907169342, -0.016813337802886963, 0.03986981511116028, 0.09655296802520752, 0.15323612093925476, 0.209919273853302, 0.26660242676734924, 0.3232855796813965, 0.3799687325954437, 0.43665188550949097, 0.4933350384235382, 0.5500181913375854, 0.6067013740539551, 0.6633844971656799, 0.7200676202774048, 0.7767508029937744, 0.833433985710144, 0.8901171088218689, 0.9468002319335938, 1.0034834146499634, 1.060166597366333, 1.116849660873413, 1.1735328435897827, 1.2302160263061523, 1.286899209022522, 1.3435823917388916, 1.4002654552459717, 1.4569486379623413, 1.513631820678711, 1.570314884185791, 1.6269980669021606, 1.6836812496185303]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 15.0, 20.0, 46.0, 111.0, 253.0, 624.0, 1484.0, 3970.0, 12620.0, 52589.0, 357149.0, 3210992.0, 468855.0, 63729.0, 14883.0, 4480.0, 1523.0, 584.0, 215.0, 91.0, 38.0, 16.0, 8.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.88037109375, -0.8575363159179688, -0.8347015380859375, -0.8118667602539062, -0.789031982421875, -0.7661972045898438, -0.7433624267578125, -0.7205276489257812, -0.69769287109375, -0.6748580932617188, -0.6520233154296875, -0.6291885375976562, -0.606353759765625, -0.5835189819335938, -0.5606842041015625, -0.5378494262695312, -0.5150146484375, -0.49217987060546875, -0.4693450927734375, -0.44651031494140625, -0.423675537109375, -0.40084075927734375, -0.3780059814453125, -0.35517120361328125, -0.33233642578125, -0.30950164794921875, -0.2866668701171875, -0.26383209228515625, -0.240997314453125, -0.21816253662109375, -0.1953277587890625, -0.17249298095703125, -0.149658203125, -0.12682342529296875, -0.1039886474609375, -0.08115386962890625, -0.058319091796875, -0.03548431396484375, -0.0126495361328125, 0.01018524169921875, 0.03302001953125, 0.05585479736328125, 0.0786895751953125, 0.10152435302734375, 0.124359130859375, 0.14719390869140625, 0.1700286865234375, 0.19286346435546875, 0.2156982421875, 0.23853302001953125, 0.2613677978515625, 0.28420257568359375, 0.307037353515625, 0.32987213134765625, 0.3527069091796875, 0.37554168701171875, 0.39837646484375, 0.42121124267578125, 0.4440460205078125, 0.46688079833984375, 0.489715576171875, 0.5125503540039062, 0.5353851318359375, 0.5582199096679688, 0.5810546875]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 7.0, 5.0, 9.0, 15.0, 20.0, 23.0, 24.0, 42.0, 46.0, 47.0, 63.0, 79.0, 84.0, 62.0, 77.0, 72.0, 71.0, 60.0, 44.0, 46.0, 37.0, 22.0, 27.0, 9.0, 13.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.422607421875, -0.4104118347167969, -0.39821624755859375, -0.3860206604003906, -0.3738250732421875, -0.3616294860839844, -0.34943389892578125, -0.3372383117675781, -0.325042724609375, -0.3128471374511719, -0.30065155029296875, -0.2884559631347656, -0.2762603759765625, -0.2640647888183594, -0.25186920166015625, -0.23967361450195312, -0.22747802734375, -0.21528244018554688, -0.20308685302734375, -0.19089126586914062, -0.1786956787109375, -0.16650009155273438, -0.15430450439453125, -0.14210891723632812, -0.129913330078125, -0.11771774291992188, -0.10552215576171875, -0.09332656860351562, -0.0811309814453125, -0.06893539428710938, -0.05673980712890625, -0.044544219970703125, -0.0323486328125, -0.020153045654296875, -0.00795745849609375, 0.004238128662109375, 0.0164337158203125, 0.028629302978515625, 0.04082489013671875, 0.053020477294921875, 0.065216064453125, 0.07741165161132812, 0.08960723876953125, 0.10180282592773438, 0.1139984130859375, 0.12619400024414062, 0.13838958740234375, 0.15058517456054688, 0.16278076171875, 0.17497634887695312, 0.18717193603515625, 0.19936752319335938, 0.2115631103515625, 0.22375869750976562, 0.23595428466796875, 0.24814987182617188, 0.260345458984375, 0.2725410461425781, 0.28473663330078125, 0.2969322204589844, 0.3091278076171875, 0.3213233947753906, 0.33351898193359375, 0.3457145690917969, 0.35791015625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 3.0, 4.0, 5.0, 6.0, 5.0, 20.0, 11.0, 18.0, 27.0, 46.0, 51.0, 74.0, 144.0, 197.0, 242.0, 425.0, 616.0, 1070.0, 1764.0, 3275.0, 6661.0, 14304.0, 35281.0, 103070.0, 408623.0, 2428584.0, 912084.0, 181075.0, 55614.0, 21170.0, 9233.0, 4551.0, 2398.0, 1312.0, 811.0, 464.0, 308.0, 217.0, 141.0, 117.0, 84.0, 43.0, 36.0, 30.0, 17.0, 12.0, 12.0, 13.0, 10.0, 7.0, 2.0, 3.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.56982421875, -0.5506515502929688, -0.5314788818359375, -0.5123062133789062, -0.493133544921875, -0.47396087646484375, -0.4547882080078125, -0.43561553955078125, -0.41644287109375, -0.39727020263671875, -0.3780975341796875, -0.35892486572265625, -0.339752197265625, -0.32057952880859375, -0.3014068603515625, -0.28223419189453125, -0.2630615234375, -0.24388885498046875, -0.2247161865234375, -0.20554351806640625, -0.186370849609375, -0.16719818115234375, -0.1480255126953125, -0.12885284423828125, -0.10968017578125, -0.09050750732421875, -0.0713348388671875, -0.05216217041015625, -0.032989501953125, -0.01381683349609375, 0.0053558349609375, 0.02452850341796875, 0.043701171875, 0.06287384033203125, 0.0820465087890625, 0.10121917724609375, 0.120391845703125, 0.13956451416015625, 0.1587371826171875, 0.17790985107421875, 0.19708251953125, 0.21625518798828125, 0.2354278564453125, 0.25460052490234375, 0.273773193359375, 0.29294586181640625, 0.3121185302734375, 0.33129119873046875, 0.3504638671875, 0.36963653564453125, 0.3888092041015625, 0.40798187255859375, 0.427154541015625, 0.44632720947265625, 0.4654998779296875, 0.48467254638671875, 0.50384521484375, 0.5230178833007812, 0.5421905517578125, 0.5613632202148438, 0.580535888671875, 0.5997085571289062, 0.6188812255859375, 0.6380538940429688, 0.6572265625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 6.0, 5.0, 8.0, 13.0, 12.0, 10.0, 21.0, 44.0, 53.0, 59.0, 106.0, 151.0, 266.0, 504.0, 952.0, 755.0, 384.0, 238.0, 136.0, 93.0, 70.0, 51.0, 29.0, 36.0, 16.0, 11.0, 18.0, 7.0, 8.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.55810546875, -0.5373153686523438, -0.5165252685546875, -0.49573516845703125, -0.474945068359375, -0.45415496826171875, -0.4333648681640625, -0.41257476806640625, -0.39178466796875, -0.37099456787109375, -0.3502044677734375, -0.32941436767578125, -0.308624267578125, -0.28783416748046875, -0.2670440673828125, -0.24625396728515625, -0.2254638671875, -0.20467376708984375, -0.1838836669921875, -0.16309356689453125, -0.142303466796875, -0.12151336669921875, -0.1007232666015625, -0.07993316650390625, -0.05914306640625, -0.03835296630859375, -0.0175628662109375, 0.00322723388671875, 0.024017333984375, 0.04480743408203125, 0.0655975341796875, 0.08638763427734375, 0.107177734375, 0.12796783447265625, 0.1487579345703125, 0.16954803466796875, 0.190338134765625, 0.21112823486328125, 0.2319183349609375, 0.25270843505859375, 0.27349853515625, 0.29428863525390625, 0.3150787353515625, 0.33586883544921875, 0.356658935546875, 0.37744903564453125, 0.3982391357421875, 0.41902923583984375, 0.4398193359375, 0.46060943603515625, 0.4813995361328125, 0.5021896362304688, 0.522979736328125, 0.5437698364257812, 0.5645599365234375, 0.5853500366210938, 0.60614013671875, 0.6269302368164062, 0.6477203369140625, 0.6685104370117188, 0.689300537109375, 0.7100906372070312, 0.7308807373046875, 0.7516708374023438, 0.7724609375]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 5.0, 5.0, 15.0, 24.0, 24.0, 45.0, 57.0, 70.0, 80.0, 82.0, 90.0, 103.0, 72.0, 84.0, 65.0, 52.0, 39.0, 28.0, 21.0, 13.0, 11.0, 3.0, 4.0, 5.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2211592197418213, -2.1372456550598145, -2.0533323287963867, -1.9694187641143799, -1.8855053186416626, -1.8015918731689453, -1.7176783084869385, -1.6337648630142212, -1.549851417541504, -1.4659379720687866, -1.3820245265960693, -1.2981109619140625, -1.2141975164413452, -1.130284070968628, -1.046370506286621, -0.9624570608139038, -0.8785436153411865, -0.7946301698684692, -0.7107166647911072, -0.6268031597137451, -0.5428897142410278, -0.45897623896598816, -0.3750627636909485, -0.2911492586135864, -0.20723581314086914, -0.12332233786582947, -0.039408862590789795, 0.04450461268424988, 0.12841808795928955, 0.21233156323432922, 0.2962450385093689, 0.38015854358673096, 0.46407175064086914, 0.5479851961135864, 0.6318987011909485, 0.7158122062683105, 0.7997256517410278, 0.8836390972137451, 0.9675526022911072, 1.0514661073684692, 1.1353795528411865, 1.2192929983139038, 1.303206443786621, 1.387120008468628, 1.4710334539413452, 1.5549468994140625, 1.6388604640960693, 1.7227739095687866, 1.806687355041504, 1.8906008005142212, 1.9745142459869385, 2.0584278106689453, 2.142341136932373, 2.22625470161438, 2.3101682662963867, 2.3940815925598145, 2.4779951572418213, 2.561908721923828, 2.645822048187256, 2.7297356128692627, 2.8136491775512695, 2.8975625038146973, 2.981476068496704, 3.065389633178711, 3.1493029594421387]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 6.0, 7.0, 8.0, 8.0, 7.0, 11.0, 10.0, 18.0, 20.0, 20.0, 30.0, 16.0, 32.0, 32.0, 30.0, 43.0, 32.0, 44.0, 31.0, 41.0, 50.0, 43.0, 35.0, 38.0, 60.0, 40.0, 34.0, 30.0, 39.0, 17.0, 20.0, 20.0, 19.0, 20.0, 22.0, 23.0, 9.0, 12.0, 7.0, 2.0, 7.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.5522727966308594, -1.4985096454620361, -1.444746494293213, -1.3909833431243896, -1.3372201919555664, -1.2834570407867432, -1.22969388961792, -1.1759307384490967, -1.1221675872802734, -1.0684044361114502, -1.014641284942627, -0.9608781337738037, -0.9071149826049805, -0.8533518314361572, -0.799588680267334, -0.7458255290985107, -0.6920623779296875, -0.6382992267608643, -0.584536075592041, -0.5307729244232178, -0.47700977325439453, -0.4232466220855713, -0.36948347091674805, -0.3157203197479248, -0.26195716857910156, -0.20819401741027832, -0.15443086624145508, -0.10066771507263184, -0.046904563903808594, 0.0068585872650146484, 0.06062173843383789, 0.11438488960266113, 0.16814815998077393, 0.22191131114959717, 0.2756744623184204, 0.32943761348724365, 0.3832007646560669, 0.43696391582489014, 0.4907270669937134, 0.5444902181625366, 0.5982533693313599, 0.6520165205001831, 0.7057796716690063, 0.7595428228378296, 0.8133059740066528, 0.8670691251754761, 0.9208322763442993, 0.9745954275131226, 1.0283585786819458, 1.082121729850769, 1.1358848810195923, 1.1896480321884155, 1.2434111833572388, 1.297174334526062, 1.3509374856948853, 1.4047006368637085, 1.4584637880325317, 1.512226939201355, 1.5659900903701782, 1.6197532415390015, 1.6735163927078247, 1.727279543876648, 1.7810426950454712, 1.8348058462142944, 1.8885689973831177]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 4.0, 8.0, 9.0, 15.0, 25.0, 38.0, 39.0, 64.0, 66.0, 148.0, 201.0, 309.0, 466.0, 761.0, 1223.0, 2033.0, 3412.0, 5820.0, 10210.0, 18177.0, 35856.0, 79569.0, 197294.0, 338029.0, 196745.0, 79359.0, 35792.0, 18355.0, 10099.0, 5629.0, 3422.0, 1934.0, 1244.0, 809.0, 454.0, 323.0, 197.0, 146.0, 85.0, 54.0, 48.0, 31.0, 18.0, 12.0, 9.0, 5.0, 1.0, 9.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.41796875, -0.4054908752441406, -0.39301300048828125, -0.3805351257324219, -0.3680572509765625, -0.3555793762207031, -0.34310150146484375, -0.3306236267089844, -0.318145751953125, -0.3056678771972656, -0.29319000244140625, -0.2807121276855469, -0.2682342529296875, -0.2557563781738281, -0.24327850341796875, -0.23080062866210938, -0.21832275390625, -0.20584487915039062, -0.19336700439453125, -0.18088912963867188, -0.1684112548828125, -0.15593338012695312, -0.14345550537109375, -0.13097763061523438, -0.118499755859375, -0.10602188110351562, -0.09354400634765625, -0.08106613159179688, -0.0685882568359375, -0.056110382080078125, -0.04363250732421875, -0.031154632568359375, -0.0186767578125, -0.006198883056640625, 0.00627899169921875, 0.018756866455078125, 0.0312347412109375, 0.043712615966796875, 0.05619049072265625, 0.06866836547851562, 0.081146240234375, 0.09362411499023438, 0.10610198974609375, 0.11857986450195312, 0.1310577392578125, 0.14353561401367188, 0.15601348876953125, 0.16849136352539062, 0.18096923828125, 0.19344711303710938, 0.20592498779296875, 0.21840286254882812, 0.2308807373046875, 0.24335861206054688, 0.25583648681640625, 0.2683143615722656, 0.280792236328125, 0.2932701110839844, 0.30574798583984375, 0.3182258605957031, 0.3307037353515625, 0.3431816101074219, 0.35565948486328125, 0.3681373596191406, 0.380615234375]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 6.0, 4.0, 7.0, 7.0, 13.0, 11.0, 29.0, 32.0, 35.0, 41.0, 40.0, 56.0, 63.0, 63.0, 69.0, 55.0, 53.0, 62.0, 65.0, 58.0, 37.0, 54.0, 36.0, 29.0, 30.0, 17.0, 12.0, 8.0, 9.0, 5.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.41357421875, -0.4022483825683594, -0.39092254638671875, -0.3795967102050781, -0.3682708740234375, -0.3569450378417969, -0.34561920166015625, -0.3342933654785156, -0.322967529296875, -0.3116416931152344, -0.30031585693359375, -0.2889900207519531, -0.2776641845703125, -0.2663383483886719, -0.25501251220703125, -0.24368667602539062, -0.23236083984375, -0.22103500366210938, -0.20970916748046875, -0.19838333129882812, -0.1870574951171875, -0.17573165893554688, -0.16440582275390625, -0.15307998657226562, -0.141754150390625, -0.13042831420898438, -0.11910247802734375, -0.10777664184570312, -0.0964508056640625, -0.08512496948242188, -0.07379913330078125, -0.062473297119140625, -0.0511474609375, -0.039821624755859375, -0.02849578857421875, -0.017169952392578125, -0.0058441162109375, 0.005481719970703125, 0.01680755615234375, 0.028133392333984375, 0.039459228515625, 0.050785064697265625, 0.06211090087890625, 0.07343673706054688, 0.0847625732421875, 0.09608840942382812, 0.10741424560546875, 0.11874008178710938, 0.13006591796875, 0.14139175415039062, 0.15271759033203125, 0.16404342651367188, 0.1753692626953125, 0.18669509887695312, 0.19802093505859375, 0.20934677124023438, 0.220672607421875, 0.23199844360351562, 0.24332427978515625, 0.2546501159667969, 0.2659759521484375, 0.2773017883300781, 0.28862762451171875, 0.2999534606933594, 0.311279296875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 10.0, 9.0, 15.0, 11.0, 32.0, 26.0, 44.0, 48.0, 66.0, 164.0, 311.0, 686.0, 1647.0, 5024.0, 15638.0, 54298.0, 234964.0, 530032.0, 150351.0, 37675.0, 11372.0, 3677.0, 1304.0, 525.0, 261.0, 136.0, 65.0, 44.0, 33.0, 28.0, 17.0, 7.0, 10.0, 7.0, 5.0, 6.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.662109375, -0.639556884765625, -0.61700439453125, -0.594451904296875, -0.5718994140625, -0.549346923828125, -0.52679443359375, -0.504241943359375, -0.481689453125, -0.459136962890625, -0.43658447265625, -0.414031982421875, -0.3914794921875, -0.368927001953125, -0.34637451171875, -0.323822021484375, -0.30126953125, -0.278717041015625, -0.25616455078125, -0.233612060546875, -0.2110595703125, -0.188507080078125, -0.16595458984375, -0.143402099609375, -0.120849609375, -0.098297119140625, -0.07574462890625, -0.053192138671875, -0.0306396484375, -0.008087158203125, 0.01446533203125, 0.037017822265625, 0.0595703125, 0.082122802734375, 0.10467529296875, 0.127227783203125, 0.1497802734375, 0.172332763671875, 0.19488525390625, 0.217437744140625, 0.239990234375, 0.262542724609375, 0.28509521484375, 0.307647705078125, 0.3302001953125, 0.352752685546875, 0.37530517578125, 0.397857666015625, 0.42041015625, 0.442962646484375, 0.46551513671875, 0.488067626953125, 0.5106201171875, 0.533172607421875, 0.55572509765625, 0.578277587890625, 0.600830078125, 0.623382568359375, 0.64593505859375, 0.668487548828125, 0.6910400390625, 0.713592529296875, 0.73614501953125, 0.758697509765625, 0.78125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 3.0, 1.0, 6.0, 7.0, 10.0, 9.0, 16.0, 9.0, 18.0, 16.0, 19.0, 28.0, 29.0, 19.0, 27.0, 32.0, 34.0, 42.0, 49.0, 55.0, 35.0, 44.0, 54.0, 45.0, 44.0, 25.0, 40.0, 41.0, 27.0, 38.0, 23.0, 32.0, 26.0, 11.0, 16.0, 13.0, 12.0, 7.0, 8.0, 9.0, 8.0, 5.0, 7.0, 3.0, 3.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.689453125, -0.667266845703125, -0.64508056640625, -0.622894287109375, -0.6007080078125, -0.578521728515625, -0.55633544921875, -0.534149169921875, -0.511962890625, -0.489776611328125, -0.46759033203125, -0.445404052734375, -0.4232177734375, -0.401031494140625, -0.37884521484375, -0.356658935546875, -0.33447265625, -0.312286376953125, -0.29010009765625, -0.267913818359375, -0.2457275390625, -0.223541259765625, -0.20135498046875, -0.179168701171875, -0.156982421875, -0.134796142578125, -0.11260986328125, -0.090423583984375, -0.0682373046875, -0.046051025390625, -0.02386474609375, -0.001678466796875, 0.0205078125, 0.042694091796875, 0.06488037109375, 0.087066650390625, 0.1092529296875, 0.131439208984375, 0.15362548828125, 0.175811767578125, 0.197998046875, 0.220184326171875, 0.24237060546875, 0.264556884765625, 0.2867431640625, 0.308929443359375, 0.33111572265625, 0.353302001953125, 0.37548828125, 0.397674560546875, 0.41986083984375, 0.442047119140625, 0.4642333984375, 0.486419677734375, 0.50860595703125, 0.530792236328125, 0.552978515625, 0.575164794921875, 0.59735107421875, 0.619537353515625, 0.6417236328125, 0.663909912109375, 0.68609619140625, 0.708282470703125, 0.73046875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 2.0, 4.0, 6.0, 6.0, 14.0, 14.0, 15.0, 28.0, 49.0, 70.0, 135.0, 209.0, 356.0, 752.0, 1682.0, 3824.0, 8623.0, 21312.0, 55140.0, 166337.0, 417975.0, 244594.0, 77778.0, 28860.0, 11606.0, 4815.0, 2246.0, 1010.0, 489.0, 240.0, 143.0, 73.0, 52.0, 31.0, 22.0, 8.0, 8.0, 9.0, 5.0, 4.0, 6.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.254150390625, -0.24681854248046875, -0.2394866943359375, -0.23215484619140625, -0.224822998046875, -0.21749114990234375, -0.2101593017578125, -0.20282745361328125, -0.19549560546875, -0.18816375732421875, -0.1808319091796875, -0.17350006103515625, -0.166168212890625, -0.15883636474609375, -0.1515045166015625, -0.14417266845703125, -0.1368408203125, -0.12950897216796875, -0.1221771240234375, -0.11484527587890625, -0.107513427734375, -0.10018157958984375, -0.0928497314453125, -0.08551788330078125, -0.07818603515625, -0.07085418701171875, -0.0635223388671875, -0.05619049072265625, -0.048858642578125, -0.04152679443359375, -0.0341949462890625, -0.02686309814453125, -0.01953125, -0.01219940185546875, -0.0048675537109375, 0.00246429443359375, 0.009796142578125, 0.01712799072265625, 0.0244598388671875, 0.03179168701171875, 0.03912353515625, 0.04645538330078125, 0.0537872314453125, 0.06111907958984375, 0.068450927734375, 0.07578277587890625, 0.0831146240234375, 0.09044647216796875, 0.0977783203125, 0.10511016845703125, 0.1124420166015625, 0.11977386474609375, 0.127105712890625, 0.13443756103515625, 0.1417694091796875, 0.14910125732421875, 0.15643310546875, 0.16376495361328125, 0.1710968017578125, 0.17842864990234375, 0.185760498046875, 0.19309234619140625, 0.2004241943359375, 0.20775604248046875, 0.215087890625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 1.0, 3.0, 5.0, 8.0, 5.0, 5.0, 9.0, 8.0, 6.0, 13.0, 7.0, 19.0, 20.0, 29.0, 25.0, 39.0, 57.0, 83.0, 117.0, 99.0, 96.0, 101.0, 59.0, 42.0, 34.0, 17.0, 19.0, 15.0, 8.0, 5.0, 10.0, 5.0, 4.0, 3.0, 5.0, 5.0, 0.0, 3.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0], "bins": [-4.6193599700927734e-05, -4.488416016101837e-05, -4.357472062110901e-05, -4.2265281081199646e-05, -4.095584154129028e-05, -3.964640200138092e-05, -3.833696246147156e-05, -3.7027522921562195e-05, -3.571808338165283e-05, -3.440864384174347e-05, -3.3099204301834106e-05, -3.1789764761924744e-05, -3.048032522201538e-05, -2.9170885682106018e-05, -2.7861446142196655e-05, -2.6552006602287292e-05, -2.524256706237793e-05, -2.3933127522468567e-05, -2.2623687982559204e-05, -2.131424844264984e-05, -2.000480890274048e-05, -1.8695369362831116e-05, -1.7385929822921753e-05, -1.607649028301239e-05, -1.4767050743103027e-05, -1.3457611203193665e-05, -1.2148171663284302e-05, -1.0838732123374939e-05, -9.529292583465576e-06, -8.219853043556213e-06, -6.910413503646851e-06, -5.600973963737488e-06, -4.291534423828125e-06, -2.982094883918762e-06, -1.6726553440093994e-06, -3.632158041000366e-07, 9.462237358093262e-07, 2.255663275718689e-06, 3.5651028156280518e-06, 4.8745423555374146e-06, 6.183981895446777e-06, 7.49342143535614e-06, 8.802860975265503e-06, 1.0112300515174866e-05, 1.1421740055084229e-05, 1.2731179594993591e-05, 1.4040619134902954e-05, 1.5350058674812317e-05, 1.665949821472168e-05, 1.7968937754631042e-05, 1.9278377294540405e-05, 2.0587816834449768e-05, 2.189725637435913e-05, 2.3206695914268494e-05, 2.4516135454177856e-05, 2.582557499408722e-05, 2.7135014533996582e-05, 2.8444454073905945e-05, 2.9753893613815308e-05, 3.106333315372467e-05, 3.237277269363403e-05, 3.3682212233543396e-05, 3.499165177345276e-05, 3.630109131336212e-05, 3.7610530853271484e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 6.0, 7.0, 7.0, 8.0, 12.0, 22.0, 24.0, 45.0, 57.0, 86.0, 171.0, 274.0, 572.0, 1086.0, 2174.0, 4979.0, 12339.0, 33243.0, 106461.0, 339930.0, 366477.0, 120045.0, 37211.0, 12982.0, 5424.0, 2368.0, 1139.0, 628.0, 299.0, 183.0, 113.0, 65.0, 40.0, 22.0, 19.0, 10.0, 5.0, 4.0, 10.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.25634765625, -0.24859046936035156, -0.24083328247070312, -0.2330760955810547, -0.22531890869140625, -0.2175617218017578, -0.20980453491210938, -0.20204734802246094, -0.1942901611328125, -0.18653297424316406, -0.17877578735351562, -0.1710186004638672, -0.16326141357421875, -0.1555042266845703, -0.14774703979492188, -0.13998985290527344, -0.132232666015625, -0.12447547912597656, -0.11671829223632812, -0.10896110534667969, -0.10120391845703125, -0.09344673156738281, -0.08568954467773438, -0.07793235778808594, -0.0701751708984375, -0.06241798400878906, -0.054660797119140625, -0.04690361022949219, -0.03914642333984375, -0.03138923645019531, -0.023632049560546875, -0.015874862670898438, -0.00811767578125, -0.0003604888916015625, 0.007396697998046875, 0.015153884887695312, 0.02291107177734375, 0.030668258666992188, 0.038425445556640625, 0.04618263244628906, 0.0539398193359375, 0.06169700622558594, 0.06945419311523438, 0.07721138000488281, 0.08496856689453125, 0.09272575378417969, 0.10048294067382812, 0.10824012756347656, 0.115997314453125, 0.12375450134277344, 0.13151168823242188, 0.1392688751220703, 0.14702606201171875, 0.1547832489013672, 0.16254043579101562, 0.17029762268066406, 0.1780548095703125, 0.18581199645996094, 0.19356918334960938, 0.2013263702392578, 0.20908355712890625, 0.2168407440185547, 0.22459793090820312, 0.23235511779785156, 0.2401123046875]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 6.0, 7.0, 8.0, 7.0, 12.0, 15.0, 15.0, 21.0, 28.0, 26.0, 55.0, 68.0, 92.0, 75.0, 93.0, 106.0, 85.0, 69.0, 50.0, 41.0, 29.0, 28.0, 14.0, 7.0, 5.0, 7.0, 8.0, 6.0, 5.0, 3.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.275146484375, -0.26784324645996094, -0.2605400085449219, -0.2532367706298828, -0.24593353271484375, -0.2386302947998047, -0.23132705688476562, -0.22402381896972656, -0.2167205810546875, -0.20941734313964844, -0.20211410522460938, -0.1948108673095703, -0.18750762939453125, -0.1802043914794922, -0.17290115356445312, -0.16559791564941406, -0.158294677734375, -0.15099143981933594, -0.14368820190429688, -0.1363849639892578, -0.12908172607421875, -0.12177848815917969, -0.11447525024414062, -0.10717201232910156, -0.0998687744140625, -0.09256553649902344, -0.08526229858398438, -0.07795906066894531, -0.07065582275390625, -0.06335258483886719, -0.056049346923828125, -0.04874610900878906, -0.04144287109375, -0.03413963317871094, -0.026836395263671875, -0.019533157348632812, -0.01222991943359375, -0.0049266815185546875, 0.002376556396484375, 0.009679794311523438, 0.0169830322265625, 0.024286270141601562, 0.031589508056640625, 0.03889274597167969, 0.04619598388671875, 0.05349922180175781, 0.060802459716796875, 0.06810569763183594, 0.075408935546875, 0.08271217346191406, 0.09001541137695312, 0.09731864929199219, 0.10462188720703125, 0.11192512512207031, 0.11922836303710938, 0.12653160095214844, 0.1338348388671875, 0.14113807678222656, 0.14844131469726562, 0.1557445526123047, 0.16304779052734375, 0.1703510284423828, 0.17765426635742188, 0.18495750427246094, 0.1922607421875]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 6.0, 9.0, 6.0, 14.0, 26.0, 36.0, 53.0, 102.0, 118.0, 161.0, 116.0, 127.0, 76.0, 61.0, 31.0, 25.0, 14.0, 6.0, 5.0, 7.0, 3.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1253836154937744, -2.0369930267333984, -1.948602318763733, -1.860211730003357, -1.7718210220336914, -1.6834304332733154, -1.5950398445129395, -1.5066492557525635, -1.418258547782898, -1.329867959022522, -1.2414772510528564, -1.1530866622924805, -1.0646960735321045, -0.976305365562439, -0.887914776802063, -0.7995241284370422, -0.7111334800720215, -0.6227428317070007, -0.53435218334198, -0.445961594581604, -0.35757094621658325, -0.2691802978515625, -0.18078970909118652, -0.09239906072616577, -0.0040084123611450195, 0.08438222110271454, 0.1727728545665741, 0.26116347312927246, 0.3495541214942932, 0.43794476985931396, 0.5263353586196899, 0.6147260069847107, 0.7031164169311523, 0.7915070652961731, 0.8798977136611938, 0.9682883024215698, 1.0566790103912354, 1.1450695991516113, 1.2334601879119873, 1.3218507766723633, 1.4102414846420288, 1.4986320734024048, 1.5870227813720703, 1.6754133701324463, 1.7638039588928223, 1.8521946668624878, 1.9405852556228638, 2.0289759635925293, 2.1173665523529053, 2.2057571411132812, 2.2941477298736572, 2.382538318634033, 2.4709291458129883, 2.5593197345733643, 2.6477103233337402, 2.736100912094116, 2.824491500854492, 2.912882089614868, 3.001272678375244, 3.089663505554199, 3.178054094314575, 3.266444683074951, 3.354835271835327, 3.443225860595703, 3.531616687774658]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 2.0, 6.0, 4.0, 8.0, 8.0, 11.0, 13.0, 29.0, 31.0, 28.0, 35.0, 32.0, 33.0, 27.0, 48.0, 53.0, 35.0, 58.0, 59.0, 55.0, 52.0, 49.0, 40.0, 39.0, 40.0, 37.0, 26.0, 24.0, 23.0, 19.0, 15.0, 15.0, 13.0, 9.0, 9.0, 7.0, 5.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1442737579345703, -2.0782127380371094, -2.0121517181396484, -1.946090579032898, -1.880029559135437, -1.813968539237976, -1.7479074001312256, -1.6818463802337646, -1.6157853603363037, -1.5497243404388428, -1.4836633205413818, -1.4176021814346313, -1.3515411615371704, -1.2854801416397095, -1.219419002532959, -1.153357982635498, -1.087296962738037, -1.0212359428405762, -0.9551748633384705, -0.8891137838363647, -0.8230527639389038, -0.7569917440414429, -0.6909306645393372, -0.6248695850372314, -0.5588085651397705, -0.4927475154399872, -0.42668646574020386, -0.36062541604042053, -0.2945643663406372, -0.22850331664085388, -0.16244226694107056, -0.09638121724128723, -0.030319929122924805, 0.03574112057685852, 0.10180217027664185, 0.16786321997642517, 0.2339242696762085, 0.2999853193759918, 0.36604636907577515, 0.43210741877555847, 0.4981684684753418, 0.5642294883728027, 0.6302905678749084, 0.6963516473770142, 0.7624126672744751, 0.828473687171936, 0.8945347666740417, 0.9605958461761475, 1.0266568660736084, 1.0927178859710693, 1.1587789058685303, 1.2248400449752808, 1.2909010648727417, 1.3569620847702026, 1.4230232238769531, 1.489084243774414, 1.555145263671875, 1.621206283569336, 1.6872673034667969, 1.7533284425735474, 1.8193894624710083, 1.8854504823684692, 1.9515116214752197, 2.0175726413726807, 2.0836336612701416]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 17.0, 21.0, 43.0, 61.0, 124.0, 213.0, 430.0, 977.0, 2277.0, 6788.0, 26024.0, 154624.0, 2330886.0, 1526977.0, 115514.0, 20621.0, 5443.0, 1802.0, 728.0, 328.0, 182.0, 93.0, 49.0, 32.0, 13.0, 7.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.119140625, -1.0911102294921875, -1.063079833984375, -1.0350494384765625, -1.00701904296875, -0.9789886474609375, -0.950958251953125, -0.9229278564453125, -0.8948974609375, -0.8668670654296875, -0.838836669921875, -0.8108062744140625, -0.78277587890625, -0.7547454833984375, -0.726715087890625, -0.6986846923828125, -0.670654296875, -0.6426239013671875, -0.614593505859375, -0.5865631103515625, -0.55853271484375, -0.5305023193359375, -0.502471923828125, -0.4744415283203125, -0.4464111328125, -0.4183807373046875, -0.390350341796875, -0.3623199462890625, -0.33428955078125, -0.3062591552734375, -0.278228759765625, -0.2501983642578125, -0.22216796875, -0.1941375732421875, -0.166107177734375, -0.1380767822265625, -0.11004638671875, -0.0820159912109375, -0.053985595703125, -0.0259552001953125, 0.0020751953125, 0.0301055908203125, 0.058135986328125, 0.0861663818359375, 0.11419677734375, 0.1422271728515625, 0.170257568359375, 0.1982879638671875, 0.226318359375, 0.2543487548828125, 0.282379150390625, 0.3104095458984375, 0.33843994140625, 0.3664703369140625, 0.394500732421875, 0.4225311279296875, 0.4505615234375, 0.4785919189453125, 0.506622314453125, 0.5346527099609375, 0.56268310546875, 0.5907135009765625, 0.618743896484375, 0.6467742919921875, 0.6748046875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 2.0, 7.0, 7.0, 7.0, 13.0, 26.0, 30.0, 32.0, 29.0, 45.0, 61.0, 48.0, 68.0, 58.0, 71.0, 58.0, 62.0, 71.0, 66.0, 46.0, 36.0, 43.0, 39.0, 25.0, 20.0, 10.0, 11.0, 10.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4150390625, -0.40349578857421875, -0.3919525146484375, -0.38040924072265625, -0.368865966796875, -0.35732269287109375, -0.3457794189453125, -0.33423614501953125, -0.32269287109375, -0.31114959716796875, -0.2996063232421875, -0.28806304931640625, -0.276519775390625, -0.26497650146484375, -0.2534332275390625, -0.24188995361328125, -0.2303466796875, -0.21880340576171875, -0.2072601318359375, -0.19571685791015625, -0.184173583984375, -0.17263031005859375, -0.1610870361328125, -0.14954376220703125, -0.13800048828125, -0.12645721435546875, -0.1149139404296875, -0.10337066650390625, -0.091827392578125, -0.08028411865234375, -0.0687408447265625, -0.05719757080078125, -0.045654296875, -0.03411102294921875, -0.0225677490234375, -0.01102447509765625, 0.000518798828125, 0.01206207275390625, 0.0236053466796875, 0.03514862060546875, 0.04669189453125, 0.05823516845703125, 0.0697784423828125, 0.08132171630859375, 0.092864990234375, 0.10440826416015625, 0.1159515380859375, 0.12749481201171875, 0.1390380859375, 0.15058135986328125, 0.1621246337890625, 0.17366790771484375, 0.185211181640625, 0.19675445556640625, 0.2082977294921875, 0.21984100341796875, 0.23138427734375, 0.24292755126953125, 0.2544708251953125, 0.26601409912109375, 0.277557373046875, 0.28910064697265625, 0.3006439208984375, 0.31218719482421875, 0.32373046875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 5.0, 5.0, 3.0, 8.0, 7.0, 10.0, 16.0, 24.0, 29.0, 47.0, 59.0, 86.0, 119.0, 187.0, 292.0, 506.0, 738.0, 1094.0, 1832.0, 2991.0, 5009.0, 8523.0, 15125.0, 28068.0, 55429.0, 118009.0, 280618.0, 843910.0, 1777442.0, 628173.0, 225936.0, 97462.0, 46621.0, 23768.0, 13005.0, 7321.0, 4374.0, 2735.0, 1647.0, 1050.0, 673.0, 440.0, 293.0, 197.0, 124.0, 104.0, 51.0, 43.0, 27.0, 17.0, 13.0, 13.0, 7.0, 3.0, 3.0, 2.0, 1.0, 3.0, 2.0, 2.0], "bins": [-0.3427734375, -0.3321876525878906, -0.32160186767578125, -0.3110160827636719, -0.3004302978515625, -0.2898445129394531, -0.27925872802734375, -0.2686729431152344, -0.258087158203125, -0.24750137329101562, -0.23691558837890625, -0.22632980346679688, -0.2157440185546875, -0.20515823364257812, -0.19457244873046875, -0.18398666381835938, -0.17340087890625, -0.16281509399414062, -0.15222930908203125, -0.14164352416992188, -0.1310577392578125, -0.12047195434570312, -0.10988616943359375, -0.09930038452148438, -0.088714599609375, -0.07812881469726562, -0.06754302978515625, -0.056957244873046875, -0.0463714599609375, -0.035785675048828125, -0.02519989013671875, -0.014614105224609375, -0.0040283203125, 0.006557464599609375, 0.01714324951171875, 0.027729034423828125, 0.0383148193359375, 0.048900604248046875, 0.05948638916015625, 0.07007217407226562, 0.080657958984375, 0.09124374389648438, 0.10182952880859375, 0.11241531372070312, 0.1230010986328125, 0.13358688354492188, 0.14417266845703125, 0.15475845336914062, 0.16534423828125, 0.17593002319335938, 0.18651580810546875, 0.19710159301757812, 0.2076873779296875, 0.21827316284179688, 0.22885894775390625, 0.23944473266601562, 0.250030517578125, 0.2606163024902344, 0.27120208740234375, 0.2817878723144531, 0.2923736572265625, 0.3029594421386719, 0.31354522705078125, 0.3241310119628906, 0.334716796875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 3.0, 2.0, 5.0, 3.0, 7.0, 11.0, 14.0, 19.0, 22.0, 24.0, 39.0, 53.0, 81.0, 95.0, 117.0, 172.0, 263.0, 422.0, 675.0, 668.0, 405.0, 290.0, 196.0, 130.0, 80.0, 70.0, 46.0, 32.0, 23.0, 33.0, 18.0, 20.0, 13.0, 2.0, 6.0, 4.0, 7.0, 2.0, 6.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.56201171875, -0.54498291015625, -0.5279541015625, -0.51092529296875, -0.493896484375, -0.47686767578125, -0.4598388671875, -0.44281005859375, -0.42578125, -0.40875244140625, -0.3917236328125, -0.37469482421875, -0.357666015625, -0.34063720703125, -0.3236083984375, -0.30657958984375, -0.28955078125, -0.27252197265625, -0.2554931640625, -0.23846435546875, -0.221435546875, -0.20440673828125, -0.1873779296875, -0.17034912109375, -0.1533203125, -0.13629150390625, -0.1192626953125, -0.10223388671875, -0.085205078125, -0.06817626953125, -0.0511474609375, -0.03411865234375, -0.01708984375, -6.103515625e-05, 0.0169677734375, 0.03399658203125, 0.051025390625, 0.06805419921875, 0.0850830078125, 0.10211181640625, 0.119140625, 0.13616943359375, 0.1531982421875, 0.17022705078125, 0.187255859375, 0.20428466796875, 0.2213134765625, 0.23834228515625, 0.25537109375, 0.27239990234375, 0.2894287109375, 0.30645751953125, 0.323486328125, 0.34051513671875, 0.3575439453125, 0.37457275390625, 0.3916015625, 0.40863037109375, 0.4256591796875, 0.44268798828125, 0.459716796875, 0.47674560546875, 0.4937744140625, 0.51080322265625, 0.52783203125]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 3.0, 13.0, 12.0, 21.0, 43.0, 71.0, 106.0, 134.0, 146.0, 128.0, 119.0, 82.0, 54.0, 31.0, 21.0, 12.0, 6.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.866886615753174, -3.7438747882843018, -3.6208627223968506, -3.4978508949279785, -3.3748390674591064, -3.2518270015716553, -3.128815174102783, -3.005803108215332, -2.88279128074646, -2.759779453277588, -2.6367673873901367, -2.5137555599212646, -2.3907437324523926, -2.2677316665649414, -2.1447198390960693, -2.0217080116271973, -1.8986960649490356, -1.775684118270874, -1.652672290802002, -1.5296603441238403, -1.4066483974456787, -1.2836365699768066, -1.160624623298645, -1.0376126766204834, -0.9146007895469666, -0.7915889024734497, -0.6685769557952881, -0.5455650687217712, -0.422553151845932, -0.2995412349700928, -0.17652934789657593, -0.05351740121841431, 0.06949448585510254, 0.19250640273094177, 0.315518319606781, 0.43853020668029785, 0.5615421533584595, 0.6845540404319763, 0.8075659275054932, 0.9305778741836548, 1.0535898208618164, 1.176601767539978, 1.29961359500885, 1.4226255416870117, 1.5456374883651733, 1.668649435043335, 1.791661262512207, 1.9146732091903687, 2.037684917449951, 2.1606967449188232, 2.2837088108062744, 2.4067206382751465, 2.5297324657440186, 2.6527445316314697, 2.775756359100342, 2.898768424987793, 3.021780252456665, 3.144792079925537, 3.2678041458129883, 3.3908159732818604, 3.5138278007507324, 3.6368398666381836, 3.7598516941070557, 3.8828635215759277, 4.005875587463379]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 6.0, 6.0, 6.0, 1.0, 7.0, 6.0, 13.0, 13.0, 13.0, 18.0, 16.0, 22.0, 17.0, 28.0, 16.0, 23.0, 34.0, 41.0, 43.0, 39.0, 41.0, 41.0, 46.0, 45.0, 34.0, 33.0, 35.0, 37.0, 33.0, 36.0, 33.0, 30.0, 23.0, 22.0, 28.0, 25.0, 15.0, 19.0, 8.0, 14.0, 11.0, 8.0, 7.0, 3.0, 2.0, 3.0, 4.0, 0.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5481631755828857, -1.4985090494155884, -1.4488550424575806, -1.3992009162902832, -1.3495467901229858, -1.2998926639556885, -1.2502386569976807, -1.2005845308303833, -1.150930404663086, -1.1012762784957886, -1.0516222715377808, -1.0019681453704834, -0.952314019203186, -0.9026599526405334, -0.8530058860778809, -0.8033517599105835, -0.7536977529525757, -0.7040436863899231, -0.6543895602226257, -0.6047354936599731, -0.5550813674926758, -0.5054273009300232, -0.4557732343673706, -0.40611913800239563, -0.35646504163742065, -0.3068109452724457, -0.2571568489074707, -0.20750278234481812, -0.15784868597984314, -0.10819458961486816, -0.058540523052215576, -0.0088864266872406, 0.040767669677734375, 0.09042175859212875, 0.14007584750652313, 0.18972992897033691, 0.2393840253353119, 0.28903812170028687, 0.33869218826293945, 0.38834628462791443, 0.4380003809928894, 0.4876544773578644, 0.5373085737228394, 0.5869626402854919, 0.6366167068481445, 0.6862708330154419, 0.7359248995780945, 0.7855789661407471, 0.8352330923080444, 0.884887158870697, 0.9345412850379944, 0.984195351600647, 1.0338494777679443, 1.0835034847259521, 1.1331576108932495, 1.1828117370605469, 1.2324657440185547, 1.282119870185852, 1.3317738771438599, 1.3814280033111572, 1.4310821294784546, 1.480736255645752, 1.5303902626037598, 1.5800443887710571, 1.6296985149383545]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 5.0, 5.0, 14.0, 20.0, 34.0, 45.0, 82.0, 121.0, 200.0, 345.0, 483.0, 725.0, 1216.0, 1919.0, 2997.0, 4802.0, 7856.0, 13043.0, 24217.0, 54023.0, 166400.0, 429433.0, 211698.0, 63840.0, 27845.0, 14559.0, 8436.0, 5159.0, 3316.0, 2097.0, 1324.0, 850.0, 506.0, 345.0, 225.0, 136.0, 87.0, 61.0, 42.0, 16.0, 14.0, 12.0, 5.0, 4.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5380859375, -0.521575927734375, -0.50506591796875, -0.488555908203125, -0.4720458984375, -0.455535888671875, -0.43902587890625, -0.422515869140625, -0.406005859375, -0.389495849609375, -0.37298583984375, -0.356475830078125, -0.3399658203125, -0.323455810546875, -0.30694580078125, -0.290435791015625, -0.27392578125, -0.257415771484375, -0.24090576171875, -0.224395751953125, -0.2078857421875, -0.191375732421875, -0.17486572265625, -0.158355712890625, -0.141845703125, -0.125335693359375, -0.10882568359375, -0.092315673828125, -0.0758056640625, -0.059295654296875, -0.04278564453125, -0.026275634765625, -0.009765625, 0.006744384765625, 0.02325439453125, 0.039764404296875, 0.0562744140625, 0.072784423828125, 0.08929443359375, 0.105804443359375, 0.122314453125, 0.138824462890625, 0.15533447265625, 0.171844482421875, 0.1883544921875, 0.204864501953125, 0.22137451171875, 0.237884521484375, 0.25439453125, 0.270904541015625, 0.28741455078125, 0.303924560546875, 0.3204345703125, 0.336944580078125, 0.35345458984375, 0.369964599609375, 0.386474609375, 0.402984619140625, 0.41949462890625, 0.436004638671875, 0.4525146484375, 0.469024658203125, 0.48553466796875, 0.502044677734375, 0.5185546875]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 9.0, 11.0, 6.0, 16.0, 19.0, 22.0, 25.0, 43.0, 51.0, 49.0, 62.0, 56.0, 70.0, 78.0, 75.0, 64.0, 63.0, 58.0, 54.0, 35.0, 30.0, 28.0, 23.0, 21.0, 11.0, 9.0, 10.0, 8.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.435546875, -0.4240150451660156, -0.41248321533203125, -0.4009513854980469, -0.3894195556640625, -0.3778877258300781, -0.36635589599609375, -0.3548240661621094, -0.343292236328125, -0.3317604064941406, -0.32022857666015625, -0.3086967468261719, -0.2971649169921875, -0.2856330871582031, -0.27410125732421875, -0.2625694274902344, -0.25103759765625, -0.23950576782226562, -0.22797393798828125, -0.21644210815429688, -0.2049102783203125, -0.19337844848632812, -0.18184661865234375, -0.17031478881835938, -0.158782958984375, -0.14725112915039062, -0.13571929931640625, -0.12418746948242188, -0.1126556396484375, -0.10112380981445312, -0.08959197998046875, -0.07806015014648438, -0.0665283203125, -0.054996490478515625, -0.04346466064453125, -0.031932830810546875, -0.0204010009765625, -0.008869171142578125, 0.00266265869140625, 0.014194488525390625, 0.025726318359375, 0.037258148193359375, 0.04878997802734375, 0.060321807861328125, 0.0718536376953125, 0.08338546752929688, 0.09491729736328125, 0.10644912719726562, 0.11798095703125, 0.12951278686523438, 0.14104461669921875, 0.15257644653320312, 0.1641082763671875, 0.17564010620117188, 0.18717193603515625, 0.19870376586914062, 0.210235595703125, 0.22176742553710938, 0.23329925537109375, 0.24483108520507812, 0.2563629150390625, 0.2678947448730469, 0.27942657470703125, 0.2909584045410156, 0.302490234375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 5.0, 4.0, 8.0, 8.0, 8.0, 11.0, 14.0, 18.0, 30.0, 42.0, 64.0, 108.0, 162.0, 280.0, 663.0, 1714.0, 4496.0, 12588.0, 38067.0, 166277.0, 613578.0, 155000.0, 36188.0, 11827.0, 4304.0, 1638.0, 665.0, 298.0, 184.0, 85.0, 66.0, 49.0, 35.0, 24.0, 16.0, 13.0, 7.0, 1.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.77685546875, -0.7505035400390625, -0.724151611328125, -0.6977996826171875, -0.67144775390625, -0.6450958251953125, -0.618743896484375, -0.5923919677734375, -0.5660400390625, -0.5396881103515625, -0.513336181640625, -0.4869842529296875, -0.46063232421875, -0.4342803955078125, -0.407928466796875, -0.3815765380859375, -0.355224609375, -0.3288726806640625, -0.302520751953125, -0.2761688232421875, -0.24981689453125, -0.2234649658203125, -0.197113037109375, -0.1707611083984375, -0.1444091796875, -0.1180572509765625, -0.091705322265625, -0.0653533935546875, -0.03900146484375, -0.0126495361328125, 0.013702392578125, 0.0400543212890625, 0.06640625, 0.0927581787109375, 0.119110107421875, 0.1454620361328125, 0.17181396484375, 0.1981658935546875, 0.224517822265625, 0.2508697509765625, 0.2772216796875, 0.3035736083984375, 0.329925537109375, 0.3562774658203125, 0.38262939453125, 0.4089813232421875, 0.435333251953125, 0.4616851806640625, 0.488037109375, 0.5143890380859375, 0.540740966796875, 0.5670928955078125, 0.59344482421875, 0.6197967529296875, 0.646148681640625, 0.6725006103515625, 0.6988525390625, 0.7252044677734375, 0.751556396484375, 0.7779083251953125, 0.80426025390625, 0.8306121826171875, 0.856964111328125, 0.8833160400390625, 0.90966796875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 5.0, 8.0, 9.0, 6.0, 10.0, 7.0, 13.0, 17.0, 16.0, 22.0, 30.0, 39.0, 30.0, 38.0, 46.0, 37.0, 39.0, 62.0, 53.0, 48.0, 49.0, 41.0, 40.0, 46.0, 45.0, 33.0, 28.0, 34.0, 29.0, 17.0, 15.0, 22.0, 15.0, 13.0, 12.0, 2.0, 8.0, 6.0, 5.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.69384765625, -0.6712493896484375, -0.648651123046875, -0.6260528564453125, -0.60345458984375, -0.5808563232421875, -0.558258056640625, -0.5356597900390625, -0.5130615234375, -0.4904632568359375, -0.467864990234375, -0.4452667236328125, -0.42266845703125, -0.4000701904296875, -0.377471923828125, -0.3548736572265625, -0.332275390625, -0.3096771240234375, -0.287078857421875, -0.2644805908203125, -0.24188232421875, -0.2192840576171875, -0.196685791015625, -0.1740875244140625, -0.1514892578125, -0.1288909912109375, -0.106292724609375, -0.0836944580078125, -0.06109619140625, -0.0384979248046875, -0.015899658203125, 0.0066986083984375, 0.029296875, 0.0518951416015625, 0.074493408203125, 0.0970916748046875, 0.11968994140625, 0.1422882080078125, 0.164886474609375, 0.1874847412109375, 0.2100830078125, 0.2326812744140625, 0.255279541015625, 0.2778778076171875, 0.30047607421875, 0.3230743408203125, 0.345672607421875, 0.3682708740234375, 0.390869140625, 0.4134674072265625, 0.436065673828125, 0.4586639404296875, 0.48126220703125, 0.5038604736328125, 0.526458740234375, 0.5490570068359375, 0.5716552734375, 0.5942535400390625, 0.616851806640625, 0.6394500732421875, 0.66204833984375, 0.6846466064453125, 0.707244873046875, 0.7298431396484375, 0.75244140625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 10.0, 14.0, 16.0, 22.0, 39.0, 63.0, 110.0, 212.0, 393.0, 751.0, 1612.0, 3249.0, 6903.0, 15430.0, 40213.0, 125773.0, 374731.0, 320361.0, 100708.0, 32964.0, 13255.0, 5961.0, 2830.0, 1409.0, 712.0, 385.0, 183.0, 99.0, 61.0, 28.0, 20.0, 15.0, 11.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2095947265625, -0.20302581787109375, -0.1964569091796875, -0.18988800048828125, -0.183319091796875, -0.17675018310546875, -0.1701812744140625, -0.16361236572265625, -0.15704345703125, -0.15047454833984375, -0.1439056396484375, -0.13733673095703125, -0.130767822265625, -0.12419891357421875, -0.1176300048828125, -0.11106109619140625, -0.1044921875, -0.09792327880859375, -0.0913543701171875, -0.08478546142578125, -0.078216552734375, -0.07164764404296875, -0.0650787353515625, -0.05850982666015625, -0.05194091796875, -0.04537200927734375, -0.0388031005859375, -0.03223419189453125, -0.025665283203125, -0.01909637451171875, -0.0125274658203125, -0.00595855712890625, 0.0006103515625, 0.00717926025390625, 0.0137481689453125, 0.02031707763671875, 0.026885986328125, 0.03345489501953125, 0.0400238037109375, 0.04659271240234375, 0.05316162109375, 0.05973052978515625, 0.0662994384765625, 0.07286834716796875, 0.079437255859375, 0.08600616455078125, 0.0925750732421875, 0.09914398193359375, 0.105712890625, 0.11228179931640625, 0.1188507080078125, 0.12541961669921875, 0.131988525390625, 0.13855743408203125, 0.1451263427734375, 0.15169525146484375, 0.15826416015625, 0.16483306884765625, 0.1714019775390625, 0.17797088623046875, 0.184539794921875, 0.19110870361328125, 0.1976776123046875, 0.20424652099609375, 0.2108154296875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 6.0, 5.0, 2.0, 9.0, 2.0, 7.0, 7.0, 15.0, 10.0, 12.0, 18.0, 39.0, 51.0, 69.0, 114.0, 145.0, 132.0, 103.0, 68.0, 33.0, 44.0, 18.0, 23.0, 14.0, 6.0, 10.0, 4.0, 8.0, 3.0, 3.0, 2.0, 1.0, 7.0, 3.0, 0.0, 4.0, 2.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.898143768310547e-05, -3.735162317752838e-05, -3.5721808671951294e-05, -3.4091994166374207e-05, -3.246217966079712e-05, -3.083236515522003e-05, -2.9202550649642944e-05, -2.7572736144065857e-05, -2.594292163848877e-05, -2.4313107132911682e-05, -2.2683292627334595e-05, -2.1053478121757507e-05, -1.942366361618042e-05, -1.7793849110603333e-05, -1.6164034605026245e-05, -1.4534220099449158e-05, -1.290440559387207e-05, -1.1274591088294983e-05, -9.644776582717896e-06, -8.014962077140808e-06, -6.385147571563721e-06, -4.755333065986633e-06, -3.125518560409546e-06, -1.4957040548324585e-06, 1.341104507446289e-07, 1.7639249563217163e-06, 3.3937394618988037e-06, 5.023553967475891e-06, 6.6533684730529785e-06, 8.283182978630066e-06, 9.912997484207153e-06, 1.154281198978424e-05, 1.3172626495361328e-05, 1.4802441000938416e-05, 1.6432255506515503e-05, 1.806207001209259e-05, 1.9691884517669678e-05, 2.1321699023246765e-05, 2.2951513528823853e-05, 2.458132803440094e-05, 2.6211142539978027e-05, 2.7840957045555115e-05, 2.9470771551132202e-05, 3.110058605670929e-05, 3.273040056228638e-05, 3.4360215067863464e-05, 3.599002957344055e-05, 3.761984407901764e-05, 3.9249658584594727e-05, 4.0879473090171814e-05, 4.25092875957489e-05, 4.413910210132599e-05, 4.5768916606903076e-05, 4.7398731112480164e-05, 4.902854561805725e-05, 5.065836012363434e-05, 5.2288174629211426e-05, 5.391798913478851e-05, 5.55478036403656e-05, 5.717761814594269e-05, 5.8807432651519775e-05, 6.043724715709686e-05, 6.206706166267395e-05, 6.369687616825104e-05, 6.532669067382812e-05]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 10.0, 7.0, 6.0, 9.0, 23.0, 21.0, 47.0, 62.0, 100.0, 217.0, 418.0, 912.0, 2286.0, 6827.0, 21248.0, 76110.0, 308673.0, 446816.0, 133229.0, 34806.0, 10742.0, 3526.0, 1245.0, 538.0, 272.0, 163.0, 84.0, 57.0, 30.0, 25.0, 13.0, 12.0, 8.0, 7.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.283447265625, -0.27582740783691406, -0.2682075500488281, -0.2605876922607422, -0.25296783447265625, -0.2453479766845703, -0.23772811889648438, -0.23010826110839844, -0.2224884033203125, -0.21486854553222656, -0.20724868774414062, -0.1996288299560547, -0.19200897216796875, -0.1843891143798828, -0.17676925659179688, -0.16914939880371094, -0.161529541015625, -0.15390968322753906, -0.14628982543945312, -0.1386699676513672, -0.13105010986328125, -0.12343025207519531, -0.11581039428710938, -0.10819053649902344, -0.1005706787109375, -0.09295082092285156, -0.08533096313476562, -0.07771110534667969, -0.07009124755859375, -0.06247138977050781, -0.054851531982421875, -0.04723167419433594, -0.03961181640625, -0.03199195861816406, -0.024372100830078125, -0.016752243041992188, -0.00913238525390625, -0.0015125274658203125, 0.006107330322265625, 0.013727188110351562, 0.0213470458984375, 0.028966903686523438, 0.036586761474609375, 0.04420661926269531, 0.05182647705078125, 0.05944633483886719, 0.06706619262695312, 0.07468605041503906, 0.082305908203125, 0.08992576599121094, 0.09754562377929688, 0.10516548156738281, 0.11278533935546875, 0.12040519714355469, 0.12802505493164062, 0.13564491271972656, 0.1432647705078125, 0.15088462829589844, 0.15850448608398438, 0.1661243438720703, 0.17374420166015625, 0.1813640594482422, 0.18898391723632812, 0.19660377502441406, 0.2042236328125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 7.0, 10.0, 12.0, 13.0, 15.0, 18.0, 33.0, 38.0, 54.0, 77.0, 93.0, 91.0, 94.0, 85.0, 92.0, 68.0, 44.0, 36.0, 27.0, 28.0, 19.0, 17.0, 8.0, 3.0, 10.0, 5.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.173583984375, -0.16578292846679688, -0.15798187255859375, -0.15018081665039062, -0.1423797607421875, -0.13457870483398438, -0.12677764892578125, -0.11897659301757812, -0.111175537109375, -0.10337448120117188, -0.09557342529296875, -0.08777236938476562, -0.0799713134765625, -0.07217025756835938, -0.06436920166015625, -0.056568145751953125, -0.04876708984375, -0.040966033935546875, -0.03316497802734375, -0.025363922119140625, -0.0175628662109375, -0.009761810302734375, -0.00196075439453125, 0.005840301513671875, 0.013641357421875, 0.021442413330078125, 0.02924346923828125, 0.037044525146484375, 0.0448455810546875, 0.052646636962890625, 0.06044769287109375, 0.06824874877929688, 0.0760498046875, 0.08385086059570312, 0.09165191650390625, 0.09945297241210938, 0.1072540283203125, 0.11505508422851562, 0.12285614013671875, 0.13065719604492188, 0.138458251953125, 0.14625930786132812, 0.15406036376953125, 0.16186141967773438, 0.1696624755859375, 0.17746353149414062, 0.18526458740234375, 0.19306564331054688, 0.20086669921875, 0.20866775512695312, 0.21646881103515625, 0.22426986694335938, 0.2320709228515625, 0.23987197875976562, 0.24767303466796875, 0.2554740905761719, 0.263275146484375, 0.2710762023925781, 0.27887725830078125, 0.2866783142089844, 0.2944793701171875, 0.3022804260253906, 0.31008148193359375, 0.3178825378417969, 0.32568359375]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 5.0, 5.0, 17.0, 47.0, 108.0, 185.0, 223.0, 203.0, 105.0, 65.0, 26.0, 11.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.389437198638916, -4.224103927612305, -4.058770656585693, -3.893437385559082, -3.7281041145324707, -3.5627708435058594, -3.397437334060669, -3.2321040630340576, -3.0667707920074463, -2.901437520980835, -2.7361042499542236, -2.5707709789276123, -2.405437469482422, -2.2401041984558105, -2.074770927429199, -1.909437656402588, -1.7441043853759766, -1.5787711143493652, -1.413437843322754, -1.248104453086853, -1.0827711820602417, -0.9174379110336304, -0.7521045804023743, -0.5867712497711182, -0.42143797874450684, -0.2561046779155731, -0.0907713770866394, 0.07456192374229431, 0.23989522457122803, 0.40522849559783936, 0.5705618262290955, 0.7358951568603516, 0.9012289047241211, 1.0665621757507324, 1.2318954467773438, 1.3972288370132446, 1.562562108039856, 1.7278953790664673, 1.8932287693023682, 2.0585620403289795, 2.223895311355591, 2.389228582382202, 2.5545618534088135, 2.719895124435425, 2.8852286338806152, 3.0505619049072266, 3.215895175933838, 3.381228446960449, 3.5465617179870605, 3.711894989013672, 3.877228260040283, 4.0425615310668945, 4.207894802093506, 4.373228073120117, 4.5385613441467285, 4.70389461517334, 4.869228363037109, 5.034561634063721, 5.199894905090332, 5.365228176116943, 5.530561447143555, 5.695894718170166, 5.861227989196777, 6.026561737060547, 6.19189453125]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 3.0, 3.0, 6.0, 4.0, 5.0, 5.0, 8.0, 13.0, 18.0, 15.0, 25.0, 17.0, 26.0, 26.0, 32.0, 28.0, 24.0, 45.0, 34.0, 39.0, 49.0, 42.0, 32.0, 39.0, 47.0, 30.0, 36.0, 30.0, 44.0, 44.0, 26.0, 32.0, 34.0, 18.0, 25.0, 18.0, 12.0, 13.0, 11.0, 10.0, 12.0, 8.0, 8.0, 6.0, 6.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.109098196029663, -2.046830892562866, -1.9845635890960693, -1.9222962856292725, -1.860028862953186, -1.7977615594863892, -1.7354942560195923, -1.6732269525527954, -1.610959529876709, -1.548692226409912, -1.4864249229431152, -1.4241576194763184, -1.361890196800232, -1.299622893333435, -1.2373555898666382, -1.1750882863998413, -1.1128209829330444, -1.0505536794662476, -0.9882863163948059, -0.926019012928009, -0.8637516498565674, -0.8014843463897705, -0.7392170429229736, -0.6769497394561768, -0.6146823763847351, -0.5524150729179382, -0.4901477098464966, -0.4278804063796997, -0.36561307311058044, -0.3033457398414612, -0.2410784363746643, -0.17881110310554504, -0.11654376983642578, -0.054276444017887115, 0.00799088180065155, 0.07025820016860962, 0.13252553343772888, 0.19479286670684814, 0.257060170173645, 0.3193275034427643, 0.38159483671188354, 0.4438621699810028, 0.5061295032501221, 0.568396806716919, 0.6306641101837158, 0.6929314732551575, 0.7551987767219543, 0.817466139793396, 0.8797334432601929, 0.9420007467269897, 1.0042680501937866, 1.066535472869873, 1.12880277633667, 1.1910700798034668, 1.2533373832702637, 1.3156046867370605, 1.3778719902038574, 1.4401392936706543, 1.5024065971374512, 1.564673900604248, 1.6269413232803345, 1.6892086267471313, 1.7514759302139282, 1.813743233680725, 1.8760106563568115]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 9.0, 15.0, 21.0, 37.0, 91.0, 161.0, 454.0, 1022.0, 3258.0, 10580.0, 42821.0, 250132.0, 3021699.0, 753663.0, 84168.0, 18823.0, 4976.0, 1447.0, 548.0, 213.0, 91.0, 45.0, 11.0, 4.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9873046875, -0.9624404907226562, -0.9375762939453125, -0.9127120971679688, -0.887847900390625, -0.8629837036132812, -0.8381195068359375, -0.8132553100585938, -0.78839111328125, -0.7635269165039062, -0.7386627197265625, -0.7137985229492188, -0.688934326171875, -0.6640701293945312, -0.6392059326171875, -0.6143417358398438, -0.5894775390625, -0.5646133422851562, -0.5397491455078125, -0.5148849487304688, -0.490020751953125, -0.46515655517578125, -0.4402923583984375, -0.41542816162109375, -0.39056396484375, -0.36569976806640625, -0.3408355712890625, -0.31597137451171875, -0.291107177734375, -0.26624298095703125, -0.2413787841796875, -0.21651458740234375, -0.191650390625, -0.16678619384765625, -0.1419219970703125, -0.11705780029296875, -0.092193603515625, -0.06732940673828125, -0.0424652099609375, -0.01760101318359375, 0.00726318359375, 0.03212738037109375, 0.0569915771484375, 0.08185577392578125, 0.106719970703125, 0.13158416748046875, 0.1564483642578125, 0.18131256103515625, 0.2061767578125, 0.23104095458984375, 0.2559051513671875, 0.28076934814453125, 0.305633544921875, 0.33049774169921875, 0.3553619384765625, 0.38022613525390625, 0.40509033203125, 0.42995452880859375, 0.4548187255859375, 0.47968292236328125, 0.504547119140625, 0.5294113159179688, 0.5542755126953125, 0.5791397094726562, 0.60400390625]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 5.0, 2.0, 4.0, 2.0, 4.0, 15.0, 15.0, 13.0, 17.0, 28.0, 21.0, 42.0, 43.0, 61.0, 59.0, 67.0, 65.0, 52.0, 52.0, 52.0, 63.0, 41.0, 48.0, 48.0, 35.0, 31.0, 32.0, 23.0, 22.0, 15.0, 12.0, 11.0, 7.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3974609375, -0.3867645263671875, -0.376068115234375, -0.3653717041015625, -0.35467529296875, -0.3439788818359375, -0.333282470703125, -0.3225860595703125, -0.3118896484375, -0.3011932373046875, -0.290496826171875, -0.2798004150390625, -0.26910400390625, -0.2584075927734375, -0.247711181640625, -0.2370147705078125, -0.226318359375, -0.2156219482421875, -0.204925537109375, -0.1942291259765625, -0.18353271484375, -0.1728363037109375, -0.162139892578125, -0.1514434814453125, -0.1407470703125, -0.1300506591796875, -0.119354248046875, -0.1086578369140625, -0.09796142578125, -0.0872650146484375, -0.076568603515625, -0.0658721923828125, -0.05517578125, -0.0444793701171875, -0.033782958984375, -0.0230865478515625, -0.01239013671875, -0.0016937255859375, 0.009002685546875, 0.0196990966796875, 0.0303955078125, 0.0410919189453125, 0.051788330078125, 0.0624847412109375, 0.07318115234375, 0.0838775634765625, 0.094573974609375, 0.1052703857421875, 0.115966796875, 0.1266632080078125, 0.137359619140625, 0.1480560302734375, 0.15875244140625, 0.1694488525390625, 0.180145263671875, 0.1908416748046875, 0.2015380859375, 0.2122344970703125, 0.222930908203125, 0.2336273193359375, 0.24432373046875, 0.2550201416015625, 0.265716552734375, 0.2764129638671875, 0.287109375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 9.0, 11.0, 21.0, 21.0, 35.0, 59.0, 103.0, 170.0, 335.0, 583.0, 1071.0, 2203.0, 4728.0, 11800.0, 32527.0, 103835.0, 450732.0, 2699648.0, 684311.0, 135912.0, 40668.0, 14464.0, 5755.0, 2546.0, 1252.0, 661.0, 320.0, 200.0, 107.0, 66.0, 47.0, 31.0, 17.0, 19.0, 8.0, 4.0, 5.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52490234375, -0.5065536499023438, -0.4882049560546875, -0.46985626220703125, -0.451507568359375, -0.43315887451171875, -0.4148101806640625, -0.39646148681640625, -0.37811279296875, -0.35976409912109375, -0.3414154052734375, -0.32306671142578125, -0.304718017578125, -0.28636932373046875, -0.2680206298828125, -0.24967193603515625, -0.2313232421875, -0.21297454833984375, -0.1946258544921875, -0.17627716064453125, -0.157928466796875, -0.13957977294921875, -0.1212310791015625, -0.10288238525390625, -0.08453369140625, -0.06618499755859375, -0.0478363037109375, -0.02948760986328125, -0.011138916015625, 0.00720977783203125, 0.0255584716796875, 0.04390716552734375, 0.062255859375, 0.08060455322265625, 0.0989532470703125, 0.11730194091796875, 0.135650634765625, 0.15399932861328125, 0.1723480224609375, 0.19069671630859375, 0.20904541015625, 0.22739410400390625, 0.2457427978515625, 0.26409149169921875, 0.282440185546875, 0.30078887939453125, 0.3191375732421875, 0.33748626708984375, 0.3558349609375, 0.37418365478515625, 0.3925323486328125, 0.41088104248046875, 0.429229736328125, 0.44757843017578125, 0.4659271240234375, 0.48427581787109375, 0.50262451171875, 0.5209732055664062, 0.5393218994140625, 0.5576705932617188, 0.576019287109375, 0.5943679809570312, 0.6127166748046875, 0.6310653686523438, 0.6494140625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 6.0, 5.0, 6.0, 7.0, 15.0, 10.0, 11.0, 23.0, 21.0, 36.0, 36.0, 56.0, 78.0, 113.0, 168.0, 267.0, 423.0, 693.0, 740.0, 491.0, 305.0, 146.0, 103.0, 80.0, 67.0, 47.0, 34.0, 26.0, 15.0, 15.0, 10.0, 7.0, 4.0, 7.0, 3.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.634765625, -0.6167068481445312, -0.5986480712890625, -0.5805892944335938, -0.562530517578125, -0.5444717407226562, -0.5264129638671875, -0.5083541870117188, -0.49029541015625, -0.47223663330078125, -0.4541778564453125, -0.43611907958984375, -0.418060302734375, -0.40000152587890625, -0.3819427490234375, -0.36388397216796875, -0.3458251953125, -0.32776641845703125, -0.3097076416015625, -0.29164886474609375, -0.273590087890625, -0.25553131103515625, -0.2374725341796875, -0.21941375732421875, -0.20135498046875, -0.18329620361328125, -0.1652374267578125, -0.14717864990234375, -0.129119873046875, -0.11106109619140625, -0.0930023193359375, -0.07494354248046875, -0.056884765625, -0.03882598876953125, -0.0207672119140625, -0.00270843505859375, 0.015350341796875, 0.03340911865234375, 0.0514678955078125, 0.06952667236328125, 0.08758544921875, 0.10564422607421875, 0.1237030029296875, 0.14176177978515625, 0.159820556640625, 0.17787933349609375, 0.1959381103515625, 0.21399688720703125, 0.2320556640625, 0.25011444091796875, 0.2681732177734375, 0.28623199462890625, 0.304290771484375, 0.32234954833984375, 0.3404083251953125, 0.35846710205078125, 0.37652587890625, 0.39458465576171875, 0.4126434326171875, 0.43070220947265625, 0.448760986328125, 0.46681976318359375, 0.4848785400390625, 0.5029373168945312, 0.52099609375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 6.0, 4.0, 6.0, 15.0, 22.0, 26.0, 54.0, 72.0, 124.0, 126.0, 138.0, 111.0, 91.0, 71.0, 59.0, 36.0, 23.0, 13.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.570553779602051, -4.458034992218018, -4.345516681671143, -4.232997894287109, -4.120479583740234, -4.007960796356201, -3.895442008972168, -3.782923460006714, -3.6704049110412598, -3.5578863620758057, -3.4453678131103516, -3.3328490257263184, -3.2203304767608643, -3.10781192779541, -2.995293140411377, -2.882774591445923, -2.7702560424804688, -2.6577374935150146, -2.5452189445495605, -2.4327001571655273, -2.3201816082000732, -2.207663059234619, -2.095144271850586, -1.9826257228851318, -1.8701071739196777, -1.7575886249542236, -1.64506995677948, -1.5325512886047363, -1.4200327396392822, -1.3075141906738281, -1.1949955224990845, -1.0824768543243408, -0.9699583053588867, -0.8574396967887878, -0.744921088218689, -0.6324024796485901, -0.5198838710784912, -0.40736526250839233, -0.29484665393829346, -0.18232804536819458, -0.0698094367980957, 0.042709171772003174, 0.15522778034210205, 0.2677463889122009, 0.3802649974822998, 0.4927836060523987, 0.6053022146224976, 0.7178208231925964, 0.8303394317626953, 0.9428580403327942, 1.055376648902893, 1.1678953170776367, 1.2804138660430908, 1.392932415008545, 1.5054510831832886, 1.6179697513580322, 1.7304883003234863, 1.8430068492889404, 1.955525517463684, 2.0680441856384277, 2.180562734603882, 2.293081283569336, 2.405600070953369, 2.5181186199188232, 2.6306371688842773]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 6.0, 1.0, 3.0, 8.0, 5.0, 2.0, 13.0, 10.0, 16.0, 11.0, 19.0, 27.0, 21.0, 27.0, 23.0, 34.0, 28.0, 32.0, 42.0, 42.0, 38.0, 45.0, 26.0, 52.0, 41.0, 42.0, 34.0, 52.0, 25.0, 38.0, 39.0, 37.0, 26.0, 28.0, 16.0, 12.0, 19.0, 11.0, 15.0, 9.0, 3.0, 7.0, 8.0, 5.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0], "bins": [-1.8439691066741943, -1.784392237663269, -1.7248153686523438, -1.665238380432129, -1.6056615114212036, -1.5460846424102783, -1.486507773399353, -1.4269309043884277, -1.367353916168213, -1.3077770471572876, -1.2482001781463623, -1.1886231899261475, -1.1290463209152222, -1.0694694519042969, -1.0098925828933716, -0.9503156542778015, -0.8907387852668762, -0.8311619162559509, -0.7715849876403809, -0.7120081186294556, -0.6524311900138855, -0.5928543210029602, -0.5332773923873901, -0.47370052337646484, -0.41412362456321716, -0.3545467257499695, -0.2949698269367218, -0.23539294302463531, -0.17581604421138763, -0.11623916029930115, -0.05666226148605347, 0.002914637327194214, 0.062491536140441895, 0.12206843495368958, 0.18164533376693726, 0.24122221767902374, 0.3007991313934326, 0.3603760004043579, 0.4199528992176056, 0.47952979803085327, 0.5391067266464233, 0.5986835956573486, 0.6582605242729187, 0.717837393283844, 0.7774143218994141, 0.8369911909103394, 0.8965680599212646, 0.9561449885368347, 1.0157217979431152, 1.0752986669540405, 1.1348755359649658, 1.1944525241851807, 1.254029393196106, 1.3136062622070312, 1.3731831312179565, 1.4327600002288818, 1.4923369884490967, 1.551913857460022, 1.6114907264709473, 1.671067714691162, 1.7306445837020874, 1.7902214527130127, 1.849798321723938, 1.9093751907348633, 1.9689521789550781]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 4.0, 6.0, 7.0, 12.0, 20.0, 31.0, 44.0, 57.0, 81.0, 158.0, 228.0, 329.0, 487.0, 714.0, 1123.0, 1667.0, 2582.0, 4024.0, 6107.0, 9576.0, 15650.0, 26117.0, 49400.0, 110924.0, 263950.0, 291830.0, 131423.0, 56544.0, 28837.0, 16916.0, 10496.0, 6631.0, 4366.0, 2856.0, 1782.0, 1195.0, 797.0, 561.0, 380.0, 217.0, 141.0, 95.0, 72.0, 32.0, 33.0, 14.0, 13.0, 9.0, 8.0, 5.0, 2.0, 4.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.407470703125, -0.3951568603515625, -0.382843017578125, -0.3705291748046875, -0.35821533203125, -0.3459014892578125, -0.333587646484375, -0.3212738037109375, -0.3089599609375, -0.2966461181640625, -0.284332275390625, -0.2720184326171875, -0.25970458984375, -0.2473907470703125, -0.235076904296875, -0.2227630615234375, -0.21044921875, -0.1981353759765625, -0.185821533203125, -0.1735076904296875, -0.16119384765625, -0.1488800048828125, -0.136566162109375, -0.1242523193359375, -0.1119384765625, -0.0996246337890625, -0.087310791015625, -0.0749969482421875, -0.06268310546875, -0.0503692626953125, -0.038055419921875, -0.0257415771484375, -0.013427734375, -0.0011138916015625, 0.011199951171875, 0.0235137939453125, 0.03582763671875, 0.0481414794921875, 0.060455322265625, 0.0727691650390625, 0.0850830078125, 0.0973968505859375, 0.109710693359375, 0.1220245361328125, 0.13433837890625, 0.1466522216796875, 0.158966064453125, 0.1712799072265625, 0.18359375, 0.1959075927734375, 0.208221435546875, 0.2205352783203125, 0.23284912109375, 0.2451629638671875, 0.257476806640625, 0.2697906494140625, 0.2821044921875, 0.2944183349609375, 0.306732177734375, 0.3190460205078125, 0.33135986328125, 0.3436737060546875, 0.355987548828125, 0.3683013916015625, 0.380615234375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 11.0, 11.0, 13.0, 28.0, 30.0, 31.0, 47.0, 71.0, 52.0, 57.0, 57.0, 69.0, 65.0, 77.0, 61.0, 64.0, 44.0, 60.0, 44.0, 27.0, 18.0, 15.0, 14.0, 12.0, 12.0, 4.0, 5.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.414794921875, -0.4036674499511719, -0.39253997802734375, -0.3814125061035156, -0.3702850341796875, -0.3591575622558594, -0.34803009033203125, -0.3369026184082031, -0.325775146484375, -0.3146476745605469, -0.30352020263671875, -0.2923927307128906, -0.2812652587890625, -0.2701377868652344, -0.25901031494140625, -0.24788284301757812, -0.23675537109375, -0.22562789916992188, -0.21450042724609375, -0.20337295532226562, -0.1922454833984375, -0.18111801147460938, -0.16999053955078125, -0.15886306762695312, -0.147735595703125, -0.13660812377929688, -0.12548065185546875, -0.11435317993164062, -0.1032257080078125, -0.09209823608398438, -0.08097076416015625, -0.06984329223632812, -0.0587158203125, -0.047588348388671875, -0.03646087646484375, -0.025333404541015625, -0.0142059326171875, -0.003078460693359375, 0.00804901123046875, 0.019176483154296875, 0.030303955078125, 0.041431427001953125, 0.05255889892578125, 0.06368637084960938, 0.0748138427734375, 0.08594131469726562, 0.09706878662109375, 0.10819625854492188, 0.11932373046875, 0.13045120239257812, 0.14157867431640625, 0.15270614624023438, 0.1638336181640625, 0.17496109008789062, 0.18608856201171875, 0.19721603393554688, 0.208343505859375, 0.21947097778320312, 0.23059844970703125, 0.24172592163085938, 0.2528533935546875, 0.2639808654785156, 0.27510833740234375, 0.2862358093261719, 0.29736328125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 6.0, 9.0, 9.0, 15.0, 17.0, 36.0, 38.0, 68.0, 158.0, 291.0, 776.0, 2653.0, 12296.0, 74361.0, 738106.0, 189563.0, 23365.0, 4687.0, 1249.0, 409.0, 193.0, 102.0, 61.0, 35.0, 22.0, 13.0, 10.0, 3.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9248046875, -0.882171630859375, -0.83953857421875, -0.796905517578125, -0.7542724609375, -0.711639404296875, -0.66900634765625, -0.626373291015625, -0.583740234375, -0.541107177734375, -0.49847412109375, -0.455841064453125, -0.4132080078125, -0.370574951171875, -0.32794189453125, -0.285308837890625, -0.24267578125, -0.200042724609375, -0.15740966796875, -0.114776611328125, -0.0721435546875, -0.029510498046875, 0.01312255859375, 0.055755615234375, 0.098388671875, 0.141021728515625, 0.18365478515625, 0.226287841796875, 0.2689208984375, 0.311553955078125, 0.35418701171875, 0.396820068359375, 0.439453125, 0.482086181640625, 0.52471923828125, 0.567352294921875, 0.6099853515625, 0.652618408203125, 0.69525146484375, 0.737884521484375, 0.780517578125, 0.823150634765625, 0.86578369140625, 0.908416748046875, 0.9510498046875, 0.993682861328125, 1.03631591796875, 1.078948974609375, 1.12158203125, 1.164215087890625, 1.20684814453125, 1.249481201171875, 1.2921142578125, 1.334747314453125, 1.37738037109375, 1.420013427734375, 1.462646484375, 1.505279541015625, 1.54791259765625, 1.590545654296875, 1.6331787109375, 1.675811767578125, 1.71844482421875, 1.761077880859375, 1.8037109375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 7.0, 5.0, 12.0, 6.0, 5.0, 9.0, 12.0, 13.0, 22.0, 28.0, 26.0, 39.0, 24.0, 39.0, 34.0, 43.0, 35.0, 43.0, 48.0, 46.0, 49.0, 40.0, 45.0, 36.0, 41.0, 38.0, 38.0, 36.0, 29.0, 25.0, 25.0, 13.0, 21.0, 12.0, 5.0, 13.0, 7.0, 12.0, 6.0, 0.0, 2.0, 4.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.62646484375, -0.60479736328125, -0.5831298828125, -0.56146240234375, -0.539794921875, -0.51812744140625, -0.4964599609375, -0.47479248046875, -0.453125, -0.43145751953125, -0.4097900390625, -0.38812255859375, -0.366455078125, -0.34478759765625, -0.3231201171875, -0.30145263671875, -0.27978515625, -0.25811767578125, -0.2364501953125, -0.21478271484375, -0.193115234375, -0.17144775390625, -0.1497802734375, -0.12811279296875, -0.1064453125, -0.08477783203125, -0.0631103515625, -0.04144287109375, -0.019775390625, 0.00189208984375, 0.0235595703125, 0.04522705078125, 0.06689453125, 0.08856201171875, 0.1102294921875, 0.13189697265625, 0.153564453125, 0.17523193359375, 0.1968994140625, 0.21856689453125, 0.240234375, 0.26190185546875, 0.2835693359375, 0.30523681640625, 0.326904296875, 0.34857177734375, 0.3702392578125, 0.39190673828125, 0.41357421875, 0.43524169921875, 0.4569091796875, 0.47857666015625, 0.500244140625, 0.52191162109375, 0.5435791015625, 0.56524658203125, 0.5869140625, 0.60858154296875, 0.6302490234375, 0.65191650390625, 0.673583984375, 0.69525146484375, 0.7169189453125, 0.73858642578125, 0.76025390625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 7.0, 1.0, 9.0, 3.0, 10.0, 9.0, 20.0, 20.0, 28.0, 61.0, 74.0, 118.0, 185.0, 289.0, 499.0, 832.0, 1398.0, 2523.0, 4849.0, 9364.0, 19872.0, 45470.0, 127085.0, 448363.0, 257001.0, 72385.0, 29526.0, 13555.0, 6850.0, 3541.0, 1903.0, 1093.0, 604.0, 361.0, 210.0, 153.0, 99.0, 42.0, 45.0, 37.0, 28.0, 13.0, 7.0, 5.0, 6.0, 1.0, 4.0, 3.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.226318359375, -0.2191905975341797, -0.21206283569335938, -0.20493507385253906, -0.19780731201171875, -0.19067955017089844, -0.18355178833007812, -0.1764240264892578, -0.1692962646484375, -0.1621685028076172, -0.15504074096679688, -0.14791297912597656, -0.14078521728515625, -0.13365745544433594, -0.12652969360351562, -0.11940193176269531, -0.112274169921875, -0.10514640808105469, -0.09801864624023438, -0.09089088439941406, -0.08376312255859375, -0.07663536071777344, -0.06950759887695312, -0.06237983703613281, -0.0552520751953125, -0.04812431335449219, -0.040996551513671875, -0.03386878967285156, -0.02674102783203125, -0.019613265991210938, -0.012485504150390625, -0.0053577423095703125, 0.00177001953125, 0.008897781372070312, 0.016025543212890625, 0.023153305053710938, 0.03028106689453125, 0.03740882873535156, 0.044536590576171875, 0.05166435241699219, 0.0587921142578125, 0.06591987609863281, 0.07304763793945312, 0.08017539978027344, 0.08730316162109375, 0.09443092346191406, 0.10155868530273438, 0.10868644714355469, 0.115814208984375, 0.12294197082519531, 0.13006973266601562, 0.13719749450683594, 0.14432525634765625, 0.15145301818847656, 0.15858078002929688, 0.1657085418701172, 0.1728363037109375, 0.1799640655517578, 0.18709182739257812, 0.19421958923339844, 0.20134735107421875, 0.20847511291503906, 0.21560287475585938, 0.2227306365966797, 0.2298583984375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 3.0, 8.0, 4.0, 5.0, 4.0, 8.0, 5.0, 6.0, 13.0, 18.0, 25.0, 34.0, 60.0, 152.0, 208.0, 149.0, 86.0, 44.0, 39.0, 31.0, 19.0, 17.0, 11.0, 10.0, 8.0, 7.0, 7.0, 5.0, 4.0, 2.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.249282836914062e-05, -7.997825741767883e-05, -7.746368646621704e-05, -7.494911551475525e-05, -7.243454456329346e-05, -6.991997361183167e-05, -6.740540266036987e-05, -6.489083170890808e-05, -6.237626075744629e-05, -5.98616898059845e-05, -5.7347118854522705e-05, -5.483254790306091e-05, -5.231797695159912e-05, -4.980340600013733e-05, -4.728883504867554e-05, -4.4774264097213745e-05, -4.225969314575195e-05, -3.974512219429016e-05, -3.723055124282837e-05, -3.471598029136658e-05, -3.2201409339904785e-05, -2.9686838388442993e-05, -2.71722674369812e-05, -2.465769648551941e-05, -2.2143125534057617e-05, -1.9628554582595825e-05, -1.7113983631134033e-05, -1.4599412679672241e-05, -1.208484172821045e-05, -9.570270776748657e-06, -7.055699825286865e-06, -4.541128873825073e-06, -2.0265579223632812e-06, 4.880130290985107e-07, 3.0025839805603027e-06, 5.517154932022095e-06, 8.031725883483887e-06, 1.0546296834945679e-05, 1.306086778640747e-05, 1.5575438737869263e-05, 1.8090009689331055e-05, 2.0604580640792847e-05, 2.311915159225464e-05, 2.563372254371643e-05, 2.8148293495178223e-05, 3.0662864446640015e-05, 3.317743539810181e-05, 3.56920063495636e-05, 3.820657730102539e-05, 4.072114825248718e-05, 4.3235719203948975e-05, 4.5750290155410767e-05, 4.826486110687256e-05, 5.077943205833435e-05, 5.329400300979614e-05, 5.5808573961257935e-05, 5.8323144912719727e-05, 6.083771586418152e-05, 6.335228681564331e-05, 6.58668577671051e-05, 6.83814287185669e-05, 7.089599967002869e-05, 7.341057062149048e-05, 7.592514157295227e-05, 7.843971252441406e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 1.0, 3.0, 9.0, 10.0, 6.0, 6.0, 9.0, 14.0, 13.0, 10.0, 27.0, 21.0, 58.0, 74.0, 91.0, 146.0, 208.0, 349.0, 646.0, 1298.0, 2865.0, 6994.0, 18081.0, 52090.0, 174870.0, 486607.0, 209080.0, 59851.0, 20739.0, 7926.0, 3176.0, 1468.0, 714.0, 371.0, 218.0, 147.0, 102.0, 63.0, 44.0, 43.0, 26.0, 16.0, 14.0, 15.0, 6.0, 3.0, 9.0, 6.0, 10.0, 5.0, 1.0, 1.0, 3.0, 2.0, 2.0], "bins": [-0.26416015625, -0.2565174102783203, -0.24887466430664062, -0.24123191833496094, -0.23358917236328125, -0.22594642639160156, -0.21830368041992188, -0.2106609344482422, -0.2030181884765625, -0.1953754425048828, -0.18773269653320312, -0.18008995056152344, -0.17244720458984375, -0.16480445861816406, -0.15716171264648438, -0.1495189666748047, -0.141876220703125, -0.1342334747314453, -0.12659072875976562, -0.11894798278808594, -0.11130523681640625, -0.10366249084472656, -0.09601974487304688, -0.08837699890136719, -0.0807342529296875, -0.07309150695800781, -0.06544876098632812, -0.05780601501464844, -0.05016326904296875, -0.04252052307128906, -0.034877777099609375, -0.027235031127929688, -0.01959228515625, -0.011949539184570312, -0.004306793212890625, 0.0033359527587890625, 0.01097869873046875, 0.018621444702148438, 0.026264190673828125, 0.03390693664550781, 0.0415496826171875, 0.04919242858886719, 0.056835174560546875, 0.06447792053222656, 0.07212066650390625, 0.07976341247558594, 0.08740615844726562, 0.09504890441894531, 0.102691650390625, 0.11033439636230469, 0.11797714233398438, 0.12561988830566406, 0.13326263427734375, 0.14090538024902344, 0.14854812622070312, 0.1561908721923828, 0.1638336181640625, 0.1714763641357422, 0.17911911010742188, 0.18676185607910156, 0.19440460205078125, 0.20204734802246094, 0.20969009399414062, 0.2173328399658203, 0.2249755859375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 3.0, 3.0, 0.0, 6.0, 5.0, 7.0, 2.0, 8.0, 7.0, 12.0, 15.0, 16.0, 26.0, 28.0, 29.0, 50.0, 47.0, 75.0, 67.0, 94.0, 98.0, 77.0, 60.0, 50.0, 48.0, 31.0, 21.0, 17.0, 19.0, 11.0, 21.0, 13.0, 6.0, 6.0, 7.0, 6.0, 6.0, 6.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.20849609375, -0.2022228240966797, -0.19594955444335938, -0.18967628479003906, -0.18340301513671875, -0.17712974548339844, -0.17085647583007812, -0.1645832061767578, -0.1583099365234375, -0.1520366668701172, -0.14576339721679688, -0.13949012756347656, -0.13321685791015625, -0.12694358825683594, -0.12067031860351562, -0.11439704895019531, -0.108123779296875, -0.10185050964355469, -0.09557723999023438, -0.08930397033691406, -0.08303070068359375, -0.07675743103027344, -0.07048416137695312, -0.06421089172363281, -0.0579376220703125, -0.05166435241699219, -0.045391082763671875, -0.03911781311035156, -0.03284454345703125, -0.026571273803710938, -0.020298004150390625, -0.014024734497070312, -0.00775146484375, -0.0014781951904296875, 0.004795074462890625, 0.011068344116210938, 0.01734161376953125, 0.023614883422851562, 0.029888153076171875, 0.03616142272949219, 0.0424346923828125, 0.04870796203613281, 0.054981231689453125, 0.06125450134277344, 0.06752777099609375, 0.07380104064941406, 0.08007431030273438, 0.08634757995605469, 0.092620849609375, 0.09889411926269531, 0.10516738891601562, 0.11144065856933594, 0.11771392822265625, 0.12398719787597656, 0.13026046752929688, 0.1365337371826172, 0.1428070068359375, 0.1490802764892578, 0.15535354614257812, 0.16162681579589844, 0.16790008544921875, 0.17417335510253906, 0.18044662475585938, 0.1867198944091797, 0.1929931640625]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 6.0, 2.0, 8.0, 16.0, 36.0, 110.0, 185.0, 279.0, 201.0, 95.0, 39.0, 18.0, 6.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.517734050750732, -7.321969509124756, -7.126204967498779, -6.930440902709961, -6.734676361083984, -6.538911819458008, -6.343147277832031, -6.147382736206055, -5.951618194580078, -5.755853652954102, -5.560089111328125, -5.364324569702148, -5.16856050491333, -4.9727959632873535, -4.777031421661377, -4.5812668800354, -4.385502815246582, -4.1897382736206055, -3.993973970413208, -3.7982094287872314, -3.602445125579834, -3.4066805839538574, -3.210916042327881, -3.0151515007019043, -2.819387197494507, -2.6236226558685303, -2.427858352661133, -2.2320938110351562, -2.0363292694091797, -1.8405649662017822, -1.6448004245758057, -1.4490360021591187, -1.2532711029052734, -1.0575066804885864, -0.8617421984672546, -0.6659777164459229, -0.47021329402923584, -0.27444887161254883, -0.07868432998657227, 0.11708009243011475, 0.31284451484680176, 0.5086089372634888, 0.7043734192848206, 0.9001379013061523, 1.0959023237228394, 1.2916667461395264, 1.487431287765503, 1.68319571018219, 1.878960132598877, 2.0747246742248535, 2.270488977432251, 2.4662535190582275, 2.662017822265625, 2.8577823638916016, 3.053546905517578, 3.2493114471435547, 3.445075750350952, 3.6408402919769287, 3.836604595184326, 4.032369136810303, 4.228133678436279, 4.423897743225098, 4.619662284851074, 4.815426826477051, 5.011191368103027]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 5.0, 4.0, 5.0, 9.0, 4.0, 13.0, 11.0, 16.0, 18.0, 14.0, 23.0, 20.0, 28.0, 30.0, 24.0, 27.0, 25.0, 36.0, 37.0, 36.0, 40.0, 43.0, 42.0, 41.0, 37.0, 31.0, 38.0, 36.0, 39.0, 27.0, 30.0, 25.0, 18.0, 14.0, 29.0, 24.0, 20.0, 14.0, 16.0, 10.0, 11.0, 6.0, 10.0, 3.0, 4.0, 6.0, 1.0, 3.0, 4.0, 1.0, 4.0, 0.0, 2.0, 0.0, 2.0], "bins": [-1.614044427871704, -1.5635217428207397, -1.512999176979065, -1.4624764919281006, -1.4119539260864258, -1.3614312410354614, -1.310908555984497, -1.2603859901428223, -1.2098634243011475, -1.159340739250183, -1.1088181734085083, -1.058295488357544, -1.0077729225158691, -0.9572502374649048, -0.9067276120185852, -0.8562049865722656, -0.8056823015213013, -0.7551596760749817, -0.7046370506286621, -0.6541143655776978, -0.603591799736023, -0.5530691146850586, -0.502546489238739, -0.45202386379241943, -0.40150123834609985, -0.3509786128997803, -0.3004559874534607, -0.24993333220481873, -0.19941070675849915, -0.14888808131217957, -0.0983654260635376, -0.04784280061721802, 0.0026798248291015625, 0.05320245772600174, 0.10372509062290192, 0.1542477309703827, 0.20477035641670227, 0.25529298186302185, 0.3058156371116638, 0.3563382625579834, 0.406860888004303, 0.45738351345062256, 0.5079061388969421, 0.5584287643432617, 0.6089514493942261, 0.6594740152359009, 0.7099967002868652, 0.7605193257331848, 0.8110419511795044, 0.861564576625824, 0.9120872020721436, 0.9626098871231079, 1.0131324529647827, 1.063655138015747, 1.1141777038574219, 1.1647003889083862, 1.2152230739593506, 1.265745759010315, 1.3162683248519897, 1.366791009902954, 1.417313575744629, 1.4678362607955933, 1.5183589458465576, 1.5688815116882324, 1.6194040775299072]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 6.0, 13.0, 11.0, 14.0, 23.0, 25.0, 41.0, 68.0, 122.0, 152.0, 249.0, 366.0, 574.0, 911.0, 1405.0, 2292.0, 3516.0, 6054.0, 10431.0, 19425.0, 38152.0, 79626.0, 192532.0, 596670.0, 1628814.0, 1049493.0, 325847.0, 122129.0, 54598.0, 27174.0, 14049.0, 7808.0, 4417.0, 2700.0, 1646.0, 1084.0, 621.0, 408.0, 255.0, 195.0, 115.0, 82.0, 52.0, 50.0, 25.0, 19.0, 12.0, 3.0, 6.0, 1.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.27001953125, -0.26151275634765625, -0.2530059814453125, -0.24449920654296875, -0.235992431640625, -0.22748565673828125, -0.2189788818359375, -0.21047210693359375, -0.20196533203125, -0.19345855712890625, -0.1849517822265625, -0.17644500732421875, -0.167938232421875, -0.15943145751953125, -0.1509246826171875, -0.14241790771484375, -0.1339111328125, -0.12540435791015625, -0.1168975830078125, -0.10839080810546875, -0.099884033203125, -0.09137725830078125, -0.0828704833984375, -0.07436370849609375, -0.06585693359375, -0.05735015869140625, -0.0488433837890625, -0.04033660888671875, -0.031829833984375, -0.02332305908203125, -0.0148162841796875, -0.00630950927734375, 0.002197265625, 0.01070404052734375, 0.0192108154296875, 0.02771759033203125, 0.036224365234375, 0.04473114013671875, 0.0532379150390625, 0.06174468994140625, 0.07025146484375, 0.07875823974609375, 0.0872650146484375, 0.09577178955078125, 0.104278564453125, 0.11278533935546875, 0.1212921142578125, 0.12979888916015625, 0.1383056640625, 0.14681243896484375, 0.1553192138671875, 0.16382598876953125, 0.172332763671875, 0.18083953857421875, 0.1893463134765625, 0.19785308837890625, 0.20635986328125, 0.21486663818359375, 0.2233734130859375, 0.23188018798828125, 0.240386962890625, 0.24889373779296875, 0.2574005126953125, 0.26590728759765625, 0.2744140625]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 6.0, 12.0, 11.0, 19.0, 19.0, 23.0, 38.0, 43.0, 56.0, 58.0, 60.0, 68.0, 83.0, 66.0, 63.0, 79.0, 54.0, 53.0, 50.0, 36.0, 38.0, 25.0, 13.0, 9.0, 12.0, 5.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.427490234375, -0.4162178039550781, -0.40494537353515625, -0.3936729431152344, -0.3824005126953125, -0.3711280822753906, -0.35985565185546875, -0.3485832214355469, -0.337310791015625, -0.3260383605957031, -0.31476593017578125, -0.3034934997558594, -0.2922210693359375, -0.2809486389160156, -0.26967620849609375, -0.2584037780761719, -0.24713134765625, -0.23585891723632812, -0.22458648681640625, -0.21331405639648438, -0.2020416259765625, -0.19076919555664062, -0.17949676513671875, -0.16822433471679688, -0.156951904296875, -0.14567947387695312, -0.13440704345703125, -0.12313461303710938, -0.1118621826171875, -0.10058975219726562, -0.08931732177734375, -0.07804489135742188, -0.0667724609375, -0.055500030517578125, -0.04422760009765625, -0.032955169677734375, -0.0216827392578125, -0.010410308837890625, 0.00086212158203125, 0.012134552001953125, 0.023406982421875, 0.034679412841796875, 0.04595184326171875, 0.057224273681640625, 0.0684967041015625, 0.07976913452148438, 0.09104156494140625, 0.10231399536132812, 0.11358642578125, 0.12485885620117188, 0.13613128662109375, 0.14740371704101562, 0.1586761474609375, 0.16994857788085938, 0.18122100830078125, 0.19249343872070312, 0.203765869140625, 0.21503829956054688, 0.22631072998046875, 0.23758316040039062, 0.2488555908203125, 0.2601280212402344, 0.27140045166015625, 0.2826728820800781, 0.2939453125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 6.0, 6.0, 3.0, 14.0, 19.0, 26.0, 33.0, 40.0, 76.0, 111.0, 143.0, 322.0, 599.0, 1151.0, 2534.0, 6160.0, 18007.0, 60068.0, 242993.0, 1759414.0, 1767695.0, 244290.0, 60956.0, 17891.0, 6379.0, 2645.0, 1233.0, 622.0, 333.0, 198.0, 115.0, 64.0, 50.0, 32.0, 25.0, 12.0, 9.0, 10.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.697265625, -0.6784210205078125, -0.659576416015625, -0.6407318115234375, -0.62188720703125, -0.6030426025390625, -0.584197998046875, -0.5653533935546875, -0.5465087890625, -0.5276641845703125, -0.508819580078125, -0.4899749755859375, -0.47113037109375, -0.4522857666015625, -0.433441162109375, -0.4145965576171875, -0.395751953125, -0.3769073486328125, -0.358062744140625, -0.3392181396484375, -0.32037353515625, -0.3015289306640625, -0.282684326171875, -0.2638397216796875, -0.2449951171875, -0.2261505126953125, -0.207305908203125, -0.1884613037109375, -0.16961669921875, -0.1507720947265625, -0.131927490234375, -0.1130828857421875, -0.09423828125, -0.0753936767578125, -0.056549072265625, -0.0377044677734375, -0.01885986328125, -1.52587890625e-05, 0.018829345703125, 0.0376739501953125, 0.0565185546875, 0.0753631591796875, 0.094207763671875, 0.1130523681640625, 0.13189697265625, 0.1507415771484375, 0.169586181640625, 0.1884307861328125, 0.207275390625, 0.2261199951171875, 0.244964599609375, 0.2638092041015625, 0.28265380859375, 0.3014984130859375, 0.320343017578125, 0.3391876220703125, 0.3580322265625, 0.3768768310546875, 0.395721435546875, 0.4145660400390625, 0.43341064453125, 0.4522552490234375, 0.471099853515625, 0.4899444580078125, 0.5087890625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 5.0, 10.0, 8.0, 14.0, 11.0, 28.0, 42.0, 45.0, 44.0, 77.0, 91.0, 144.0, 195.0, 288.0, 452.0, 621.0, 614.0, 421.0, 247.0, 159.0, 123.0, 101.0, 78.0, 66.0, 42.0, 28.0, 23.0, 26.0, 20.0, 10.0, 9.0, 7.0, 7.0, 7.0, 3.0, 6.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.59423828125, -0.5781364440917969, -0.5620346069335938, -0.5459327697753906, -0.5298309326171875, -0.5137290954589844, -0.49762725830078125, -0.4815254211425781, -0.465423583984375, -0.4493217468261719, -0.43321990966796875, -0.4171180725097656, -0.4010162353515625, -0.3849143981933594, -0.36881256103515625, -0.3527107238769531, -0.33660888671875, -0.3205070495605469, -0.30440521240234375, -0.2883033752441406, -0.2722015380859375, -0.2560997009277344, -0.23999786376953125, -0.22389602661132812, -0.207794189453125, -0.19169235229492188, -0.17559051513671875, -0.15948867797851562, -0.1433868408203125, -0.12728500366210938, -0.11118316650390625, -0.09508132934570312, -0.0789794921875, -0.06287765502929688, -0.04677581787109375, -0.030673980712890625, -0.0145721435546875, 0.001529693603515625, 0.01763153076171875, 0.033733367919921875, 0.049835205078125, 0.06593704223632812, 0.08203887939453125, 0.09814071655273438, 0.1142425537109375, 0.13034439086914062, 0.14644622802734375, 0.16254806518554688, 0.17864990234375, 0.19475173950195312, 0.21085357666015625, 0.22695541381835938, 0.2430572509765625, 0.2591590881347656, 0.27526092529296875, 0.2913627624511719, 0.307464599609375, 0.3235664367675781, 0.33966827392578125, 0.3557701110839844, 0.3718719482421875, 0.3879737854003906, 0.40407562255859375, 0.4201774597167969, 0.436279296875]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 7.0, 7.0, 26.0, 48.0, 79.0, 158.0, 181.0, 193.0, 133.0, 83.0, 49.0, 18.0, 6.0, 6.0, 4.0, 4.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4010376930236816, -3.23771071434021, -3.0743837356567383, -2.9110567569732666, -2.747729778289795, -2.584402561187744, -2.4210755825042725, -2.257748603820801, -2.094421625137329, -1.9310946464538574, -1.7677676677703857, -1.6044405698776245, -1.4411135911941528, -1.2777866125106812, -1.11445951461792, -0.9511325359344482, -0.7878055572509766, -0.6244785785675049, -0.4611515402793884, -0.29782453179359436, -0.1344975233078003, 0.028829455375671387, 0.19215649366378784, 0.3554835319519043, 0.518810510635376, 0.6821374893188477, 0.8454645276069641, 1.0087915658950806, 1.1721185445785522, 1.335445523262024, 1.4987726211547852, 1.6620995998382568, 1.8254270553588867, 1.9887540340423584, 2.15208101272583, 2.3154079914093018, 2.4787349700927734, 2.642062187194824, 2.805389165878296, 2.9687161445617676, 3.1320431232452393, 3.295370101928711, 3.4586970806121826, 3.6220240592956543, 3.785351276397705, 3.9486780166625977, 4.112005233764648, 4.275332450866699, 4.438659191131592, 4.601986408233643, 4.765313148498535, 4.928640365600586, 5.0919671058654785, 5.255294322967529, 5.418621063232422, 5.581948280334473, 5.745275497436523, 5.908602714538574, 6.071929454803467, 6.235256671905518, 6.39858341217041, 6.561910629272461, 6.7252373695373535, 6.888564586639404, 7.051891326904297]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 3.0, 4.0, 10.0, 11.0, 15.0, 16.0, 15.0, 19.0, 17.0, 24.0, 25.0, 30.0, 26.0, 36.0, 35.0, 37.0, 39.0, 38.0, 37.0, 45.0, 38.0, 45.0, 35.0, 35.0, 39.0, 46.0, 32.0, 25.0, 41.0, 34.0, 27.0, 26.0, 14.0, 13.0, 17.0, 12.0, 7.0, 5.0, 7.0, 7.0, 5.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.9155385494232178, -1.8578332662582397, -1.8001279830932617, -1.7424226999282837, -1.6847174167633057, -1.6270122528076172, -1.5693069696426392, -1.5116016864776611, -1.453896403312683, -1.396191120147705, -1.338485836982727, -1.280780553817749, -1.2230753898620605, -1.165369987487793, -1.1076648235321045, -1.0499595403671265, -0.9922542572021484, -0.9345489740371704, -0.8768436908721924, -0.8191384673118591, -0.7614331841468811, -0.7037279009819031, -0.6460226774215698, -0.5883173942565918, -0.5306121110916138, -0.47290682792663574, -0.4152015745639801, -0.35749632120132446, -0.29979103803634644, -0.2420857548713684, -0.18438050150871277, -0.12667524814605713, -0.06896984577178955, -0.011264577507972717, 0.046440690755844116, 0.10414595901966095, 0.16185122728347778, 0.2195565104484558, 0.27726176381111145, 0.3349670171737671, 0.3926723003387451, 0.45037758350372314, 0.5080828666687012, 0.5657880902290344, 0.6234933733940125, 0.6811986565589905, 0.7389038801193237, 0.7966091632843018, 0.8543144464492798, 0.9120197296142578, 0.9697250127792358, 1.0274302959442139, 1.0851354598999023, 1.14284086227417, 1.2005460262298584, 1.2582513093948364, 1.3159565925598145, 1.3736618757247925, 1.4313671588897705, 1.4890724420547485, 1.5467777252197266, 1.604482889175415, 1.662188172340393, 1.719893455505371, 1.7775987386703491]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 2.0, 4.0, 6.0, 7.0, 10.0, 9.0, 13.0, 27.0, 62.0, 63.0, 113.0, 159.0, 222.0, 365.0, 541.0, 918.0, 1408.0, 2193.0, 3610.0, 5658.0, 8755.0, 13802.0, 22093.0, 36544.0, 63807.0, 122388.0, 227840.0, 237700.0, 130937.0, 67851.0, 38548.0, 23272.0, 14730.0, 9050.0, 5773.0, 3701.0, 2310.0, 1485.0, 897.0, 570.0, 403.0, 241.0, 158.0, 104.0, 72.0, 46.0, 32.0, 31.0, 12.0, 8.0, 6.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.306640625, -0.2967643737792969, -0.28688812255859375, -0.2770118713378906, -0.2671356201171875, -0.2572593688964844, -0.24738311767578125, -0.23750686645507812, -0.227630615234375, -0.21775436401367188, -0.20787811279296875, -0.19800186157226562, -0.1881256103515625, -0.17824935913085938, -0.16837310791015625, -0.15849685668945312, -0.14862060546875, -0.13874435424804688, -0.12886810302734375, -0.11899185180664062, -0.1091156005859375, -0.09923934936523438, -0.08936309814453125, -0.07948684692382812, -0.069610595703125, -0.059734344482421875, -0.04985809326171875, -0.039981842041015625, -0.0301055908203125, -0.020229339599609375, -0.01035308837890625, -0.000476837158203125, 0.0093994140625, 0.019275665283203125, 0.02915191650390625, 0.039028167724609375, 0.0489044189453125, 0.058780670166015625, 0.06865692138671875, 0.07853317260742188, 0.088409423828125, 0.09828567504882812, 0.10816192626953125, 0.11803817749023438, 0.1279144287109375, 0.13779067993164062, 0.14766693115234375, 0.15754318237304688, 0.16741943359375, 0.17729568481445312, 0.18717193603515625, 0.19704818725585938, 0.2069244384765625, 0.21680068969726562, 0.22667694091796875, 0.23655319213867188, 0.246429443359375, 0.2563056945800781, 0.26618194580078125, 0.2760581970214844, 0.2859344482421875, 0.2958106994628906, 0.30568695068359375, 0.3155632019042969, 0.325439453125]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 8.0, 8.0, 10.0, 7.0, 8.0, 13.0, 25.0, 30.0, 29.0, 46.0, 37.0, 38.0, 67.0, 71.0, 64.0, 80.0, 53.0, 59.0, 68.0, 52.0, 49.0, 49.0, 27.0, 31.0, 22.0, 16.0, 23.0, 8.0, 7.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3935546875, -0.3830909729003906, -0.37262725830078125, -0.3621635437011719, -0.3516998291015625, -0.3412361145019531, -0.33077239990234375, -0.3203086853027344, -0.309844970703125, -0.2993812561035156, -0.28891754150390625, -0.2784538269042969, -0.2679901123046875, -0.2575263977050781, -0.24706268310546875, -0.23659896850585938, -0.22613525390625, -0.21567153930664062, -0.20520782470703125, -0.19474411010742188, -0.1842803955078125, -0.17381668090820312, -0.16335296630859375, -0.15288925170898438, -0.142425537109375, -0.13196182250976562, -0.12149810791015625, -0.11103439331054688, -0.1005706787109375, -0.09010696411132812, -0.07964324951171875, -0.06917953491210938, -0.0587158203125, -0.048252105712890625, -0.03778839111328125, -0.027324676513671875, -0.0168609619140625, -0.006397247314453125, 0.00406646728515625, 0.014530181884765625, 0.024993896484375, 0.035457611083984375, 0.04592132568359375, 0.056385040283203125, 0.0668487548828125, 0.07731246948242188, 0.08777618408203125, 0.09823989868164062, 0.10870361328125, 0.11916732788085938, 0.12963104248046875, 0.14009475708007812, 0.1505584716796875, 0.16102218627929688, 0.17148590087890625, 0.18194961547851562, 0.192413330078125, 0.20287704467773438, 0.21334075927734375, 0.22380447387695312, 0.2342681884765625, 0.24473190307617188, 0.25519561767578125, 0.2656593322753906, 0.276123046875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 7.0, 8.0, 8.0, 12.0, 31.0, 36.0, 42.0, 68.0, 115.0, 163.0, 225.0, 428.0, 725.0, 1580.0, 3660.0, 9934.0, 29628.0, 101030.0, 440239.0, 343262.0, 78872.0, 24151.0, 8156.0, 3203.0, 1301.0, 664.0, 365.0, 191.0, 162.0, 81.0, 62.0, 38.0, 32.0, 20.0, 13.0, 11.0, 8.0, 9.0, 6.0, 5.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.87548828125, -0.851104736328125, -0.82672119140625, -0.802337646484375, -0.7779541015625, -0.753570556640625, -0.72918701171875, -0.704803466796875, -0.680419921875, -0.656036376953125, -0.63165283203125, -0.607269287109375, -0.5828857421875, -0.558502197265625, -0.53411865234375, -0.509735107421875, -0.4853515625, -0.460968017578125, -0.43658447265625, -0.412200927734375, -0.3878173828125, -0.363433837890625, -0.33905029296875, -0.314666748046875, -0.290283203125, -0.265899658203125, -0.24151611328125, -0.217132568359375, -0.1927490234375, -0.168365478515625, -0.14398193359375, -0.119598388671875, -0.09521484375, -0.070831298828125, -0.04644775390625, -0.022064208984375, 0.0023193359375, 0.026702880859375, 0.05108642578125, 0.075469970703125, 0.099853515625, 0.124237060546875, 0.14862060546875, 0.173004150390625, 0.1973876953125, 0.221771240234375, 0.24615478515625, 0.270538330078125, 0.294921875, 0.319305419921875, 0.34368896484375, 0.368072509765625, 0.3924560546875, 0.416839599609375, 0.44122314453125, 0.465606689453125, 0.489990234375, 0.514373779296875, 0.53875732421875, 0.563140869140625, 0.5875244140625, 0.611907958984375, 0.63629150390625, 0.660675048828125, 0.68505859375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 5.0, 8.0, 6.0, 11.0, 12.0, 13.0, 15.0, 16.0, 24.0, 29.0, 32.0, 31.0, 41.0, 40.0, 42.0, 44.0, 52.0, 49.0, 36.0, 52.0, 44.0, 36.0, 51.0, 52.0, 48.0, 42.0, 26.0, 47.0, 20.0, 12.0, 15.0, 11.0, 10.0, 8.0, 6.0, 4.0, 3.0, 3.0, 0.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.7841796875, -0.7603073120117188, -0.7364349365234375, -0.7125625610351562, -0.688690185546875, -0.6648178100585938, -0.6409454345703125, -0.6170730590820312, -0.59320068359375, -0.5693283081054688, -0.5454559326171875, -0.5215835571289062, -0.497711181640625, -0.47383880615234375, -0.4499664306640625, -0.42609405517578125, -0.4022216796875, -0.37834930419921875, -0.3544769287109375, -0.33060455322265625, -0.306732177734375, -0.28285980224609375, -0.2589874267578125, -0.23511505126953125, -0.21124267578125, -0.18737030029296875, -0.1634979248046875, -0.13962554931640625, -0.115753173828125, -0.09188079833984375, -0.0680084228515625, -0.04413604736328125, -0.020263671875, 0.00360870361328125, 0.0274810791015625, 0.05135345458984375, 0.075225830078125, 0.09909820556640625, 0.1229705810546875, 0.14684295654296875, 0.17071533203125, 0.19458770751953125, 0.2184600830078125, 0.24233245849609375, 0.266204833984375, 0.29007720947265625, 0.3139495849609375, 0.33782196044921875, 0.3616943359375, 0.38556671142578125, 0.4094390869140625, 0.43331146240234375, 0.457183837890625, 0.48105621337890625, 0.5049285888671875, 0.5288009643554688, 0.55267333984375, 0.5765457153320312, 0.6004180908203125, 0.6242904663085938, 0.648162841796875, 0.6720352172851562, 0.6959075927734375, 0.7197799682617188, 0.74365234375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 4.0, 7.0, 6.0, 6.0, 14.0, 25.0, 16.0, 34.0, 38.0, 53.0, 83.0, 139.0, 242.0, 390.0, 698.0, 1327.0, 2503.0, 5016.0, 9763.0, 19250.0, 41542.0, 96666.0, 238674.0, 340937.0, 164227.0, 66987.0, 30051.0, 14221.0, 7233.0, 3941.0, 2015.0, 1082.0, 567.0, 288.0, 169.0, 131.0, 76.0, 39.0, 35.0, 25.0, 15.0, 10.0, 7.0, 3.0, 4.0, 1.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1326904296875, -0.12782859802246094, -0.12296676635742188, -0.11810493469238281, -0.11324310302734375, -0.10838127136230469, -0.10351943969726562, -0.09865760803222656, -0.0937957763671875, -0.08893394470214844, -0.08407211303710938, -0.07921028137207031, -0.07434844970703125, -0.06948661804199219, -0.06462478637695312, -0.05976295471191406, -0.054901123046875, -0.05003929138183594, -0.045177459716796875, -0.04031562805175781, -0.03545379638671875, -0.030591964721679688, -0.025730133056640625, -0.020868301391601562, -0.0160064697265625, -0.011144638061523438, -0.006282806396484375, -0.0014209747314453125, 0.00344085693359375, 0.008302688598632812, 0.013164520263671875, 0.018026351928710938, 0.02288818359375, 0.027750015258789062, 0.032611846923828125, 0.03747367858886719, 0.04233551025390625, 0.04719734191894531, 0.052059173583984375, 0.05692100524902344, 0.0617828369140625, 0.06664466857910156, 0.07150650024414062, 0.07636833190917969, 0.08123016357421875, 0.08609199523925781, 0.09095382690429688, 0.09581565856933594, 0.100677490234375, 0.10553932189941406, 0.11040115356445312, 0.11526298522949219, 0.12012481689453125, 0.12498664855957031, 0.12984848022460938, 0.13471031188964844, 0.1395721435546875, 0.14443397521972656, 0.14929580688476562, 0.1541576385498047, 0.15901947021484375, 0.1638813018798828, 0.16874313354492188, 0.17360496520996094, 0.178466796875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 1.0, 3.0, 4.0, 3.0, 2.0, 5.0, 9.0, 4.0, 5.0, 9.0, 10.0, 17.0, 19.0, 20.0, 26.0, 30.0, 44.0, 48.0, 84.0, 128.0, 120.0, 92.0, 66.0, 46.0, 43.0, 35.0, 25.0, 28.0, 12.0, 12.0, 9.0, 10.0, 8.0, 8.0, 1.0, 3.0, 2.0, 4.0, 2.0, 5.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-5.08427619934082e-05, -4.93144616484642e-05, -4.77861613035202e-05, -4.62578609585762e-05, -4.47295606136322e-05, -4.32012602686882e-05, -4.16729599237442e-05, -4.01446595788002e-05, -3.86163592338562e-05, -3.70880588889122e-05, -3.55597585439682e-05, -3.40314581990242e-05, -3.25031578540802e-05, -3.09748575091362e-05, -2.94465571641922e-05, -2.79182568192482e-05, -2.63899564743042e-05, -2.48616561293602e-05, -2.33333557844162e-05, -2.18050554394722e-05, -2.0276755094528198e-05, -1.8748454749584198e-05, -1.7220154404640198e-05, -1.5691854059696198e-05, -1.4163553714752197e-05, -1.2635253369808197e-05, -1.1106953024864197e-05, -9.578652679920197e-06, -8.050352334976196e-06, -6.522051990032196e-06, -4.993751645088196e-06, -3.4654513001441956e-06, -1.9371509552001953e-06, -4.0885061025619507e-07, 1.1194497346878052e-06, 2.6477500796318054e-06, 4.176050424575806e-06, 5.704350769519806e-06, 7.232651114463806e-06, 8.760951459407806e-06, 1.0289251804351807e-05, 1.1817552149295807e-05, 1.3345852494239807e-05, 1.4874152839183807e-05, 1.6402453184127808e-05, 1.7930753529071808e-05, 1.9459053874015808e-05, 2.098735421895981e-05, 2.251565456390381e-05, 2.404395490884781e-05, 2.557225525379181e-05, 2.710055559873581e-05, 2.862885594367981e-05, 3.015715628862381e-05, 3.168545663356781e-05, 3.321375697851181e-05, 3.474205732345581e-05, 3.627035766839981e-05, 3.779865801334381e-05, 3.932695835828781e-05, 4.085525870323181e-05, 4.238355904817581e-05, 4.391185939311981e-05, 4.544015973806381e-05, 4.696846008300781e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 0.0, 2.0, 6.0, 4.0, 11.0, 17.0, 22.0, 34.0, 45.0, 63.0, 93.0, 111.0, 208.0, 292.0, 566.0, 982.0, 1971.0, 4383.0, 10676.0, 28286.0, 77688.0, 213414.0, 377126.0, 209099.0, 76548.0, 27831.0, 10428.0, 4341.0, 1939.0, 973.0, 516.0, 278.0, 190.0, 120.0, 74.0, 58.0, 50.0, 31.0, 16.0, 15.0, 6.0, 15.0, 6.0, 11.0, 3.0, 5.0, 1.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.18115234375, -0.17574310302734375, -0.1703338623046875, -0.16492462158203125, -0.159515380859375, -0.15410614013671875, -0.1486968994140625, -0.14328765869140625, -0.13787841796875, -0.13246917724609375, -0.1270599365234375, -0.12165069580078125, -0.116241455078125, -0.11083221435546875, -0.1054229736328125, -0.10001373291015625, -0.0946044921875, -0.08919525146484375, -0.0837860107421875, -0.07837677001953125, -0.072967529296875, -0.06755828857421875, -0.0621490478515625, -0.05673980712890625, -0.05133056640625, -0.04592132568359375, -0.0405120849609375, -0.03510284423828125, -0.029693603515625, -0.02428436279296875, -0.0188751220703125, -0.01346588134765625, -0.008056640625, -0.00264739990234375, 0.0027618408203125, 0.00817108154296875, 0.013580322265625, 0.01898956298828125, 0.0243988037109375, 0.02980804443359375, 0.03521728515625, 0.04062652587890625, 0.0460357666015625, 0.05144500732421875, 0.056854248046875, 0.06226348876953125, 0.0676727294921875, 0.07308197021484375, 0.0784912109375, 0.08390045166015625, 0.0893096923828125, 0.09471893310546875, 0.100128173828125, 0.10553741455078125, 0.1109466552734375, 0.11635589599609375, 0.12176513671875, 0.12717437744140625, 0.1325836181640625, 0.13799285888671875, 0.143402099609375, 0.14881134033203125, 0.1542205810546875, 0.15962982177734375, 0.1650390625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 5.0, 6.0, 6.0, 12.0, 8.0, 10.0, 8.0, 13.0, 22.0, 27.0, 27.0, 41.0, 51.0, 48.0, 52.0, 71.0, 74.0, 74.0, 77.0, 65.0, 59.0, 45.0, 42.0, 26.0, 32.0, 17.0, 17.0, 9.0, 14.0, 7.0, 9.0, 8.0, 3.0, 4.0, 3.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1689453125, -0.1636962890625, -0.158447265625, -0.1531982421875, -0.14794921875, -0.1427001953125, -0.137451171875, -0.1322021484375, -0.126953125, -0.1217041015625, -0.116455078125, -0.1112060546875, -0.10595703125, -0.1007080078125, -0.095458984375, -0.0902099609375, -0.0849609375, -0.0797119140625, -0.074462890625, -0.0692138671875, -0.06396484375, -0.0587158203125, -0.053466796875, -0.0482177734375, -0.04296875, -0.0377197265625, -0.032470703125, -0.0272216796875, -0.02197265625, -0.0167236328125, -0.011474609375, -0.0062255859375, -0.0009765625, 0.0042724609375, 0.009521484375, 0.0147705078125, 0.02001953125, 0.0252685546875, 0.030517578125, 0.0357666015625, 0.041015625, 0.0462646484375, 0.051513671875, 0.0567626953125, 0.06201171875, 0.0672607421875, 0.072509765625, 0.0777587890625, 0.0830078125, 0.0882568359375, 0.093505859375, 0.0987548828125, 0.10400390625, 0.1092529296875, 0.114501953125, 0.1197509765625, 0.125, 0.1302490234375, 0.135498046875, 0.1407470703125, 0.14599609375, 0.1512451171875, 0.156494140625, 0.1617431640625, 0.1669921875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 6.0, 6.0, 18.0, 39.0, 98.0, 191.0, 222.0, 224.0, 127.0, 46.0, 18.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.998752593994141, -5.826739311218262, -5.654726028442383, -5.482712745666504, -5.310699462890625, -5.138686180114746, -4.966672897338867, -4.794659614562988, -4.622646331787109, -4.4506330490112305, -4.278619766235352, -4.106606483459473, -3.9345932006835938, -3.762579917907715, -3.590566396713257, -3.418553113937378, -3.24653959274292, -3.074526309967041, -2.902513027191162, -2.730499744415283, -2.5584864616394043, -2.3864731788635254, -2.2144596576690674, -2.0424463748931885, -1.8704330921173096, -1.6984198093414307, -1.5264065265655518, -1.3543931245803833, -1.1823798418045044, -1.0103665590286255, -0.838353157043457, -0.6663398742675781, -0.494326114654541, -0.3223128020763397, -0.15029948949813843, 0.021713852882385254, 0.19372713565826416, 0.36574041843414307, 0.5377538204193115, 0.7097671031951904, 0.8817803859710693, 1.0537936687469482, 1.2258069515228271, 1.3978203535079956, 1.5698336362838745, 1.7418469190597534, 1.9138603210449219, 2.085873603820801, 2.2578868865966797, 2.4299001693725586, 2.6019134521484375, 2.7739267349243164, 2.9459400177001953, 3.117953300476074, 3.2899668216705322, 3.461980104446411, 3.63399338722229, 3.806006669998169, 3.978019952774048, 4.150033473968506, 4.322046756744385, 4.494060039520264, 4.666073322296143, 4.8380866050720215, 5.0100998878479]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 4.0, 4.0, 4.0, 9.0, 10.0, 18.0, 15.0, 8.0, 11.0, 12.0, 17.0, 16.0, 25.0, 27.0, 21.0, 25.0, 28.0, 28.0, 32.0, 36.0, 34.0, 54.0, 28.0, 41.0, 33.0, 40.0, 52.0, 27.0, 39.0, 45.0, 37.0, 20.0, 29.0, 34.0, 21.0, 17.0, 25.0, 11.0, 14.0, 8.0, 12.0, 8.0, 4.0, 6.0, 6.0, 6.0, 5.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5828663110733032, -1.5257573127746582, -1.4686483144760132, -1.4115393161773682, -1.3544304370880127, -1.2973213195800781, -1.2402124404907227, -1.1831034421920776, -1.1259944438934326, -1.0688854455947876, -1.0117764472961426, -0.9546675086021423, -0.8975585103034973, -0.8404495120048523, -0.783340573310852, -0.726231575012207, -0.669122576713562, -0.612013578414917, -0.554904580116272, -0.49779564142227173, -0.4406866431236267, -0.3835776448249817, -0.32646867632865906, -0.2693597078323364, -0.2122507095336914, -0.15514172613620758, -0.09803274273872375, -0.04092375934123993, 0.016185224056243896, 0.07329422235488892, 0.13040319085121155, 0.18751215934753418, 0.24462127685546875, 0.30173027515411377, 0.3588392436504364, 0.41594821214675903, 0.47305721044540405, 0.5301662087440491, 0.5872751474380493, 0.6443841457366943, 0.7014931440353394, 0.7586021423339844, 0.8157111406326294, 0.8728200793266296, 0.9299290776252747, 0.9870380759239197, 1.04414701461792, 1.101256012916565, 1.15836501121521, 1.215474009513855, 1.2725830078125, 1.329692006111145, 1.38680100440979, 1.4439098834991455, 1.5010188817977905, 1.5581278800964355, 1.6152368783950806, 1.6723458766937256, 1.7294548749923706, 1.7865638732910156, 1.843672752380371, 1.9007818698883057, 1.9578907489776611, 2.0149998664855957, 2.072108745574951]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 5.0, 9.0, 20.0, 36.0, 61.0, 139.0, 272.0, 592.0, 1158.0, 2771.0, 6575.0, 16943.0, 48988.0, 187585.0, 1133947.0, 2203499.0, 451560.0, 93887.0, 28994.0, 10354.0, 3859.0, 1651.0, 724.0, 336.0, 157.0, 88.0, 38.0, 17.0, 17.0, 3.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4794921875, -0.46695709228515625, -0.4544219970703125, -0.44188690185546875, -0.429351806640625, -0.41681671142578125, -0.4042816162109375, -0.39174652099609375, -0.37921142578125, -0.36667633056640625, -0.3541412353515625, -0.34160614013671875, -0.329071044921875, -0.31653594970703125, -0.3040008544921875, -0.29146575927734375, -0.2789306640625, -0.26639556884765625, -0.2538604736328125, -0.24132537841796875, -0.228790283203125, -0.21625518798828125, -0.2037200927734375, -0.19118499755859375, -0.17864990234375, -0.16611480712890625, -0.1535797119140625, -0.14104461669921875, -0.128509521484375, -0.11597442626953125, -0.1034393310546875, -0.09090423583984375, -0.078369140625, -0.06583404541015625, -0.0532989501953125, -0.04076385498046875, -0.028228759765625, -0.01569366455078125, -0.0031585693359375, 0.00937652587890625, 0.02191162109375, 0.03444671630859375, 0.0469818115234375, 0.05951690673828125, 0.072052001953125, 0.08458709716796875, 0.0971221923828125, 0.10965728759765625, 0.1221923828125, 0.13472747802734375, 0.1472625732421875, 0.15979766845703125, 0.172332763671875, 0.18486785888671875, 0.1974029541015625, 0.20993804931640625, 0.22247314453125, 0.23500823974609375, 0.2475433349609375, 0.26007843017578125, 0.272613525390625, 0.28514862060546875, 0.2976837158203125, 0.31021881103515625, 0.32275390625]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 4.0, 6.0, 7.0, 12.0, 16.0, 26.0, 25.0, 32.0, 38.0, 45.0, 48.0, 48.0, 60.0, 77.0, 71.0, 57.0, 62.0, 67.0, 51.0, 46.0, 50.0, 37.0, 36.0, 20.0, 20.0, 14.0, 9.0, 9.0, 6.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.39697265625, -0.3867454528808594, -0.37651824951171875, -0.3662910461425781, -0.3560638427734375, -0.3458366394042969, -0.33560943603515625, -0.3253822326660156, -0.315155029296875, -0.3049278259277344, -0.29470062255859375, -0.2844734191894531, -0.2742462158203125, -0.2640190124511719, -0.25379180908203125, -0.24356460571289062, -0.23333740234375, -0.22311019897460938, -0.21288299560546875, -0.20265579223632812, -0.1924285888671875, -0.18220138549804688, -0.17197418212890625, -0.16174697875976562, -0.151519775390625, -0.14129257202148438, -0.13106536865234375, -0.12083816528320312, -0.1106109619140625, -0.10038375854492188, -0.09015655517578125, -0.07992935180664062, -0.0697021484375, -0.059474945068359375, -0.04924774169921875, -0.039020538330078125, -0.0287933349609375, -0.018566131591796875, -0.00833892822265625, 0.001888275146484375, 0.012115478515625, 0.022342681884765625, 0.03256988525390625, 0.042797088623046875, 0.0530242919921875, 0.06325149536132812, 0.07347869873046875, 0.08370590209960938, 0.09393310546875, 0.10416030883789062, 0.11438751220703125, 0.12461471557617188, 0.1348419189453125, 0.14506912231445312, 0.15529632568359375, 0.16552352905273438, 0.175750732421875, 0.18597793579101562, 0.19620513916015625, 0.20643234252929688, 0.2166595458984375, 0.22688674926757812, 0.23711395263671875, 0.24734115600585938, 0.257568359375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 5.0, 3.0, 8.0, 12.0, 19.0, 31.0, 42.0, 49.0, 89.0, 130.0, 240.0, 419.0, 770.0, 1561.0, 3257.0, 8374.0, 26292.0, 101654.0, 554616.0, 2816189.0, 539534.0, 99713.0, 26155.0, 8429.0, 3376.0, 1482.0, 750.0, 417.0, 247.0, 159.0, 99.0, 56.0, 41.0, 15.0, 22.0, 11.0, 7.0, 3.0, 3.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.501953125, -0.48369598388671875, -0.4654388427734375, -0.44718170166015625, -0.428924560546875, -0.41066741943359375, -0.3924102783203125, -0.37415313720703125, -0.35589599609375, -0.33763885498046875, -0.3193817138671875, -0.30112457275390625, -0.282867431640625, -0.26461029052734375, -0.2463531494140625, -0.22809600830078125, -0.2098388671875, -0.19158172607421875, -0.1733245849609375, -0.15506744384765625, -0.136810302734375, -0.11855316162109375, -0.1002960205078125, -0.08203887939453125, -0.06378173828125, -0.04552459716796875, -0.0272674560546875, -0.00901031494140625, 0.009246826171875, 0.02750396728515625, 0.0457611083984375, 0.06401824951171875, 0.082275390625, 0.10053253173828125, 0.1187896728515625, 0.13704681396484375, 0.155303955078125, 0.17356109619140625, 0.1918182373046875, 0.21007537841796875, 0.22833251953125, 0.24658966064453125, 0.2648468017578125, 0.28310394287109375, 0.301361083984375, 0.31961822509765625, 0.3378753662109375, 0.35613250732421875, 0.3743896484375, 0.39264678955078125, 0.4109039306640625, 0.42916107177734375, 0.447418212890625, 0.46567535400390625, 0.4839324951171875, 0.5021896362304688, 0.52044677734375, 0.5387039184570312, 0.5569610595703125, 0.5752182006835938, 0.593475341796875, 0.6117324829101562, 0.6299896240234375, 0.6482467651367188, 0.66650390625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 5.0, 3.0, 6.0, 5.0, 4.0, 12.0, 14.0, 10.0, 15.0, 26.0, 27.0, 47.0, 58.0, 77.0, 108.0, 133.0, 220.0, 305.0, 469.0, 642.0, 557.0, 406.0, 259.0, 162.0, 133.0, 91.0, 60.0, 57.0, 32.0, 38.0, 30.0, 26.0, 16.0, 8.0, 4.0, 9.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4072265625, -0.3925628662109375, -0.377899169921875, -0.3632354736328125, -0.34857177734375, -0.3339080810546875, -0.319244384765625, -0.3045806884765625, -0.2899169921875, -0.2752532958984375, -0.260589599609375, -0.2459259033203125, -0.23126220703125, -0.2165985107421875, -0.201934814453125, -0.1872711181640625, -0.172607421875, -0.1579437255859375, -0.143280029296875, -0.1286163330078125, -0.11395263671875, -0.0992889404296875, -0.084625244140625, -0.0699615478515625, -0.0552978515625, -0.0406341552734375, -0.025970458984375, -0.0113067626953125, 0.00335693359375, 0.0180206298828125, 0.032684326171875, 0.0473480224609375, 0.06201171875, 0.0766754150390625, 0.091339111328125, 0.1060028076171875, 0.12066650390625, 0.1353302001953125, 0.149993896484375, 0.1646575927734375, 0.1793212890625, 0.1939849853515625, 0.208648681640625, 0.2233123779296875, 0.23797607421875, 0.2526397705078125, 0.267303466796875, 0.2819671630859375, 0.296630859375, 0.3112945556640625, 0.325958251953125, 0.3406219482421875, 0.35528564453125, 0.3699493408203125, 0.384613037109375, 0.3992767333984375, 0.4139404296875, 0.4286041259765625, 0.443267822265625, 0.4579315185546875, 0.47259521484375, 0.4872589111328125, 0.501922607421875, 0.5165863037109375, 0.53125]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 15.0, 32.0, 67.0, 139.0, 220.0, 216.0, 155.0, 76.0, 42.0, 15.0, 9.0, 6.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-7.044751167297363, -6.87268590927124, -6.700620651245117, -6.528554916381836, -6.356489658355713, -6.18442440032959, -6.012358665466309, -5.8402934074401855, -5.6682281494140625, -5.4961628913879395, -5.324097633361816, -5.152031898498535, -4.979966640472412, -4.807901382446289, -4.635835647583008, -4.463770389556885, -4.291705131530762, -4.119639873504639, -3.9475743770599365, -3.7755088806152344, -3.6034436225891113, -3.4313783645629883, -3.259312868118286, -3.087247371673584, -2.915182113647461, -2.743116855621338, -2.5710513591766357, -2.3989858627319336, -2.2269206047058105, -2.0548553466796875, -1.8827898502349854, -1.7107244729995728, -1.538658857345581, -1.3665934801101685, -1.1945281028747559, -1.0224627256393433, -0.8503973484039307, -0.6783319711685181, -0.5062665939331055, -0.33420121669769287, -0.16213583946228027, 0.009929537773132324, 0.18199491500854492, 0.3540602922439575, 0.5261256694793701, 0.6981910467147827, 0.8702564239501953, 1.042321801185608, 1.2143871784210205, 1.386452555656433, 1.5585179328918457, 1.7305833101272583, 1.902648687362671, 2.074714183807373, 2.246779441833496, 2.418844699859619, 2.5909101963043213, 2.7629756927490234, 2.9350409507751465, 3.1071062088012695, 3.2791717052459717, 3.451237201690674, 3.623302459716797, 3.79536771774292, 3.967433214187622]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 3.0, 4.0, 7.0, 8.0, 3.0, 12.0, 10.0, 20.0, 9.0, 28.0, 20.0, 28.0, 28.0, 40.0, 29.0, 35.0, 45.0, 47.0, 41.0, 45.0, 37.0, 36.0, 54.0, 37.0, 45.0, 35.0, 34.0, 36.0, 27.0, 35.0, 30.0, 20.0, 20.0, 23.0, 16.0, 9.0, 11.0, 9.0, 9.0, 6.0, 4.0, 3.0, 3.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6828688383102417, -1.6299283504486084, -1.5769879817962646, -1.5240474939346313, -1.471107006072998, -1.4181666374206543, -1.365226149559021, -1.3122856616973877, -1.259345293045044, -1.2064048051834106, -1.153464436531067, -1.1005239486694336, -1.0475834608078003, -0.9946430325508118, -0.9417026042938232, -0.8887621164321899, -0.8358216285705566, -0.7828812003135681, -0.7299407124519348, -0.6770002841949463, -0.624059796333313, -0.5711193680763245, -0.5181789398193359, -0.465238481760025, -0.4122980237007141, -0.3593575656414032, -0.3064171075820923, -0.25347667932510376, -0.20053622126579285, -0.14759576320648193, -0.09465533494949341, -0.041714876890182495, 0.011225581169128418, 0.06416603177785873, 0.11710648238658905, 0.17004692554473877, 0.22298738360404968, 0.2759278416633606, 0.3288682699203491, 0.38180872797966003, 0.43474918603897095, 0.48768964409828186, 0.5406301021575928, 0.5935705304145813, 0.6465109586715698, 0.6994514465332031, 0.7523918747901917, 0.8053323030471802, 0.8582727909088135, 0.911213219165802, 0.9641537070274353, 1.0170941352844238, 1.0700346231460571, 1.1229751110076904, 1.1759154796600342, 1.2288559675216675, 1.2817964553833008, 1.334736943244934, 1.3876773118972778, 1.4406177997589111, 1.4935582876205444, 1.5464987754821777, 1.5994391441345215, 1.6523796319961548, 1.7053200006484985]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 1.0, 2.0, 5.0, 5.0, 3.0, 8.0, 15.0, 26.0, 39.0, 66.0, 89.0, 150.0, 251.0, 440.0, 897.0, 1621.0, 3770.0, 8253.0, 20748.0, 55089.0, 145916.0, 297247.0, 288993.0, 138283.0, 51854.0, 19763.0, 7965.0, 3487.0, 1667.0, 818.0, 460.0, 269.0, 139.0, 87.0, 49.0, 28.0, 24.0, 16.0, 7.0, 6.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.307861328125, -0.2955322265625, -0.283203125, -0.2708740234375, -0.258544921875, -0.2462158203125, -0.23388671875, -0.2215576171875, -0.209228515625, -0.1968994140625, -0.1845703125, -0.1722412109375, -0.159912109375, -0.1475830078125, -0.13525390625, -0.1229248046875, -0.110595703125, -0.0982666015625, -0.0859375, -0.0736083984375, -0.061279296875, -0.0489501953125, -0.03662109375, -0.0242919921875, -0.011962890625, 0.0003662109375, 0.0126953125, 0.0250244140625, 0.037353515625, 0.0496826171875, 0.06201171875, 0.0743408203125, 0.086669921875, 0.0989990234375, 0.111328125, 0.1236572265625, 0.135986328125, 0.1483154296875, 0.16064453125, 0.1729736328125, 0.185302734375, 0.1976318359375, 0.2099609375, 0.2222900390625, 0.234619140625, 0.2469482421875, 0.25927734375, 0.2716064453125, 0.283935546875, 0.2962646484375, 0.30859375, 0.3209228515625, 0.333251953125, 0.3455810546875, 0.35791015625, 0.3702392578125, 0.382568359375, 0.3948974609375, 0.4072265625, 0.4195556640625, 0.431884765625, 0.4442138671875, 0.45654296875, 0.4688720703125, 0.481201171875]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 3.0, 7.0, 15.0, 15.0, 14.0, 22.0, 32.0, 39.0, 38.0, 47.0, 58.0, 61.0, 73.0, 71.0, 68.0, 68.0, 68.0, 65.0, 48.0, 47.0, 42.0, 30.0, 19.0, 22.0, 13.0, 8.0, 6.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.433349609375, -0.4225006103515625, -0.411651611328125, -0.4008026123046875, -0.38995361328125, -0.3791046142578125, -0.368255615234375, -0.3574066162109375, -0.3465576171875, -0.3357086181640625, -0.324859619140625, -0.3140106201171875, -0.30316162109375, -0.2923126220703125, -0.281463623046875, -0.2706146240234375, -0.259765625, -0.2489166259765625, -0.238067626953125, -0.2272186279296875, -0.21636962890625, -0.2055206298828125, -0.194671630859375, -0.1838226318359375, -0.1729736328125, -0.1621246337890625, -0.151275634765625, -0.1404266357421875, -0.12957763671875, -0.1187286376953125, -0.107879638671875, -0.0970306396484375, -0.086181640625, -0.0753326416015625, -0.064483642578125, -0.0536346435546875, -0.04278564453125, -0.0319366455078125, -0.021087646484375, -0.0102386474609375, 0.0006103515625, 0.0114593505859375, 0.022308349609375, 0.0331573486328125, 0.04400634765625, 0.0548553466796875, 0.065704345703125, 0.0765533447265625, 0.08740234375, 0.0982513427734375, 0.109100341796875, 0.1199493408203125, 0.13079833984375, 0.1416473388671875, 0.152496337890625, 0.1633453369140625, 0.1741943359375, 0.1850433349609375, 0.195892333984375, 0.2067413330078125, 0.21759033203125, 0.2284393310546875, 0.239288330078125, 0.2501373291015625, 0.260986328125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 6.0, 10.0, 6.0, 12.0, 17.0, 22.0, 23.0, 44.0, 83.0, 135.0, 220.0, 410.0, 878.0, 1768.0, 4230.0, 10199.0, 26854.0, 78733.0, 244588.0, 401491.0, 184899.0, 58427.0, 20832.0, 8252.0, 3380.0, 1428.0, 720.0, 350.0, 202.0, 132.0, 66.0, 44.0, 33.0, 21.0, 17.0, 5.0, 4.0, 4.0, 2.0, 3.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.42431640625, -0.4088134765625, -0.393310546875, -0.3778076171875, -0.3623046875, -0.3468017578125, -0.331298828125, -0.3157958984375, -0.30029296875, -0.2847900390625, -0.269287109375, -0.2537841796875, -0.23828125, -0.2227783203125, -0.207275390625, -0.1917724609375, -0.17626953125, -0.1607666015625, -0.145263671875, -0.1297607421875, -0.1142578125, -0.0987548828125, -0.083251953125, -0.0677490234375, -0.05224609375, -0.0367431640625, -0.021240234375, -0.0057373046875, 0.009765625, 0.0252685546875, 0.040771484375, 0.0562744140625, 0.07177734375, 0.0872802734375, 0.102783203125, 0.1182861328125, 0.1337890625, 0.1492919921875, 0.164794921875, 0.1802978515625, 0.19580078125, 0.2113037109375, 0.226806640625, 0.2423095703125, 0.2578125, 0.2733154296875, 0.288818359375, 0.3043212890625, 0.31982421875, 0.3353271484375, 0.350830078125, 0.3663330078125, 0.3818359375, 0.3973388671875, 0.412841796875, 0.4283447265625, 0.44384765625, 0.4593505859375, 0.474853515625, 0.4903564453125, 0.505859375, 0.5213623046875, 0.536865234375, 0.5523681640625, 0.56787109375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 8.0, 5.0, 10.0, 3.0, 8.0, 7.0, 10.0, 12.0, 9.0, 19.0, 24.0, 21.0, 19.0, 23.0, 41.0, 37.0, 31.0, 43.0, 40.0, 58.0, 54.0, 34.0, 40.0, 54.0, 51.0, 41.0, 33.0, 24.0, 33.0, 32.0, 33.0, 29.0, 18.0, 18.0, 13.0, 16.0, 11.0, 12.0, 2.0, 6.0, 6.0, 10.0, 2.0, 3.0, 2.0, 3.0, 3.0, 0.0, 3.0], "bins": [-0.78125, -0.7598724365234375, -0.738494873046875, -0.7171173095703125, -0.69573974609375, -0.6743621826171875, -0.652984619140625, -0.6316070556640625, -0.6102294921875, -0.5888519287109375, -0.567474365234375, -0.5460968017578125, -0.52471923828125, -0.5033416748046875, -0.481964111328125, -0.4605865478515625, -0.439208984375, -0.4178314208984375, -0.396453857421875, -0.3750762939453125, -0.35369873046875, -0.3323211669921875, -0.310943603515625, -0.2895660400390625, -0.2681884765625, -0.2468109130859375, -0.225433349609375, -0.2040557861328125, -0.18267822265625, -0.1613006591796875, -0.139923095703125, -0.1185455322265625, -0.09716796875, -0.0757904052734375, -0.054412841796875, -0.0330352783203125, -0.01165771484375, 0.0097198486328125, 0.031097412109375, 0.0524749755859375, 0.0738525390625, 0.0952301025390625, 0.116607666015625, 0.1379852294921875, 0.15936279296875, 0.1807403564453125, 0.202117919921875, 0.2234954833984375, 0.244873046875, 0.2662506103515625, 0.287628173828125, 0.3090057373046875, 0.33038330078125, 0.3517608642578125, 0.373138427734375, 0.3945159912109375, 0.4158935546875, 0.4372711181640625, 0.458648681640625, 0.4800262451171875, 0.50140380859375, 0.5227813720703125, 0.544158935546875, 0.5655364990234375, 0.5869140625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 2.0, 7.0, 14.0, 15.0, 22.0, 23.0, 35.0, 52.0, 96.0, 126.0, 185.0, 296.0, 403.0, 721.0, 1185.0, 2024.0, 3648.0, 7540.0, 17273.0, 49378.0, 183777.0, 446121.0, 233991.0, 62649.0, 20553.0, 8563.0, 4211.0, 2209.0, 1273.0, 733.0, 487.0, 290.0, 207.0, 145.0, 91.0, 64.0, 36.0, 38.0, 25.0, 15.0, 8.0, 4.0, 7.0, 3.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.2481689453125, -0.24005699157714844, -0.23194503784179688, -0.2238330841064453, -0.21572113037109375, -0.2076091766357422, -0.19949722290039062, -0.19138526916503906, -0.1832733154296875, -0.17516136169433594, -0.16704940795898438, -0.1589374542236328, -0.15082550048828125, -0.1427135467529297, -0.13460159301757812, -0.12648963928222656, -0.118377685546875, -0.11026573181152344, -0.10215377807617188, -0.09404182434082031, -0.08592987060546875, -0.07781791687011719, -0.06970596313476562, -0.06159400939941406, -0.0534820556640625, -0.04537010192871094, -0.037258148193359375, -0.029146194458007812, -0.02103424072265625, -0.012922286987304688, -0.004810333251953125, 0.0033016204833984375, 0.01141357421875, 0.019525527954101562, 0.027637481689453125, 0.03574943542480469, 0.04386138916015625, 0.05197334289550781, 0.060085296630859375, 0.06819725036621094, 0.0763092041015625, 0.08442115783691406, 0.09253311157226562, 0.10064506530761719, 0.10875701904296875, 0.11686897277832031, 0.12498092651367188, 0.13309288024902344, 0.141204833984375, 0.14931678771972656, 0.15742874145507812, 0.1655406951904297, 0.17365264892578125, 0.1817646026611328, 0.18987655639648438, 0.19798851013183594, 0.2061004638671875, 0.21421241760253906, 0.22232437133789062, 0.2304363250732422, 0.23854827880859375, 0.2466602325439453, 0.2547721862792969, 0.26288414001464844, 0.27099609375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 5.0, 5.0, 9.0, 11.0, 24.0, 32.0, 28.0, 51.0, 69.0, 71.0, 123.0, 137.0, 104.0, 95.0, 77.0, 49.0, 28.0, 19.0, 16.0, 15.0, 9.0, 6.0, 6.0, 3.0, 6.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.537271499633789e-05, -5.3423456847667694e-05, -5.14741986989975e-05, -4.95249405503273e-05, -4.7575682401657104e-05, -4.562642425298691e-05, -4.367716610431671e-05, -4.1727907955646515e-05, -3.977864980697632e-05, -3.782939165830612e-05, -3.5880133509635925e-05, -3.393087536096573e-05, -3.198161721229553e-05, -3.0032359063625336e-05, -2.808310091495514e-05, -2.6133842766284943e-05, -2.4184584617614746e-05, -2.223532646894455e-05, -2.0286068320274353e-05, -1.8336810171604156e-05, -1.638755202293396e-05, -1.4438293874263763e-05, -1.2489035725593567e-05, -1.053977757692337e-05, -8.590519428253174e-06, -6.641261279582977e-06, -4.692003130912781e-06, -2.7427449822425842e-06, -7.934868335723877e-07, 1.1557713150978088e-06, 3.1050294637680054e-06, 5.054287612438202e-06, 7.0035457611083984e-06, 8.952803909778595e-06, 1.0902062058448792e-05, 1.2851320207118988e-05, 1.4800578355789185e-05, 1.674983650445938e-05, 1.8699094653129578e-05, 2.0648352801799774e-05, 2.259761095046997e-05, 2.4546869099140167e-05, 2.6496127247810364e-05, 2.844538539648056e-05, 3.0394643545150757e-05, 3.234390169382095e-05, 3.429315984249115e-05, 3.6242417991161346e-05, 3.819167613983154e-05, 4.014093428850174e-05, 4.2090192437171936e-05, 4.403945058584213e-05, 4.598870873451233e-05, 4.7937966883182526e-05, 4.988722503185272e-05, 5.183648318052292e-05, 5.3785741329193115e-05, 5.573499947786331e-05, 5.768425762653351e-05, 5.9633515775203705e-05, 6.15827739238739e-05, 6.35320320725441e-05, 6.54812902212143e-05, 6.743054836988449e-05, 6.937980651855469e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0, 10.0, 11.0, 15.0, 16.0, 34.0, 42.0, 66.0, 102.0, 148.0, 249.0, 431.0, 790.0, 1758.0, 4053.0, 12459.0, 53943.0, 302084.0, 517798.0, 119190.0, 23590.0, 6592.0, 2568.0, 1164.0, 558.0, 324.0, 192.0, 112.0, 92.0, 43.0, 38.0, 28.0, 16.0, 11.0, 6.0, 5.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.32568359375, -0.314910888671875, -0.30413818359375, -0.293365478515625, -0.2825927734375, -0.271820068359375, -0.26104736328125, -0.250274658203125, -0.239501953125, -0.228729248046875, -0.21795654296875, -0.207183837890625, -0.1964111328125, -0.185638427734375, -0.17486572265625, -0.164093017578125, -0.1533203125, -0.142547607421875, -0.13177490234375, -0.121002197265625, -0.1102294921875, -0.099456787109375, -0.08868408203125, -0.077911376953125, -0.067138671875, -0.056365966796875, -0.04559326171875, -0.034820556640625, -0.0240478515625, -0.013275146484375, -0.00250244140625, 0.008270263671875, 0.01904296875, 0.029815673828125, 0.04058837890625, 0.051361083984375, 0.0621337890625, 0.072906494140625, 0.08367919921875, 0.094451904296875, 0.105224609375, 0.115997314453125, 0.12677001953125, 0.137542724609375, 0.1483154296875, 0.159088134765625, 0.16986083984375, 0.180633544921875, 0.19140625, 0.202178955078125, 0.21295166015625, 0.223724365234375, 0.2344970703125, 0.245269775390625, 0.25604248046875, 0.266815185546875, 0.277587890625, 0.288360595703125, 0.29913330078125, 0.309906005859375, 0.3206787109375, 0.331451416015625, 0.34222412109375, 0.352996826171875, 0.36376953125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 1.0, 5.0, 4.0, 5.0, 6.0, 17.0, 30.0, 37.0, 41.0, 55.0, 77.0, 86.0, 128.0, 118.0, 98.0, 89.0, 63.0, 43.0, 38.0, 17.0, 11.0, 11.0, 10.0, 7.0, 2.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.349609375, -0.3390312194824219, -0.32845306396484375, -0.3178749084472656, -0.3072967529296875, -0.2967185974121094, -0.28614044189453125, -0.2755622863769531, -0.264984130859375, -0.2544059753417969, -0.24382781982421875, -0.23324966430664062, -0.2226715087890625, -0.21209335327148438, -0.20151519775390625, -0.19093704223632812, -0.18035888671875, -0.16978073120117188, -0.15920257568359375, -0.14862442016601562, -0.1380462646484375, -0.12746810913085938, -0.11688995361328125, -0.10631179809570312, -0.095733642578125, -0.08515548706054688, -0.07457733154296875, -0.06399917602539062, -0.0534210205078125, -0.042842864990234375, -0.03226470947265625, -0.021686553955078125, -0.0111083984375, -0.000530242919921875, 0.01004791259765625, 0.020626068115234375, 0.0312042236328125, 0.041782379150390625, 0.05236053466796875, 0.06293869018554688, 0.073516845703125, 0.08409500122070312, 0.09467315673828125, 0.10525131225585938, 0.1158294677734375, 0.12640762329101562, 0.13698577880859375, 0.14756393432617188, 0.15814208984375, 0.16872024536132812, 0.17929840087890625, 0.18987655639648438, 0.2004547119140625, 0.21103286743164062, 0.22161102294921875, 0.23218917846679688, 0.242767333984375, 0.2533454895019531, 0.26392364501953125, 0.2745018005371094, 0.2850799560546875, 0.2956581115722656, 0.30623626708984375, 0.3168144226074219, 0.327392578125]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 4.0, 4.0, 5.0, 40.0, 71.0, 101.0, 211.0, 261.0, 170.0, 84.0, 26.0, 17.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.3927106857299805, -6.2385029792785645, -6.084295272827148, -5.930088043212891, -5.775880336761475, -5.621672630310059, -5.467464923858643, -5.313257217407227, -5.159049987792969, -5.004842281341553, -4.850634574890137, -4.696427345275879, -4.542219638824463, -4.388011932373047, -4.233804225921631, -4.079596519470215, -3.925389051437378, -3.771181344985962, -3.616973876953125, -3.462766170501709, -3.308558702468872, -3.154350996017456, -3.000143527984619, -2.845935821533203, -2.691728115081787, -2.537520408630371, -2.383312940597534, -2.229105234146118, -2.0748977661132812, -1.9206900596618652, -1.7664824724197388, -1.6122748851776123, -1.4580671787261963, -1.3038595914840698, -1.1496520042419434, -0.9954443573951721, -0.8412367701530457, -0.6870291829109192, -0.532821536064148, -0.3786139488220215, -0.22440636157989502, -0.07019875943660736, 0.0840088427066803, 0.23821645975112915, 0.3924240469932556, 0.5466316342353821, 0.7008392810821533, 0.8550468683242798, 1.0092544555664062, 1.1634620428085327, 1.3176696300506592, 1.4718773365020752, 1.626084804534912, 1.7802925109863281, 1.9345000982284546, 2.088707685470581, 2.242915153503418, 2.397122859954834, 2.551330327987671, 2.705538034439087, 2.859745502471924, 3.01395320892334, 3.168160915374756, 3.3223683834075928, 3.476576089859009]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 2.0, 10.0, 7.0, 8.0, 9.0, 13.0, 18.0, 18.0, 19.0, 18.0, 23.0, 24.0, 33.0, 25.0, 33.0, 30.0, 41.0, 44.0, 48.0, 56.0, 50.0, 52.0, 33.0, 46.0, 27.0, 30.0, 31.0, 31.0, 31.0, 32.0, 14.0, 20.0, 24.0, 19.0, 16.0, 8.0, 14.0, 11.0, 6.0, 9.0, 4.0, 5.0, 1.0, 3.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.0689220428466797, -2.007063388824463, -1.9452046155929565, -1.8833458423614502, -1.8214870691299438, -1.7596282958984375, -1.6977696418762207, -1.6359108686447144, -1.574052095413208, -1.5121933221817017, -1.4503346681594849, -1.3884758949279785, -1.3266171216964722, -1.2647583484649658, -1.202899694442749, -1.1410409212112427, -1.0791822671890259, -1.0173234939575195, -0.955464780330658, -0.8936060667037964, -0.83174729347229, -0.7698885798454285, -0.7080298662185669, -0.6461710929870605, -0.584312379360199, -0.5224536657333374, -0.46059489250183105, -0.3987361788749695, -0.3368774354457855, -0.27501869201660156, -0.21315997838974, -0.15130123496055603, -0.08944249153137207, -0.027583755552768707, 0.034274980425834656, 0.09613370895385742, 0.15799245238304138, 0.21985119581222534, 0.2817099094390869, 0.3435686528682709, 0.40542739629745483, 0.4672861397266388, 0.5291448831558228, 0.5910035967826843, 0.6528623104095459, 0.7147210836410522, 0.7765797972679138, 0.8384385108947754, 0.9002972841262817, 0.9621559977531433, 1.0240147113800049, 1.0858734846115112, 1.1477322578430176, 1.2095909118652344, 1.2714496850967407, 1.333308458328247, 1.3951671123504639, 1.4570258855819702, 1.518884539604187, 1.5807433128356934, 1.6426020860671997, 1.704460859298706, 1.7663195133209229, 1.8281782865524292, 1.8900370597839355]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 5.0, 8.0, 11.0, 13.0, 16.0, 43.0, 51.0, 92.0, 143.0, 228.0, 407.0, 740.0, 1235.0, 2500.0, 5180.0, 11234.0, 27997.0, 84178.0, 335787.0, 1478608.0, 1678119.0, 409493.0, 100594.0, 32925.0, 13111.0, 5905.0, 2607.0, 1315.0, 738.0, 400.0, 236.0, 122.0, 98.0, 58.0, 34.0, 29.0, 8.0, 4.0, 6.0, 4.0, 1.0, 2.0, 1.0, 1.0, 3.0], "bins": [-0.399658203125, -0.38942718505859375, -0.3791961669921875, -0.36896514892578125, -0.358734130859375, -0.34850311279296875, -0.3382720947265625, -0.32804107666015625, -0.31781005859375, -0.30757904052734375, -0.2973480224609375, -0.28711700439453125, -0.276885986328125, -0.26665496826171875, -0.2564239501953125, -0.24619293212890625, -0.2359619140625, -0.22573089599609375, -0.2154998779296875, -0.20526885986328125, -0.195037841796875, -0.18480682373046875, -0.1745758056640625, -0.16434478759765625, -0.15411376953125, -0.14388275146484375, -0.1336517333984375, -0.12342071533203125, -0.113189697265625, -0.10295867919921875, -0.0927276611328125, -0.08249664306640625, -0.072265625, -0.06203460693359375, -0.0518035888671875, -0.04157257080078125, -0.031341552734375, -0.02111053466796875, -0.0108795166015625, -0.00064849853515625, 0.00958251953125, 0.01981353759765625, 0.0300445556640625, 0.04027557373046875, 0.050506591796875, 0.06073760986328125, 0.0709686279296875, 0.08119964599609375, 0.0914306640625, 0.10166168212890625, 0.1118927001953125, 0.12212371826171875, 0.132354736328125, 0.14258575439453125, 0.1528167724609375, 0.16304779052734375, 0.17327880859375, 0.18350982666015625, 0.1937408447265625, 0.20397186279296875, 0.214202880859375, 0.22443389892578125, 0.2346649169921875, 0.24489593505859375, 0.255126953125]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 9.0, 5.0, 9.0, 15.0, 15.0, 25.0, 31.0, 28.0, 41.0, 37.0, 48.0, 43.0, 57.0, 58.0, 62.0, 74.0, 74.0, 63.0, 55.0, 55.0, 33.0, 36.0, 30.0, 19.0, 23.0, 13.0, 13.0, 8.0, 10.0, 7.0, 7.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.415771484375, -0.4053497314453125, -0.394927978515625, -0.3845062255859375, -0.37408447265625, -0.3636627197265625, -0.353240966796875, -0.3428192138671875, -0.3323974609375, -0.3219757080078125, -0.311553955078125, -0.3011322021484375, -0.29071044921875, -0.2802886962890625, -0.269866943359375, -0.2594451904296875, -0.2490234375, -0.2386016845703125, -0.228179931640625, -0.2177581787109375, -0.20733642578125, -0.1969146728515625, -0.186492919921875, -0.1760711669921875, -0.1656494140625, -0.1552276611328125, -0.144805908203125, -0.1343841552734375, -0.12396240234375, -0.1135406494140625, -0.103118896484375, -0.0926971435546875, -0.082275390625, -0.0718536376953125, -0.061431884765625, -0.0510101318359375, -0.04058837890625, -0.0301666259765625, -0.019744873046875, -0.0093231201171875, 0.0010986328125, 0.0115203857421875, 0.021942138671875, 0.0323638916015625, 0.04278564453125, 0.0532073974609375, 0.063629150390625, 0.0740509033203125, 0.08447265625, 0.0948944091796875, 0.105316162109375, 0.1157379150390625, 0.12615966796875, 0.1365814208984375, 0.147003173828125, 0.1574249267578125, 0.1678466796875, 0.1782684326171875, 0.188690185546875, 0.1991119384765625, 0.20953369140625, 0.2199554443359375, 0.230377197265625, 0.2407989501953125, 0.251220703125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 5.0, 4.0, 14.0, 10.0, 12.0, 22.0, 30.0, 52.0, 58.0, 89.0, 155.0, 212.0, 405.0, 665.0, 1088.0, 2086.0, 4347.0, 10183.0, 28425.0, 98878.0, 531444.0, 2745520.0, 609981.0, 109403.0, 30473.0, 10890.0, 4627.0, 2199.0, 1209.0, 655.0, 409.0, 241.0, 145.0, 120.0, 79.0, 45.0, 31.0, 13.0, 21.0, 15.0, 8.0, 6.0, 2.0, 4.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.469970703125, -0.4545783996582031, -0.43918609619140625, -0.4237937927246094, -0.4084014892578125, -0.3930091857910156, -0.37761688232421875, -0.3622245788574219, -0.346832275390625, -0.3314399719238281, -0.31604766845703125, -0.3006553649902344, -0.2852630615234375, -0.2698707580566406, -0.25447845458984375, -0.23908615112304688, -0.22369384765625, -0.20830154418945312, -0.19290924072265625, -0.17751693725585938, -0.1621246337890625, -0.14673233032226562, -0.13134002685546875, -0.11594772338867188, -0.100555419921875, -0.08516311645507812, -0.06977081298828125, -0.054378509521484375, -0.0389862060546875, -0.023593902587890625, -0.00820159912109375, 0.007190704345703125, 0.0225830078125, 0.037975311279296875, 0.05336761474609375, 0.06875991821289062, 0.0841522216796875, 0.09954452514648438, 0.11493682861328125, 0.13032913208007812, 0.145721435546875, 0.16111373901367188, 0.17650604248046875, 0.19189834594726562, 0.2072906494140625, 0.22268295288085938, 0.23807525634765625, 0.2534675598144531, 0.26885986328125, 0.2842521667480469, 0.29964447021484375, 0.3150367736816406, 0.3304290771484375, 0.3458213806152344, 0.36121368408203125, 0.3766059875488281, 0.391998291015625, 0.4073905944824219, 0.42278289794921875, 0.4381752014160156, 0.4535675048828125, 0.4689598083496094, 0.48435211181640625, 0.4997444152832031, 0.51513671875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 2.0, 7.0, 11.0, 5.0, 9.0, 12.0, 32.0, 32.0, 63.0, 73.0, 64.0, 181.0, 235.0, 365.0, 640.0, 744.0, 563.0, 353.0, 201.0, 145.0, 95.0, 60.0, 51.0, 38.0, 28.0, 11.0, 17.0, 6.0, 11.0, 7.0, 3.0, 4.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.469970703125, -0.4545326232910156, -0.43909454345703125, -0.4236564636230469, -0.4082183837890625, -0.3927803039550781, -0.37734222412109375, -0.3619041442871094, -0.346466064453125, -0.3310279846191406, -0.31558990478515625, -0.3001518249511719, -0.2847137451171875, -0.2692756652832031, -0.25383758544921875, -0.23839950561523438, -0.22296142578125, -0.20752334594726562, -0.19208526611328125, -0.17664718627929688, -0.1612091064453125, -0.14577102661132812, -0.13033294677734375, -0.11489486694335938, -0.099456787109375, -0.08401870727539062, -0.06858062744140625, -0.053142547607421875, -0.0377044677734375, -0.022266387939453125, -0.00682830810546875, 0.008609771728515625, 0.0240478515625, 0.039485931396484375, 0.05492401123046875, 0.07036209106445312, 0.0858001708984375, 0.10123825073242188, 0.11667633056640625, 0.13211441040039062, 0.147552490234375, 0.16299057006835938, 0.17842864990234375, 0.19386672973632812, 0.2093048095703125, 0.22474288940429688, 0.24018096923828125, 0.2556190490722656, 0.27105712890625, 0.2864952087402344, 0.30193328857421875, 0.3173713684082031, 0.3328094482421875, 0.3482475280761719, 0.36368560791015625, 0.3791236877441406, 0.394561767578125, 0.4099998474121094, 0.42543792724609375, 0.4408760070800781, 0.4563140869140625, 0.4717521667480469, 0.48719024658203125, 0.5026283264160156, 0.51806640625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 5.0, 10.0, 42.0, 90.0, 150.0, 208.0, 192.0, 161.0, 67.0, 37.0, 15.0, 11.0, 7.0, 1.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2460906505584717, -3.109084367752075, -2.9720780849456787, -2.8350720405578613, -2.698065757751465, -2.5610594749450684, -2.424053192138672, -2.2870469093322754, -2.150040626525879, -2.0130343437194824, -1.8760281801223755, -1.739021897315979, -1.602015733718872, -1.4650094509124756, -1.328003168106079, -1.1909968852996826, -1.0539908409118652, -0.9169846177101135, -0.7799783945083618, -0.6429721117019653, -0.5059658885002136, -0.3689596652984619, -0.23195338249206543, -0.09494715929031372, 0.04205906391143799, 0.1790653020143509, 0.3160715401172638, 0.4530777931213379, 0.5900840163230896, 0.7270902395248413, 0.8640965223312378, 1.0011026859283447, 1.138108730316162, 1.2751150131225586, 1.4121211767196655, 1.549127459526062, 1.686133623123169, 1.8231399059295654, 1.960146188735962, 2.0971524715423584, 2.234158515930176, 2.3711647987365723, 2.5081710815429688, 2.6451773643493652, 2.7821834087371826, 2.919189691543579, 3.0561959743499756, 3.193202257156372, 3.3302085399627686, 3.467214822769165, 3.6042211055755615, 3.741227149963379, 3.8782334327697754, 4.015239715576172, 4.152245998382568, 4.289252281188965, 4.426258563995361, 4.563264846801758, 4.700271129608154, 4.837277412414551, 4.974283695220947, 5.111289978027344, 5.248295783996582, 5.3853020668029785, 5.522308349609375]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 3.0, 1.0, 6.0, 7.0, 9.0, 12.0, 12.0, 15.0, 16.0, 19.0, 20.0, 19.0, 25.0, 22.0, 21.0, 27.0, 27.0, 40.0, 32.0, 41.0, 42.0, 40.0, 44.0, 43.0, 40.0, 26.0, 47.0, 32.0, 44.0, 24.0, 26.0, 37.0, 28.0, 20.0, 17.0, 18.0, 18.0, 19.0, 16.0, 7.0, 10.0, 5.0, 5.0, 8.0, 3.0, 5.0, 1.0, 3.0, 3.0, 3.0, 1.0], "bins": [-1.3673205375671387, -1.3295714855194092, -1.2918224334716797, -1.2540735006332397, -1.2163244485855103, -1.1785753965377808, -1.1408263444900513, -1.1030774116516113, -1.0653283596038818, -1.0275793075561523, -0.9898303151130676, -0.9520812630653381, -0.9143322706222534, -0.8765832185745239, -0.8388341665267944, -0.8010851740837097, -0.7633361220359802, -0.7255870699882507, -0.687838077545166, -0.6500890254974365, -0.6123400330543518, -0.5745909810066223, -0.5368419885635376, -0.4990929365158081, -0.461343914270401, -0.4235948920249939, -0.3858458697795868, -0.3480968475341797, -0.3103477954864502, -0.2725988030433655, -0.234849750995636, -0.19710072875022888, -0.15935170650482178, -0.12160268425941467, -0.08385365456342697, -0.04610462486743927, -0.008355602622032166, 0.02939341962337494, 0.06714245676994324, 0.10489147901535034, 0.14264050126075745, 0.18038952350616455, 0.21813854575157166, 0.25588756799697876, 0.29363662004470825, 0.33138561248779297, 0.36913466453552246, 0.40688368678092957, 0.44463270902633667, 0.4823817312717438, 0.5201307535171509, 0.5578798055648804, 0.5956287980079651, 0.6333778500556946, 0.6711268424987793, 0.7088758945465088, 0.7466249465942383, 0.7843739986419678, 0.8221229910850525, 0.859872043132782, 0.8976210355758667, 0.9353700876235962, 0.9731191396713257, 1.0108680725097656, 1.0486171245574951]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 5.0, 10.0, 7.0, 14.0, 27.0, 35.0, 59.0, 89.0, 131.0, 220.0, 354.0, 656.0, 1312.0, 2733.0, 6436.0, 15265.0, 41566.0, 129338.0, 359506.0, 322938.0, 108095.0, 35494.0, 13533.0, 5605.0, 2482.0, 1199.0, 647.0, 301.0, 182.0, 116.0, 67.0, 48.0, 29.0, 20.0, 10.0, 6.0, 7.0, 10.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.479248046875, -0.4620857238769531, -0.44492340087890625, -0.4277610778808594, -0.4105987548828125, -0.3934364318847656, -0.37627410888671875, -0.3591117858886719, -0.341949462890625, -0.3247871398925781, -0.30762481689453125, -0.2904624938964844, -0.2733001708984375, -0.2561378479003906, -0.23897552490234375, -0.22181320190429688, -0.20465087890625, -0.18748855590820312, -0.17032623291015625, -0.15316390991210938, -0.1360015869140625, -0.11883926391601562, -0.10167694091796875, -0.08451461791992188, -0.067352294921875, -0.050189971923828125, -0.03302764892578125, -0.015865325927734375, 0.0012969970703125, 0.018459320068359375, 0.03562164306640625, 0.052783966064453125, 0.0699462890625, 0.08710861206054688, 0.10427093505859375, 0.12143325805664062, 0.1385955810546875, 0.15575790405273438, 0.17292022705078125, 0.19008255004882812, 0.207244873046875, 0.22440719604492188, 0.24156951904296875, 0.2587318420410156, 0.2758941650390625, 0.2930564880371094, 0.31021881103515625, 0.3273811340332031, 0.34454345703125, 0.3617057800292969, 0.37886810302734375, 0.3960304260253906, 0.4131927490234375, 0.4303550720214844, 0.44751739501953125, 0.4646797180175781, 0.481842041015625, 0.4990043640136719, 0.5161666870117188, 0.5333290100097656, 0.5504913330078125, 0.5676536560058594, 0.5848159790039062, 0.6019783020019531, 0.619140625]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 5.0, 6.0, 14.0, 20.0, 25.0, 18.0, 24.0, 45.0, 36.0, 44.0, 59.0, 57.0, 51.0, 45.0, 61.0, 76.0, 60.0, 71.0, 63.0, 55.0, 23.0, 33.0, 29.0, 18.0, 17.0, 15.0, 10.0, 8.0, 8.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.421142578125, -0.4107170104980469, -0.40029144287109375, -0.3898658752441406, -0.3794403076171875, -0.3690147399902344, -0.35858917236328125, -0.3481636047363281, -0.337738037109375, -0.3273124694824219, -0.31688690185546875, -0.3064613342285156, -0.2960357666015625, -0.2856101989746094, -0.27518463134765625, -0.2647590637207031, -0.25433349609375, -0.24390792846679688, -0.23348236083984375, -0.22305679321289062, -0.2126312255859375, -0.20220565795898438, -0.19178009033203125, -0.18135452270507812, -0.170928955078125, -0.16050338745117188, -0.15007781982421875, -0.13965225219726562, -0.1292266845703125, -0.11880111694335938, -0.10837554931640625, -0.09794998168945312, -0.0875244140625, -0.07709884643554688, -0.06667327880859375, -0.056247711181640625, -0.0458221435546875, -0.035396575927734375, -0.02497100830078125, -0.014545440673828125, -0.004119873046875, 0.006305694580078125, 0.01673126220703125, 0.027156829833984375, 0.0375823974609375, 0.048007965087890625, 0.05843353271484375, 0.06885910034179688, 0.07928466796875, 0.08971023559570312, 0.10013580322265625, 0.11056137084960938, 0.1209869384765625, 0.13141250610351562, 0.14183807373046875, 0.15226364135742188, 0.162689208984375, 0.17311477661132812, 0.18354034423828125, 0.19396591186523438, 0.2043914794921875, 0.21481704711914062, 0.22524261474609375, 0.23566818237304688, 0.24609375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 6.0, 5.0, 9.0, 15.0, 19.0, 37.0, 42.0, 62.0, 102.0, 189.0, 326.0, 475.0, 825.0, 1496.0, 2803.0, 5868.0, 13002.0, 31791.0, 90264.0, 295600.0, 393608.0, 135126.0, 44074.0, 17270.0, 7371.0, 3715.0, 1900.0, 1001.0, 575.0, 381.0, 227.0, 135.0, 87.0, 43.0, 22.0, 25.0, 15.0, 19.0, 7.0, 6.0, 4.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.55712890625, -0.5398101806640625, -0.522491455078125, -0.5051727294921875, -0.48785400390625, -0.4705352783203125, -0.453216552734375, -0.4358978271484375, -0.4185791015625, -0.4012603759765625, -0.383941650390625, -0.3666229248046875, -0.34930419921875, -0.3319854736328125, -0.314666748046875, -0.2973480224609375, -0.280029296875, -0.2627105712890625, -0.245391845703125, -0.2280731201171875, -0.21075439453125, -0.1934356689453125, -0.176116943359375, -0.1587982177734375, -0.1414794921875, -0.1241607666015625, -0.106842041015625, -0.0895233154296875, -0.07220458984375, -0.0548858642578125, -0.037567138671875, -0.0202484130859375, -0.0029296875, 0.0143890380859375, 0.031707763671875, 0.0490264892578125, 0.06634521484375, 0.0836639404296875, 0.100982666015625, 0.1183013916015625, 0.1356201171875, 0.1529388427734375, 0.170257568359375, 0.1875762939453125, 0.20489501953125, 0.2222137451171875, 0.239532470703125, 0.2568511962890625, 0.274169921875, 0.2914886474609375, 0.308807373046875, 0.3261260986328125, 0.34344482421875, 0.3607635498046875, 0.378082275390625, 0.3954010009765625, 0.4127197265625, 0.4300384521484375, 0.447357177734375, 0.4646759033203125, 0.48199462890625, 0.4993133544921875, 0.516632080078125, 0.5339508056640625, 0.55126953125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 3.0, 2.0, 2.0, 5.0, 2.0, 7.0, 7.0, 11.0, 13.0, 21.0, 11.0, 25.0, 22.0, 26.0, 22.0, 50.0, 29.0, 41.0, 40.0, 54.0, 43.0, 48.0, 50.0, 49.0, 52.0, 49.0, 56.0, 41.0, 34.0, 30.0, 24.0, 22.0, 16.0, 16.0, 18.0, 11.0, 20.0, 11.0, 7.0, 7.0, 5.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.888671875, -0.863861083984375, -0.83905029296875, -0.814239501953125, -0.7894287109375, -0.764617919921875, -0.73980712890625, -0.714996337890625, -0.690185546875, -0.665374755859375, -0.64056396484375, -0.615753173828125, -0.5909423828125, -0.566131591796875, -0.54132080078125, -0.516510009765625, -0.49169921875, -0.466888427734375, -0.44207763671875, -0.417266845703125, -0.3924560546875, -0.367645263671875, -0.34283447265625, -0.318023681640625, -0.293212890625, -0.268402099609375, -0.24359130859375, -0.218780517578125, -0.1939697265625, -0.169158935546875, -0.14434814453125, -0.119537353515625, -0.0947265625, -0.069915771484375, -0.04510498046875, -0.020294189453125, 0.0045166015625, 0.029327392578125, 0.05413818359375, 0.078948974609375, 0.103759765625, 0.128570556640625, 0.15338134765625, 0.178192138671875, 0.2030029296875, 0.227813720703125, 0.25262451171875, 0.277435302734375, 0.30224609375, 0.327056884765625, 0.35186767578125, 0.376678466796875, 0.4014892578125, 0.426300048828125, 0.45111083984375, 0.475921630859375, 0.500732421875, 0.525543212890625, 0.55035400390625, 0.575164794921875, 0.5999755859375, 0.624786376953125, 0.64959716796875, 0.674407958984375, 0.69921875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 9.0, 9.0, 9.0, 13.0, 20.0, 28.0, 51.0, 56.0, 94.0, 161.0, 252.0, 390.0, 656.0, 1094.0, 1790.0, 3229.0, 6254.0, 12934.0, 30210.0, 82400.0, 242747.0, 382656.0, 178379.0, 59868.0, 23177.0, 10175.0, 5059.0, 2769.0, 1578.0, 895.0, 569.0, 347.0, 227.0, 161.0, 87.0, 67.0, 45.0, 26.0, 22.0, 12.0, 12.0, 2.0, 6.0, 4.0, 5.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.1943359375, -0.18867874145507812, -0.18302154541015625, -0.17736434936523438, -0.1717071533203125, -0.16604995727539062, -0.16039276123046875, -0.15473556518554688, -0.149078369140625, -0.14342117309570312, -0.13776397705078125, -0.13210678100585938, -0.1264495849609375, -0.12079238891601562, -0.11513519287109375, -0.10947799682617188, -0.10382080078125, -0.09816360473632812, -0.09250640869140625, -0.08684921264648438, -0.0811920166015625, -0.07553482055664062, -0.06987762451171875, -0.06422042846679688, -0.058563232421875, -0.052906036376953125, -0.04724884033203125, -0.041591644287109375, -0.0359344482421875, -0.030277252197265625, -0.02462005615234375, -0.018962860107421875, -0.0133056640625, -0.007648468017578125, -0.00199127197265625, 0.003665924072265625, 0.0093231201171875, 0.014980316162109375, 0.02063751220703125, 0.026294708251953125, 0.031951904296875, 0.037609100341796875, 0.04326629638671875, 0.048923492431640625, 0.0545806884765625, 0.060237884521484375, 0.06589508056640625, 0.07155227661132812, 0.07720947265625, 0.08286666870117188, 0.08852386474609375, 0.09418106079101562, 0.0998382568359375, 0.10549545288085938, 0.11115264892578125, 0.11680984497070312, 0.122467041015625, 0.12812423706054688, 0.13378143310546875, 0.13943862915039062, 0.1450958251953125, 0.15075302124023438, 0.15641021728515625, 0.16206741333007812, 0.167724609375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 4.0, 2.0, 9.0, 4.0, 6.0, 6.0, 9.0, 20.0, 25.0, 48.0, 59.0, 105.0, 168.0, 184.0, 126.0, 81.0, 52.0, 23.0, 19.0, 15.0, 6.0, 9.0, 6.0, 7.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-8.499622344970703e-05, -8.265301585197449e-05, -8.030980825424194e-05, -7.79666006565094e-05, -7.562339305877686e-05, -7.328018546104431e-05, -7.093697786331177e-05, -6.859377026557922e-05, -6.625056266784668e-05, -6.390735507011414e-05, -6.156414747238159e-05, -5.922093987464905e-05, -5.6877732276916504e-05, -5.453452467918396e-05, -5.2191317081451416e-05, -4.984810948371887e-05, -4.750490188598633e-05, -4.5161694288253784e-05, -4.281848669052124e-05, -4.0475279092788696e-05, -3.813207149505615e-05, -3.578886389732361e-05, -3.3445656299591064e-05, -3.110244870185852e-05, -2.8759241104125977e-05, -2.6416033506393433e-05, -2.407282590866089e-05, -2.1729618310928345e-05, -1.93864107131958e-05, -1.7043203115463257e-05, -1.4699995517730713e-05, -1.2356787919998169e-05, -1.0013580322265625e-05, -7.670372724533081e-06, -5.327165126800537e-06, -2.983957529067993e-06, -6.407499313354492e-07, 1.7024576663970947e-06, 4.045665264129639e-06, 6.388872861862183e-06, 8.732080459594727e-06, 1.107528805732727e-05, 1.3418495655059814e-05, 1.576170325279236e-05, 1.8104910850524902e-05, 2.0448118448257446e-05, 2.279132604598999e-05, 2.5134533643722534e-05, 2.7477741241455078e-05, 2.9820948839187622e-05, 3.2164156436920166e-05, 3.450736403465271e-05, 3.6850571632385254e-05, 3.91937792301178e-05, 4.153698682785034e-05, 4.3880194425582886e-05, 4.622340202331543e-05, 4.8566609621047974e-05, 5.090981721878052e-05, 5.325302481651306e-05, 5.5596232414245605e-05, 5.793944001197815e-05, 6.028264760971069e-05, 6.262585520744324e-05, 6.496906280517578e-05]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 6.0, 10.0, 10.0, 7.0, 30.0, 46.0, 41.0, 87.0, 205.0, 347.0, 769.0, 1503.0, 3488.0, 8775.0, 25547.0, 84296.0, 283816.0, 410054.0, 159184.0, 45468.0, 14731.0, 5634.0, 2298.0, 1048.0, 546.0, 241.0, 151.0, 88.0, 42.0, 36.0, 21.0, 11.0, 8.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.218994140625, -0.21198654174804688, -0.20497894287109375, -0.19797134399414062, -0.1909637451171875, -0.18395614624023438, -0.17694854736328125, -0.16994094848632812, -0.162933349609375, -0.15592575073242188, -0.14891815185546875, -0.14191055297851562, -0.1349029541015625, -0.12789535522460938, -0.12088775634765625, -0.11388015747070312, -0.10687255859375, -0.09986495971679688, -0.09285736083984375, -0.08584976196289062, -0.0788421630859375, -0.07183456420898438, -0.06482696533203125, -0.057819366455078125, -0.050811767578125, -0.043804168701171875, -0.03679656982421875, -0.029788970947265625, -0.0227813720703125, -0.015773773193359375, -0.00876617431640625, -0.001758575439453125, 0.0052490234375, 0.012256622314453125, 0.01926422119140625, 0.026271820068359375, 0.0332794189453125, 0.040287017822265625, 0.04729461669921875, 0.054302215576171875, 0.061309814453125, 0.06831741333007812, 0.07532501220703125, 0.08233261108398438, 0.0893402099609375, 0.09634780883789062, 0.10335540771484375, 0.11036300659179688, 0.11737060546875, 0.12437820434570312, 0.13138580322265625, 0.13839340209960938, 0.1454010009765625, 0.15240859985351562, 0.15941619873046875, 0.16642379760742188, 0.173431396484375, 0.18043899536132812, 0.18744659423828125, 0.19445419311523438, 0.2014617919921875, 0.20846939086914062, 0.21547698974609375, 0.22248458862304688, 0.2294921875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 4.0, 4.0, 7.0, 4.0, 10.0, 11.0, 9.0, 16.0, 16.0, 17.0, 19.0, 30.0, 34.0, 38.0, 39.0, 60.0, 51.0, 78.0, 54.0, 75.0, 54.0, 57.0, 53.0, 40.0, 28.0, 29.0, 31.0, 24.0, 26.0, 13.0, 14.0, 8.0, 6.0, 6.0, 4.0, 6.0, 6.0, 4.0, 3.0, 4.0, 3.0, 1.0, 7.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1732177734375, -0.16778945922851562, -0.16236114501953125, -0.15693283081054688, -0.1515045166015625, -0.14607620239257812, -0.14064788818359375, -0.13521957397460938, -0.129791259765625, -0.12436294555664062, -0.11893463134765625, -0.11350631713867188, -0.1080780029296875, -0.10264968872070312, -0.09722137451171875, -0.09179306030273438, -0.08636474609375, -0.08093643188476562, -0.07550811767578125, -0.07007980346679688, -0.0646514892578125, -0.059223175048828125, -0.05379486083984375, -0.048366546630859375, -0.042938232421875, -0.037509918212890625, -0.03208160400390625, -0.026653289794921875, -0.0212249755859375, -0.015796661376953125, -0.01036834716796875, -0.004940032958984375, 0.00048828125, 0.005916595458984375, 0.01134490966796875, 0.016773223876953125, 0.0222015380859375, 0.027629852294921875, 0.03305816650390625, 0.038486480712890625, 0.043914794921875, 0.049343109130859375, 0.05477142333984375, 0.060199737548828125, 0.0656280517578125, 0.07105636596679688, 0.07648468017578125, 0.08191299438476562, 0.08734130859375, 0.09276962280273438, 0.09819793701171875, 0.10362625122070312, 0.1090545654296875, 0.11448287963867188, 0.11991119384765625, 0.12533950805664062, 0.130767822265625, 0.13619613647460938, 0.14162445068359375, 0.14705276489257812, 0.1524810791015625, 0.15790939331054688, 0.16333770751953125, 0.16876602172851562, 0.1741943359375]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 10.0, 11.0, 11.0, 29.0, 32.0, 76.0, 120.0, 140.0, 154.0, 121.0, 107.0, 59.0, 56.0, 37.0, 13.0, 14.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.112490177154541, -2.0139505863189697, -1.9154109954833984, -1.8168714046478271, -1.7183319330215454, -1.6197923421859741, -1.5212527513504028, -1.422713279724121, -1.3241736888885498, -1.2256340980529785, -1.1270945072174072, -1.028554916381836, -0.9300154447555542, -0.8314758539199829, -0.7329362630844116, -0.6343967318534851, -0.535857081413269, -0.43731752038002014, -0.33877795934677124, -0.24023836851119995, -0.14169880747795105, -0.04315924644470215, 0.05538034439086914, 0.15391987562179565, 0.25245946645736694, 0.35099902749061584, 0.44953858852386475, 0.548078179359436, 0.6466177701950073, 0.7451573014259338, 0.8436968922615051, 0.9422364234924316, 1.040776014328003, 1.1393156051635742, 1.2378551959991455, 1.3363947868347168, 1.4349342584609985, 1.5334738492965698, 1.6320134401321411, 1.7305529117584229, 1.8290925025939941, 1.9276320934295654, 2.0261716842651367, 2.124711275100708, 2.2232508659362793, 2.3217902183532715, 2.420330047607422, 2.518869400024414, 2.6174092292785645, 2.7159488201141357, 2.814488410949707, 2.9130280017852783, 3.0115675926208496, 3.110106945037842, 3.208646774291992, 3.3071861267089844, 3.4057257175445557, 3.504265308380127, 3.6028048992156982, 3.7013444900512695, 3.799884080886841, 3.898423671722412, 3.9969630241394043, 4.095502853393555, 4.194042205810547]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 7.0, 6.0, 7.0, 13.0, 11.0, 11.0, 15.0, 21.0, 35.0, 46.0, 39.0, 34.0, 45.0, 42.0, 41.0, 49.0, 44.0, 48.0, 46.0, 42.0, 57.0, 44.0, 41.0, 32.0, 32.0, 41.0, 23.0, 20.0, 30.0, 16.0, 14.0, 14.0, 16.0, 13.0, 5.0, 4.0, 1.0, 2.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.191250801086426, -2.1201508045196533, -2.049050807952881, -1.977950930595398, -1.906851053237915, -1.8357510566711426, -1.7646510601043701, -1.6935510635375977, -1.6224511861801147, -1.5513511896133423, -1.4802513122558594, -1.409151315689087, -1.3380513191223145, -1.2669514417648315, -1.195851445198059, -1.1247515678405762, -1.0536515712738037, -0.982551634311676, -0.9114516973495483, -0.8403517007827759, -0.7692517638206482, -0.6981518268585205, -0.627051830291748, -0.5559518933296204, -0.4848519563674927, -0.413752019405365, -0.3426520526409149, -0.27155208587646484, -0.20045214891433716, -0.12935221195220947, -0.0582522451877594, 0.012847721576690674, 0.08394765853881836, 0.15504761040210724, 0.22614756226539612, 0.2972475290298462, 0.3683474659919739, 0.43944740295410156, 0.510547399520874, 0.5816473364830017, 0.6527472734451294, 0.7238472104072571, 0.7949471473693848, 0.8660471439361572, 0.9371470808982849, 1.0082470178604126, 1.079347014427185, 1.150446891784668, 1.2215468883514404, 1.292646884918213, 1.3637467622756958, 1.4348467588424683, 1.5059466361999512, 1.5770466327667236, 1.648146629333496, 1.7192466259002686, 1.7903465032577515, 1.861446499824524, 1.9325463771820068, 2.0036463737487793, 2.0747463703155518, 2.145846366882324, 2.2169461250305176, 2.28804612159729, 2.3591461181640625]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 7.0, 5.0, 10.0, 16.0, 18.0, 38.0, 69.0, 84.0, 125.0, 211.0, 310.0, 619.0, 1297.0, 2484.0, 4867.0, 10752.0, 27712.0, 96833.0, 470108.0, 1920885.0, 1310901.0, 253241.0, 58726.0, 19500.0, 7818.0, 3594.0, 1836.0, 917.0, 478.0, 292.0, 181.0, 118.0, 83.0, 52.0, 34.0, 22.0, 10.0, 10.0, 5.0, 7.0, 2.0, 1.0, 2.0, 4.0, 1.0, 1.0, 2.0], "bins": [-0.455322265625, -0.44295501708984375, -0.4305877685546875, -0.41822052001953125, -0.405853271484375, -0.39348602294921875, -0.3811187744140625, -0.36875152587890625, -0.35638427734375, -0.34401702880859375, -0.3316497802734375, -0.31928253173828125, -0.306915283203125, -0.29454803466796875, -0.2821807861328125, -0.26981353759765625, -0.2574462890625, -0.24507904052734375, -0.2327117919921875, -0.22034454345703125, -0.207977294921875, -0.19561004638671875, -0.1832427978515625, -0.17087554931640625, -0.15850830078125, -0.14614105224609375, -0.1337738037109375, -0.12140655517578125, -0.109039306640625, -0.09667205810546875, -0.0843048095703125, -0.07193756103515625, -0.0595703125, -0.04720306396484375, -0.0348358154296875, -0.02246856689453125, -0.010101318359375, 0.00226593017578125, 0.0146331787109375, 0.02700042724609375, 0.03936767578125, 0.05173492431640625, 0.0641021728515625, 0.07646942138671875, 0.088836669921875, 0.10120391845703125, 0.1135711669921875, 0.12593841552734375, 0.1383056640625, 0.15067291259765625, 0.1630401611328125, 0.17540740966796875, 0.187774658203125, 0.20014190673828125, 0.2125091552734375, 0.22487640380859375, 0.23724365234375, 0.24961090087890625, 0.2619781494140625, 0.27434539794921875, 0.286712646484375, 0.29907989501953125, 0.3114471435546875, 0.32381439208984375, 0.336181640625]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 1.0, 1.0, 7.0, 5.0, 10.0, 7.0, 8.0, 12.0, 13.0, 20.0, 37.0, 41.0, 43.0, 39.0, 55.0, 56.0, 64.0, 64.0, 62.0, 40.0, 41.0, 56.0, 47.0, 42.0, 45.0, 43.0, 33.0, 27.0, 19.0, 15.0, 18.0, 9.0, 8.0, 7.0, 3.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0], "bins": [-0.400634765625, -0.39029693603515625, -0.3799591064453125, -0.36962127685546875, -0.359283447265625, -0.34894561767578125, -0.3386077880859375, -0.32826995849609375, -0.31793212890625, -0.30759429931640625, -0.2972564697265625, -0.28691864013671875, -0.276580810546875, -0.26624298095703125, -0.2559051513671875, -0.24556732177734375, -0.2352294921875, -0.22489166259765625, -0.2145538330078125, -0.20421600341796875, -0.193878173828125, -0.18354034423828125, -0.1732025146484375, -0.16286468505859375, -0.15252685546875, -0.14218902587890625, -0.1318511962890625, -0.12151336669921875, -0.111175537109375, -0.10083770751953125, -0.0904998779296875, -0.08016204833984375, -0.06982421875, -0.05948638916015625, -0.0491485595703125, -0.03881072998046875, -0.028472900390625, -0.01813507080078125, -0.0077972412109375, 0.00254058837890625, 0.01287841796875, 0.02321624755859375, 0.0335540771484375, 0.04389190673828125, 0.054229736328125, 0.06456756591796875, 0.0749053955078125, 0.08524322509765625, 0.0955810546875, 0.10591888427734375, 0.1162567138671875, 0.12659454345703125, 0.136932373046875, 0.14727020263671875, 0.1576080322265625, 0.16794586181640625, 0.17828369140625, 0.18862152099609375, 0.1989593505859375, 0.20929718017578125, 0.219635009765625, 0.22997283935546875, 0.2403106689453125, 0.25064849853515625, 0.260986328125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 6.0, 11.0, 13.0, 11.0, 27.0, 31.0, 49.0, 75.0, 111.0, 193.0, 316.0, 534.0, 967.0, 1889.0, 4139.0, 11187.0, 40661.0, 233104.0, 2540313.0, 1199167.0, 121791.0, 25281.0, 7798.0, 3252.0, 1493.0, 752.0, 401.0, 255.0, 145.0, 117.0, 63.0, 40.0, 21.0, 14.0, 10.0, 10.0, 6.0, 6.0, 5.0, 10.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.6025390625, -0.5816421508789062, -0.5607452392578125, -0.5398483276367188, -0.518951416015625, -0.49805450439453125, -0.4771575927734375, -0.45626068115234375, -0.43536376953125, -0.41446685791015625, -0.3935699462890625, -0.37267303466796875, -0.351776123046875, -0.33087921142578125, -0.3099822998046875, -0.28908538818359375, -0.2681884765625, -0.24729156494140625, -0.2263946533203125, -0.20549774169921875, -0.184600830078125, -0.16370391845703125, -0.1428070068359375, -0.12191009521484375, -0.10101318359375, -0.08011627197265625, -0.0592193603515625, -0.03832244873046875, -0.017425537109375, 0.00347137451171875, 0.0243682861328125, 0.04526519775390625, 0.066162109375, 0.08705902099609375, 0.1079559326171875, 0.12885284423828125, 0.149749755859375, 0.17064666748046875, 0.1915435791015625, 0.21244049072265625, 0.23333740234375, 0.25423431396484375, 0.2751312255859375, 0.29602813720703125, 0.316925048828125, 0.33782196044921875, 0.3587188720703125, 0.37961578369140625, 0.4005126953125, 0.42140960693359375, 0.4423065185546875, 0.46320343017578125, 0.484100341796875, 0.5049972534179688, 0.5258941650390625, 0.5467910766601562, 0.56768798828125, 0.5885848999023438, 0.6094818115234375, 0.6303787231445312, 0.651275634765625, 0.6721725463867188, 0.6930694580078125, 0.7139663696289062, 0.73486328125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 0.0, 4.0, 7.0, 5.0, 8.0, 15.0, 10.0, 33.0, 37.0, 65.0, 76.0, 120.0, 202.0, 313.0, 544.0, 773.0, 719.0, 434.0, 261.0, 150.0, 78.0, 72.0, 50.0, 36.0, 23.0, 12.0, 7.0, 9.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.56103515625, -0.5416107177734375, -0.522186279296875, -0.5027618408203125, -0.48333740234375, -0.4639129638671875, -0.444488525390625, -0.4250640869140625, -0.4056396484375, -0.3862152099609375, -0.366790771484375, -0.3473663330078125, -0.32794189453125, -0.3085174560546875, -0.289093017578125, -0.2696685791015625, -0.250244140625, -0.2308197021484375, -0.211395263671875, -0.1919708251953125, -0.17254638671875, -0.1531219482421875, -0.133697509765625, -0.1142730712890625, -0.0948486328125, -0.0754241943359375, -0.055999755859375, -0.0365753173828125, -0.01715087890625, 0.0022735595703125, 0.021697998046875, 0.0411224365234375, 0.060546875, 0.0799713134765625, 0.099395751953125, 0.1188201904296875, 0.13824462890625, 0.1576690673828125, 0.177093505859375, 0.1965179443359375, 0.2159423828125, 0.2353668212890625, 0.254791259765625, 0.2742156982421875, 0.29364013671875, 0.3130645751953125, 0.332489013671875, 0.3519134521484375, 0.371337890625, 0.3907623291015625, 0.410186767578125, 0.4296112060546875, 0.44903564453125, 0.4684600830078125, 0.487884521484375, 0.5073089599609375, 0.5267333984375, 0.5461578369140625, 0.565582275390625, 0.5850067138671875, 0.60443115234375, 0.6238555908203125, 0.643280029296875, 0.6627044677734375, 0.68212890625]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 7.0, 5.0, 20.0, 22.0, 21.0, 52.0, 88.0, 114.0, 118.0, 138.0, 141.0, 107.0, 59.0, 42.0, 30.0, 14.0, 9.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1194229125976562, -3.013315200805664, -2.907207489013672, -2.8010995388031006, -2.6949918270111084, -2.588884115219116, -2.482776165008545, -2.3766684532165527, -2.2705607414245605, -2.1644530296325684, -2.058345317840576, -1.9522373676300049, -1.8461296558380127, -1.7400219440460205, -1.6339141130447388, -1.527806282043457, -1.4216985702514648, -1.3155908584594727, -1.209483027458191, -1.1033751964569092, -0.997267484664917, -0.89115971326828, -0.7850519418716431, -0.6789441704750061, -0.5728363990783691, -0.4667286276817322, -0.3606208562850952, -0.25451308488845825, -0.1484053134918213, -0.042297542095184326, 0.06381022930145264, 0.1699180006980896, 0.27602577209472656, 0.3821335434913635, 0.4882413148880005, 0.5943490862846375, 0.7004568576812744, 0.8065646290779114, 0.9126724004745483, 1.01878023147583, 1.1248879432678223, 1.2309956550598145, 1.3371034860610962, 1.443211317062378, 1.5493190288543701, 1.6554267406463623, 1.761534571647644, 1.8676424026489258, 1.973750114440918, 2.07985782623291, 2.1859655380249023, 2.2920734882354736, 2.398181200027466, 2.504288911819458, 2.6103968620300293, 2.7165045738220215, 2.8226122856140137, 2.928719997406006, 3.034827709197998, 3.1409356594085693, 3.2470433712005615, 3.3531510829925537, 3.459259033203125, 3.565366744995117, 3.6714744567871094]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 3.0, 7.0, 9.0, 8.0, 5.0, 8.0, 14.0, 10.0, 10.0, 13.0, 18.0, 14.0, 23.0, 21.0, 24.0, 33.0, 28.0, 28.0, 32.0, 30.0, 36.0, 31.0, 35.0, 36.0, 36.0, 44.0, 45.0, 42.0, 34.0, 43.0, 21.0, 32.0, 25.0, 23.0, 28.0, 16.0, 19.0, 20.0, 14.0, 14.0, 10.0, 12.0, 10.0, 11.0, 5.0, 11.0, 5.0, 1.0, 6.0, 3.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.265763282775879, -1.219376802444458, -1.1729902029037476, -1.1266037225723267, -1.0802171230316162, -1.0338306427001953, -0.9874441623687744, -0.9410576224327087, -0.8946710824966431, -0.8482845425605774, -0.8018980026245117, -0.7555115222930908, -0.7091249823570251, -0.6627384424209595, -0.6163519620895386, -0.5699654221534729, -0.5235788822174072, -0.47719234228134155, -0.43080583214759827, -0.384419322013855, -0.3380327820777893, -0.29164624214172363, -0.24525973200798035, -0.19887322187423706, -0.1524866819381714, -0.1061001569032669, -0.05971363186836243, -0.013327106833457947, 0.03305941820144653, 0.07944594323635101, 0.1258324682712555, 0.17221897840499878, 0.21860551834106445, 0.2649920582771301, 0.3113785684108734, 0.3577650785446167, 0.4041516184806824, 0.45053815841674805, 0.49692466855049133, 0.5433111786842346, 0.5896977186203003, 0.636084258556366, 0.6824707984924316, 0.7288572788238525, 0.7752438187599182, 0.8216303586959839, 0.8680168390274048, 0.9144033789634705, 0.9607899188995361, 1.007176399230957, 1.0535629987716675, 1.0999494791030884, 1.1463360786437988, 1.1927225589752197, 1.2391090393066406, 1.2854955196380615, 1.331882119178772, 1.3782685995101929, 1.4246551990509033, 1.4710416793823242, 1.5174281597137451, 1.5638147592544556, 1.6102012395858765, 1.656587839126587, 1.7029743194580078]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 7.0, 5.0, 10.0, 28.0, 26.0, 48.0, 87.0, 157.0, 258.0, 557.0, 948.0, 1891.0, 3918.0, 8209.0, 18327.0, 46886.0, 143545.0, 349539.0, 301123.0, 108063.0, 36575.0, 14911.0, 6620.0, 3302.0, 1648.0, 866.0, 432.0, 255.0, 124.0, 87.0, 49.0, 30.0, 11.0, 9.0, 6.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.59033203125, -0.5712127685546875, -0.552093505859375, -0.5329742431640625, -0.51385498046875, -0.4947357177734375, -0.475616455078125, -0.4564971923828125, -0.4373779296875, -0.4182586669921875, -0.399139404296875, -0.3800201416015625, -0.36090087890625, -0.3417816162109375, -0.322662353515625, -0.3035430908203125, -0.284423828125, -0.2653045654296875, -0.246185302734375, -0.2270660400390625, -0.20794677734375, -0.1888275146484375, -0.169708251953125, -0.1505889892578125, -0.1314697265625, -0.1123504638671875, -0.093231201171875, -0.0741119384765625, -0.05499267578125, -0.0358734130859375, -0.016754150390625, 0.0023651123046875, 0.021484375, 0.0406036376953125, 0.059722900390625, 0.0788421630859375, 0.09796142578125, 0.1170806884765625, 0.136199951171875, 0.1553192138671875, 0.1744384765625, 0.1935577392578125, 0.212677001953125, 0.2317962646484375, 0.25091552734375, 0.2700347900390625, 0.289154052734375, 0.3082733154296875, 0.327392578125, 0.3465118408203125, 0.365631103515625, 0.3847503662109375, 0.40386962890625, 0.4229888916015625, 0.442108154296875, 0.4612274169921875, 0.4803466796875, 0.4994659423828125, 0.518585205078125, 0.5377044677734375, 0.55682373046875, 0.5759429931640625, 0.595062255859375, 0.6141815185546875, 0.63330078125]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 10.0, 10.0, 7.0, 12.0, 16.0, 19.0, 30.0, 36.0, 38.0, 58.0, 52.0, 51.0, 64.0, 61.0, 46.0, 60.0, 63.0, 54.0, 54.0, 48.0, 41.0, 44.0, 27.0, 21.0, 15.0, 14.0, 13.0, 19.0, 3.0, 6.0, 3.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3671875, -0.35601806640625, -0.3448486328125, -0.33367919921875, -0.322509765625, -0.31134033203125, -0.3001708984375, -0.28900146484375, -0.27783203125, -0.26666259765625, -0.2554931640625, -0.24432373046875, -0.233154296875, -0.22198486328125, -0.2108154296875, -0.19964599609375, -0.1884765625, -0.17730712890625, -0.1661376953125, -0.15496826171875, -0.143798828125, -0.13262939453125, -0.1214599609375, -0.11029052734375, -0.09912109375, -0.08795166015625, -0.0767822265625, -0.06561279296875, -0.054443359375, -0.04327392578125, -0.0321044921875, -0.02093505859375, -0.009765625, 0.00140380859375, 0.0125732421875, 0.02374267578125, 0.034912109375, 0.04608154296875, 0.0572509765625, 0.06842041015625, 0.07958984375, 0.09075927734375, 0.1019287109375, 0.11309814453125, 0.124267578125, 0.13543701171875, 0.1466064453125, 0.15777587890625, 0.1689453125, 0.18011474609375, 0.1912841796875, 0.20245361328125, 0.213623046875, 0.22479248046875, 0.2359619140625, 0.24713134765625, 0.25830078125, 0.26947021484375, 0.2806396484375, 0.29180908203125, 0.302978515625, 0.31414794921875, 0.3253173828125, 0.33648681640625, 0.34765625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 7.0, 7.0, 1.0, 11.0, 15.0, 23.0, 27.0, 37.0, 46.0, 82.0, 116.0, 179.0, 304.0, 554.0, 991.0, 2146.0, 4746.0, 10988.0, 28398.0, 83124.0, 295072.0, 416215.0, 135123.0, 42233.0, 15630.0, 6349.0, 2953.0, 1387.0, 697.0, 398.0, 239.0, 158.0, 86.0, 52.0, 48.0, 34.0, 29.0, 12.0, 16.0, 5.0, 6.0, 4.0, 4.0, 4.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.7470703125, -0.7231216430664062, -0.6991729736328125, -0.6752243041992188, -0.651275634765625, -0.6273269653320312, -0.6033782958984375, -0.5794296264648438, -0.55548095703125, -0.5315322875976562, -0.5075836181640625, -0.48363494873046875, -0.459686279296875, -0.43573760986328125, -0.4117889404296875, -0.38784027099609375, -0.3638916015625, -0.33994293212890625, -0.3159942626953125, -0.29204559326171875, -0.268096923828125, -0.24414825439453125, -0.2201995849609375, -0.19625091552734375, -0.17230224609375, -0.14835357666015625, -0.1244049072265625, -0.10045623779296875, -0.076507568359375, -0.05255889892578125, -0.0286102294921875, -0.00466156005859375, 0.019287109375, 0.04323577880859375, 0.0671844482421875, 0.09113311767578125, 0.115081787109375, 0.13903045654296875, 0.1629791259765625, 0.18692779541015625, 0.21087646484375, 0.23482513427734375, 0.2587738037109375, 0.28272247314453125, 0.306671142578125, 0.33061981201171875, 0.3545684814453125, 0.37851715087890625, 0.4024658203125, 0.42641448974609375, 0.4503631591796875, 0.47431182861328125, 0.498260498046875, 0.5222091674804688, 0.5461578369140625, 0.5701065063476562, 0.59405517578125, 0.6180038452148438, 0.6419525146484375, 0.6659011840820312, 0.689849853515625, 0.7137985229492188, 0.7377471923828125, 0.7616958618164062, 0.78564453125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 4.0, 11.0, 12.0, 10.0, 9.0, 21.0, 21.0, 24.0, 37.0, 28.0, 27.0, 34.0, 44.0, 56.0, 57.0, 55.0, 36.0, 49.0, 38.0, 47.0, 44.0, 44.0, 34.0, 38.0, 31.0, 25.0, 37.0, 19.0, 23.0, 20.0, 14.0, 13.0, 7.0, 9.0, 4.0, 7.0, 2.0, 2.0, 1.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9228515625, -0.8945770263671875, -0.866302490234375, -0.8380279541015625, -0.80975341796875, -0.7814788818359375, -0.753204345703125, -0.7249298095703125, -0.6966552734375, -0.6683807373046875, -0.640106201171875, -0.6118316650390625, -0.58355712890625, -0.5552825927734375, -0.527008056640625, -0.4987335205078125, -0.470458984375, -0.4421844482421875, -0.413909912109375, -0.3856353759765625, -0.35736083984375, -0.3290863037109375, -0.300811767578125, -0.2725372314453125, -0.2442626953125, -0.2159881591796875, -0.187713623046875, -0.1594390869140625, -0.13116455078125, -0.1028900146484375, -0.074615478515625, -0.0463409423828125, -0.01806640625, 0.0102081298828125, 0.038482666015625, 0.0667572021484375, 0.09503173828125, 0.1233062744140625, 0.151580810546875, 0.1798553466796875, 0.2081298828125, 0.2364044189453125, 0.264678955078125, 0.2929534912109375, 0.32122802734375, 0.3495025634765625, 0.377777099609375, 0.4060516357421875, 0.434326171875, 0.4626007080078125, 0.490875244140625, 0.5191497802734375, 0.54742431640625, 0.5756988525390625, 0.603973388671875, 0.6322479248046875, 0.6605224609375, 0.6887969970703125, 0.717071533203125, 0.7453460693359375, 0.77362060546875, 0.8018951416015625, 0.830169677734375, 0.8584442138671875, 0.88671875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 1.0, 5.0, 7.0, 8.0, 11.0, 19.0, 21.0, 42.0, 34.0, 77.0, 113.0, 211.0, 352.0, 596.0, 1018.0, 1871.0, 3343.0, 6043.0, 11691.0, 23216.0, 51671.0, 132738.0, 304296.0, 292080.0, 123882.0, 48876.0, 22111.0, 11153.0, 5752.0, 3140.0, 1739.0, 948.0, 587.0, 344.0, 180.0, 126.0, 95.0, 57.0, 36.0, 20.0, 14.0, 12.0, 8.0, 5.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.192138671875, -0.186309814453125, -0.18048095703125, -0.174652099609375, -0.1688232421875, -0.162994384765625, -0.15716552734375, -0.151336669921875, -0.1455078125, -0.139678955078125, -0.13385009765625, -0.128021240234375, -0.1221923828125, -0.116363525390625, -0.11053466796875, -0.104705810546875, -0.098876953125, -0.093048095703125, -0.08721923828125, -0.081390380859375, -0.0755615234375, -0.069732666015625, -0.06390380859375, -0.058074951171875, -0.05224609375, -0.046417236328125, -0.04058837890625, -0.034759521484375, -0.0289306640625, -0.023101806640625, -0.01727294921875, -0.011444091796875, -0.005615234375, 0.000213623046875, 0.00604248046875, 0.011871337890625, 0.0177001953125, 0.023529052734375, 0.02935791015625, 0.035186767578125, 0.041015625, 0.046844482421875, 0.05267333984375, 0.058502197265625, 0.0643310546875, 0.070159912109375, 0.07598876953125, 0.081817626953125, 0.087646484375, 0.093475341796875, 0.09930419921875, 0.105133056640625, 0.1109619140625, 0.116790771484375, 0.12261962890625, 0.128448486328125, 0.13427734375, 0.140106201171875, 0.14593505859375, 0.151763916015625, 0.1575927734375, 0.163421630859375, 0.16925048828125, 0.175079345703125, 0.180908203125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 2.0, 7.0, 7.0, 12.0, 15.0, 24.0, 42.0, 90.0, 115.0, 190.0, 209.0, 136.0, 65.0, 25.0, 25.0, 13.0, 10.0, 3.0, 5.0, 6.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001270771026611328, -0.00012269988656044006, -0.00011832267045974731, -0.00011394545435905457, -0.00010956823825836182, -0.00010519102215766907, -0.00010081380605697632, -9.643658995628357e-05, -9.205937385559082e-05, -8.768215775489807e-05, -8.330494165420532e-05, -7.892772555351257e-05, -7.455050945281982e-05, -7.017329335212708e-05, -6.579607725143433e-05, -6.141886115074158e-05, -5.704164505004883e-05, -5.266442894935608e-05, -4.828721284866333e-05, -4.390999674797058e-05, -3.953278064727783e-05, -3.515556454658508e-05, -3.0778348445892334e-05, -2.6401132345199585e-05, -2.2023916244506836e-05, -1.7646700143814087e-05, -1.3269484043121338e-05, -8.892267942428589e-06, -4.51505184173584e-06, -1.3783574104309082e-07, 4.239380359649658e-06, 8.616596460342407e-06, 1.2993812561035156e-05, 1.7371028661727905e-05, 2.1748244762420654e-05, 2.6125460863113403e-05, 3.0502676963806152e-05, 3.48798930644989e-05, 3.925710916519165e-05, 4.36343252658844e-05, 4.801154136657715e-05, 5.23887574672699e-05, 5.6765973567962646e-05, 6.11431896686554e-05, 6.552040576934814e-05, 6.98976218700409e-05, 7.427483797073364e-05, 7.865205407142639e-05, 8.302927017211914e-05, 8.740648627281189e-05, 9.178370237350464e-05, 9.616091847419739e-05, 0.00010053813457489014, 0.00010491535067558289, 0.00010929256677627563, 0.00011366978287696838, 0.00011804699897766113, 0.00012242421507835388, 0.00012680143117904663, 0.00013117864727973938, 0.00013555586338043213, 0.00013993307948112488, 0.00014431029558181763, 0.00014868751168251038, 0.00015306472778320312]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 3.0, 4.0, 6.0, 8.0, 9.0, 15.0, 19.0, 22.0, 33.0, 56.0, 75.0, 108.0, 194.0, 362.0, 650.0, 1277.0, 3035.0, 7976.0, 24042.0, 91543.0, 351162.0, 405882.0, 115813.0, 30143.0, 9467.0, 3450.0, 1465.0, 747.0, 379.0, 200.0, 136.0, 97.0, 42.0, 43.0, 22.0, 20.0, 8.0, 12.0, 9.0, 8.0, 2.0, 6.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.3076171875, -0.29859161376953125, -0.2895660400390625, -0.28054046630859375, -0.271514892578125, -0.26248931884765625, -0.2534637451171875, -0.24443817138671875, -0.23541259765625, -0.22638702392578125, -0.2173614501953125, -0.20833587646484375, -0.199310302734375, -0.19028472900390625, -0.1812591552734375, -0.17223358154296875, -0.1632080078125, -0.15418243408203125, -0.1451568603515625, -0.13613128662109375, -0.127105712890625, -0.11808013916015625, -0.1090545654296875, -0.10002899169921875, -0.09100341796875, -0.08197784423828125, -0.0729522705078125, -0.06392669677734375, -0.054901123046875, -0.04587554931640625, -0.0368499755859375, -0.02782440185546875, -0.018798828125, -0.00977325439453125, -0.0007476806640625, 0.00827789306640625, 0.017303466796875, 0.02632904052734375, 0.0353546142578125, 0.04438018798828125, 0.05340576171875, 0.06243133544921875, 0.0714569091796875, 0.08048248291015625, 0.089508056640625, 0.09853363037109375, 0.1075592041015625, 0.11658477783203125, 0.1256103515625, 0.13463592529296875, 0.1436614990234375, 0.15268707275390625, 0.161712646484375, 0.17073822021484375, 0.1797637939453125, 0.18878936767578125, 0.19781494140625, 0.20684051513671875, 0.2158660888671875, 0.22489166259765625, 0.233917236328125, 0.24294281005859375, 0.2519683837890625, 0.26099395751953125, 0.27001953125]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 5.0, 4.0, 16.0, 15.0, 19.0, 15.0, 18.0, 22.0, 47.0, 34.0, 49.0, 51.0, 59.0, 49.0, 64.0, 54.0, 70.0, 62.0, 55.0, 47.0, 41.0, 34.0, 28.0, 35.0, 23.0, 24.0, 12.0, 9.0, 13.0, 7.0, 3.0, 7.0, 2.0, 1.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1795654296875, -0.1736469268798828, -0.16772842407226562, -0.16180992126464844, -0.15589141845703125, -0.14997291564941406, -0.14405441284179688, -0.1381359100341797, -0.1322174072265625, -0.1262989044189453, -0.12038040161132812, -0.11446189880371094, -0.10854339599609375, -0.10262489318847656, -0.09670639038085938, -0.09078788757324219, -0.084869384765625, -0.07895088195800781, -0.07303237915039062, -0.06711387634277344, -0.06119537353515625, -0.05527687072753906, -0.049358367919921875, -0.04343986511230469, -0.0375213623046875, -0.03160285949707031, -0.025684356689453125, -0.019765853881835938, -0.01384735107421875, -0.007928848266601562, -0.002010345458984375, 0.0039081573486328125, 0.00982666015625, 0.015745162963867188, 0.021663665771484375, 0.027582168579101562, 0.03350067138671875, 0.03941917419433594, 0.045337677001953125, 0.05125617980957031, 0.0571746826171875, 0.06309318542480469, 0.06901168823242188, 0.07493019104003906, 0.08084869384765625, 0.08676719665527344, 0.09268569946289062, 0.09860420227050781, 0.104522705078125, 0.11044120788574219, 0.11635971069335938, 0.12227821350097656, 0.12819671630859375, 0.13411521911621094, 0.14003372192382812, 0.1459522247314453, 0.1518707275390625, 0.1577892303466797, 0.16370773315429688, 0.16962623596191406, 0.17554473876953125, 0.18146324157714844, 0.18738174438476562, 0.1933002471923828, 0.19921875]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 5.0, 9.0, 20.0, 34.0, 124.0, 153.0, 227.0, 206.0, 102.0, 67.0, 24.0, 13.0, 9.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.521369934082031, -6.332040309906006, -6.1427106857299805, -5.953381061553955, -5.76405143737793, -5.574721813201904, -5.385392189025879, -5.1960625648498535, -5.006732940673828, -4.817403316497803, -4.628073692321777, -4.438744068145752, -4.249414443969727, -4.060084819793701, -3.870755195617676, -3.6814255714416504, -3.492095708847046, -3.3027660846710205, -3.113436460494995, -2.9241068363189697, -2.7347772121429443, -2.545447587966919, -2.3561177253723145, -2.166788101196289, -1.9774585962295532, -1.7881289720535278, -1.5987993478775024, -1.4094696044921875, -1.220139980316162, -1.0308103561401367, -0.8414807319641113, -0.6521511077880859, -0.46282148361206055, -0.27349185943603516, -0.08416220545768738, 0.1051674485206604, 0.2944970726966858, 0.4838266968727112, 0.6731563806533813, 0.8624860048294067, 1.0518156290054321, 1.2411452531814575, 1.430474877357483, 1.6198046207427979, 1.8091342449188232, 1.9984638690948486, 2.187793493270874, 2.3771231174468994, 2.566452741622925, 2.75578236579895, 2.9451119899749756, 3.134441614151001, 3.3237712383270264, 3.5131008625030518, 3.7024307250976562, 3.8917603492736816, 4.081089973449707, 4.270419597625732, 4.459749221801758, 4.649078845977783, 4.838408470153809, 5.027738094329834, 5.217067718505859, 5.406397342681885, 5.59572696685791]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 6.0, 6.0, 2.0, 9.0, 8.0, 14.0, 17.0, 13.0, 15.0, 25.0, 21.0, 24.0, 25.0, 22.0, 33.0, 27.0, 44.0, 58.0, 29.0, 37.0, 49.0, 39.0, 34.0, 39.0, 45.0, 52.0, 34.0, 32.0, 28.0, 25.0, 22.0, 23.0, 27.0, 17.0, 27.0, 18.0, 11.0, 10.0, 8.0, 4.0, 4.0, 4.0, 3.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-2.1612682342529297, -2.0968053340911865, -2.0323421955108643, -1.9678791761398315, -1.9034161567687988, -1.8389532566070557, -1.774490237236023, -1.7100272178649902, -1.6455641984939575, -1.5811011791229248, -1.516638159751892, -1.4521751403808594, -1.3877122402191162, -1.323249101638794, -1.2587862014770508, -1.194323182106018, -1.1298601627349854, -1.0653971433639526, -1.00093412399292, -0.936471164226532, -0.8720081448554993, -0.8075451254844666, -0.7430821657180786, -0.6786191463470459, -0.6141561269760132, -0.5496931076049805, -0.48523011803627014, -0.4207671284675598, -0.3563041090965271, -0.2918410897254944, -0.22737810015678406, -0.16291511058807373, -0.09845185279846191, -0.03398884832859039, 0.030474156141281128, 0.09493716061115265, 0.15940016508102417, 0.22386318445205688, 0.2883261740207672, 0.35278916358947754, 0.41725218296051025, 0.48171520233154297, 0.5461782217025757, 0.6106411814689636, 0.6751042008399963, 0.739567220211029, 0.804030179977417, 0.8684931993484497, 0.9329562187194824, 0.9974192380905151, 1.0618822574615479, 1.1263452768325806, 1.1908082962036133, 1.2552711963653564, 1.3197342157363892, 1.3841972351074219, 1.4486602544784546, 1.5131232738494873, 1.57758629322052, 1.6420493125915527, 1.706512212753296, 1.7709753513336182, 1.8354382514953613, 1.899901270866394, 1.9643642902374268]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 6.0, 4.0, 6.0, 4.0, 8.0, 8.0, 9.0, 23.0, 18.0, 33.0, 42.0, 72.0, 135.0, 192.0, 326.0, 593.0, 1173.0, 2590.0, 5739.0, 15333.0, 52140.0, 249831.0, 1335994.0, 1960921.0, 449760.0, 82499.0, 22407.0, 7820.0, 3297.0, 1503.0, 768.0, 398.0, 221.0, 136.0, 74.0, 57.0, 34.0, 17.0, 19.0, 19.0, 15.0, 11.0, 8.0, 6.0, 5.0, 3.0, 2.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.45263671875, -0.4385643005371094, -0.42449188232421875, -0.4104194641113281, -0.3963470458984375, -0.3822746276855469, -0.36820220947265625, -0.3541297912597656, -0.340057373046875, -0.3259849548339844, -0.31191253662109375, -0.2978401184082031, -0.2837677001953125, -0.2696952819824219, -0.25562286376953125, -0.24155044555664062, -0.22747802734375, -0.21340560913085938, -0.19933319091796875, -0.18526077270507812, -0.1711883544921875, -0.15711593627929688, -0.14304351806640625, -0.12897109985351562, -0.114898681640625, -0.10082626342773438, -0.08675384521484375, -0.07268142700195312, -0.0586090087890625, -0.044536590576171875, -0.03046417236328125, -0.016391754150390625, -0.0023193359375, 0.011753082275390625, 0.02582550048828125, 0.039897918701171875, 0.0539703369140625, 0.06804275512695312, 0.08211517333984375, 0.09618759155273438, 0.110260009765625, 0.12433242797851562, 0.13840484619140625, 0.15247726440429688, 0.1665496826171875, 0.18062210083007812, 0.19469451904296875, 0.20876693725585938, 0.22283935546875, 0.23691177368164062, 0.25098419189453125, 0.2650566101074219, 0.2791290283203125, 0.2932014465332031, 0.30727386474609375, 0.3213462829589844, 0.335418701171875, 0.3494911193847656, 0.36356353759765625, 0.3776359558105469, 0.3917083740234375, 0.4057807922363281, 0.41985321044921875, 0.4339256286621094, 0.447998046875]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 9.0, 6.0, 3.0, 7.0, 13.0, 19.0, 14.0, 15.0, 22.0, 31.0, 40.0, 33.0, 46.0, 39.0, 58.0, 55.0, 52.0, 58.0, 61.0, 39.0, 59.0, 32.0, 44.0, 46.0, 34.0, 26.0, 35.0, 20.0, 16.0, 19.0, 15.0, 10.0, 10.0, 6.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0], "bins": [-0.36181640625, -0.3520088195800781, -0.34220123291015625, -0.3323936462402344, -0.3225860595703125, -0.3127784729003906, -0.30297088623046875, -0.2931632995605469, -0.283355712890625, -0.2735481262207031, -0.26374053955078125, -0.2539329528808594, -0.2441253662109375, -0.23431777954101562, -0.22451019287109375, -0.21470260620117188, -0.20489501953125, -0.19508743286132812, -0.18527984619140625, -0.17547225952148438, -0.1656646728515625, -0.15585708618164062, -0.14604949951171875, -0.13624191284179688, -0.126434326171875, -0.11662673950195312, -0.10681915283203125, -0.09701156616210938, -0.0872039794921875, -0.07739639282226562, -0.06758880615234375, -0.057781219482421875, -0.0479736328125, -0.038166046142578125, -0.02835845947265625, -0.018550872802734375, -0.0087432861328125, 0.001064300537109375, 0.01087188720703125, 0.020679473876953125, 0.030487060546875, 0.040294647216796875, 0.05010223388671875, 0.059909820556640625, 0.0697174072265625, 0.07952499389648438, 0.08933258056640625, 0.09914016723632812, 0.10894775390625, 0.11875534057617188, 0.12856292724609375, 0.13837051391601562, 0.1481781005859375, 0.15798568725585938, 0.16779327392578125, 0.17760086059570312, 0.187408447265625, 0.19721603393554688, 0.20702362060546875, 0.21683120727539062, 0.2266387939453125, 0.23644638061523438, 0.24625396728515625, 0.2560615539550781, 0.265869140625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 3.0, 7.0, 5.0, 9.0, 17.0, 17.0, 21.0, 18.0, 41.0, 52.0, 81.0, 138.0, 233.0, 551.0, 1243.0, 3698.0, 14428.0, 94772.0, 2134917.0, 1837773.0, 86618.0, 13672.0, 3586.0, 1233.0, 522.0, 240.0, 133.0, 71.0, 56.0, 30.0, 25.0, 20.0, 15.0, 14.0, 11.0, 7.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.962890625, -0.9307708740234375, -0.898651123046875, -0.8665313720703125, -0.83441162109375, -0.8022918701171875, -0.770172119140625, -0.7380523681640625, -0.7059326171875, -0.6738128662109375, -0.641693115234375, -0.6095733642578125, -0.57745361328125, -0.5453338623046875, -0.513214111328125, -0.4810943603515625, -0.448974609375, -0.4168548583984375, -0.384735107421875, -0.3526153564453125, -0.32049560546875, -0.2883758544921875, -0.256256103515625, -0.2241363525390625, -0.1920166015625, -0.1598968505859375, -0.127777099609375, -0.0956573486328125, -0.06353759765625, -0.0314178466796875, 0.000701904296875, 0.0328216552734375, 0.06494140625, 0.0970611572265625, 0.129180908203125, 0.1613006591796875, 0.19342041015625, 0.2255401611328125, 0.257659912109375, 0.2897796630859375, 0.3218994140625, 0.3540191650390625, 0.386138916015625, 0.4182586669921875, 0.45037841796875, 0.4824981689453125, 0.514617919921875, 0.5467376708984375, 0.578857421875, 0.6109771728515625, 0.643096923828125, 0.6752166748046875, 0.70733642578125, 0.7394561767578125, 0.771575927734375, 0.8036956787109375, 0.8358154296875, 0.8679351806640625, 0.900054931640625, 0.9321746826171875, 0.96429443359375, 0.9964141845703125, 1.028533935546875, 1.0606536865234375, 1.0927734375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 6.0, 1.0, 2.0, 3.0, 8.0, 9.0, 20.0, 34.0, 45.0, 72.0, 151.0, 236.0, 468.0, 862.0, 956.0, 552.0, 277.0, 145.0, 84.0, 51.0, 41.0, 21.0, 20.0, 7.0, 6.0, 5.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.50048828125, -0.47289276123046875, -0.4452972412109375, -0.41770172119140625, -0.390106201171875, -0.36251068115234375, -0.3349151611328125, -0.30731964111328125, -0.27972412109375, -0.25212860107421875, -0.2245330810546875, -0.19693756103515625, -0.169342041015625, -0.14174652099609375, -0.1141510009765625, -0.08655548095703125, -0.0589599609375, -0.03136444091796875, -0.0037689208984375, 0.02382659912109375, 0.051422119140625, 0.07901763916015625, 0.1066131591796875, 0.13420867919921875, 0.16180419921875, 0.18939971923828125, 0.2169952392578125, 0.24459075927734375, 0.272186279296875, 0.29978179931640625, 0.3273773193359375, 0.35497283935546875, 0.382568359375, 0.41016387939453125, 0.4377593994140625, 0.46535491943359375, 0.492950439453125, 0.5205459594726562, 0.5481414794921875, 0.5757369995117188, 0.60333251953125, 0.6309280395507812, 0.6585235595703125, 0.6861190795898438, 0.713714599609375, 0.7413101196289062, 0.7689056396484375, 0.7965011596679688, 0.8240966796875, 0.8516921997070312, 0.8792877197265625, 0.9068832397460938, 0.934478759765625, 0.9620742797851562, 0.9896697998046875, 1.0172653198242188, 1.04486083984375, 1.0724563598632812, 1.1000518798828125, 1.1276473999023438, 1.155242919921875, 1.1828384399414062, 1.2104339599609375, 1.2380294799804688, 1.265625]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 17.0, 20.0, 49.0, 97.0, 205.0, 266.0, 165.0, 106.0, 43.0, 14.0, 11.0, 8.0, 1.0, 0.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.213892936706543, -4.008265018463135, -3.8026368618011475, -3.59700870513916, -3.391380786895752, -3.1857526302337646, -2.9801244735717773, -2.774496555328369, -2.568868398666382, -2.3632402420043945, -2.1576123237609863, -1.951984167098999, -1.7463561296463013, -1.5407280921936035, -1.3350999355316162, -1.1294718980789185, -0.9238438606262207, -0.718215823173523, -0.5125877261161804, -0.3069596290588379, -0.10133159160614014, 0.10429644584655762, 0.3099246025085449, 0.5155526399612427, 0.7211806774139404, 0.9268087148666382, 1.132436752319336, 1.3380649089813232, 1.543692946434021, 1.7493209838867188, 1.954949140548706, 2.1605772972106934, 2.3662052154541016, 2.571833372116089, 2.777461290359497, 2.9830894470214844, 3.1887173652648926, 3.39434552192688, 3.599973678588867, 3.8056015968322754, 4.011229515075684, 4.216857433319092, 4.422485828399658, 4.628113746643066, 4.833741664886475, 5.039369583129883, 5.244997978210449, 5.450625896453857, 5.656254291534424, 5.861882209777832, 6.067510604858398, 6.273138523101807, 6.478766441345215, 6.684394836425781, 6.8900227546691895, 7.095650672912598, 7.301279067993164, 7.506906986236572, 7.712535381317139, 7.918163299560547, 8.123791694641113, 8.329419136047363, 8.53504753112793, 8.740675926208496, 8.946303367614746]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 4.0, 5.0, 4.0, 1.0, 8.0, 6.0, 2.0, 6.0, 5.0, 11.0, 20.0, 11.0, 18.0, 9.0, 15.0, 29.0, 27.0, 31.0, 38.0, 34.0, 24.0, 36.0, 47.0, 37.0, 28.0, 43.0, 38.0, 34.0, 37.0, 40.0, 46.0, 39.0, 37.0, 25.0, 21.0, 23.0, 21.0, 33.0, 20.0, 13.0, 15.0, 7.0, 14.0, 10.0, 9.0, 8.0, 1.0, 8.0, 5.0, 4.0, 1.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3493714332580566, -1.299584150314331, -1.2497968673706055, -1.2000095844268799, -1.1502223014831543, -1.1004350185394287, -1.0506477355957031, -1.0008604526519775, -0.951073169708252, -0.9012858867645264, -0.8514986038208008, -0.8017113208770752, -0.7519240379333496, -0.702136754989624, -0.6523494720458984, -0.6025621891021729, -0.5527748465538025, -0.5029875636100769, -0.4532002806663513, -0.40341299772262573, -0.35362571477890015, -0.30383843183517456, -0.2540511190891266, -0.204263836145401, -0.15447655320167542, -0.10468927025794983, -0.054901979863643646, -0.005114689469337463, 0.04467259347438812, 0.09445987641811371, 0.1442471742630005, 0.19403445720672607, 0.24382174015045166, 0.29360902309417725, 0.34339630603790283, 0.3931835889816284, 0.442970871925354, 0.4927581548690796, 0.5425454378128052, 0.5923327207565308, 0.6421200037002563, 0.6919072866439819, 0.7416945695877075, 0.7914818525314331, 0.8412691354751587, 0.8910564184188843, 0.9408437013626099, 0.9906309843063354, 1.0404183864593506, 1.0902056694030762, 1.1399929523468018, 1.1897802352905273, 1.239567518234253, 1.2893548011779785, 1.339142084121704, 1.3889293670654297, 1.4387166500091553, 1.4885039329528809, 1.5382912158966064, 1.588078498840332, 1.6378657817840576, 1.6876530647277832, 1.7374403476715088, 1.7872276306152344, 1.83701491355896]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 9.0, 7.0, 11.0, 9.0, 18.0, 23.0, 44.0, 52.0, 70.0, 114.0, 185.0, 278.0, 383.0, 608.0, 981.0, 1658.0, 3069.0, 6220.0, 13793.0, 34659.0, 98067.0, 247757.0, 338606.0, 186821.0, 68267.0, 25516.0, 10299.0, 4900.0, 2433.0, 1351.0, 799.0, 551.0, 318.0, 222.0, 150.0, 102.0, 68.0, 58.0, 27.0, 19.0, 13.0, 7.0, 6.0, 8.0, 4.0, 4.0, 0.0, 0.0, 1.0], "bins": [-0.66015625, -0.6424713134765625, -0.624786376953125, -0.6071014404296875, -0.58941650390625, -0.5717315673828125, -0.554046630859375, -0.5363616943359375, -0.5186767578125, -0.5009918212890625, -0.483306884765625, -0.4656219482421875, -0.44793701171875, -0.4302520751953125, -0.412567138671875, -0.3948822021484375, -0.377197265625, -0.3595123291015625, -0.341827392578125, -0.3241424560546875, -0.30645751953125, -0.2887725830078125, -0.271087646484375, -0.2534027099609375, -0.2357177734375, -0.2180328369140625, -0.200347900390625, -0.1826629638671875, -0.16497802734375, -0.1472930908203125, -0.129608154296875, -0.1119232177734375, -0.09423828125, -0.0765533447265625, -0.058868408203125, -0.0411834716796875, -0.02349853515625, -0.0058135986328125, 0.011871337890625, 0.0295562744140625, 0.0472412109375, 0.0649261474609375, 0.082611083984375, 0.1002960205078125, 0.11798095703125, 0.1356658935546875, 0.153350830078125, 0.1710357666015625, 0.188720703125, 0.2064056396484375, 0.224090576171875, 0.2417755126953125, 0.25946044921875, 0.2771453857421875, 0.294830322265625, 0.3125152587890625, 0.3302001953125, 0.3478851318359375, 0.365570068359375, 0.3832550048828125, 0.40093994140625, 0.4186248779296875, 0.436309814453125, 0.4539947509765625, 0.4716796875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 2.0, 0.0, 1.0, 2.0, 4.0, 5.0, 6.0, 7.0, 6.0, 9.0, 14.0, 12.0, 32.0, 21.0, 36.0, 34.0, 40.0, 35.0, 37.0, 40.0, 43.0, 45.0, 47.0, 50.0, 58.0, 54.0, 48.0, 55.0, 41.0, 30.0, 37.0, 30.0, 24.0, 20.0, 14.0, 15.0, 8.0, 12.0, 14.0, 7.0, 5.0, 1.0, 6.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.3779296875, -0.3674812316894531, -0.35703277587890625, -0.3465843200683594, -0.3361358642578125, -0.3256874084472656, -0.31523895263671875, -0.3047904968261719, -0.294342041015625, -0.2838935852050781, -0.27344512939453125, -0.2629966735839844, -0.2525482177734375, -0.24209976196289062, -0.23165130615234375, -0.22120285034179688, -0.21075439453125, -0.20030593872070312, -0.18985748291015625, -0.17940902709960938, -0.1689605712890625, -0.15851211547851562, -0.14806365966796875, -0.13761520385742188, -0.127166748046875, -0.11671829223632812, -0.10626983642578125, -0.09582138061523438, -0.0853729248046875, -0.07492446899414062, -0.06447601318359375, -0.054027557373046875, -0.0435791015625, -0.033130645751953125, -0.02268218994140625, -0.012233734130859375, -0.0017852783203125, 0.008663177490234375, 0.01911163330078125, 0.029560089111328125, 0.040008544921875, 0.050457000732421875, 0.06090545654296875, 0.07135391235351562, 0.0818023681640625, 0.09225082397460938, 0.10269927978515625, 0.11314773559570312, 0.12359619140625, 0.13404464721679688, 0.14449310302734375, 0.15494155883789062, 0.1653900146484375, 0.17583847045898438, 0.18628692626953125, 0.19673538208007812, 0.207183837890625, 0.21763229370117188, 0.22808074951171875, 0.23852920532226562, 0.2489776611328125, 0.2594261169433594, 0.26987457275390625, 0.2803230285644531, 0.290771484375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 4.0, 6.0, 7.0, 11.0, 12.0, 10.0, 34.0, 43.0, 92.0, 146.0, 302.0, 481.0, 902.0, 1851.0, 4130.0, 11000.0, 35097.0, 140587.0, 469673.0, 286686.0, 66674.0, 18758.0, 6586.0, 2641.0, 1288.0, 674.0, 350.0, 201.0, 126.0, 71.0, 43.0, 16.0, 21.0, 13.0, 5.0, 7.0, 3.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.822265625, -0.7978973388671875, -0.773529052734375, -0.7491607666015625, -0.72479248046875, -0.7004241943359375, -0.676055908203125, -0.6516876220703125, -0.6273193359375, -0.6029510498046875, -0.578582763671875, -0.5542144775390625, -0.52984619140625, -0.5054779052734375, -0.481109619140625, -0.4567413330078125, -0.432373046875, -0.4080047607421875, -0.383636474609375, -0.3592681884765625, -0.33489990234375, -0.3105316162109375, -0.286163330078125, -0.2617950439453125, -0.2374267578125, -0.2130584716796875, -0.188690185546875, -0.1643218994140625, -0.13995361328125, -0.1155853271484375, -0.091217041015625, -0.0668487548828125, -0.04248046875, -0.0181121826171875, 0.006256103515625, 0.0306243896484375, 0.05499267578125, 0.0793609619140625, 0.103729248046875, 0.1280975341796875, 0.1524658203125, 0.1768341064453125, 0.201202392578125, 0.2255706787109375, 0.24993896484375, 0.2743072509765625, 0.298675537109375, 0.3230438232421875, 0.347412109375, 0.3717803955078125, 0.396148681640625, 0.4205169677734375, 0.44488525390625, 0.4692535400390625, 0.493621826171875, 0.5179901123046875, 0.5423583984375, 0.5667266845703125, 0.591094970703125, 0.6154632568359375, 0.63983154296875, 0.6641998291015625, 0.688568115234375, 0.7129364013671875, 0.7373046875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 4.0, 2.0, 1.0, 2.0, 3.0, 3.0, 6.0, 6.0, 6.0, 10.0, 12.0, 13.0, 16.0, 11.0, 20.0, 18.0, 21.0, 33.0, 28.0, 42.0, 34.0, 45.0, 53.0, 45.0, 55.0, 37.0, 40.0, 39.0, 45.0, 49.0, 36.0, 28.0, 36.0, 35.0, 31.0, 15.0, 25.0, 19.0, 25.0, 21.0, 7.0, 11.0, 7.0, 3.0, 4.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.75048828125, -0.72430419921875, -0.6981201171875, -0.67193603515625, -0.645751953125, -0.61956787109375, -0.5933837890625, -0.56719970703125, -0.541015625, -0.51483154296875, -0.4886474609375, -0.46246337890625, -0.436279296875, -0.41009521484375, -0.3839111328125, -0.35772705078125, -0.33154296875, -0.30535888671875, -0.2791748046875, -0.25299072265625, -0.226806640625, -0.20062255859375, -0.1744384765625, -0.14825439453125, -0.1220703125, -0.09588623046875, -0.0697021484375, -0.04351806640625, -0.017333984375, 0.00885009765625, 0.0350341796875, 0.06121826171875, 0.08740234375, 0.11358642578125, 0.1397705078125, 0.16595458984375, 0.192138671875, 0.21832275390625, 0.2445068359375, 0.27069091796875, 0.296875, 0.32305908203125, 0.3492431640625, 0.37542724609375, 0.401611328125, 0.42779541015625, 0.4539794921875, 0.48016357421875, 0.50634765625, 0.53253173828125, 0.5587158203125, 0.58489990234375, 0.611083984375, 0.63726806640625, 0.6634521484375, 0.68963623046875, 0.7158203125, 0.74200439453125, 0.7681884765625, 0.79437255859375, 0.820556640625, 0.84674072265625, 0.8729248046875, 0.89910888671875, 0.92529296875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 6.0, 3.0, 5.0, 2.0, 9.0, 7.0, 22.0, 41.0, 69.0, 142.0, 306.0, 747.0, 2132.0, 8586.0, 50296.0, 375422.0, 513172.0, 80725.0, 12177.0, 2974.0, 984.0, 382.0, 191.0, 86.0, 36.0, 15.0, 9.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.264404296875, -0.25428009033203125, -0.2441558837890625, -0.23403167724609375, -0.223907470703125, -0.21378326416015625, -0.2036590576171875, -0.19353485107421875, -0.18341064453125, -0.17328643798828125, -0.1631622314453125, -0.15303802490234375, -0.142913818359375, -0.13278961181640625, -0.1226654052734375, -0.11254119873046875, -0.1024169921875, -0.09229278564453125, -0.0821685791015625, -0.07204437255859375, -0.061920166015625, -0.05179595947265625, -0.0416717529296875, -0.03154754638671875, -0.02142333984375, -0.01129913330078125, -0.0011749267578125, 0.00894927978515625, 0.019073486328125, 0.02919769287109375, 0.0393218994140625, 0.04944610595703125, 0.0595703125, 0.06969451904296875, 0.0798187255859375, 0.08994293212890625, 0.100067138671875, 0.11019134521484375, 0.1203155517578125, 0.13043975830078125, 0.14056396484375, 0.15068817138671875, 0.1608123779296875, 0.17093658447265625, 0.181060791015625, 0.19118499755859375, 0.2013092041015625, 0.21143341064453125, 0.2215576171875, 0.23168182373046875, 0.2418060302734375, 0.25193023681640625, 0.262054443359375, 0.27217864990234375, 0.2823028564453125, 0.29242706298828125, 0.30255126953125, 0.31267547607421875, 0.3227996826171875, 0.33292388916015625, 0.343048095703125, 0.35317230224609375, 0.3632965087890625, 0.37342071533203125, 0.383544921875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 8.0, 3.0, 7.0, 6.0, 7.0, 9.0, 14.0, 16.0, 31.0, 38.0, 41.0, 32.0, 44.0, 64.0, 70.0, 75.0, 86.0, 74.0, 68.0, 56.0, 47.0, 42.0, 29.0, 21.0, 24.0, 11.0, 14.0, 17.0, 4.0, 7.0, 7.0, 3.0, 6.0, 10.0, 4.0, 5.0, 5.0, 0.0, 3.0], "bins": [-5.7697296142578125e-05, -5.6298449635505676e-05, -5.489960312843323e-05, -5.350075662136078e-05, -5.210191011428833e-05, -5.070306360721588e-05, -4.930421710014343e-05, -4.7905370593070984e-05, -4.6506524085998535e-05, -4.5107677578926086e-05, -4.370883107185364e-05, -4.230998456478119e-05, -4.091113805770874e-05, -3.951229155063629e-05, -3.811344504356384e-05, -3.6714598536491394e-05, -3.5315752029418945e-05, -3.3916905522346497e-05, -3.251805901527405e-05, -3.11192125082016e-05, -2.972036600112915e-05, -2.83215194940567e-05, -2.6922672986984253e-05, -2.5523826479911804e-05, -2.4124979972839355e-05, -2.2726133465766907e-05, -2.1327286958694458e-05, -1.992844045162201e-05, -1.852959394454956e-05, -1.7130747437477112e-05, -1.5731900930404663e-05, -1.4333054423332214e-05, -1.2934207916259766e-05, -1.1535361409187317e-05, -1.0136514902114868e-05, -8.73766839504242e-06, -7.338821887969971e-06, -5.939975380897522e-06, -4.541128873825073e-06, -3.1422823667526245e-06, -1.7434358596801758e-06, -3.4458935260772705e-07, 1.0542571544647217e-06, 2.4531036615371704e-06, 3.851950168609619e-06, 5.250796675682068e-06, 6.649643182754517e-06, 8.048489689826965e-06, 9.447336196899414e-06, 1.0846182703971863e-05, 1.2245029211044312e-05, 1.364387571811676e-05, 1.5042722225189209e-05, 1.6441568732261658e-05, 1.7840415239334106e-05, 1.9239261746406555e-05, 2.0638108253479004e-05, 2.2036954760551453e-05, 2.34358012676239e-05, 2.483464777469635e-05, 2.62334942817688e-05, 2.7632340788841248e-05, 2.9031187295913696e-05, 3.0430033802986145e-05, 3.1828880310058594e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 0.0, 8.0, 4.0, 6.0, 10.0, 7.0, 16.0, 20.0, 32.0, 48.0, 63.0, 111.0, 180.0, 286.0, 506.0, 881.0, 1549.0, 3338.0, 7633.0, 21928.0, 74929.0, 258122.0, 415343.0, 184569.0, 51695.0, 15557.0, 5953.0, 2597.0, 1284.0, 732.0, 430.0, 252.0, 179.0, 97.0, 63.0, 43.0, 26.0, 22.0, 14.0, 7.0, 4.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.1934814453125, -0.1868896484375, -0.1802978515625, -0.1737060546875, -0.1671142578125, -0.1605224609375, -0.1539306640625, -0.1473388671875, -0.1407470703125, -0.1341552734375, -0.1275634765625, -0.1209716796875, -0.1143798828125, -0.1077880859375, -0.1011962890625, -0.0946044921875, -0.0880126953125, -0.0814208984375, -0.0748291015625, -0.0682373046875, -0.0616455078125, -0.0550537109375, -0.0484619140625, -0.0418701171875, -0.0352783203125, -0.0286865234375, -0.0220947265625, -0.0155029296875, -0.0089111328125, -0.0023193359375, 0.0042724609375, 0.0108642578125, 0.0174560546875, 0.0240478515625, 0.0306396484375, 0.0372314453125, 0.0438232421875, 0.0504150390625, 0.0570068359375, 0.0635986328125, 0.0701904296875, 0.0767822265625, 0.0833740234375, 0.0899658203125, 0.0965576171875, 0.1031494140625, 0.1097412109375, 0.1163330078125, 0.1229248046875, 0.1295166015625, 0.1361083984375, 0.1427001953125, 0.1492919921875, 0.1558837890625, 0.1624755859375, 0.1690673828125, 0.1756591796875, 0.1822509765625, 0.1888427734375, 0.1954345703125, 0.2020263671875, 0.2086181640625, 0.2152099609375, 0.2218017578125, 0.2283935546875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 2.0, 3.0, 2.0, 3.0, 3.0, 3.0, 5.0, 10.0, 16.0, 13.0, 25.0, 33.0, 40.0, 68.0, 74.0, 83.0, 90.0, 88.0, 91.0, 91.0, 69.0, 49.0, 37.0, 28.0, 26.0, 18.0, 11.0, 11.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.287841796875, -0.2805366516113281, -0.27323150634765625, -0.2659263610839844, -0.2586212158203125, -0.2513160705566406, -0.24401092529296875, -0.23670578002929688, -0.229400634765625, -0.22209548950195312, -0.21479034423828125, -0.20748519897460938, -0.2001800537109375, -0.19287490844726562, -0.18556976318359375, -0.17826461791992188, -0.17095947265625, -0.16365432739257812, -0.15634918212890625, -0.14904403686523438, -0.1417388916015625, -0.13443374633789062, -0.12712860107421875, -0.11982345581054688, -0.112518310546875, -0.10521316528320312, -0.09790802001953125, -0.09060287475585938, -0.0832977294921875, -0.07599258422851562, -0.06868743896484375, -0.061382293701171875, -0.0540771484375, -0.046772003173828125, -0.03946685791015625, -0.032161712646484375, -0.0248565673828125, -0.017551422119140625, -0.01024627685546875, -0.002941131591796875, 0.004364013671875, 0.011669158935546875, 0.01897430419921875, 0.026279449462890625, 0.0335845947265625, 0.040889739990234375, 0.04819488525390625, 0.055500030517578125, 0.06280517578125, 0.07011032104492188, 0.07741546630859375, 0.08472061157226562, 0.0920257568359375, 0.09933090209960938, 0.10663604736328125, 0.11394119262695312, 0.121246337890625, 0.12855148315429688, 0.13585662841796875, 0.14316177368164062, 0.1504669189453125, 0.15777206420898438, 0.16507720947265625, 0.17238235473632812, 0.1796875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 0.0, 4.0, 4.0, 7.0, 14.0, 27.0, 55.0, 108.0, 187.0, 259.0, 178.0, 94.0, 35.0, 20.0, 10.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.041380882263184, -7.856456756591797, -7.671533107757568, -7.486608982086182, -7.301685333251953, -7.116761207580566, -6.93183708190918, -6.746913433074951, -6.561989784240723, -6.377065658569336, -6.192142009735107, -6.007217884063721, -5.822294235229492, -5.6373701095581055, -5.452445983886719, -5.26752233505249, -5.0825982093811035, -4.897674083709717, -4.712750434875488, -4.527826309204102, -4.342902660369873, -4.157978534698486, -3.9730546474456787, -3.788130760192871, -3.6032068729400635, -3.418282985687256, -3.2333590984344482, -3.0484352111816406, -2.863511085510254, -2.6785874366760254, -2.4936633110046387, -2.308739423751831, -2.1238155364990234, -1.9388916492462158, -1.7539677619934082, -1.569043755531311, -1.3841198682785034, -1.1991959810256958, -1.0142719745635986, -0.829348087310791, -0.6444242000579834, -0.4595002830028534, -0.2745763659477234, -0.089652419090271, 0.09527146816253662, 0.28019535541534424, 0.4651193618774414, 0.650043249130249, 0.8349671363830566, 1.0198910236358643, 1.2048149108886719, 1.389738917350769, 1.5746628046035767, 1.7595866918563843, 1.9445106983184814, 2.129434585571289, 2.3143584728240967, 2.4992823600769043, 2.684206247329712, 2.8691301345825195, 3.0540542602539062, 3.2389779090881348, 3.4239020347595215, 3.608825922012329, 3.7937498092651367]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 2.0, 8.0, 11.0, 3.0, 8.0, 17.0, 17.0, 15.0, 20.0, 26.0, 27.0, 32.0, 38.0, 33.0, 52.0, 48.0, 39.0, 34.0, 50.0, 38.0, 51.0, 46.0, 37.0, 38.0, 51.0, 21.0, 39.0, 28.0, 29.0, 18.0, 24.0, 21.0, 21.0, 11.0, 15.0, 8.0, 6.0, 5.0, 4.0, 7.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9336044788360596, -1.8666483163833618, -1.799692153930664, -1.7327361106872559, -1.665779948234558, -1.5988237857818604, -1.5318677425384521, -1.4649115800857544, -1.3979554176330566, -1.3309992551803589, -1.2640430927276611, -1.197087049484253, -1.1301308870315552, -1.0631747245788574, -0.9962186217308044, -0.9292625188827515, -0.8623063564300537, -0.795350193977356, -0.728394091129303, -0.66143798828125, -0.5944818258285522, -0.5275256633758545, -0.4605695605278015, -0.39361342787742615, -0.3266572952270508, -0.2597011625766754, -0.19274502992630005, -0.12578889727592468, -0.058832764625549316, 0.00812336802482605, 0.07507950067520142, 0.14203563332557678, 0.20899200439453125, 0.2759481370449066, 0.342904269695282, 0.40986040234565735, 0.4768165349960327, 0.5437726974487305, 0.6107288002967834, 0.6776849031448364, 0.7446410655975342, 0.8115972280502319, 0.8785533308982849, 0.9455094337463379, 1.0124655961990356, 1.0794217586517334, 1.1463778018951416, 1.2133339643478394, 1.280290126800537, 1.3472462892532349, 1.4142024517059326, 1.4811584949493408, 1.5481146574020386, 1.6150708198547363, 1.6820268630981445, 1.7489830255508423, 1.81593918800354, 1.8828953504562378, 1.9498515129089355, 2.0168075561523438, 2.083763599395752, 2.1507198810577393, 2.2176759243011475, 2.2846322059631348, 2.351588249206543]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 2.0, 2.0, 3.0, 2.0, 5.0, 13.0, 20.0, 23.0, 24.0, 39.0, 70.0, 86.0, 135.0, 191.0, 243.0, 413.0, 592.0, 866.0, 1399.0, 2305.0, 3667.0, 6565.0, 12474.0, 26762.0, 67911.0, 212976.0, 744729.0, 1725034.0, 948948.0, 282813.0, 88244.0, 33912.0, 15121.0, 7674.0, 4390.0, 2445.0, 1446.0, 988.0, 610.0, 386.0, 247.0, 154.0, 117.0, 78.0, 41.0, 35.0, 32.0, 19.0, 14.0, 8.0, 8.0, 4.0, 2.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.31982421875, -0.3093757629394531, -0.29892730712890625, -0.2884788513183594, -0.2780303955078125, -0.2675819396972656, -0.25713348388671875, -0.24668502807617188, -0.236236572265625, -0.22578811645507812, -0.21533966064453125, -0.20489120483398438, -0.1944427490234375, -0.18399429321289062, -0.17354583740234375, -0.16309738159179688, -0.15264892578125, -0.14220046997070312, -0.13175201416015625, -0.12130355834960938, -0.1108551025390625, -0.10040664672851562, -0.08995819091796875, -0.07950973510742188, -0.069061279296875, -0.058612823486328125, -0.04816436767578125, -0.037715911865234375, -0.0272674560546875, -0.016819000244140625, -0.00637054443359375, 0.004077911376953125, 0.0145263671875, 0.024974822998046875, 0.03542327880859375, 0.045871734619140625, 0.0563201904296875, 0.06676864624023438, 0.07721710205078125, 0.08766555786132812, 0.098114013671875, 0.10856246948242188, 0.11901092529296875, 0.12945938110351562, 0.1399078369140625, 0.15035629272460938, 0.16080474853515625, 0.17125320434570312, 0.18170166015625, 0.19215011596679688, 0.20259857177734375, 0.21304702758789062, 0.2234954833984375, 0.23394393920898438, 0.24439239501953125, 0.2548408508300781, 0.265289306640625, 0.2757377624511719, 0.28618621826171875, 0.2966346740722656, 0.3070831298828125, 0.3175315856933594, 0.32798004150390625, 0.3384284973144531, 0.348876953125]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 5.0, 2.0, 1.0, 5.0, 9.0, 9.0, 20.0, 18.0, 24.0, 23.0, 33.0, 34.0, 39.0, 50.0, 45.0, 60.0, 58.0, 54.0, 53.0, 61.0, 67.0, 45.0, 45.0, 37.0, 39.0, 21.0, 35.0, 20.0, 20.0, 21.0, 19.0, 7.0, 9.0, 3.0, 6.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.38037109375, -0.3701362609863281, -0.35990142822265625, -0.3496665954589844, -0.3394317626953125, -0.3291969299316406, -0.31896209716796875, -0.3087272644042969, -0.298492431640625, -0.2882575988769531, -0.27802276611328125, -0.2677879333496094, -0.2575531005859375, -0.24731826782226562, -0.23708343505859375, -0.22684860229492188, -0.21661376953125, -0.20637893676757812, -0.19614410400390625, -0.18590927124023438, -0.1756744384765625, -0.16543960571289062, -0.15520477294921875, -0.14496994018554688, -0.134735107421875, -0.12450027465820312, -0.11426544189453125, -0.10403060913085938, -0.0937957763671875, -0.08356094360351562, -0.07332611083984375, -0.06309127807617188, -0.0528564453125, -0.042621612548828125, -0.03238677978515625, -0.022151947021484375, -0.0119171142578125, -0.001682281494140625, 0.00855255126953125, 0.018787384033203125, 0.029022216796875, 0.039257049560546875, 0.04949188232421875, 0.059726715087890625, 0.0699615478515625, 0.08019638061523438, 0.09043121337890625, 0.10066604614257812, 0.11090087890625, 0.12113571166992188, 0.13137054443359375, 0.14160537719726562, 0.1518402099609375, 0.16207504272460938, 0.17230987548828125, 0.18254470825195312, 0.192779541015625, 0.20301437377929688, 0.21324920654296875, 0.22348403930664062, 0.2337188720703125, 0.24395370483398438, 0.25418853759765625, 0.2644233703613281, 0.274658203125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 5.0, 1.0, 6.0, 10.0, 17.0, 20.0, 36.0, 29.0, 49.0, 78.0, 114.0, 192.0, 257.0, 399.0, 598.0, 973.0, 1487.0, 2499.0, 4443.0, 7929.0, 15164.0, 31958.0, 77233.0, 235976.0, 1114561.0, 2061252.0, 428551.0, 119566.0, 45688.0, 20812.0, 10407.0, 5570.0, 3186.0, 1912.0, 1157.0, 717.0, 492.0, 290.0, 202.0, 150.0, 95.0, 62.0, 51.0, 33.0, 21.0, 13.0, 7.0, 8.0, 7.0, 6.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.40087890625, -0.38843536376953125, -0.3759918212890625, -0.36354827880859375, -0.351104736328125, -0.33866119384765625, -0.3262176513671875, -0.31377410888671875, -0.30133056640625, -0.28888702392578125, -0.2764434814453125, -0.26399993896484375, -0.251556396484375, -0.23911285400390625, -0.2266693115234375, -0.21422576904296875, -0.2017822265625, -0.18933868408203125, -0.1768951416015625, -0.16445159912109375, -0.152008056640625, -0.13956451416015625, -0.1271209716796875, -0.11467742919921875, -0.10223388671875, -0.08979034423828125, -0.0773468017578125, -0.06490325927734375, -0.052459716796875, -0.04001617431640625, -0.0275726318359375, -0.01512908935546875, -0.002685546875, 0.00975799560546875, 0.0222015380859375, 0.03464508056640625, 0.047088623046875, 0.05953216552734375, 0.0719757080078125, 0.08441925048828125, 0.09686279296875, 0.10930633544921875, 0.1217498779296875, 0.13419342041015625, 0.146636962890625, 0.15908050537109375, 0.1715240478515625, 0.18396759033203125, 0.1964111328125, 0.20885467529296875, 0.2212982177734375, 0.23374176025390625, 0.246185302734375, 0.25862884521484375, 0.2710723876953125, 0.28351593017578125, 0.29595947265625, 0.30840301513671875, 0.3208465576171875, 0.33329010009765625, 0.345733642578125, 0.35817718505859375, 0.3706207275390625, 0.38306427001953125, 0.3955078125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 3.0, 3.0, 4.0, 2.0, 8.0, 12.0, 9.0, 16.0, 23.0, 17.0, 25.0, 34.0, 57.0, 60.0, 64.0, 118.0, 178.0, 256.0, 361.0, 544.0, 611.0, 461.0, 328.0, 233.0, 157.0, 123.0, 84.0, 63.0, 42.0, 43.0, 31.0, 16.0, 15.0, 12.0, 16.0, 12.0, 10.0, 6.0, 6.0, 5.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.494384765625, -0.47953033447265625, -0.4646759033203125, -0.44982147216796875, -0.434967041015625, -0.42011260986328125, -0.4052581787109375, -0.39040374755859375, -0.37554931640625, -0.36069488525390625, -0.3458404541015625, -0.33098602294921875, -0.316131591796875, -0.30127716064453125, -0.2864227294921875, -0.27156829833984375, -0.2567138671875, -0.24185943603515625, -0.2270050048828125, -0.21215057373046875, -0.197296142578125, -0.18244171142578125, -0.1675872802734375, -0.15273284912109375, -0.13787841796875, -0.12302398681640625, -0.1081695556640625, -0.09331512451171875, -0.078460693359375, -0.06360626220703125, -0.0487518310546875, -0.03389739990234375, -0.01904296875, -0.00418853759765625, 0.0106658935546875, 0.02552032470703125, 0.040374755859375, 0.05522918701171875, 0.0700836181640625, 0.08493804931640625, 0.09979248046875, 0.11464691162109375, 0.1295013427734375, 0.14435577392578125, 0.159210205078125, 0.17406463623046875, 0.1889190673828125, 0.20377349853515625, 0.2186279296875, 0.23348236083984375, 0.2483367919921875, 0.26319122314453125, 0.278045654296875, 0.29290008544921875, 0.3077545166015625, 0.32260894775390625, 0.33746337890625, 0.35231781005859375, 0.3671722412109375, 0.38202667236328125, 0.396881103515625, 0.41173553466796875, 0.4265899658203125, 0.44144439697265625, 0.456298828125]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 8.0, 5.0, 13.0, 16.0, 47.0, 70.0, 161.0, 176.0, 197.0, 149.0, 79.0, 44.0, 14.0, 6.0, 6.0, 6.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.434116840362549, -3.2605223655700684, -3.086927890777588, -2.9133334159851074, -2.739738941192627, -2.5661444664001465, -2.392550230026245, -2.2189557552337646, -2.045361280441284, -1.8717668056488037, -1.6981723308563232, -1.5245779752731323, -1.3509835004806519, -1.1773890256881714, -1.0037946701049805, -0.8302001953125, -0.6566057205200195, -0.48301127552986145, -0.30941683053970337, -0.13582241535186768, 0.03777205944061279, 0.21136653423309326, 0.3849608898162842, 0.5585553646087646, 0.7321498394012451, 0.9057443141937256, 1.079338788986206, 1.252933144569397, 1.4265276193618774, 1.600122094154358, 1.7737164497375488, 1.9473109245300293, 2.1209049224853516, 2.294499397277832, 2.4680938720703125, 2.641688346862793, 2.8152828216552734, 2.988877296447754, 3.1624715328216553, 3.3360660076141357, 3.509660482406616, 3.6832549571990967, 3.856849431991577, 4.0304436683654785, 4.204038143157959, 4.3776326179504395, 4.55122709274292, 4.7248215675354, 4.898416042327881, 5.072010517120361, 5.245604991912842, 5.419199466705322, 5.592793941497803, 5.766388416290283, 5.9399824142456055, 6.113576889038086, 6.287171363830566, 6.460765838623047, 6.634360313415527, 6.807954788208008, 6.981549263000488, 7.155143737792969, 7.328738212585449, 7.50233268737793, 7.67592716217041]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 5.0, 6.0, 4.0, 3.0, 2.0, 6.0, 5.0, 9.0, 8.0, 18.0, 7.0, 15.0, 22.0, 19.0, 31.0, 28.0, 20.0, 26.0, 32.0, 44.0, 37.0, 33.0, 34.0, 43.0, 41.0, 29.0, 48.0, 40.0, 46.0, 35.0, 24.0, 28.0, 37.0, 31.0, 21.0, 18.0, 22.0, 16.0, 18.0, 27.0, 11.0, 15.0, 6.0, 11.0, 10.0, 4.0, 6.0, 3.0, 0.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.296291470527649, -1.2492103576660156, -1.2021292448043823, -1.155048131942749, -1.1079670190811157, -1.0608859062194824, -1.0138047933578491, -0.9667236804962158, -0.9196425676345825, -0.8725614547729492, -0.8254803419113159, -0.7783992290496826, -0.7313181161880493, -0.684237003326416, -0.6371558904647827, -0.5900747776031494, -0.5429936647415161, -0.4959125518798828, -0.4488314390182495, -0.4017503261566162, -0.3546692132949829, -0.3075881004333496, -0.2605069875717163, -0.213425874710083, -0.1663447618484497, -0.1192636489868164, -0.0721825361251831, -0.025101423263549805, 0.021979689598083496, 0.0690608024597168, 0.1161419153213501, 0.1632230281829834, 0.21030402183532715, 0.25738513469696045, 0.30446624755859375, 0.35154736042022705, 0.39862847328186035, 0.44570958614349365, 0.49279069900512695, 0.5398718118667603, 0.5869529247283936, 0.6340340375900269, 0.6811151504516602, 0.7281962633132935, 0.7752773761749268, 0.8223584890365601, 0.8694396018981934, 0.9165207147598267, 0.96360182762146, 1.0106829404830933, 1.0577640533447266, 1.1048451662063599, 1.1519262790679932, 1.1990073919296265, 1.2460885047912598, 1.293169617652893, 1.3402507305145264, 1.3873318433761597, 1.434412956237793, 1.4814940690994263, 1.5285751819610596, 1.5756562948226929, 1.6227374076843262, 1.6698185205459595, 1.7168996334075928]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 3.0, 5.0, 5.0, 7.0, 14.0, 24.0, 30.0, 42.0, 75.0, 97.0, 132.0, 208.0, 355.0, 479.0, 770.0, 1259.0, 2002.0, 3129.0, 4853.0, 7885.0, 13188.0, 22346.0, 38311.0, 64778.0, 106289.0, 157213.0, 185633.0, 161208.0, 111163.0, 67880.0, 39812.0, 23486.0, 13790.0, 8283.0, 5064.0, 3079.0, 1998.0, 1329.0, 800.0, 546.0, 322.0, 227.0, 148.0, 102.0, 77.0, 36.0, 30.0, 14.0, 13.0, 7.0, 8.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 4.0, 0.0, 1.0], "bins": [-0.2288818359375, -0.2213878631591797, -0.21389389038085938, -0.20639991760253906, -0.19890594482421875, -0.19141197204589844, -0.18391799926757812, -0.1764240264892578, -0.1689300537109375, -0.1614360809326172, -0.15394210815429688, -0.14644813537597656, -0.13895416259765625, -0.13146018981933594, -0.12396621704101562, -0.11647224426269531, -0.108978271484375, -0.10148429870605469, -0.09399032592773438, -0.08649635314941406, -0.07900238037109375, -0.07150840759277344, -0.06401443481445312, -0.05652046203613281, -0.0490264892578125, -0.04153251647949219, -0.034038543701171875, -0.026544570922851562, -0.01905059814453125, -0.011556625366210938, -0.004062652587890625, 0.0034313201904296875, 0.01092529296875, 0.018419265747070312, 0.025913238525390625, 0.03340721130371094, 0.04090118408203125, 0.04839515686035156, 0.055889129638671875, 0.06338310241699219, 0.0708770751953125, 0.07837104797363281, 0.08586502075195312, 0.09335899353027344, 0.10085296630859375, 0.10834693908691406, 0.11584091186523438, 0.12333488464355469, 0.130828857421875, 0.1383228302001953, 0.14581680297851562, 0.15331077575683594, 0.16080474853515625, 0.16829872131347656, 0.17579269409179688, 0.1832866668701172, 0.1907806396484375, 0.1982746124267578, 0.20576858520507812, 0.21326255798339844, 0.22075653076171875, 0.22825050354003906, 0.23574447631835938, 0.2432384490966797, 0.250732421875]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 5.0, 0.0, 1.0, 4.0, 4.0, 4.0, 7.0, 6.0, 20.0, 17.0, 24.0, 24.0, 28.0, 37.0, 30.0, 32.0, 33.0, 46.0, 32.0, 56.0, 41.0, 49.0, 40.0, 48.0, 44.0, 40.0, 45.0, 42.0, 35.0, 33.0, 30.0, 30.0, 27.0, 21.0, 19.0, 14.0, 7.0, 10.0, 4.0, 3.0, 6.0, 3.0, 2.0, 2.0, 2.0, 3.0, 2.0, 5.0, 0.0, 1.0], "bins": [-0.35498046875, -0.345184326171875, -0.33538818359375, -0.325592041015625, -0.3157958984375, -0.305999755859375, -0.29620361328125, -0.286407470703125, -0.276611328125, -0.266815185546875, -0.25701904296875, -0.247222900390625, -0.2374267578125, -0.227630615234375, -0.21783447265625, -0.208038330078125, -0.1982421875, -0.188446044921875, -0.17864990234375, -0.168853759765625, -0.1590576171875, -0.149261474609375, -0.13946533203125, -0.129669189453125, -0.119873046875, -0.110076904296875, -0.10028076171875, -0.090484619140625, -0.0806884765625, -0.070892333984375, -0.06109619140625, -0.051300048828125, -0.04150390625, -0.031707763671875, -0.02191162109375, -0.012115478515625, -0.0023193359375, 0.007476806640625, 0.01727294921875, 0.027069091796875, 0.036865234375, 0.046661376953125, 0.05645751953125, 0.066253662109375, 0.0760498046875, 0.085845947265625, 0.09564208984375, 0.105438232421875, 0.115234375, 0.125030517578125, 0.13482666015625, 0.144622802734375, 0.1544189453125, 0.164215087890625, 0.17401123046875, 0.183807373046875, 0.193603515625, 0.203399658203125, 0.21319580078125, 0.222991943359375, 0.2327880859375, 0.242584228515625, 0.25238037109375, 0.262176513671875, 0.27197265625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 11.0, 13.0, 13.0, 17.0, 30.0, 48.0, 50.0, 81.0, 104.0, 167.0, 259.0, 413.0, 732.0, 1196.0, 2112.0, 3936.0, 7528.0, 14551.0, 30525.0, 66367.0, 145884.0, 296854.0, 247965.0, 121560.0, 55255.0, 25715.0, 12681.0, 6340.0, 3450.0, 1820.0, 1043.0, 665.0, 392.0, 280.0, 160.0, 110.0, 84.0, 48.0, 24.0, 23.0, 9.0, 13.0, 9.0, 8.0, 3.0, 5.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.37744140625, -0.3659629821777344, -0.35448455810546875, -0.3430061340332031, -0.3315277099609375, -0.3200492858886719, -0.30857086181640625, -0.2970924377441406, -0.285614013671875, -0.2741355895996094, -0.26265716552734375, -0.2511787414550781, -0.2397003173828125, -0.22822189331054688, -0.21674346923828125, -0.20526504516601562, -0.19378662109375, -0.18230819702148438, -0.17082977294921875, -0.15935134887695312, -0.1478729248046875, -0.13639450073242188, -0.12491607666015625, -0.11343765258789062, -0.101959228515625, -0.09048080444335938, -0.07900238037109375, -0.06752395629882812, -0.0560455322265625, -0.044567108154296875, -0.03308868408203125, -0.021610260009765625, -0.0101318359375, 0.001346588134765625, 0.01282501220703125, 0.024303436279296875, 0.0357818603515625, 0.047260284423828125, 0.05873870849609375, 0.07021713256835938, 0.081695556640625, 0.09317398071289062, 0.10465240478515625, 0.11613082885742188, 0.1276092529296875, 0.13908767700195312, 0.15056610107421875, 0.16204452514648438, 0.17352294921875, 0.18500137329101562, 0.19647979736328125, 0.20795822143554688, 0.2194366455078125, 0.23091506958007812, 0.24239349365234375, 0.2538719177246094, 0.265350341796875, 0.2768287658691406, 0.28830718994140625, 0.2997856140136719, 0.3112640380859375, 0.3227424621582031, 0.33422088623046875, 0.3456993103027344, 0.357177734375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 5.0, 6.0, 8.0, 15.0, 9.0, 14.0, 25.0, 19.0, 22.0, 38.0, 44.0, 48.0, 38.0, 44.0, 53.0, 49.0, 59.0, 59.0, 43.0, 60.0, 46.0, 38.0, 42.0, 39.0, 33.0, 30.0, 25.0, 20.0, 18.0, 12.0, 10.0, 8.0, 7.0, 6.0, 0.0, 2.0, 3.0, 2.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.0498046875, -1.0195846557617188, -0.9893646240234375, -0.9591445922851562, -0.928924560546875, -0.8987045288085938, -0.8684844970703125, -0.8382644653320312, -0.80804443359375, -0.7778244018554688, -0.7476043701171875, -0.7173843383789062, -0.687164306640625, -0.6569442749023438, -0.6267242431640625, -0.5965042114257812, -0.5662841796875, -0.5360641479492188, -0.5058441162109375, -0.47562408447265625, -0.445404052734375, -0.41518402099609375, -0.3849639892578125, -0.35474395751953125, -0.32452392578125, -0.29430389404296875, -0.2640838623046875, -0.23386383056640625, -0.203643798828125, -0.17342376708984375, -0.1432037353515625, -0.11298370361328125, -0.082763671875, -0.05254364013671875, -0.0223236083984375, 0.00789642333984375, 0.038116455078125, 0.06833648681640625, 0.0985565185546875, 0.12877655029296875, 0.15899658203125, 0.18921661376953125, 0.2194366455078125, 0.24965667724609375, 0.279876708984375, 0.31009674072265625, 0.3403167724609375, 0.37053680419921875, 0.4007568359375, 0.43097686767578125, 0.4611968994140625, 0.49141693115234375, 0.521636962890625, 0.5518569946289062, 0.5820770263671875, 0.6122970581054688, 0.64251708984375, 0.6727371215820312, 0.7029571533203125, 0.7331771850585938, 0.763397216796875, 0.7936172485351562, 0.8238372802734375, 0.8540573120117188, 0.88427734375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 9.0, 12.0, 22.0, 29.0, 57.0, 129.0, 205.0, 383.0, 754.0, 1629.0, 3361.0, 7963.0, 20186.0, 59145.0, 193342.0, 435844.0, 218840.0, 68007.0, 22485.0, 8838.0, 3723.0, 1741.0, 881.0, 440.0, 224.0, 131.0, 56.0, 33.0, 20.0, 27.0, 16.0, 9.0, 4.0, 4.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1285400390625, -0.12459182739257812, -0.12064361572265625, -0.11669540405273438, -0.1127471923828125, -0.10879898071289062, -0.10485076904296875, -0.10090255737304688, -0.096954345703125, -0.09300613403320312, -0.08905792236328125, -0.08510971069335938, -0.0811614990234375, -0.07721328735351562, -0.07326507568359375, -0.06931686401367188, -0.06536865234375, -0.061420440673828125, -0.05747222900390625, -0.053524017333984375, -0.0495758056640625, -0.045627593994140625, -0.04167938232421875, -0.037731170654296875, -0.033782958984375, -0.029834747314453125, -0.02588653564453125, -0.021938323974609375, -0.0179901123046875, -0.014041900634765625, -0.01009368896484375, -0.006145477294921875, -0.002197265625, 0.001750946044921875, 0.00569915771484375, 0.009647369384765625, 0.0135955810546875, 0.017543792724609375, 0.02149200439453125, 0.025440216064453125, 0.029388427734375, 0.033336639404296875, 0.03728485107421875, 0.041233062744140625, 0.0451812744140625, 0.049129486083984375, 0.05307769775390625, 0.057025909423828125, 0.06097412109375, 0.06492233276367188, 0.06887054443359375, 0.07281875610351562, 0.0767669677734375, 0.08071517944335938, 0.08466339111328125, 0.08861160278320312, 0.092559814453125, 0.09650802612304688, 0.10045623779296875, 0.10440444946289062, 0.1083526611328125, 0.11230087280273438, 0.11624908447265625, 0.12019729614257812, 0.1241455078125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 6.0, 5.0, 15.0, 9.0, 9.0, 17.0, 17.0, 22.0, 27.0, 48.0, 45.0, 74.0, 70.0, 73.0, 80.0, 96.0, 65.0, 64.0, 55.0, 37.0, 32.0, 28.0, 18.0, 22.0, 19.0, 18.0, 9.0, 8.0, 6.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-4.035234451293945e-05, -3.928225487470627e-05, -3.8212165236473083e-05, -3.71420755982399e-05, -3.6071985960006714e-05, -3.500189632177353e-05, -3.3931806683540344e-05, -3.286171704530716e-05, -3.1791627407073975e-05, -3.072153776884079e-05, -2.9651448130607605e-05, -2.858135849237442e-05, -2.7511268854141235e-05, -2.644117921590805e-05, -2.5371089577674866e-05, -2.430099993944168e-05, -2.3230910301208496e-05, -2.216082066297531e-05, -2.1090731024742126e-05, -2.002064138650894e-05, -1.8950551748275757e-05, -1.7880462110042572e-05, -1.6810372471809387e-05, -1.5740282833576202e-05, -1.4670193195343018e-05, -1.3600103557109833e-05, -1.2530013918876648e-05, -1.1459924280643463e-05, -1.0389834642410278e-05, -9.319745004177094e-06, -8.249655365943909e-06, -7.179565727710724e-06, -6.109476089477539e-06, -5.039386451244354e-06, -3.9692968130111694e-06, -2.8992071747779846e-06, -1.8291175365447998e-06, -7.59027898311615e-07, 3.110617399215698e-07, 1.3811513781547546e-06, 2.4512410163879395e-06, 3.5213306546211243e-06, 4.591420292854309e-06, 5.661509931087494e-06, 6.731599569320679e-06, 7.801689207553864e-06, 8.871778845787048e-06, 9.941868484020233e-06, 1.1011958122253418e-05, 1.2082047760486603e-05, 1.3152137398719788e-05, 1.4222227036952972e-05, 1.5292316675186157e-05, 1.6362406313419342e-05, 1.7432495951652527e-05, 1.850258558988571e-05, 1.9572675228118896e-05, 2.064276486635208e-05, 2.1712854504585266e-05, 2.278294414281845e-05, 2.3853033781051636e-05, 2.492312341928482e-05, 2.5993213057518005e-05, 2.706330269575119e-05, 2.8133392333984375e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 4.0, 7.0, 6.0, 10.0, 19.0, 28.0, 31.0, 53.0, 76.0, 110.0, 160.0, 244.0, 441.0, 766.0, 1234.0, 2185.0, 3985.0, 7962.0, 16201.0, 35283.0, 80668.0, 176615.0, 318670.0, 215016.0, 102844.0, 44757.0, 20334.0, 9810.0, 4785.0, 2537.0, 1448.0, 861.0, 515.0, 298.0, 205.0, 137.0, 86.0, 54.0, 39.0, 23.0, 13.0, 18.0, 7.0, 8.0, 1.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.09808349609375, -0.0951681137084961, -0.09225273132324219, -0.08933734893798828, -0.08642196655273438, -0.08350658416748047, -0.08059120178222656, -0.07767581939697266, -0.07476043701171875, -0.07184505462646484, -0.06892967224121094, -0.06601428985595703, -0.06309890747070312, -0.06018352508544922, -0.05726814270019531, -0.054352760314941406, -0.0514373779296875, -0.048521995544433594, -0.04560661315917969, -0.04269123077392578, -0.039775848388671875, -0.03686046600341797, -0.03394508361816406, -0.031029701232910156, -0.02811431884765625, -0.025198936462402344, -0.022283554077148438, -0.01936817169189453, -0.016452789306640625, -0.013537406921386719, -0.010622024536132812, -0.007706642150878906, -0.004791259765625, -0.0018758773803710938, 0.0010395050048828125, 0.003954887390136719, 0.006870269775390625, 0.009785652160644531, 0.012701034545898438, 0.015616416931152344, 0.01853179931640625, 0.021447181701660156, 0.024362564086914062, 0.02727794647216797, 0.030193328857421875, 0.03310871124267578, 0.03602409362792969, 0.038939476013183594, 0.0418548583984375, 0.044770240783691406, 0.04768562316894531, 0.05060100555419922, 0.053516387939453125, 0.05643177032470703, 0.05934715270996094, 0.062262535095214844, 0.06517791748046875, 0.06809329986572266, 0.07100868225097656, 0.07392406463623047, 0.07683944702148438, 0.07975482940673828, 0.08267021179199219, 0.0855855941772461, 0.0885009765625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 3.0, 6.0, 13.0, 8.0, 9.0, 19.0, 13.0, 10.0, 15.0, 27.0, 27.0, 32.0, 34.0, 44.0, 43.0, 58.0, 57.0, 44.0, 46.0, 48.0, 62.0, 50.0, 37.0, 47.0, 40.0, 25.0, 33.0, 21.0, 33.0, 21.0, 16.0, 12.0, 10.0, 11.0, 11.0, 8.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10296630859375, -0.09948921203613281, -0.09601211547851562, -0.09253501892089844, -0.08905792236328125, -0.08558082580566406, -0.08210372924804688, -0.07862663269042969, -0.0751495361328125, -0.07167243957519531, -0.06819534301757812, -0.06471824645996094, -0.06124114990234375, -0.05776405334472656, -0.054286956787109375, -0.05080986022949219, -0.047332763671875, -0.04385566711425781, -0.040378570556640625, -0.03690147399902344, -0.03342437744140625, -0.029947280883789062, -0.026470184326171875, -0.022993087768554688, -0.0195159912109375, -0.016038894653320312, -0.012561798095703125, -0.009084701538085938, -0.00560760498046875, -0.0021305084228515625, 0.001346588134765625, 0.0048236846923828125, 0.00830078125, 0.011777877807617188, 0.015254974365234375, 0.018732070922851562, 0.02220916748046875, 0.025686264038085938, 0.029163360595703125, 0.03264045715332031, 0.0361175537109375, 0.03959465026855469, 0.043071746826171875, 0.04654884338378906, 0.05002593994140625, 0.05350303649902344, 0.056980133056640625, 0.06045722961425781, 0.063934326171875, 0.06741142272949219, 0.07088851928710938, 0.07436561584472656, 0.07784271240234375, 0.08131980895996094, 0.08479690551757812, 0.08827400207519531, 0.0917510986328125, 0.09522819519042969, 0.09870529174804688, 0.10218238830566406, 0.10565948486328125, 0.10913658142089844, 0.11261367797851562, 0.11609077453613281, 0.11956787109375]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 9.0, 9.0, 16.0, 22.0, 33.0, 45.0, 102.0, 134.0, 158.0, 155.0, 126.0, 98.0, 42.0, 28.0, 13.0, 5.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.642482757568359, -5.514662265777588, -5.386841297149658, -5.259020805358887, -5.131199836730957, -5.0033793449401855, -4.875558376312256, -4.747737884521484, -4.619916915893555, -4.492096424102783, -4.3642754554748535, -4.236454963684082, -4.108633995056152, -3.980813503265381, -3.8529927730560303, -3.7251720428466797, -3.597351551055908, -3.4695308208465576, -3.341710090637207, -3.2138893604278564, -3.086068630218506, -2.9582481384277344, -2.830427408218384, -2.702606678009033, -2.5747859477996826, -2.446965217590332, -2.3191444873809814, -2.191323757171631, -2.0635032653808594, -1.9356824159622192, -1.8078618049621582, -1.6800410747528076, -1.5522198677062988, -1.4243991374969482, -1.2965784072875977, -1.1687577962875366, -1.040937066078186, -0.9131163358688354, -0.7852956652641296, -0.6574749946594238, -0.5296542644500732, -0.40183356404304504, -0.27401286363601685, -0.14619216322898865, -0.01837146282196045, 0.10944926738739014, 0.23726993799209595, 0.36509060859680176, 0.49291133880615234, 0.6207320690155029, 0.7485527396202087, 0.8763734102249146, 1.0041941404342651, 1.1320148706436157, 1.2598354816436768, 1.3876562118530273, 1.515476942062378, 1.6432976722717285, 1.771118402481079, 1.8989390134811401, 2.026759624481201, 2.154580593109131, 2.2824010848999023, 2.410221815109253, 2.5380425453186035]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 4.0, 6.0, 7.0, 7.0, 6.0, 13.0, 8.0, 12.0, 16.0, 16.0, 15.0, 20.0, 25.0, 22.0, 27.0, 41.0, 41.0, 39.0, 42.0, 42.0, 47.0, 46.0, 44.0, 46.0, 34.0, 35.0, 35.0, 38.0, 33.0, 35.0, 28.0, 24.0, 20.0, 20.0, 16.0, 12.0, 19.0, 10.0, 14.0, 10.0, 4.0, 10.0, 3.0, 3.0, 7.0, 5.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.0175909996032715, -1.9490442276000977, -1.8804974555969238, -1.81195068359375, -1.7434039115905762, -1.6748571395874023, -1.6063103675842285, -1.5377635955810547, -1.4692168235778809, -1.400670051574707, -1.3321232795715332, -1.2635765075683594, -1.1950297355651855, -1.1264829635620117, -1.057936191558838, -0.9893894791603088, -0.9208427667617798, -0.852295994758606, -0.7837492227554321, -0.7152024507522583, -0.6466556787490845, -0.5781089067459106, -0.5095621943473816, -0.44101542234420776, -0.37246865034103394, -0.3039218783378601, -0.23537512123584747, -0.16682836413383484, -0.09828159213066101, -0.029734820127487183, 0.03881192207336426, 0.10735869407653809, 0.17590546607971191, 0.24445223808288574, 0.31299901008605957, 0.381545752286911, 0.45009252429008484, 0.518639326095581, 0.5871860384941101, 0.6557328104972839, 0.7242795825004578, 0.7928263545036316, 0.8613731265068054, 0.9299198389053345, 0.9984666109085083, 1.0670133829116821, 1.135560154914856, 1.2041069269180298, 1.2726536989212036, 1.3412004709243774, 1.4097472429275513, 1.478294014930725, 1.546840786933899, 1.6153875589370728, 1.683934211730957, 1.7524809837341309, 1.8210277557373047, 1.8895745277404785, 1.9581212997436523, 2.026668071746826, 2.09521484375, 2.163761615753174, 2.2323083877563477, 2.3008551597595215, 2.3694019317626953]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 2.0, 7.0, 3.0, 4.0, 6.0, 14.0, 15.0, 21.0, 24.0, 33.0, 44.0, 50.0, 82.0, 113.0, 164.0, 234.0, 391.0, 599.0, 1100.0, 1832.0, 3610.0, 7777.0, 20685.0, 70302.0, 284417.0, 976099.0, 1603817.0, 886769.0, 244238.0, 58898.0, 18485.0, 7033.0, 3203.0, 1631.0, 962.0, 543.0, 356.0, 207.0, 134.0, 114.0, 78.0, 49.0, 35.0, 26.0, 19.0, 19.0, 16.0, 7.0, 4.0, 5.0, 4.0, 3.0, 0.0, 4.0, 2.0, 3.0, 1.0, 1.0], "bins": [-0.36962890625, -0.3582344055175781, -0.34683990478515625, -0.3354454040527344, -0.3240509033203125, -0.3126564025878906, -0.30126190185546875, -0.2898674011230469, -0.278472900390625, -0.2670783996582031, -0.25568389892578125, -0.24428939819335938, -0.2328948974609375, -0.22150039672851562, -0.21010589599609375, -0.19871139526367188, -0.18731689453125, -0.17592239379882812, -0.16452789306640625, -0.15313339233398438, -0.1417388916015625, -0.13034439086914062, -0.11894989013671875, -0.10755538940429688, -0.096160888671875, -0.08476638793945312, -0.07337188720703125, -0.061977386474609375, -0.0505828857421875, -0.039188385009765625, -0.02779388427734375, -0.016399383544921875, -0.0050048828125, 0.006389617919921875, 0.01778411865234375, 0.029178619384765625, 0.0405731201171875, 0.051967620849609375, 0.06336212158203125, 0.07475662231445312, 0.086151123046875, 0.09754562377929688, 0.10894012451171875, 0.12033462524414062, 0.1317291259765625, 0.14312362670898438, 0.15451812744140625, 0.16591262817382812, 0.17730712890625, 0.18870162963867188, 0.20009613037109375, 0.21149063110351562, 0.2228851318359375, 0.23427963256835938, 0.24567413330078125, 0.2570686340332031, 0.268463134765625, 0.2798576354980469, 0.29125213623046875, 0.3026466369628906, 0.3140411376953125, 0.3254356384277344, 0.33683013916015625, 0.3482246398925781, 0.359619140625]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 9.0, 3.0, 10.0, 6.0, 7.0, 15.0, 15.0, 22.0, 26.0, 17.0, 27.0, 34.0, 42.0, 38.0, 44.0, 51.0, 51.0, 66.0, 62.0, 68.0, 44.0, 38.0, 55.0, 49.0, 44.0, 29.0, 24.0, 20.0, 22.0, 15.0, 14.0, 8.0, 8.0, 8.0, 4.0, 4.0, 4.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.351806640625, -0.34186553955078125, -0.3319244384765625, -0.32198333740234375, -0.312042236328125, -0.30210113525390625, -0.2921600341796875, -0.28221893310546875, -0.27227783203125, -0.26233673095703125, -0.2523956298828125, -0.24245452880859375, -0.232513427734375, -0.22257232666015625, -0.2126312255859375, -0.20269012451171875, -0.1927490234375, -0.18280792236328125, -0.1728668212890625, -0.16292572021484375, -0.152984619140625, -0.14304351806640625, -0.1331024169921875, -0.12316131591796875, -0.11322021484375, -0.10327911376953125, -0.0933380126953125, -0.08339691162109375, -0.073455810546875, -0.06351470947265625, -0.0535736083984375, -0.04363250732421875, -0.03369140625, -0.02375030517578125, -0.0138092041015625, -0.00386810302734375, 0.006072998046875, 0.01601409912109375, 0.0259552001953125, 0.03589630126953125, 0.04583740234375, 0.05577850341796875, 0.0657196044921875, 0.07566070556640625, 0.085601806640625, 0.09554290771484375, 0.1054840087890625, 0.11542510986328125, 0.1253662109375, 0.13530731201171875, 0.1452484130859375, 0.15518951416015625, 0.165130615234375, 0.17507171630859375, 0.1850128173828125, 0.19495391845703125, 0.20489501953125, 0.21483612060546875, 0.2247772216796875, 0.23471832275390625, 0.244659423828125, 0.25460052490234375, 0.2645416259765625, 0.27448272705078125, 0.284423828125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 7.0, 3.0, 7.0, 8.0, 8.0, 14.0, 15.0, 23.0, 24.0, 41.0, 53.0, 75.0, 103.0, 146.0, 201.0, 333.0, 559.0, 995.0, 2154.0, 4679.0, 13124.0, 50633.0, 346399.0, 3135054.0, 546114.0, 66885.0, 16058.0, 5558.0, 2228.0, 1182.0, 607.0, 353.0, 215.0, 139.0, 84.0, 57.0, 38.0, 30.0, 29.0, 14.0, 7.0, 7.0, 10.0, 6.0, 5.0, 6.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.66064453125, -0.6409759521484375, -0.621307373046875, -0.6016387939453125, -0.58197021484375, -0.5623016357421875, -0.542633056640625, -0.5229644775390625, -0.5032958984375, -0.4836273193359375, -0.463958740234375, -0.4442901611328125, -0.42462158203125, -0.4049530029296875, -0.385284423828125, -0.3656158447265625, -0.345947265625, -0.3262786865234375, -0.306610107421875, -0.2869415283203125, -0.26727294921875, -0.2476043701171875, -0.227935791015625, -0.2082672119140625, -0.1885986328125, -0.1689300537109375, -0.149261474609375, -0.1295928955078125, -0.10992431640625, -0.0902557373046875, -0.070587158203125, -0.0509185791015625, -0.03125, -0.0115814208984375, 0.008087158203125, 0.0277557373046875, 0.04742431640625, 0.0670928955078125, 0.086761474609375, 0.1064300537109375, 0.1260986328125, 0.1457672119140625, 0.165435791015625, 0.1851043701171875, 0.20477294921875, 0.2244415283203125, 0.244110107421875, 0.2637786865234375, 0.283447265625, 0.3031158447265625, 0.322784423828125, 0.3424530029296875, 0.36212158203125, 0.3817901611328125, 0.401458740234375, 0.4211273193359375, 0.4407958984375, 0.4604644775390625, 0.480133056640625, 0.4998016357421875, 0.51947021484375, 0.5391387939453125, 0.558807373046875, 0.5784759521484375, 0.59814453125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 4.0, 14.0, 11.0, 13.0, 18.0, 26.0, 35.0, 66.0, 65.0, 90.0, 129.0, 187.0, 279.0, 417.0, 564.0, 562.0, 446.0, 351.0, 244.0, 152.0, 122.0, 73.0, 39.0, 39.0, 34.0, 19.0, 16.0, 17.0, 10.0, 7.0, 3.0, 9.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.66064453125, -0.6401519775390625, -0.619659423828125, -0.5991668701171875, -0.57867431640625, -0.5581817626953125, -0.537689208984375, -0.5171966552734375, -0.4967041015625, -0.4762115478515625, -0.455718994140625, -0.4352264404296875, -0.41473388671875, -0.3942413330078125, -0.373748779296875, -0.3532562255859375, -0.332763671875, -0.3122711181640625, -0.291778564453125, -0.2712860107421875, -0.25079345703125, -0.2303009033203125, -0.209808349609375, -0.1893157958984375, -0.1688232421875, -0.1483306884765625, -0.127838134765625, -0.1073455810546875, -0.08685302734375, -0.0663604736328125, -0.045867919921875, -0.0253753662109375, -0.0048828125, 0.0156097412109375, 0.036102294921875, 0.0565948486328125, 0.07708740234375, 0.0975799560546875, 0.118072509765625, 0.1385650634765625, 0.1590576171875, 0.1795501708984375, 0.200042724609375, 0.2205352783203125, 0.24102783203125, 0.2615203857421875, 0.282012939453125, 0.3025054931640625, 0.322998046875, 0.3434906005859375, 0.363983154296875, 0.3844757080078125, 0.40496826171875, 0.4254608154296875, 0.445953369140625, 0.4664459228515625, 0.4869384765625, 0.5074310302734375, 0.527923583984375, 0.5484161376953125, 0.56890869140625, 0.5894012451171875, 0.609893798828125, 0.6303863525390625, 0.65087890625]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 2.0, 1.0, 4.0, 5.0, 7.0, 3.0, 12.0, 14.0, 27.0, 31.0, 50.0, 76.0, 87.0, 107.0, 129.0, 124.0, 102.0, 73.0, 47.0, 35.0, 19.0, 14.0, 10.0, 9.0, 4.0, 2.0, 5.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.100054740905762, -5.912721157073975, -5.725387096405029, -5.538053512573242, -5.350719928741455, -5.163386344909668, -4.976052284240723, -4.7887187004089355, -4.601385116577148, -4.414051532745361, -4.226717472076416, -4.039383888244629, -3.852050304412842, -3.6647164821624756, -3.4773826599121094, -3.2900490760803223, -3.102715015411377, -2.9153811931610107, -2.7280476093292236, -2.5407137870788574, -2.3533802032470703, -2.166046380996704, -1.978712558746338, -1.7913788557052612, -1.6040451526641846, -1.416711449623108, -1.2293777465820312, -1.042043924331665, -0.8547102212905884, -0.6673765182495117, -0.4800426959991455, -0.29270899295806885, -0.10537528991699219, 0.08195844292640686, 0.2692921757698059, 0.45662593841552734, 0.643959641456604, 0.8312933444976807, 1.0186271667480469, 1.2059608697891235, 1.3932945728302002, 1.5806282758712769, 1.7679619789123535, 1.9552958011627197, 2.142629623413086, 2.329963207244873, 2.5172970294952393, 2.7046308517456055, 2.8919644355773926, 3.079298257827759, 3.266631841659546, 3.453965663909912, 3.641299247741699, 3.8286330699920654, 4.015966892242432, 4.203300476074219, 4.390634536743164, 4.577968120574951, 4.7653021812438965, 4.952635765075684, 5.139969348907471, 5.327302932739258, 5.514636993408203, 5.70197057723999, 5.889304161071777]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 0.0, 3.0, 3.0, 5.0, 6.0, 12.0, 3.0, 11.0, 21.0, 17.0, 24.0, 20.0, 26.0, 36.0, 34.0, 41.0, 44.0, 46.0, 37.0, 38.0, 48.0, 50.0, 47.0, 43.0, 52.0, 45.0, 42.0, 39.0, 35.0, 26.0, 26.0, 18.0, 23.0, 14.0, 17.0, 10.0, 9.0, 6.0, 6.0, 6.0, 7.0, 6.0, 4.0, 3.0, 1.0, 2.0], "bins": [-3.531543254852295, -3.44130802154541, -3.3510727882385254, -3.2608375549316406, -3.170602560043335, -3.08036732673645, -2.9901320934295654, -2.8998968601226807, -2.809661865234375, -2.7194266319274902, -2.6291913986206055, -2.5389561653137207, -2.448721170425415, -2.3584859371185303, -2.2682507038116455, -2.1780154705047607, -2.087780237197876, -1.9975450038909912, -1.907309889793396, -1.8170746564865112, -1.726839542388916, -1.6366043090820312, -1.5463690757751465, -1.4561338424682617, -1.3658987283706665, -1.2756634950637817, -1.1854283809661865, -1.0951931476593018, -1.004957914352417, -0.9147228002548218, -0.824487566947937, -0.734252393245697, -0.644017219543457, -0.553782045841217, -0.46354684233665466, -0.3733116388320923, -0.2830764651298523, -0.1928412914276123, -0.10260605812072754, -0.012370884418487549, 0.07786428928375244, 0.16809947788715363, 0.2583346664905548, 0.3485698699951172, 0.4388050436973572, 0.5290402173995972, 0.6192754507064819, 0.7095106244087219, 0.7997457981109619, 0.8899809718132019, 0.9802161455154419, 1.0704513788223267, 1.1606864929199219, 1.2509217262268066, 1.3411569595336914, 1.4313921928405762, 1.5216273069381714, 1.6118625402450562, 1.7020976543426514, 1.7923328876495361, 1.882568120956421, 1.9728032350540161, 2.0630383491516113, 2.153273582458496, 2.243508815765381]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 3.0, 7.0, 6.0, 10.0, 14.0, 32.0, 42.0, 75.0, 112.0, 158.0, 227.0, 421.0, 639.0, 1149.0, 1930.0, 3359.0, 6201.0, 12453.0, 25883.0, 59898.0, 146274.0, 308306.0, 270309.0, 118324.0, 48634.0, 21495.0, 10216.0, 5201.0, 2857.0, 1642.0, 1015.0, 603.0, 370.0, 233.0, 175.0, 105.0, 64.0, 41.0, 29.0, 20.0, 8.0, 8.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.273681640625, -0.26535797119140625, -0.2570343017578125, -0.24871063232421875, -0.240386962890625, -0.23206329345703125, -0.2237396240234375, -0.21541595458984375, -0.20709228515625, -0.19876861572265625, -0.1904449462890625, -0.18212127685546875, -0.173797607421875, -0.16547393798828125, -0.1571502685546875, -0.14882659912109375, -0.1405029296875, -0.13217926025390625, -0.1238555908203125, -0.11553192138671875, -0.107208251953125, -0.09888458251953125, -0.0905609130859375, -0.08223724365234375, -0.07391357421875, -0.06558990478515625, -0.0572662353515625, -0.04894256591796875, -0.040618896484375, -0.03229522705078125, -0.0239715576171875, -0.01564788818359375, -0.00732421875, 0.00099945068359375, 0.0093231201171875, 0.01764678955078125, 0.025970458984375, 0.03429412841796875, 0.0426177978515625, 0.05094146728515625, 0.05926513671875, 0.06758880615234375, 0.0759124755859375, 0.08423614501953125, 0.092559814453125, 0.10088348388671875, 0.1092071533203125, 0.11753082275390625, 0.1258544921875, 0.13417816162109375, 0.1425018310546875, 0.15082550048828125, 0.159149169921875, 0.16747283935546875, 0.1757965087890625, 0.18412017822265625, 0.19244384765625, 0.20076751708984375, 0.2090911865234375, 0.21741485595703125, 0.225738525390625, 0.23406219482421875, 0.2423858642578125, 0.25070953369140625, 0.259033203125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 3.0, 7.0, 13.0, 5.0, 13.0, 14.0, 21.0, 30.0, 33.0, 27.0, 36.0, 41.0, 47.0, 62.0, 50.0, 66.0, 67.0, 51.0, 66.0, 49.0, 57.0, 45.0, 42.0, 39.0, 31.0, 25.0, 15.0, 15.0, 8.0, 5.0, 8.0, 4.0, 3.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.5009765625, -0.4879570007324219, -0.47493743896484375, -0.4619178771972656, -0.4488983154296875, -0.4358787536621094, -0.42285919189453125, -0.4098396301269531, -0.396820068359375, -0.3838005065917969, -0.37078094482421875, -0.3577613830566406, -0.3447418212890625, -0.3317222595214844, -0.31870269775390625, -0.3056831359863281, -0.29266357421875, -0.2796440124511719, -0.26662445068359375, -0.2536048889160156, -0.2405853271484375, -0.22756576538085938, -0.21454620361328125, -0.20152664184570312, -0.188507080078125, -0.17548751831054688, -0.16246795654296875, -0.14944839477539062, -0.1364288330078125, -0.12340927124023438, -0.11038970947265625, -0.09737014770507812, -0.0843505859375, -0.07133102416992188, -0.05831146240234375, -0.045291900634765625, -0.0322723388671875, -0.019252777099609375, -0.00623321533203125, 0.006786346435546875, 0.019805908203125, 0.032825469970703125, 0.04584503173828125, 0.058864593505859375, 0.0718841552734375, 0.08490371704101562, 0.09792327880859375, 0.11094284057617188, 0.12396240234375, 0.13698196411132812, 0.15000152587890625, 0.16302108764648438, 0.1760406494140625, 0.18906021118164062, 0.20207977294921875, 0.21509933471679688, 0.228118896484375, 0.24113845825195312, 0.25415802001953125, 0.2671775817871094, 0.2801971435546875, 0.2932167053222656, 0.30623626708984375, 0.3192558288574219, 0.332275390625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 18.0, 18.0, 25.0, 28.0, 59.0, 86.0, 148.0, 262.0, 514.0, 1252.0, 3948.0, 17911.0, 155874.0, 763362.0, 87806.0, 12343.0, 2876.0, 1003.0, 469.0, 207.0, 123.0, 74.0, 42.0, 34.0, 26.0, 9.0, 7.0, 8.0, 10.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.7119140625, -0.6933670043945312, -0.6748199462890625, -0.6562728881835938, -0.637725830078125, -0.6191787719726562, -0.6006317138671875, -0.5820846557617188, -0.56353759765625, -0.5449905395507812, -0.5264434814453125, -0.5078964233398438, -0.489349365234375, -0.47080230712890625, -0.4522552490234375, -0.43370819091796875, -0.4151611328125, -0.39661407470703125, -0.3780670166015625, -0.35951995849609375, -0.340972900390625, -0.32242584228515625, -0.3038787841796875, -0.28533172607421875, -0.26678466796875, -0.24823760986328125, -0.2296905517578125, -0.21114349365234375, -0.192596435546875, -0.17404937744140625, -0.1555023193359375, -0.13695526123046875, -0.118408203125, -0.09986114501953125, -0.0813140869140625, -0.06276702880859375, -0.044219970703125, -0.02567291259765625, -0.0071258544921875, 0.01142120361328125, 0.02996826171875, 0.04851531982421875, 0.0670623779296875, 0.08560943603515625, 0.104156494140625, 0.12270355224609375, 0.1412506103515625, 0.15979766845703125, 0.1783447265625, 0.19689178466796875, 0.2154388427734375, 0.23398590087890625, 0.252532958984375, 0.27108001708984375, 0.2896270751953125, 0.30817413330078125, 0.32672119140625, 0.34526824951171875, 0.3638153076171875, 0.38236236572265625, 0.400909423828125, 0.41945648193359375, 0.4380035400390625, 0.45655059814453125, 0.47509765625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 4.0, 7.0, 19.0, 18.0, 26.0, 51.0, 76.0, 82.0, 100.0, 106.0, 110.0, 109.0, 75.0, 75.0, 55.0, 34.0, 21.0, 18.0, 10.0, 3.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.27734375, -2.216217041015625, -2.15509033203125, -2.093963623046875, -2.0328369140625, -1.971710205078125, -1.91058349609375, -1.849456787109375, -1.788330078125, -1.727203369140625, -1.66607666015625, -1.604949951171875, -1.5438232421875, -1.482696533203125, -1.42156982421875, -1.360443115234375, -1.29931640625, -1.238189697265625, -1.17706298828125, -1.115936279296875, -1.0548095703125, -0.993682861328125, -0.93255615234375, -0.871429443359375, -0.810302734375, -0.749176025390625, -0.68804931640625, -0.626922607421875, -0.5657958984375, -0.504669189453125, -0.44354248046875, -0.382415771484375, -0.3212890625, -0.260162353515625, -0.19903564453125, -0.137908935546875, -0.0767822265625, -0.015655517578125, 0.04547119140625, 0.106597900390625, 0.167724609375, 0.228851318359375, 0.28997802734375, 0.351104736328125, 0.4122314453125, 0.473358154296875, 0.53448486328125, 0.595611572265625, 0.65673828125, 0.717864990234375, 0.77899169921875, 0.840118408203125, 0.9012451171875, 0.962371826171875, 1.02349853515625, 1.084625244140625, 1.145751953125, 1.206878662109375, 1.26800537109375, 1.329132080078125, 1.3902587890625, 1.451385498046875, 1.51251220703125, 1.573638916015625, 1.634765625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 11.0, 22.0, 69.0, 330.0, 4135.0, 1038813.0, 4617.0, 394.0, 108.0, 22.0, 10.0, 4.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.3251953125, -1.28564453125, -1.24609375, -1.20654296875, -1.1669921875, -1.12744140625, -1.087890625, -1.04833984375, -1.0087890625, -0.96923828125, -0.9296875, -0.89013671875, -0.8505859375, -0.81103515625, -0.771484375, -0.73193359375, -0.6923828125, -0.65283203125, -0.61328125, -0.57373046875, -0.5341796875, -0.49462890625, -0.455078125, -0.41552734375, -0.3759765625, -0.33642578125, -0.296875, -0.25732421875, -0.2177734375, -0.17822265625, -0.138671875, -0.09912109375, -0.0595703125, -0.02001953125, 0.01953125, 0.05908203125, 0.0986328125, 0.13818359375, 0.177734375, 0.21728515625, 0.2568359375, 0.29638671875, 0.3359375, 0.37548828125, 0.4150390625, 0.45458984375, 0.494140625, 0.53369140625, 0.5732421875, 0.61279296875, 0.65234375, 0.69189453125, 0.7314453125, 0.77099609375, 0.810546875, 0.85009765625, 0.8896484375, 0.92919921875, 0.96875, 1.00830078125, 1.0478515625, 1.08740234375, 1.126953125, 1.16650390625, 1.2060546875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 8.0, 3.0, 3.0, 5.0, 9.0, 11.0, 15.0, 15.0, 21.0, 34.0, 27.0, 34.0, 59.0, 93.0, 79.0, 89.0, 90.0, 94.0, 67.0, 61.0, 43.0, 30.0, 29.0, 26.0, 17.0, 11.0, 15.0, 6.0, 3.0, 3.0, 6.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3663043975830078e-05, -2.2748485207557678e-05, -2.183392643928528e-05, -2.091936767101288e-05, -2.000480890274048e-05, -1.909025013446808e-05, -1.817569136619568e-05, -1.726113259792328e-05, -1.634657382965088e-05, -1.543201506137848e-05, -1.4517456293106079e-05, -1.360289752483368e-05, -1.268833875656128e-05, -1.177377998828888e-05, -1.085922122001648e-05, -9.94466245174408e-06, -9.03010368347168e-06, -8.11554491519928e-06, -7.20098614692688e-06, -6.28642737865448e-06, -5.37186861038208e-06, -4.45730984210968e-06, -3.5427510738372803e-06, -2.6281923055648804e-06, -1.7136335372924805e-06, -7.990747690200806e-07, 1.1548399925231934e-07, 1.0300427675247192e-06, 1.944601535797119e-06, 2.859160304069519e-06, 3.773719072341919e-06, 4.688277840614319e-06, 5.602836608886719e-06, 6.517395377159119e-06, 7.4319541454315186e-06, 8.346512913703918e-06, 9.261071681976318e-06, 1.0175630450248718e-05, 1.1090189218521118e-05, 1.2004747986793518e-05, 1.2919306755065918e-05, 1.3833865523338318e-05, 1.4748424291610718e-05, 1.5662983059883118e-05, 1.6577541828155518e-05, 1.7492100596427917e-05, 1.8406659364700317e-05, 1.9321218132972717e-05, 2.0235776901245117e-05, 2.1150335669517517e-05, 2.2064894437789917e-05, 2.2979453206062317e-05, 2.3894011974334717e-05, 2.4808570742607117e-05, 2.5723129510879517e-05, 2.6637688279151917e-05, 2.7552247047424316e-05, 2.8466805815696716e-05, 2.9381364583969116e-05, 3.0295923352241516e-05, 3.1210482120513916e-05, 3.2125040888786316e-05, 3.3039599657058716e-05, 3.3954158425331116e-05, 3.4868717193603516e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 7.0, 12.0, 8.0, 9.0, 21.0, 38.0, 44.0, 50.0, 63.0, 134.0, 181.0, 303.0, 617.0, 1176.0, 2752.0, 7769.0, 30553.0, 227455.0, 675970.0, 77489.0, 15286.0, 4704.0, 1831.0, 870.0, 457.0, 285.0, 141.0, 83.0, 73.0, 43.0, 33.0, 17.0, 18.0, 17.0, 10.0, 12.0, 6.0, 7.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1380615234375, -0.13259506225585938, -0.12712860107421875, -0.12166213989257812, -0.1161956787109375, -0.11072921752929688, -0.10526275634765625, -0.09979629516601562, -0.094329833984375, -0.08886337280273438, -0.08339691162109375, -0.07793045043945312, -0.0724639892578125, -0.06699752807617188, -0.06153106689453125, -0.056064605712890625, -0.05059814453125, -0.045131683349609375, -0.03966522216796875, -0.034198760986328125, -0.0287322998046875, -0.023265838623046875, -0.01779937744140625, -0.012332916259765625, -0.006866455078125, -0.001399993896484375, 0.00406646728515625, 0.009532928466796875, 0.0149993896484375, 0.020465850830078125, 0.02593231201171875, 0.031398773193359375, 0.036865234375, 0.042331695556640625, 0.04779815673828125, 0.053264617919921875, 0.0587310791015625, 0.06419754028320312, 0.06966400146484375, 0.07513046264648438, 0.080596923828125, 0.08606338500976562, 0.09152984619140625, 0.09699630737304688, 0.1024627685546875, 0.10792922973632812, 0.11339569091796875, 0.11886215209960938, 0.12432861328125, 0.12979507446289062, 0.13526153564453125, 0.14072799682617188, 0.1461944580078125, 0.15166091918945312, 0.15712738037109375, 0.16259384155273438, 0.168060302734375, 0.17352676391601562, 0.17899322509765625, 0.18445968627929688, 0.1899261474609375, 0.19539260864257812, 0.20085906982421875, 0.20632553100585938, 0.2117919921875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 2.0, 2.0, 4.0, 7.0, 8.0, 10.0, 23.0, 49.0, 87.0, 178.0, 259.0, 161.0, 83.0, 43.0, 15.0, 18.0, 11.0, 9.0, 4.0, 5.0, 5.0, 4.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3369140625, -0.32363128662109375, -0.3103485107421875, -0.29706573486328125, -0.283782958984375, -0.27050018310546875, -0.2572174072265625, -0.24393463134765625, -0.23065185546875, -0.21736907958984375, -0.2040863037109375, -0.19080352783203125, -0.177520751953125, -0.16423797607421875, -0.1509552001953125, -0.13767242431640625, -0.1243896484375, -0.11110687255859375, -0.0978240966796875, -0.08454132080078125, -0.071258544921875, -0.05797576904296875, -0.0446929931640625, -0.03141021728515625, -0.01812744140625, -0.00484466552734375, 0.0084381103515625, 0.02172088623046875, 0.035003662109375, 0.04828643798828125, 0.0615692138671875, 0.07485198974609375, 0.088134765625, 0.10141754150390625, 0.1147003173828125, 0.12798309326171875, 0.141265869140625, 0.15454864501953125, 0.1678314208984375, 0.18111419677734375, 0.19439697265625, 0.20767974853515625, 0.2209625244140625, 0.23424530029296875, 0.247528076171875, 0.26081085205078125, 0.2740936279296875, 0.28737640380859375, 0.3006591796875, 0.31394195556640625, 0.3272247314453125, 0.34050750732421875, 0.353790283203125, 0.36707305908203125, 0.3803558349609375, 0.39363861083984375, 0.40692138671875, 0.42020416259765625, 0.4334869384765625, 0.44676971435546875, 0.460052490234375, 0.47333526611328125, 0.4866180419921875, 0.49990081787109375, 0.51318359375]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 9.0, 14.0, 19.0, 80.0, 180.0, 322.0, 207.0, 87.0, 42.0, 19.0, 8.0, 9.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.031712532043457, -10.790215492248535, -10.548717498779297, -10.307220458984375, -10.065723419189453, -9.824225425720215, -9.582728385925293, -9.341230392456055, -9.099733352661133, -8.858236312866211, -8.616738319396973, -8.37524127960205, -8.133744239807129, -7.892246246337891, -7.650749206542969, -7.409251689910889, -7.167754173278809, -6.9262566566467285, -6.684759616851807, -6.443262100219727, -6.2017645835876465, -5.960267066955566, -5.7187700271606445, -5.4772725105285645, -5.235775470733643, -4.9942779541015625, -4.752780914306641, -4.5112833976745605, -4.2697858810424805, -4.028288841247559, -3.7867913246154785, -3.5452938079833984, -3.3037962913513184, -3.0622990131378174, -2.8208014965057373, -2.5793042182922363, -2.3378067016601562, -2.0963094234466553, -1.8548120260238647, -1.6133146286010742, -1.3718172311782837, -1.1303198337554932, -0.8888224363327026, -0.6473250985145569, -0.40582770109176636, -0.1643303632736206, 0.07716703414916992, 0.31866443157196045, 0.560161828994751, 0.8016592264175415, 1.043156623840332, 1.284653902053833, 1.526151418685913, 1.767648696899414, 2.009146213531494, 2.250643491744995, 2.492140769958496, 2.733638048171997, 2.975135564804077, 3.216632843017578, 3.458130359649658, 3.699627637863159, 3.94112491607666, 4.18262243270874, 4.42411994934082]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 6.0, 23.0, 45.0, 102.0, 143.0, 229.0, 212.0, 110.0, 56.0, 47.0, 22.0, 6.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.594009399414062, -15.260812759399414, -14.927616119384766, -14.5944185256958, -14.261221885681152, -13.928025245666504, -13.594827651977539, -13.26163101196289, -12.928434371948242, -12.595237731933594, -12.262041091918945, -11.92884349822998, -11.595646858215332, -11.262450218200684, -10.929252624511719, -10.59605598449707, -10.262859344482422, -9.929662704467773, -9.596466064453125, -9.26326847076416, -8.930071830749512, -8.596875190734863, -8.263677597045898, -7.93048095703125, -7.597284317016602, -7.264087677001953, -6.9308905601501465, -6.59769344329834, -6.264496803283691, -5.931300163269043, -5.598103046417236, -5.26490592956543, -4.931708335876465, -4.598511695861816, -4.26531457901001, -3.9321177005767822, -3.5989208221435547, -3.265723943710327, -2.9325270652770996, -2.599330186843872, -2.2661333084106445, -1.932936429977417, -1.5997395515441895, -1.266542673110962, -0.9333457946777344, -0.6001489162445068, -0.2669520378112793, 0.06624484062194824, 0.3994417190551758, 0.7326385974884033, 1.0658354759216309, 1.3990323543548584, 1.732229232788086, 2.0654261112213135, 2.398622989654541, 2.7318198680877686, 3.065016746520996, 3.3982136249542236, 3.731410503387451, 4.064607620239258, 4.397804260253906, 4.731000900268555, 5.064198017120361, 5.397395133972168, 5.730591773986816]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 15.0, 24.0, 30.0, 70.0, 202.0, 415.0, 94.0, 59.0, 48.0, 18.0, 14.0, 9.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.677734375, -1.6421661376953125, -1.606597900390625, -1.5710296630859375, -1.53546142578125, -1.4998931884765625, -1.464324951171875, -1.4287567138671875, -1.3931884765625, -1.3576202392578125, -1.322052001953125, -1.2864837646484375, -1.25091552734375, -1.2153472900390625, -1.179779052734375, -1.1442108154296875, -1.108642578125, -1.0730743408203125, -1.037506103515625, -1.0019378662109375, -0.96636962890625, -0.9308013916015625, -0.895233154296875, -0.8596649169921875, -0.8240966796875, -0.7885284423828125, -0.752960205078125, -0.7173919677734375, -0.68182373046875, -0.6462554931640625, -0.610687255859375, -0.5751190185546875, -0.53955078125, -0.5039825439453125, -0.468414306640625, -0.4328460693359375, -0.39727783203125, -0.3617095947265625, -0.326141357421875, -0.2905731201171875, -0.2550048828125, -0.2194366455078125, -0.183868408203125, -0.1483001708984375, -0.11273193359375, -0.0771636962890625, -0.041595458984375, -0.0060272216796875, 0.029541015625, 0.0651092529296875, 0.100677490234375, 0.1362457275390625, 0.17181396484375, 0.2073822021484375, 0.242950439453125, 0.2785186767578125, 0.3140869140625, 0.3496551513671875, 0.385223388671875, 0.4207916259765625, 0.45635986328125, 0.4919281005859375, 0.527496337890625, 0.5630645751953125, 0.5986328125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 2.0, 5.0, 10.0, 11.0, 7.0, 9.0, 15.0, 27.0, 35.0, 60.0, 78.0, 132.0, 222.0, 374.0, 893.0, 3102.0, 15186.0, 8280971.0, 77865.0, 6677.0, 1694.0, 600.0, 275.0, 132.0, 74.0, 41.0, 26.0, 23.0, 12.0, 8.0, 6.0, 1.0, 4.0, 2.0, 3.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5169224739074707, -2.4445338249206543, -2.372144937515259, -2.2997562885284424, -2.227367401123047, -2.1549787521362305, -2.082590103149414, -2.0102014541625977, -1.9378125667572021, -1.8654237985610962, -1.7930350303649902, -1.7206463813781738, -1.6482576131820679, -1.575868844985962, -1.5034801959991455, -1.4310914278030396, -1.3587026596069336, -1.2863138914108276, -1.2139251232147217, -1.1415364742279053, -1.0691477060317993, -0.9967589378356934, -0.9243702292442322, -0.851981520652771, -0.779592752456665, -0.7072039842605591, -0.6348152756690979, -0.5624265670776367, -0.49003779888153076, -0.4176490604877472, -0.3452603220939636, -0.27287161350250244, -0.20048260688781738, -0.1280938684940338, -0.055705130100250244, 0.016683608293533325, 0.0890723466873169, 0.16146108508110046, 0.23384982347488403, 0.3062385320663452, 0.37862730026245117, 0.45101603865623474, 0.5234047770500183, 0.5957934856414795, 0.6681822538375854, 0.7405710220336914, 0.8129597306251526, 0.8853484392166138, 0.9577372074127197, 1.0301259756088257, 1.1025147438049316, 1.174903392791748, 1.247292160987854, 1.31968092918396, 1.3920695781707764, 1.4644583463668823, 1.5368471145629883, 1.6092358827590942, 1.6816246509552002, 1.7540132999420166, 1.8264020681381226, 1.8987908363342285, 1.971179485321045, 2.0435681343078613, 2.115957021713257]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 6.0, 4.0, 1.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 5.0, 5.0, 6.0, 5.0, 6.0, 3.0, 5.0, 3.0, 2.0, 3.0, 3.0, 2.0, 3.0, 3.0, 3.0, 3.0, 3.0, 5.0, 2.0, 1.0, 6.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6380681991577148, -1.5474196672439575, -1.4567710161209106, -1.3661224842071533, -1.2754738330841064, -1.1848253011703491, -1.0941767692565918, -1.003528118133545, -0.9128795862197876, -0.8222309947013855, -0.7315824031829834, -0.6409338712692261, -0.550285279750824, -0.4596366882324219, -0.36898815631866455, -0.27833956480026245, -0.18769097328186035, -0.09704239666461945, -0.00639382004737854, 0.08425474166870117, 0.17490333318710327, 0.26555192470550537, 0.3562004566192627, 0.4468490481376648, 0.5374976396560669, 0.628146231174469, 0.7187948226928711, 0.8094433546066284, 0.9000919461250305, 0.9907405376434326, 1.08138906955719, 1.1720376014709473, 1.2626862525939941, 1.3533347845077515, 1.4439834356307983, 1.5346319675445557, 1.6252806186676025, 1.7159291505813599, 1.8065776824951172, 1.897226333618164, 1.9878748655319214, 2.0785233974456787, 2.1691720485687256, 2.2598204612731934, 2.3504691123962402, 2.441117763519287, 2.531766414642334, 2.6224148273468018, 2.7130634784698486, 2.8037121295928955, 2.8943605422973633, 2.98500919342041, 3.075657844543457, 3.166306495666504, 3.2569549083709717, 3.3476035594940186, 3.4382519721984863, 3.528900623321533, 3.619549036026001, 3.710197687149048, 3.8008463382720947, 3.8914947509765625, 3.9821434020996094, 4.072792053222656, 4.163440704345703]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 7.0, 1.0, 1.0, 10.0, 10.0, 16.0, 14.0, 18.0, 29.0, 29.0, 28.0, 46.0, 47.0, 50.0, 54.0, 69.0, 58.0, 57.0, 58.0, 60.0, 43.0, 45.0, 46.0, 42.0, 35.0, 31.0, 25.0, 20.0, 25.0, 7.0, 6.0, 6.0, 3.0, 5.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17822265625, -0.1723461151123047, -0.16646957397460938, -0.16059303283691406, -0.15471649169921875, -0.14883995056152344, -0.14296340942382812, -0.1370868682861328, -0.1312103271484375, -0.1253337860107422, -0.11945724487304688, -0.11358070373535156, -0.10770416259765625, -0.10182762145996094, -0.09595108032226562, -0.09007453918457031, -0.084197998046875, -0.07832145690917969, -0.07244491577148438, -0.06656837463378906, -0.06069183349609375, -0.05481529235839844, -0.048938751220703125, -0.04306221008300781, -0.0371856689453125, -0.03130912780761719, -0.025432586669921875, -0.019556045532226562, -0.01367950439453125, -0.0078029632568359375, -0.001926422119140625, 0.0039501190185546875, 0.00982666015625, 0.015703201293945312, 0.021579742431640625, 0.027456283569335938, 0.03333282470703125, 0.03920936584472656, 0.045085906982421875, 0.05096244812011719, 0.0568389892578125, 0.06271553039550781, 0.06859207153320312, 0.07446861267089844, 0.08034515380859375, 0.08622169494628906, 0.09209823608398438, 0.09797477722167969, 0.103851318359375, 0.10972785949707031, 0.11560440063476562, 0.12148094177246094, 0.12735748291015625, 0.13323402404785156, 0.13911056518554688, 0.1449871063232422, 0.1508636474609375, 0.1567401885986328, 0.16261672973632812, 0.16849327087402344, 0.17436981201171875, 0.18024635314941406, 0.18612289428710938, 0.1919994354248047, 0.1978759765625]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 6.0, 7.0, 8.0, 13.0, 30.0, 34.0, 40.0, 71.0, 126.0, 215.0, 317.0, 566.0, 1083.0, 2263.0, 5575.0, 17512.0, 82091.0, 306176.0, 80806.0, 17272.0, 5464.0, 2193.0, 1057.0, 588.0, 314.0, 169.0, 99.0, 63.0, 55.0, 21.0, 12.0, 16.0, 6.0, 4.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0], "bins": [-6.71484375, -6.553009033203125, -6.39117431640625, -6.229339599609375, -6.0675048828125, -5.905670166015625, -5.74383544921875, -5.582000732421875, -5.420166015625, -5.258331298828125, -5.09649658203125, -4.934661865234375, -4.7728271484375, -4.610992431640625, -4.44915771484375, -4.287322998046875, -4.12548828125, -3.963653564453125, -3.80181884765625, -3.639984130859375, -3.4781494140625, -3.316314697265625, -3.15447998046875, -2.992645263671875, -2.830810546875, -2.668975830078125, -2.50714111328125, -2.345306396484375, -2.1834716796875, -2.021636962890625, -1.85980224609375, -1.697967529296875, -1.5361328125, -1.374298095703125, -1.21246337890625, -1.050628662109375, -0.8887939453125, -0.726959228515625, -0.56512451171875, -0.403289794921875, -0.241455078125, -0.079620361328125, 0.08221435546875, 0.244049072265625, 0.4058837890625, 0.567718505859375, 0.72955322265625, 0.891387939453125, 1.05322265625, 1.215057373046875, 1.37689208984375, 1.538726806640625, 1.7005615234375, 1.862396240234375, 2.02423095703125, 2.186065673828125, 2.347900390625, 2.509735107421875, 2.67156982421875, 2.833404541015625, 2.9952392578125, 3.157073974609375, 3.31890869140625, 3.480743408203125, 3.642578125]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 7.0, 7.0, 17.0, 39.0, 53.0, 77.0, 102.0, 117.0, 144.0, 128.0, 118.0, 80.0, 51.0, 36.0, 19.0, 7.0, 3.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3017578125, -1.2742881774902344, -1.2468185424804688, -1.2193489074707031, -1.1918792724609375, -1.1644096374511719, -1.1369400024414062, -1.1094703674316406, -1.082000732421875, -1.0545310974121094, -1.0270614624023438, -0.9995918273925781, -0.9721221923828125, -0.9446525573730469, -0.9171829223632812, -0.8897132873535156, -0.86224365234375, -0.8347740173339844, -0.8073043823242188, -0.7798347473144531, -0.7523651123046875, -0.7248954772949219, -0.6974258422851562, -0.6699562072753906, -0.642486572265625, -0.6150169372558594, -0.5875473022460938, -0.5600776672363281, -0.5326080322265625, -0.5051383972167969, -0.47766876220703125, -0.4501991271972656, -0.4227294921875, -0.3952598571777344, -0.36779022216796875, -0.3403205871582031, -0.3128509521484375, -0.2853813171386719, -0.25791168212890625, -0.23044204711914062, -0.202972412109375, -0.17550277709960938, -0.14803314208984375, -0.12056350708007812, -0.0930938720703125, -0.06562423706054688, -0.03815460205078125, -0.010684967041015625, 0.01678466796875, 0.044254302978515625, 0.07172393798828125, 0.09919357299804688, 0.1266632080078125, 0.15413284301757812, 0.18160247802734375, 0.20907211303710938, 0.236541748046875, 0.2640113830566406, 0.29148101806640625, 0.3189506530761719, 0.3464202880859375, 0.3738899230957031, 0.40135955810546875, 0.4288291931152344, 0.456298828125]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 10.0, 6.0, 15.0, 44.0, 80.0, 77.0, 78.0, 52.0, 39.0, 27.0, 20.0, 14.0, 8.0, 3.0, 2.0, 5.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6714954376220703, -1.6122031211853027, -1.5529106855392456, -1.493618369102478, -1.434325933456421, -1.3750336170196533, -1.3157413005828857, -1.2564488649368286, -1.1971564292907715, -1.137864112854004, -1.0785716772079468, -1.0192793607711792, -0.9599869251251221, -0.9006946086883545, -0.8414022326469421, -0.7821098566055298, -0.7228175401687622, -0.6635251641273499, -0.6042327880859375, -0.5449404716491699, -0.4856480658054352, -0.4263556897640228, -0.36706334352493286, -0.3077709674835205, -0.24847859144210815, -0.1891862154006958, -0.12989385426044464, -0.07060149312019348, -0.011309117078781128, 0.047983258962631226, 0.10727560520172119, 0.16656798124313354, 0.2258603572845459, 0.28515273332595825, 0.3444451093673706, 0.40373745560646057, 0.4630298316478729, 0.5223221778869629, 0.5816145539283752, 0.6409069299697876, 0.7001993060112, 0.7594916820526123, 0.8187840580940247, 0.878076434135437, 0.9373687505722046, 0.9966611862182617, 1.0559535026550293, 1.1152458190917969, 1.174538254737854, 1.2338305711746216, 1.2931230068206787, 1.3524153232574463, 1.4117077589035034, 1.471000075340271, 1.5302925109863281, 1.5895848274230957, 1.6488771438598633, 1.7081694602966309, 1.767461895942688, 1.8267542123794556, 1.8860466480255127, 1.9453389644622803, 2.004631280899048, 2.0639238357543945, 2.123216152191162]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 7.0, 2.0, 9.0, 7.0, 6.0, 8.0, 9.0, 13.0, 29.0, 44.0, 56.0, 84.0, 61.0, 42.0, 35.0, 19.0, 8.0, 12.0, 7.0, 6.0, 3.0, 4.0, 6.0, 4.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1091551780700684, -2.0538675785064697, -1.9985800981521606, -1.9432926177978516, -1.8880051374435425, -1.8327176570892334, -1.7774300575256348, -1.7221425771713257, -1.6668550968170166, -1.6115676164627075, -1.5562800168991089, -1.5009925365447998, -1.4457050561904907, -1.3904175758361816, -1.335129976272583, -1.279842495918274, -1.2245548963546753, -1.1692674160003662, -1.1139798164367676, -1.0586923360824585, -1.0034048557281494, -0.9481173157691956, -0.8928297758102417, -0.8375422954559326, -0.7822547554969788, -0.7269672155380249, -0.6716797351837158, -0.616392195224762, -0.5611046552658081, -0.505817174911499, -0.45052963495254517, -0.3952421247959137, -0.3399546146392822, -0.28466710448265076, -0.2293795794248581, -0.17409205436706543, -0.11880454421043396, -0.06351703405380249, -0.008229494094848633, 0.04705801606178284, 0.1023455262184143, 0.15763303637504578, 0.21292056143283844, 0.2682080864906311, 0.3234955966472626, 0.37878310680389404, 0.4340706467628479, 0.48935815691947937, 0.5446456670761108, 0.5999332070350647, 0.6552206873893738, 0.7105082273483276, 0.7657957077026367, 0.8210832476615906, 0.8763707876205444, 0.9316582679748535, 0.9869458079338074, 1.0422333478927612, 1.0975208282470703, 1.152808427810669, 1.208095908164978, 1.263383388519287, 1.3186709880828857, 1.3739584684371948, 1.429245948791504]}, "eval/loss": 3.0510671138763428, "eval/bleu": 1.5827445667544166e-18, "eval/runtime": 2619.9089, "eval/samples_per_second": 5.634, "eval/steps_per_second": 0.704} \ No newline at end of file +{"train/loss": 0.9251, "train/learning_rate": 3.2066153313506185e-07, "train/epoch": 3.0, "train/global_step": 9720, "_runtime": 93795, "_timestamp": 1651767884, "_step": 9739, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 10.0, 41.0, 232.0, 466.0, 211.0, 43.0, 14.0, 1.0], "bins": [-22.81093406677246, -22.4266300201416, -22.042327880859375, -21.658023834228516, -21.27372169494629, -20.88941764831543, -20.505115509033203, -20.120811462402344, -19.736509323120117, -19.352205276489258, -18.96790313720703, -18.583599090576172, -18.199296951293945, -17.814992904663086, -17.43069076538086, -17.04638671875, -16.66208267211914, -16.27777862548828, -15.893476486206055, -15.509173393249512, -15.124870300292969, -14.740567207336426, -14.356264114379883, -13.971960067749023, -13.587657928466797, -13.203354835510254, -12.819051742553711, -12.434748649597168, -12.050445556640625, -11.666142463684082, -11.281839370727539, -10.89753532409668, -10.513232231140137, -10.128929138183594, -9.74462604522705, -9.360322952270508, -8.976019859313965, -8.591716766357422, -8.207412719726562, -7.823110103607178, -7.438807487487793, -7.05450439453125, -6.670201301574707, -6.285898208618164, -5.901595115661621, -5.517292022705078, -5.132988452911377, -4.748685359954834, -4.364382266998291, -3.980079174041748, -3.595776081085205, -3.211472749710083, -2.82716965675354, -2.442866563796997, -2.058563232421875, -1.674260139465332, -1.2899569272994995, -0.9056537747383118, -0.521350622177124, -0.1370474100112915, 0.24725568294525146, 0.6315587759017944, 1.0158621072769165, 1.4001652002334595, 1.7844682931900024]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 6.0, 5.0, 7.0, 3.0, 8.0, 13.0, 11.0, 13.0, 15.0, 16.0, 22.0, 21.0, 24.0, 29.0, 26.0, 28.0, 39.0, 33.0, 41.0, 34.0, 32.0, 33.0, 47.0, 38.0, 41.0, 30.0, 35.0, 35.0, 43.0, 38.0, 31.0, 30.0, 23.0, 33.0, 16.0, 25.0, 16.0, 12.0, 19.0, 6.0, 6.0, 8.0, 5.0, 2.0, 2.0, 0.0, 6.0, 2.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0], "bins": [-2.0006556510925293, -1.933129072189331, -1.8656026124954224, -1.7980761528015137, -1.7305495738983154, -1.6630229949951172, -1.5954965353012085, -1.5279700756072998, -1.4604434967041016, -1.3929169178009033, -1.3253904581069946, -1.257863998413086, -1.1903374195098877, -1.1228108406066895, -1.0552843809127808, -0.9877578616142273, -0.9202313423156738, -0.8527048230171204, -0.7851783037185669, -0.7176517844200134, -0.65012526512146, -0.5825987458229065, -0.515072226524353, -0.44754570722579956, -0.3800191879272461, -0.3124926686286926, -0.24496614933013916, -0.1774396300315857, -0.10991311073303223, -0.04238659143447876, 0.025139927864074707, 0.09266644716262817, 0.16019272804260254, 0.227719247341156, 0.2952457666397095, 0.36277228593826294, 0.4302988052368164, 0.4978253245353699, 0.5653518438339233, 0.6328783631324768, 0.7004048824310303, 0.7679314017295837, 0.8354579210281372, 0.9029844403266907, 0.9705109596252441, 1.0380375385284424, 1.105563998222351, 1.1730904579162598, 1.240617036819458, 1.3081436157226562, 1.375670075416565, 1.4431965351104736, 1.5107231140136719, 1.5782496929168701, 1.6457761526107788, 1.7133026123046875, 1.7808291912078857, 1.848355770111084, 1.9158822298049927, 1.9834086894989014, 2.0509352684020996, 2.118461847305298, 2.185988426208496, 2.2535147666931152, 2.3210413455963135]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 4.0, 7.0, 8.0, 9.0, 10.0, 20.0, 21.0, 38.0, 62.0, 83.0, 124.0, 179.0, 285.0, 389.0, 552.0, 796.0, 1204.0, 1853.0, 3058.0, 5427.0, 9892.0, 19022.0, 38094.0, 82406.0, 219508.0, 868829.0, 2214707.0, 462620.0, 142770.0, 60228.0, 28659.0, 14034.0, 7695.0, 4267.0, 2619.0, 1648.0, 1032.0, 694.0, 471.0, 298.0, 220.0, 151.0, 92.0, 76.0, 41.0, 29.0, 27.0, 10.0, 8.0, 6.0, 5.0, 1.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.96484375, -1.899993896484375, -1.83514404296875, -1.770294189453125, -1.7054443359375, -1.640594482421875, -1.57574462890625, -1.510894775390625, -1.446044921875, -1.381195068359375, -1.31634521484375, -1.251495361328125, -1.1866455078125, -1.121795654296875, -1.05694580078125, -0.992095947265625, -0.92724609375, -0.862396240234375, -0.79754638671875, -0.732696533203125, -0.6678466796875, -0.602996826171875, -0.53814697265625, -0.473297119140625, -0.408447265625, -0.343597412109375, -0.27874755859375, -0.213897705078125, -0.1490478515625, -0.084197998046875, -0.01934814453125, 0.045501708984375, 0.1103515625, 0.175201416015625, 0.24005126953125, 0.304901123046875, 0.3697509765625, 0.434600830078125, 0.49945068359375, 0.564300537109375, 0.629150390625, 0.694000244140625, 0.75885009765625, 0.823699951171875, 0.8885498046875, 0.953399658203125, 1.01824951171875, 1.083099365234375, 1.14794921875, 1.212799072265625, 1.27764892578125, 1.342498779296875, 1.4073486328125, 1.472198486328125, 1.53704833984375, 1.601898193359375, 1.666748046875, 1.731597900390625, 1.79644775390625, 1.861297607421875, 1.9261474609375, 1.990997314453125, 2.05584716796875, 2.120697021484375, 2.185546875]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 3.0, 4.0, 10.0, 4.0, 9.0, 9.0, 13.0, 11.0, 14.0, 25.0, 22.0, 30.0, 15.0, 32.0, 40.0, 40.0, 37.0, 45.0, 26.0, 51.0, 47.0, 53.0, 48.0, 48.0, 44.0, 29.0, 52.0, 41.0, 29.0, 32.0, 21.0, 23.0, 21.0, 22.0, 14.0, 10.0, 7.0, 4.0, 5.0, 4.0, 4.0, 3.0, 6.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.65625, -3.538665771484375, -3.42108154296875, -3.303497314453125, -3.1859130859375, -3.068328857421875, -2.95074462890625, -2.833160400390625, -2.715576171875, -2.597991943359375, -2.48040771484375, -2.362823486328125, -2.2452392578125, -2.127655029296875, -2.01007080078125, -1.892486572265625, -1.77490234375, -1.657318115234375, -1.53973388671875, -1.422149658203125, -1.3045654296875, -1.186981201171875, -1.06939697265625, -0.951812744140625, -0.834228515625, -0.716644287109375, -0.59906005859375, -0.481475830078125, -0.3638916015625, -0.246307373046875, -0.12872314453125, -0.011138916015625, 0.1064453125, 0.224029541015625, 0.34161376953125, 0.459197998046875, 0.5767822265625, 0.694366455078125, 0.81195068359375, 0.929534912109375, 1.047119140625, 1.164703369140625, 1.28228759765625, 1.399871826171875, 1.5174560546875, 1.635040283203125, 1.75262451171875, 1.870208740234375, 1.98779296875, 2.105377197265625, 2.22296142578125, 2.340545654296875, 2.4581298828125, 2.575714111328125, 2.69329833984375, 2.810882568359375, 2.928466796875, 3.046051025390625, 3.16363525390625, 3.281219482421875, 3.3988037109375, 3.516387939453125, 3.63397216796875, 3.751556396484375, 3.869140625]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 6.0, 3.0, 6.0, 7.0, 11.0, 11.0, 21.0, 35.0, 58.0, 86.0, 172.0, 1069.0, 4186925.0, 5374.0, 249.0, 95.0, 60.0, 26.0, 22.0, 30.0, 13.0, 3.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-65.5625, -63.6708984375, -61.779296875, -59.8876953125, -57.99609375, -56.1044921875, -54.212890625, -52.3212890625, -50.4296875, -48.5380859375, -46.646484375, -44.7548828125, -42.86328125, -40.9716796875, -39.080078125, -37.1884765625, -35.296875, -33.4052734375, -31.513671875, -29.6220703125, -27.73046875, -25.8388671875, -23.947265625, -22.0556640625, -20.1640625, -18.2724609375, -16.380859375, -14.4892578125, -12.59765625, -10.7060546875, -8.814453125, -6.9228515625, -5.03125, -3.1396484375, -1.248046875, 0.6435546875, 2.53515625, 4.4267578125, 6.318359375, 8.2099609375, 10.1015625, 11.9931640625, 13.884765625, 15.7763671875, 17.66796875, 19.5595703125, 21.451171875, 23.3427734375, 25.234375, 27.1259765625, 29.017578125, 30.9091796875, 32.80078125, 34.6923828125, 36.583984375, 38.4755859375, 40.3671875, 42.2587890625, 44.150390625, 46.0419921875, 47.93359375, 49.8251953125, 51.716796875, 53.6083984375, 55.5]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 4.0, 6.0, 6.0, 15.0, 18.0, 24.0, 26.0, 66.0, 92.0, 157.0, 682.0, 2059.0, 554.0, 142.0, 84.0, 49.0, 29.0, 22.0, 13.0, 13.0, 11.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.216796875, -2.14630126953125, -2.0758056640625, -2.00531005859375, -1.934814453125, -1.86431884765625, -1.7938232421875, -1.72332763671875, -1.65283203125, -1.58233642578125, -1.5118408203125, -1.44134521484375, -1.370849609375, -1.30035400390625, -1.2298583984375, -1.15936279296875, -1.0888671875, -1.01837158203125, -0.9478759765625, -0.87738037109375, -0.806884765625, -0.73638916015625, -0.6658935546875, -0.59539794921875, -0.52490234375, -0.45440673828125, -0.3839111328125, -0.31341552734375, -0.242919921875, -0.17242431640625, -0.1019287109375, -0.03143310546875, 0.0390625, 0.10955810546875, 0.1800537109375, 0.25054931640625, 0.321044921875, 0.39154052734375, 0.4620361328125, 0.53253173828125, 0.60302734375, 0.67352294921875, 0.7440185546875, 0.81451416015625, 0.885009765625, 0.95550537109375, 1.0260009765625, 1.09649658203125, 1.1669921875, 1.23748779296875, 1.3079833984375, 1.37847900390625, 1.448974609375, 1.51947021484375, 1.5899658203125, 1.66046142578125, 1.73095703125, 1.80145263671875, 1.8719482421875, 1.94244384765625, 2.012939453125, 2.08343505859375, 2.1539306640625, 2.22442626953125, 2.294921875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 4.0, 4.0, 13.0, 26.0, 31.0, 35.0, 72.0, 82.0, 131.0, 130.0, 138.0, 111.0, 78.0, 52.0, 37.0, 24.0, 12.0, 9.0, 5.0, 10.0, 4.0, 1.0, 1.0, 2.0, 2.0], "bins": [-12.560930252075195, -12.301332473754883, -12.04173469543457, -11.782137870788574, -11.522540092468262, -11.26294231414795, -11.003345489501953, -10.74374771118164, -10.484149932861328, -10.224552154541016, -9.964954376220703, -9.705357551574707, -9.445759773254395, -9.186161994934082, -8.926565170288086, -8.666967391967773, -8.407369613647461, -8.147771835327148, -7.888174533843994, -7.62857723236084, -7.368979454040527, -7.109381675720215, -6.8497843742370605, -6.590187072753906, -6.330589294433594, -6.070991516113281, -5.811394214630127, -5.551796913146973, -5.29219913482666, -5.032601356506348, -4.773004055023193, -4.513406753540039, -4.253809928894043, -3.9942123889923096, -3.734614849090576, -3.4750173091888428, -3.2154197692871094, -2.955822229385376, -2.6962246894836426, -2.436627149581909, -2.177029609680176, -1.9174320697784424, -1.657834529876709, -1.3982369899749756, -1.1386394500732422, -0.8790419101715088, -0.6194443702697754, -0.359846830368042, -0.1002492904663086, 0.1593482494354248, 0.4189457893371582, 0.6785433292388916, 0.938140869140625, 1.1977384090423584, 1.4573359489440918, 1.7169334888458252, 1.9765310287475586, 2.236128568649292, 2.4957261085510254, 2.755323648452759, 3.014921188354492, 3.2745187282562256, 3.534116268157959, 3.7937138080596924, 4.053311347961426]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 4.0, 3.0, 6.0, 6.0, 9.0, 6.0, 10.0, 11.0, 16.0, 14.0, 16.0, 19.0, 18.0, 17.0, 29.0, 28.0, 34.0, 48.0, 40.0, 34.0, 31.0, 49.0, 33.0, 45.0, 38.0, 36.0, 44.0, 42.0, 32.0, 32.0, 29.0, 32.0, 32.0, 24.0, 27.0, 15.0, 20.0, 23.0, 11.0, 17.0, 5.0, 8.0, 3.0, 4.0, 0.0, 2.0, 2.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.888427495956421, -2.7885069847106934, -2.688586711883545, -2.5886662006378174, -2.488745927810669, -2.3888254165649414, -2.288905143737793, -2.1889846324920654, -2.089064121246338, -1.9891437292099, -1.889223337173462, -1.7893028259277344, -1.689382553100586, -1.5894620418548584, -1.4895416498184204, -1.3896212577819824, -1.289700984954834, -1.189780592918396, -1.089860200881958, -0.9899397492408752, -0.8900193572044373, -0.7900989651679993, -0.6901785135269165, -0.5902581214904785, -0.4903377294540405, -0.39041733741760254, -0.29049691557884216, -0.1905764937400818, -0.0906561017036438, 0.00926429033279419, 0.10918474197387695, 0.20910513401031494, 0.30902528762817383, 0.4089456796646118, 0.5088660717010498, 0.6087865233421326, 0.7087069153785706, 0.8086273074150085, 0.9085477590560913, 1.0084681510925293, 1.1083885431289673, 1.2083089351654053, 1.3082293272018433, 1.4081497192382812, 1.5080702304840088, 1.6079905033111572, 1.7079110145568848, 1.8078314065933228, 1.9077517986297607, 2.0076723098754883, 2.1075925827026367, 2.2075130939483643, 2.3074333667755127, 2.4073538780212402, 2.5072741508483887, 2.607194662094116, 2.7071151733398438, 2.8070356845855713, 2.9069559574127197, 3.0068764686584473, 3.1067967414855957, 3.2067172527313232, 3.306637763977051, 3.406558036804199, 3.5064783096313477]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 6.0, 13.0, 8.0, 16.0, 31.0, 47.0, 88.0, 148.0, 271.0, 435.0, 753.0, 1359.0, 2627.0, 5296.0, 11371.0, 26243.0, 65216.0, 173036.0, 349536.0, 248225.0, 96093.0, 37240.0, 15846.0, 7179.0, 3501.0, 1695.0, 932.0, 565.0, 317.0, 188.0, 131.0, 56.0, 20.0, 24.0, 13.0, 12.0, 5.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.291015625, -1.24603271484375, -1.2010498046875, -1.15606689453125, -1.111083984375, -1.06610107421875, -1.0211181640625, -0.97613525390625, -0.93115234375, -0.88616943359375, -0.8411865234375, -0.79620361328125, -0.751220703125, -0.70623779296875, -0.6612548828125, -0.61627197265625, -0.5712890625, -0.52630615234375, -0.4813232421875, -0.43634033203125, -0.391357421875, -0.34637451171875, -0.3013916015625, -0.25640869140625, -0.21142578125, -0.16644287109375, -0.1214599609375, -0.07647705078125, -0.031494140625, 0.01348876953125, 0.0584716796875, 0.10345458984375, 0.1484375, 0.19342041015625, 0.2384033203125, 0.28338623046875, 0.328369140625, 0.37335205078125, 0.4183349609375, 0.46331787109375, 0.50830078125, 0.55328369140625, 0.5982666015625, 0.64324951171875, 0.688232421875, 0.73321533203125, 0.7781982421875, 0.82318115234375, 0.8681640625, 0.91314697265625, 0.9581298828125, 1.00311279296875, 1.048095703125, 1.09307861328125, 1.1380615234375, 1.18304443359375, 1.22802734375, 1.27301025390625, 1.3179931640625, 1.36297607421875, 1.407958984375, 1.45294189453125, 1.4979248046875, 1.54290771484375, 1.587890625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 3.0, 12.0, 9.0, 14.0, 19.0, 27.0, 19.0, 30.0, 32.0, 37.0, 41.0, 47.0, 64.0, 63.0, 50.0, 65.0, 54.0, 59.0, 55.0, 52.0, 56.0, 37.0, 42.0, 28.0, 25.0, 14.0, 9.0, 15.0, 7.0, 6.0, 4.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.1015625, -3.98828125, -3.875, -3.76171875, -3.6484375, -3.53515625, -3.421875, -3.30859375, -3.1953125, -3.08203125, -2.96875, -2.85546875, -2.7421875, -2.62890625, -2.515625, -2.40234375, -2.2890625, -2.17578125, -2.0625, -1.94921875, -1.8359375, -1.72265625, -1.609375, -1.49609375, -1.3828125, -1.26953125, -1.15625, -1.04296875, -0.9296875, -0.81640625, -0.703125, -0.58984375, -0.4765625, -0.36328125, -0.25, -0.13671875, -0.0234375, 0.08984375, 0.203125, 0.31640625, 0.4296875, 0.54296875, 0.65625, 0.76953125, 0.8828125, 0.99609375, 1.109375, 1.22265625, 1.3359375, 1.44921875, 1.5625, 1.67578125, 1.7890625, 1.90234375, 2.015625, 2.12890625, 2.2421875, 2.35546875, 2.46875, 2.58203125, 2.6953125, 2.80859375, 2.921875, 3.03515625, 3.1484375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 6.0, 3.0, 3.0, 3.0, 11.0, 17.0, 21.0, 30.0, 42.0, 76.0, 101.0, 183.0, 418.0, 634.0, 1361.0, 3222.0, 8430.0, 25532.0, 94036.0, 378079.0, 394984.0, 99770.0, 26703.0, 8597.0, 3250.0, 1409.0, 724.0, 355.0, 188.0, 127.0, 78.0, 48.0, 36.0, 18.0, 21.0, 10.0, 9.0, 5.0, 2.0, 7.0, 4.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.8125, -1.7607421875, -1.708984375, -1.6572265625, -1.60546875, -1.5537109375, -1.501953125, -1.4501953125, -1.3984375, -1.3466796875, -1.294921875, -1.2431640625, -1.19140625, -1.1396484375, -1.087890625, -1.0361328125, -0.984375, -0.9326171875, -0.880859375, -0.8291015625, -0.77734375, -0.7255859375, -0.673828125, -0.6220703125, -0.5703125, -0.5185546875, -0.466796875, -0.4150390625, -0.36328125, -0.3115234375, -0.259765625, -0.2080078125, -0.15625, -0.1044921875, -0.052734375, -0.0009765625, 0.05078125, 0.1025390625, 0.154296875, 0.2060546875, 0.2578125, 0.3095703125, 0.361328125, 0.4130859375, 0.46484375, 0.5166015625, 0.568359375, 0.6201171875, 0.671875, 0.7236328125, 0.775390625, 0.8271484375, 0.87890625, 0.9306640625, 0.982421875, 1.0341796875, 1.0859375, 1.1376953125, 1.189453125, 1.2412109375, 1.29296875, 1.3447265625, 1.396484375, 1.4482421875, 1.5]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 6.0, 6.0, 4.0, 4.0, 7.0, 9.0, 11.0, 10.0, 15.0, 8.0, 24.0, 28.0, 30.0, 38.0, 33.0, 28.0, 38.0, 32.0, 41.0, 34.0, 45.0, 37.0, 47.0, 44.0, 54.0, 44.0, 41.0, 36.0, 25.0, 35.0, 34.0, 25.0, 17.0, 17.0, 13.0, 19.0, 13.0, 11.0, 8.0, 10.0, 12.0, 12.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.609375, -5.43597412109375, -5.2625732421875, -5.08917236328125, -4.915771484375, -4.74237060546875, -4.5689697265625, -4.39556884765625, -4.22216796875, -4.04876708984375, -3.8753662109375, -3.70196533203125, -3.528564453125, -3.35516357421875, -3.1817626953125, -3.00836181640625, -2.8349609375, -2.66156005859375, -2.4881591796875, -2.31475830078125, -2.141357421875, -1.96795654296875, -1.7945556640625, -1.62115478515625, -1.44775390625, -1.27435302734375, -1.1009521484375, -0.92755126953125, -0.754150390625, -0.58074951171875, -0.4073486328125, -0.23394775390625, -0.060546875, 0.11285400390625, 0.2862548828125, 0.45965576171875, 0.633056640625, 0.80645751953125, 0.9798583984375, 1.15325927734375, 1.32666015625, 1.50006103515625, 1.6734619140625, 1.84686279296875, 2.020263671875, 2.19366455078125, 2.3670654296875, 2.54046630859375, 2.7138671875, 2.88726806640625, 3.0606689453125, 3.23406982421875, 3.407470703125, 3.58087158203125, 3.7542724609375, 3.92767333984375, 4.10107421875, 4.27447509765625, 4.4478759765625, 4.62127685546875, 4.794677734375, 4.96807861328125, 5.1414794921875, 5.31488037109375, 5.48828125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 9.0, 2.0, 7.0, 14.0, 26.0, 37.0, 37.0, 57.0, 85.0, 121.0, 227.0, 306.0, 540.0, 838.0, 1482.0, 2504.0, 4760.0, 9445.0, 21136.0, 53814.0, 170990.0, 420848.0, 237123.0, 73071.0, 26541.0, 11585.0, 5552.0, 3031.0, 1710.0, 1020.0, 557.0, 346.0, 239.0, 154.0, 103.0, 67.0, 48.0, 45.0, 22.0, 20.0, 8.0, 9.0, 5.0, 5.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.373779296875, -0.3619651794433594, -0.35015106201171875, -0.3383369445800781, -0.3265228271484375, -0.3147087097167969, -0.30289459228515625, -0.2910804748535156, -0.279266357421875, -0.2674522399902344, -0.25563812255859375, -0.24382400512695312, -0.2320098876953125, -0.22019577026367188, -0.20838165283203125, -0.19656753540039062, -0.18475341796875, -0.17293930053710938, -0.16112518310546875, -0.14931106567382812, -0.1374969482421875, -0.12568283081054688, -0.11386871337890625, -0.10205459594726562, -0.090240478515625, -0.07842636108398438, -0.06661224365234375, -0.054798126220703125, -0.0429840087890625, -0.031169891357421875, -0.01935577392578125, -0.007541656494140625, 0.0042724609375, 0.016086578369140625, 0.02790069580078125, 0.039714813232421875, 0.0515289306640625, 0.06334304809570312, 0.07515716552734375, 0.08697128295898438, 0.098785400390625, 0.11059951782226562, 0.12241363525390625, 0.13422775268554688, 0.1460418701171875, 0.15785598754882812, 0.16967010498046875, 0.18148422241210938, 0.19329833984375, 0.20511245727539062, 0.21692657470703125, 0.22874069213867188, 0.2405548095703125, 0.2523689270019531, 0.26418304443359375, 0.2759971618652344, 0.287811279296875, 0.2996253967285156, 0.31143951416015625, 0.3232536315917969, 0.3350677490234375, 0.3468818664550781, 0.35869598388671875, 0.3705101013183594, 0.38232421875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 2.0, 3.0, 5.0, 12.0, 14.0, 28.0, 20.0, 40.0, 66.0, 81.0, 106.0, 125.0, 142.0, 102.0, 76.0, 54.0, 28.0, 32.0, 21.0, 11.0, 10.0, 6.0, 6.0, 3.0, 3.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00037741661071777344, -0.00036386027932167053, -0.0003503039479255676, -0.0003367476165294647, -0.0003231912851333618, -0.0003096349537372589, -0.000296078622341156, -0.0002825222909450531, -0.0002689659595489502, -0.0002554096281528473, -0.00024185329675674438, -0.00022829696536064148, -0.00021474063396453857, -0.00020118430256843567, -0.00018762797117233276, -0.00017407163977622986, -0.00016051530838012695, -0.00014695897698402405, -0.00013340264558792114, -0.00011984631419181824, -0.00010628998279571533, -9.273365139961243e-05, -7.917732000350952e-05, -6.562098860740662e-05, -5.206465721130371e-05, -3.8508325815200806e-05, -2.49519944190979e-05, -1.1395663022994995e-05, 2.16066837310791e-06, 1.5716999769210815e-05, 2.927333116531372e-05, 4.2829662561416626e-05, 5.638599395751953e-05, 6.994232535362244e-05, 8.349865674972534e-05, 9.705498814582825e-05, 0.00011061131954193115, 0.00012416765093803406, 0.00013772398233413696, 0.00015128031373023987, 0.00016483664512634277, 0.00017839297652244568, 0.00019194930791854858, 0.0002055056393146515, 0.0002190619707107544, 0.0002326183021068573, 0.0002461746335029602, 0.0002597309648990631, 0.000273287296295166, 0.0002868436276912689, 0.0003003999590873718, 0.00031395629048347473, 0.00032751262187957764, 0.00034106895327568054, 0.00035462528467178345, 0.00036818161606788635, 0.00038173794746398926, 0.00039529427886009216, 0.00040885061025619507, 0.000422406941652298, 0.0004359632730484009, 0.0004495196044445038, 0.0004630759358406067, 0.0004766322672367096, 0.0004901885986328125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 5.0, 9.0, 11.0, 14.0, 11.0, 11.0, 35.0, 40.0, 66.0, 108.0, 229.0, 976.0, 6056.0, 71367.0, 832968.0, 125746.0, 8947.0, 1273.0, 305.0, 124.0, 91.0, 50.0, 24.0, 19.0, 19.0, 9.0, 8.0, 9.0, 5.0, 5.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.376953125, -1.331939697265625, -1.28692626953125, -1.241912841796875, -1.1968994140625, -1.151885986328125, -1.10687255859375, -1.061859130859375, -1.016845703125, -0.971832275390625, -0.92681884765625, -0.881805419921875, -0.8367919921875, -0.791778564453125, -0.74676513671875, -0.701751708984375, -0.65673828125, -0.611724853515625, -0.56671142578125, -0.521697998046875, -0.4766845703125, -0.431671142578125, -0.38665771484375, -0.341644287109375, -0.296630859375, -0.251617431640625, -0.20660400390625, -0.161590576171875, -0.1165771484375, -0.071563720703125, -0.02655029296875, 0.018463134765625, 0.0634765625, 0.108489990234375, 0.15350341796875, 0.198516845703125, 0.2435302734375, 0.288543701171875, 0.33355712890625, 0.378570556640625, 0.423583984375, 0.468597412109375, 0.51361083984375, 0.558624267578125, 0.6036376953125, 0.648651123046875, 0.69366455078125, 0.738677978515625, 0.78369140625, 0.828704833984375, 0.87371826171875, 0.918731689453125, 0.9637451171875, 1.008758544921875, 1.05377197265625, 1.098785400390625, 1.143798828125, 1.188812255859375, 1.23382568359375, 1.278839111328125, 1.3238525390625, 1.368865966796875, 1.41387939453125, 1.458892822265625, 1.50390625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 5.0, 0.0, 2.0, 5.0, 1.0, 8.0, 4.0, 5.0, 17.0, 15.0, 16.0, 20.0, 29.0, 33.0, 42.0, 40.0, 50.0, 54.0, 68.0, 70.0, 59.0, 63.0, 69.0, 60.0, 46.0, 56.0, 27.0, 40.0, 30.0, 16.0, 17.0, 8.0, 12.0, 9.0, 1.0, 3.0, 3.0, 1.0, 1.0, 4.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1416015625, -0.1370220184326172, -0.13244247436523438, -0.12786293029785156, -0.12328338623046875, -0.11870384216308594, -0.11412429809570312, -0.10954475402832031, -0.1049652099609375, -0.10038566589355469, -0.09580612182617188, -0.09122657775878906, -0.08664703369140625, -0.08206748962402344, -0.07748794555664062, -0.07290840148925781, -0.068328857421875, -0.06374931335449219, -0.059169769287109375, -0.05459022521972656, -0.05001068115234375, -0.04543113708496094, -0.040851593017578125, -0.03627204895019531, -0.0316925048828125, -0.027112960815429688, -0.022533416748046875, -0.017953872680664062, -0.01337432861328125, -0.008794784545898438, -0.004215240478515625, 0.0003643035888671875, 0.00494384765625, 0.009523391723632812, 0.014102935791015625, 0.018682479858398438, 0.02326202392578125, 0.027841567993164062, 0.032421112060546875, 0.03700065612792969, 0.0415802001953125, 0.04615974426269531, 0.050739288330078125, 0.05531883239746094, 0.05989837646484375, 0.06447792053222656, 0.06905746459960938, 0.07363700866699219, 0.078216552734375, 0.08279609680175781, 0.08737564086914062, 0.09195518493652344, 0.09653472900390625, 0.10111427307128906, 0.10569381713867188, 0.11027336120605469, 0.1148529052734375, 0.11943244934082031, 0.12401199340820312, 0.12859153747558594, 0.13317108154296875, 0.13775062561035156, 0.14233016967773438, 0.1469097137451172, 0.1514892578125]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 13.0, 33.0, 121.0, 350.0, 322.0, 110.0, 40.0, 15.0, 3.0, 1.0, 3.0], "bins": [-31.517847061157227, -30.963668823242188, -30.40949058532715, -29.855310440063477, -29.301132202148438, -28.7469539642334, -28.19277572631836, -27.63859748840332, -27.08441925048828, -26.530241012573242, -25.976062774658203, -25.42188262939453, -24.867704391479492, -24.313526153564453, -23.759347915649414, -23.205169677734375, -22.650989532470703, -22.096811294555664, -21.542633056640625, -20.988452911376953, -20.434274673461914, -19.880096435546875, -19.325918197631836, -18.771739959716797, -18.217559814453125, -17.663381576538086, -17.109203338623047, -16.555023193359375, -16.000844955444336, -15.446666717529297, -14.892488479614258, -14.338310241699219, -13.784130096435547, -13.229951858520508, -12.675772666931152, -12.121594429016113, -11.567415237426758, -11.013236999511719, -10.45905876159668, -9.90488052368164, -9.350701332092285, -8.796523094177246, -8.24234390258789, -7.688165664672852, -7.133986949920654, -6.579808235168457, -6.025629997253418, -5.471451282501221, -4.917272567749023, -4.363093852996826, -3.808915376663208, -3.25473690032959, -2.7005581855773926, -2.1463794708251953, -1.5922009944915771, -1.038022518157959, -0.4838438034057617, 0.070334792137146, 0.6245133876800537, 1.1786919832229614, 1.7328705787658691, 2.2870492935180664, 2.8412277698516846, 3.3954062461853027, 3.9495849609375]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 7.0, 7.0, 5.0, 10.0, 17.0, 23.0, 28.0, 29.0, 25.0, 41.0, 35.0, 65.0, 64.0, 65.0, 64.0, 56.0, 69.0, 60.0, 52.0, 54.0, 44.0, 49.0, 42.0, 26.0, 25.0, 15.0, 9.0, 8.0, 6.0, 5.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.441911697387695, -4.322793006896973, -4.203674793243408, -4.0845561027526855, -3.965437889099121, -3.8463194370269775, -3.727200984954834, -3.6080825328826904, -3.488964080810547, -3.3698456287384033, -3.2507271766662598, -3.131608724594116, -3.0124902725219727, -2.893371820449829, -2.7742533683776855, -2.655134916305542, -2.5360164642333984, -2.416898012161255, -2.2977795600891113, -2.1786611080169678, -2.059542655944824, -1.9404242038726807, -1.821305751800537, -1.7021872997283936, -1.583068609237671, -1.4639501571655273, -1.3448317050933838, -1.2257132530212402, -1.1065948009490967, -0.9874762892723083, -0.8683578372001648, -0.7492393851280212, -0.6301209926605225, -0.5110025405883789, -0.39188408851623535, -0.2727656066417694, -0.15364715456962585, -0.03452867269515991, 0.08458977937698364, 0.2037082314491272, 0.32282668352127075, 0.4419451355934143, 0.5610635876655579, 0.6801820993423462, 0.7993005514144897, 0.9184190034866333, 1.0375374555587769, 1.1566559076309204, 1.275774359703064, 1.3948928117752075, 1.514011263847351, 1.6331297159194946, 1.7522481679916382, 1.8713667392730713, 1.9904851913452148, 2.1096036434173584, 2.228722095489502, 2.3478405475616455, 2.466958999633789, 2.5860774517059326, 2.705195903778076, 2.8243143558502197, 2.9434328079223633, 3.062551259994507, 3.1816697120666504]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 3.0, 6.0, 9.0, 17.0, 26.0, 34.0, 74.0, 129.0, 257.0, 594.0, 1410.0, 3652.0, 10241.0, 35789.0, 192897.0, 631025.0, 131685.0, 27353.0, 8093.0, 2947.0, 1208.0, 529.0, 257.0, 131.0, 79.0, 47.0, 19.0, 13.0, 12.0, 11.0, 3.0, 4.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.263671875, -2.174560546875, -2.08544921875, -1.996337890625, -1.9072265625, -1.818115234375, -1.72900390625, -1.639892578125, -1.55078125, -1.461669921875, -1.37255859375, -1.283447265625, -1.1943359375, -1.105224609375, -1.01611328125, -0.927001953125, -0.837890625, -0.748779296875, -0.65966796875, -0.570556640625, -0.4814453125, -0.392333984375, -0.30322265625, -0.214111328125, -0.125, -0.035888671875, 0.05322265625, 0.142333984375, 0.2314453125, 0.320556640625, 0.40966796875, 0.498779296875, 0.587890625, 0.677001953125, 0.76611328125, 0.855224609375, 0.9443359375, 1.033447265625, 1.12255859375, 1.211669921875, 1.30078125, 1.389892578125, 1.47900390625, 1.568115234375, 1.6572265625, 1.746337890625, 1.83544921875, 1.924560546875, 2.013671875, 2.102783203125, 2.19189453125, 2.281005859375, 2.3701171875, 2.459228515625, 2.54833984375, 2.637451171875, 2.7265625, 2.815673828125, 2.90478515625, 2.993896484375, 3.0830078125, 3.172119140625, 3.26123046875, 3.350341796875, 3.439453125]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 5.0, 2.0, 5.0, 2.0, 4.0, 5.0, 9.0, 8.0, 5.0, 14.0, 24.0, 18.0, 20.0, 23.0, 24.0, 33.0, 30.0, 29.0, 42.0, 39.0, 43.0, 43.0, 46.0, 44.0, 32.0, 39.0, 42.0, 43.0, 44.0, 32.0, 31.0, 30.0, 27.0, 27.0, 21.0, 18.0, 16.0, 17.0, 17.0, 10.0, 10.0, 4.0, 7.0, 4.0, 5.0, 6.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0], "bins": [-8.140625, -7.91253662109375, -7.6844482421875, -7.45635986328125, -7.228271484375, -7.00018310546875, -6.7720947265625, -6.54400634765625, -6.31591796875, -6.08782958984375, -5.8597412109375, -5.63165283203125, -5.403564453125, -5.17547607421875, -4.9473876953125, -4.71929931640625, -4.4912109375, -4.26312255859375, -4.0350341796875, -3.80694580078125, -3.578857421875, -3.35076904296875, -3.1226806640625, -2.89459228515625, -2.66650390625, -2.43841552734375, -2.2103271484375, -1.98223876953125, -1.754150390625, -1.52606201171875, -1.2979736328125, -1.06988525390625, -0.841796875, -0.61370849609375, -0.3856201171875, -0.15753173828125, 0.070556640625, 0.29864501953125, 0.5267333984375, 0.75482177734375, 0.98291015625, 1.21099853515625, 1.4390869140625, 1.66717529296875, 1.895263671875, 2.12335205078125, 2.3514404296875, 2.57952880859375, 2.8076171875, 3.03570556640625, 3.2637939453125, 3.49188232421875, 3.719970703125, 3.94805908203125, 4.1761474609375, 4.40423583984375, 4.63232421875, 4.86041259765625, 5.0885009765625, 5.31658935546875, 5.544677734375, 5.77276611328125, 6.0008544921875, 6.22894287109375, 6.45703125]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 5.0, 2.0, 5.0, 3.0, 7.0, 7.0, 12.0, 12.0, 12.0, 12.0, 25.0, 31.0, 42.0, 56.0, 71.0, 102.0, 132.0, 222.0, 432.0, 1308.0, 10681.0, 573857.0, 449960.0, 9307.0, 1126.0, 394.0, 209.0, 144.0, 92.0, 65.0, 47.0, 44.0, 36.0, 21.0, 28.0, 8.0, 13.0, 8.0, 2.0, 5.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.34765625, -7.12481689453125, -6.9019775390625, -6.67913818359375, -6.456298828125, -6.23345947265625, -6.0106201171875, -5.78778076171875, -5.56494140625, -5.34210205078125, -5.1192626953125, -4.89642333984375, -4.673583984375, -4.45074462890625, -4.2279052734375, -4.00506591796875, -3.7822265625, -3.55938720703125, -3.3365478515625, -3.11370849609375, -2.890869140625, -2.66802978515625, -2.4451904296875, -2.22235107421875, -1.99951171875, -1.77667236328125, -1.5538330078125, -1.33099365234375, -1.108154296875, -0.88531494140625, -0.6624755859375, -0.43963623046875, -0.216796875, 0.00604248046875, 0.2288818359375, 0.45172119140625, 0.674560546875, 0.89739990234375, 1.1202392578125, 1.34307861328125, 1.56591796875, 1.78875732421875, 2.0115966796875, 2.23443603515625, 2.457275390625, 2.68011474609375, 2.9029541015625, 3.12579345703125, 3.3486328125, 3.57147216796875, 3.7943115234375, 4.01715087890625, 4.239990234375, 4.46282958984375, 4.6856689453125, 4.90850830078125, 5.13134765625, 5.35418701171875, 5.5770263671875, 5.79986572265625, 6.022705078125, 6.24554443359375, 6.4683837890625, 6.69122314453125, 6.9140625]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 6.0, 6.0, 5.0, 9.0, 6.0, 5.0, 11.0, 12.0, 13.0, 16.0, 18.0, 21.0, 25.0, 28.0, 19.0, 39.0, 34.0, 29.0, 38.0, 26.0, 44.0, 35.0, 41.0, 54.0, 45.0, 41.0, 27.0, 42.0, 33.0, 29.0, 31.0, 30.0, 27.0, 24.0, 17.0, 16.0, 21.0, 16.0, 17.0, 12.0, 7.0, 9.0, 1.0, 6.0, 1.0, 6.0, 5.0, 2.0, 1.0, 6.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.3046875, -7.06494140625, -6.8251953125, -6.58544921875, -6.345703125, -6.10595703125, -5.8662109375, -5.62646484375, -5.38671875, -5.14697265625, -4.9072265625, -4.66748046875, -4.427734375, -4.18798828125, -3.9482421875, -3.70849609375, -3.46875, -3.22900390625, -2.9892578125, -2.74951171875, -2.509765625, -2.27001953125, -2.0302734375, -1.79052734375, -1.55078125, -1.31103515625, -1.0712890625, -0.83154296875, -0.591796875, -0.35205078125, -0.1123046875, 0.12744140625, 0.3671875, 0.60693359375, 0.8466796875, 1.08642578125, 1.326171875, 1.56591796875, 1.8056640625, 2.04541015625, 2.28515625, 2.52490234375, 2.7646484375, 3.00439453125, 3.244140625, 3.48388671875, 3.7236328125, 3.96337890625, 4.203125, 4.44287109375, 4.6826171875, 4.92236328125, 5.162109375, 5.40185546875, 5.6416015625, 5.88134765625, 6.12109375, 6.36083984375, 6.6005859375, 6.84033203125, 7.080078125, 7.31982421875, 7.5595703125, 7.79931640625, 8.0390625]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 4.0, 4.0, 3.0, 7.0, 10.0, 11.0, 29.0, 39.0, 54.0, 119.0, 214.0, 420.0, 1152.0, 3624.0, 16163.0, 129794.0, 815705.0, 66841.0, 10125.0, 2531.0, 913.0, 365.0, 178.0, 103.0, 50.0, 26.0, 27.0, 21.0, 13.0, 8.0, 5.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.818359375, -0.7904891967773438, -0.7626190185546875, -0.7347488403320312, -0.706878662109375, -0.6790084838867188, -0.6511383056640625, -0.6232681274414062, -0.59539794921875, -0.5675277709960938, -0.5396575927734375, -0.5117874145507812, -0.483917236328125, -0.45604705810546875, -0.4281768798828125, -0.40030670166015625, -0.3724365234375, -0.34456634521484375, -0.3166961669921875, -0.28882598876953125, -0.260955810546875, -0.23308563232421875, -0.2052154541015625, -0.17734527587890625, -0.14947509765625, -0.12160491943359375, -0.0937347412109375, -0.06586456298828125, -0.037994384765625, -0.01012420654296875, 0.0177459716796875, 0.04561614990234375, 0.073486328125, 0.10135650634765625, 0.1292266845703125, 0.15709686279296875, 0.184967041015625, 0.21283721923828125, 0.2407073974609375, 0.26857757568359375, 0.29644775390625, 0.32431793212890625, 0.3521881103515625, 0.38005828857421875, 0.407928466796875, 0.43579864501953125, 0.4636688232421875, 0.49153900146484375, 0.5194091796875, 0.5472793579101562, 0.5751495361328125, 0.6030197143554688, 0.630889892578125, 0.6587600708007812, 0.6866302490234375, 0.7145004272460938, 0.74237060546875, 0.7702407836914062, 0.7981109619140625, 0.8259811401367188, 0.853851318359375, 0.8817214965820312, 0.9095916748046875, 0.9374618530273438, 0.96533203125]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 4.0, 4.0, 4.0, 4.0, 10.0, 3.0, 6.0, 23.0, 42.0, 41.0, 66.0, 121.0, 150.0, 182.0, 101.0, 77.0, 47.0, 30.0, 21.0, 14.0, 13.0, 11.0, 7.0, 7.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00011426210403442383, -0.00011033471673727036, -0.00010640732944011688, -0.00010247994214296341, -9.855255484580994e-05, -9.462516754865646e-05, -9.069778025150299e-05, -8.677039295434952e-05, -8.284300565719604e-05, -7.891561836004257e-05, -7.49882310628891e-05, -7.106084376573563e-05, -6.713345646858215e-05, -6.320606917142868e-05, -5.927868187427521e-05, -5.5351294577121735e-05, -5.142390727996826e-05, -4.749651998281479e-05, -4.3569132685661316e-05, -3.964174538850784e-05, -3.571435809135437e-05, -3.17869707942009e-05, -2.7859583497047424e-05, -2.393219619989395e-05, -2.000480890274048e-05, -1.6077421605587006e-05, -1.2150034308433533e-05, -8.22264701128006e-06, -4.295259714126587e-06, -3.67872416973114e-07, 3.559514880180359e-06, 7.486902177333832e-06, 1.1414289474487305e-05, 1.5341676771640778e-05, 1.926906406879425e-05, 2.3196451365947723e-05, 2.7123838663101196e-05, 3.105122596025467e-05, 3.497861325740814e-05, 3.8906000554561615e-05, 4.283338785171509e-05, 4.676077514886856e-05, 5.0688162446022034e-05, 5.4615549743175507e-05, 5.854293704032898e-05, 6.247032433748245e-05, 6.639771163463593e-05, 7.03250989317894e-05, 7.425248622894287e-05, 7.817987352609634e-05, 8.210726082324982e-05, 8.603464812040329e-05, 8.996203541755676e-05, 9.388942271471024e-05, 9.781681001186371e-05, 0.00010174419730901718, 0.00010567158460617065, 0.00010959897190332413, 0.0001135263592004776, 0.00011745374649763107, 0.00012138113379478455, 0.00012530852109193802, 0.0001292359083890915, 0.00013316329568624496, 0.00013709068298339844]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 0.0, 2.0, 4.0, 8.0, 7.0, 15.0, 13.0, 25.0, 46.0, 56.0, 109.0, 204.0, 300.0, 692.0, 1510.0, 4056.0, 12234.0, 49897.0, 519401.0, 394488.0, 47036.0, 11734.0, 3774.0, 1459.0, 685.0, 315.0, 194.0, 106.0, 67.0, 34.0, 21.0, 20.0, 7.0, 10.0, 9.0, 3.0, 1.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.65283203125, -0.6317596435546875, -0.610687255859375, -0.5896148681640625, -0.56854248046875, -0.5474700927734375, -0.526397705078125, -0.5053253173828125, -0.4842529296875, -0.4631805419921875, -0.442108154296875, -0.4210357666015625, -0.39996337890625, -0.3788909912109375, -0.357818603515625, -0.3367462158203125, -0.315673828125, -0.2946014404296875, -0.273529052734375, -0.2524566650390625, -0.23138427734375, -0.2103118896484375, -0.189239501953125, -0.1681671142578125, -0.1470947265625, -0.1260223388671875, -0.104949951171875, -0.0838775634765625, -0.06280517578125, -0.0417327880859375, -0.020660400390625, 0.0004119873046875, 0.021484375, 0.0425567626953125, 0.063629150390625, 0.0847015380859375, 0.10577392578125, 0.1268463134765625, 0.147918701171875, 0.1689910888671875, 0.1900634765625, 0.2111358642578125, 0.232208251953125, 0.2532806396484375, 0.27435302734375, 0.2954254150390625, 0.316497802734375, 0.3375701904296875, 0.358642578125, 0.3797149658203125, 0.400787353515625, 0.4218597412109375, 0.44293212890625, 0.4640045166015625, 0.485076904296875, 0.5061492919921875, 0.5272216796875, 0.5482940673828125, 0.569366455078125, 0.5904388427734375, 0.61151123046875, 0.6325836181640625, 0.653656005859375, 0.6747283935546875, 0.69580078125]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 5.0, 3.0, 8.0, 6.0, 8.0, 10.0, 10.0, 6.0, 11.0, 21.0, 35.0, 43.0, 51.0, 46.0, 105.0, 175.0, 120.0, 71.0, 49.0, 52.0, 28.0, 21.0, 18.0, 21.0, 19.0, 6.0, 5.0, 6.0, 6.0, 7.0, 4.0, 5.0, 1.0, 4.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 0.0, 2.0], "bins": [-0.264404296875, -0.2572002410888672, -0.24999618530273438, -0.24279212951660156, -0.23558807373046875, -0.22838401794433594, -0.22117996215820312, -0.2139759063720703, -0.2067718505859375, -0.1995677947998047, -0.19236373901367188, -0.18515968322753906, -0.17795562744140625, -0.17075157165527344, -0.16354751586914062, -0.1563434600830078, -0.149139404296875, -0.1419353485107422, -0.13473129272460938, -0.12752723693847656, -0.12032318115234375, -0.11311912536621094, -0.10591506958007812, -0.09871101379394531, -0.0915069580078125, -0.08430290222167969, -0.07709884643554688, -0.06989479064941406, -0.06269073486328125, -0.05548667907714844, -0.048282623291015625, -0.04107856750488281, -0.03387451171875, -0.026670455932617188, -0.019466400146484375, -0.012262344360351562, -0.00505828857421875, 0.0021457672119140625, 0.009349822998046875, 0.016553878784179688, 0.0237579345703125, 0.030961990356445312, 0.038166046142578125, 0.04537010192871094, 0.05257415771484375, 0.05977821350097656, 0.06698226928710938, 0.07418632507324219, 0.081390380859375, 0.08859443664550781, 0.09579849243164062, 0.10300254821777344, 0.11020660400390625, 0.11741065979003906, 0.12461471557617188, 0.1318187713623047, 0.1390228271484375, 0.1462268829345703, 0.15343093872070312, 0.16063499450683594, 0.16783905029296875, 0.17504310607910156, 0.18224716186523438, 0.1894512176513672, 0.1966552734375]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 61.0, 320.0, 473.0, 126.0, 25.0, 6.0, 2.0], "bins": [-75.66742706298828, -74.3896484375, -73.11187744140625, -71.8341064453125, -70.55632781982422, -69.27854919433594, -68.00077819824219, -66.72300720214844, -65.44522857666016, -64.16744995117188, -62.889678955078125, -61.61190414428711, -60.334129333496094, -59.05635452270508, -57.77857971191406, -56.50080490112305, -55.22303009033203, -53.945255279541016, -52.66748046875, -51.389705657958984, -50.11193084716797, -48.83415603637695, -47.55638122558594, -46.27860641479492, -45.000831604003906, -43.72305679321289, -42.445281982421875, -41.16750717163086, -39.889732360839844, -38.61195755004883, -37.33418273925781, -36.0564079284668, -34.77863693237305, -33.50086212158203, -32.223087310791016, -30.9453125, -29.667537689208984, -28.38976287841797, -27.111988067626953, -25.834213256835938, -24.55643653869629, -23.278661727905273, -22.000886917114258, -20.723112106323242, -19.445337295532227, -18.16756248474121, -16.889787673950195, -15.61201286315918, -14.334238052368164, -13.056463241577148, -11.778688430786133, -10.500913619995117, -9.223138809204102, -7.945363998413086, -6.66758918762207, -5.389814376831055, -4.112040042877197, -2.8342652320861816, -1.556490421295166, -0.2787156105041504, 0.9990592002868652, 2.276834011077881, 3.5546088218688965, 4.832383632659912, 6.110158443450928]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 4.0, 7.0, 5.0, 13.0, 9.0, 9.0, 11.0, 14.0, 16.0, 19.0, 30.0, 21.0, 18.0, 34.0, 27.0, 41.0, 29.0, 23.0, 42.0, 42.0, 30.0, 41.0, 34.0, 45.0, 39.0, 37.0, 32.0, 27.0, 38.0, 27.0, 28.0, 32.0, 20.0, 24.0, 29.0, 24.0, 16.0, 11.0, 10.0, 11.0, 9.0, 7.0, 3.0, 2.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-11.042387962341309, -10.688484191894531, -10.334579467773438, -9.98067569732666, -9.626770973205566, -9.272867202758789, -8.918962478637695, -8.565058708190918, -8.21115493774414, -7.857250690460205, -7.5033464431762695, -7.149442672729492, -6.795538425445557, -6.441634178161621, -6.0877299308776855, -5.73382568359375, -5.3799214363098145, -5.026017189025879, -4.672112941741943, -4.318208694458008, -3.9643049240112305, -3.610400676727295, -3.2564964294433594, -2.902592420578003, -2.5486881732940674, -2.194783926010132, -1.8408799171447754, -1.4869756698608398, -1.1330715417861938, -0.7791674137115479, -0.4252631664276123, -0.07135915756225586, 0.2825450897216797, 0.6364492177963257, 0.9903534054756165, 1.3442575931549072, 1.6981617212295532, 2.052065849304199, 2.4059700965881348, 2.759874105453491, 3.1137783527374268, 3.4676826000213623, 3.8215866088867188, 4.175490856170654, 4.52939510345459, 4.883298873901367, 5.237203598022461, 5.591107368469238, 5.945011615753174, 6.298915863037109, 6.652820110321045, 7.0067243576049805, 7.360628128051758, 7.714532375335693, 8.068436622619629, 8.422340393066406, 8.7762451171875, 9.130148887634277, 9.484053611755371, 9.837957382202148, 10.191862106323242, 10.54576587677002, 10.899669647216797, 11.25357437133789, 11.607478141784668]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 3.0, 2.0, 3.0, 1.0, 5.0, 6.0, 8.0, 25.0, 27.0, 45.0, 69.0, 119.0, 214.0, 394.0, 828.0, 1715.0, 4468.0, 12219.0, 42664.0, 295240.0, 3206520.0, 542674.0, 61423.0, 15583.0, 5547.0, 2299.0, 1073.0, 520.0, 290.0, 129.0, 80.0, 37.0, 18.0, 15.0, 9.0, 4.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.4765625, -5.3309326171875, -5.185302734375, -5.0396728515625, -4.89404296875, -4.7484130859375, -4.602783203125, -4.4571533203125, -4.3115234375, -4.1658935546875, -4.020263671875, -3.8746337890625, -3.72900390625, -3.5833740234375, -3.437744140625, -3.2921142578125, -3.146484375, -3.0008544921875, -2.855224609375, -2.7095947265625, -2.56396484375, -2.4183349609375, -2.272705078125, -2.1270751953125, -1.9814453125, -1.8358154296875, -1.690185546875, -1.5445556640625, -1.39892578125, -1.2532958984375, -1.107666015625, -0.9620361328125, -0.81640625, -0.6707763671875, -0.525146484375, -0.3795166015625, -0.23388671875, -0.0882568359375, 0.057373046875, 0.2030029296875, 0.3486328125, 0.4942626953125, 0.639892578125, 0.7855224609375, 0.93115234375, 1.0767822265625, 1.222412109375, 1.3680419921875, 1.513671875, 1.6593017578125, 1.804931640625, 1.9505615234375, 2.09619140625, 2.2418212890625, 2.387451171875, 2.5330810546875, 2.6787109375, 2.8243408203125, 2.969970703125, 3.1156005859375, 3.26123046875, 3.4068603515625, 3.552490234375, 3.6981201171875, 3.84375]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 7.0, 10.0, 14.0, 17.0, 26.0, 57.0, 51.0, 71.0, 69.0, 84.0, 94.0, 112.0, 91.0, 79.0, 75.0, 55.0, 33.0, 29.0, 15.0, 12.0, 6.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.171875, -7.9898681640625, -7.807861328125, -7.6258544921875, -7.44384765625, -7.2618408203125, -7.079833984375, -6.8978271484375, -6.7158203125, -6.5338134765625, -6.351806640625, -6.1697998046875, -5.98779296875, -5.8057861328125, -5.623779296875, -5.4417724609375, -5.259765625, -5.0777587890625, -4.895751953125, -4.7137451171875, -4.53173828125, -4.3497314453125, -4.167724609375, -3.9857177734375, -3.8037109375, -3.6217041015625, -3.439697265625, -3.2576904296875, -3.07568359375, -2.8936767578125, -2.711669921875, -2.5296630859375, -2.34765625, -2.1656494140625, -1.983642578125, -1.8016357421875, -1.61962890625, -1.4376220703125, -1.255615234375, -1.0736083984375, -0.8916015625, -0.7095947265625, -0.527587890625, -0.3455810546875, -0.16357421875, 0.0184326171875, 0.200439453125, 0.3824462890625, 0.564453125, 0.7464599609375, 0.928466796875, 1.1104736328125, 1.29248046875, 1.4744873046875, 1.656494140625, 1.8385009765625, 2.0205078125, 2.2025146484375, 2.384521484375, 2.5665283203125, 2.74853515625, 2.9305419921875, 3.112548828125, 3.2945556640625, 3.4765625]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 5.0, 12.0, 28.0, 57.0, 145.0, 999.0, 4190117.0, 2634.0, 185.0, 63.0, 17.0, 12.0, 6.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-87.5, -85.661865234375, -83.82373046875, -81.985595703125, -80.1474609375, -78.309326171875, -76.47119140625, -74.633056640625, -72.794921875, -70.956787109375, -69.11865234375, -67.280517578125, -65.4423828125, -63.604248046875, -61.76611328125, -59.927978515625, -58.08984375, -56.251708984375, -54.41357421875, -52.575439453125, -50.7373046875, -48.899169921875, -47.06103515625, -45.222900390625, -43.384765625, -41.546630859375, -39.70849609375, -37.870361328125, -36.0322265625, -34.194091796875, -32.35595703125, -30.517822265625, -28.6796875, -26.841552734375, -25.00341796875, -23.165283203125, -21.3271484375, -19.489013671875, -17.65087890625, -15.812744140625, -13.974609375, -12.136474609375, -10.29833984375, -8.460205078125, -6.6220703125, -4.783935546875, -2.94580078125, -1.107666015625, 0.73046875, 2.568603515625, 4.40673828125, 6.244873046875, 8.0830078125, 9.921142578125, 11.75927734375, 13.597412109375, 15.435546875, 17.273681640625, 19.11181640625, 20.949951171875, 22.7880859375, 24.626220703125, 26.46435546875, 28.302490234375, 30.140625]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 7.0, 3.0, 6.0, 2.0, 11.0, 25.0, 31.0, 35.0, 49.0, 99.0, 145.0, 307.0, 674.0, 1305.0, 684.0, 302.0, 145.0, 89.0, 67.0, 38.0, 19.0, 14.0, 7.0, 7.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6435546875, -1.59130859375, -1.5390625, -1.48681640625, -1.4345703125, -1.38232421875, -1.330078125, -1.27783203125, -1.2255859375, -1.17333984375, -1.12109375, -1.06884765625, -1.0166015625, -0.96435546875, -0.912109375, -0.85986328125, -0.8076171875, -0.75537109375, -0.703125, -0.65087890625, -0.5986328125, -0.54638671875, -0.494140625, -0.44189453125, -0.3896484375, -0.33740234375, -0.28515625, -0.23291015625, -0.1806640625, -0.12841796875, -0.076171875, -0.02392578125, 0.0283203125, 0.08056640625, 0.1328125, 0.18505859375, 0.2373046875, 0.28955078125, 0.341796875, 0.39404296875, 0.4462890625, 0.49853515625, 0.55078125, 0.60302734375, 0.6552734375, 0.70751953125, 0.759765625, 0.81201171875, 0.8642578125, 0.91650390625, 0.96875, 1.02099609375, 1.0732421875, 1.12548828125, 1.177734375, 1.22998046875, 1.2822265625, 1.33447265625, 1.38671875, 1.43896484375, 1.4912109375, 1.54345703125, 1.595703125, 1.64794921875, 1.7001953125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 13.0, 21.0, 29.0, 68.0, 119.0, 195.0, 178.0, 178.0, 101.0, 54.0, 28.0, 9.0, 11.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.76431655883789, -15.431965827941895, -15.099614143371582, -14.767263412475586, -14.434911727905273, -14.102560997009277, -13.770210266113281, -13.437858581542969, -13.105507850646973, -12.773157119750977, -12.440805435180664, -12.108454704284668, -11.776103973388672, -11.44375228881836, -11.111401557922363, -10.779050827026367, -10.446699142456055, -10.114348411560059, -9.781996726989746, -9.44964599609375, -9.117294311523438, -8.784943580627441, -8.452592849731445, -8.120241165161133, -7.787890434265137, -7.455539226531982, -7.123188018798828, -6.790837287902832, -6.458486080169678, -6.126134872436523, -5.793784141540527, -5.461432933807373, -5.129082679748535, -4.796731472015381, -4.464380264282227, -4.1320295333862305, -3.799678325653076, -3.467327117919922, -3.1349761486053467, -2.8026251792907715, -2.470273971557617, -2.137922763824463, -1.8055717945098877, -1.473220705986023, -1.1408696174621582, -0.8085185289382935, -0.4761674404144287, -0.14381647109985352, 0.18853473663330078, 0.5208858251571655, 0.8532369136810303, 1.185588002204895, 1.5179390907287598, 1.8502901792526245, 2.1826412677764893, 2.5149922370910645, 2.8473434448242188, 3.179694652557373, 3.5120456218719482, 3.8443965911865234, 4.176747798919678, 4.509099006652832, 4.841449737548828, 5.173800945281982, 5.506152153015137]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 1.0, 5.0, 5.0, 5.0, 6.0, 6.0, 18.0, 15.0, 25.0, 26.0, 47.0, 32.0, 46.0, 40.0, 59.0, 54.0, 62.0, 69.0, 60.0, 67.0, 62.0, 61.0, 53.0, 54.0, 30.0, 23.0, 18.0, 18.0, 13.0, 10.0, 4.0, 9.0, 2.0, 3.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.992746829986572, -4.8575592041015625, -4.722371578216553, -4.587183475494385, -4.451995849609375, -4.316808223724365, -4.1816205978393555, -4.046432971954346, -3.911245107650757, -3.776057481765747, -3.640869617462158, -3.5056819915771484, -3.3704943656921387, -3.23530650138855, -3.10011887550354, -2.964931011199951, -2.8297433853149414, -2.6945557594299316, -2.5593678951263428, -2.424180269241333, -2.288992404937744, -2.1538047790527344, -2.0186171531677246, -1.8834294080734253, -1.748241662979126, -1.6130539178848267, -1.4778661727905273, -1.3426785469055176, -1.2074908018112183, -1.072303056716919, -0.9371153712272644, -0.8019276857376099, -0.6667399406433105, -0.5315521955490112, -0.3963645100593567, -0.26117679476737976, -0.12598907947540283, 0.009198665618896484, 0.14438635110855103, 0.27957403659820557, 0.4147617816925049, 0.5499495267868042, 0.6851372122764587, 0.8203248977661133, 0.9555126428604126, 1.090700387954712, 1.2258880138397217, 1.361075758934021, 1.4962635040283203, 1.6314512491226196, 1.766638994216919, 1.9018266201019287, 2.0370144844055176, 2.1722021102905273, 2.307389736175537, 2.442577362060547, 2.5777652263641357, 2.7129528522491455, 2.8481407165527344, 2.983328342437744, 3.118515968322754, 3.2537038326263428, 3.3888914585113525, 3.5240793228149414, 3.659266948699951]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 1.0, 2.0, 6.0, 8.0, 10.0, 18.0, 25.0, 39.0, 40.0, 72.0, 108.0, 149.0, 260.0, 467.0, 679.0, 1155.0, 1990.0, 3574.0, 6718.0, 14377.0, 36318.0, 114518.0, 378253.0, 333452.0, 97491.0, 31672.0, 12803.0, 6281.0, 3305.0, 1877.0, 1102.0, 657.0, 407.0, 258.0, 171.0, 99.0, 61.0, 40.0, 28.0, 29.0, 9.0, 12.0, 2.0, 5.0, 0.0, 3.0, 5.0, 1.0, 1.0, 5.0], "bins": [-1.2734375, -1.2389602661132812, -1.2044830322265625, -1.1700057983398438, -1.135528564453125, -1.1010513305664062, -1.0665740966796875, -1.0320968627929688, -0.99761962890625, -0.9631423950195312, -0.9286651611328125, -0.8941879272460938, -0.859710693359375, -0.8252334594726562, -0.7907562255859375, -0.7562789916992188, -0.7218017578125, -0.6873245239257812, -0.6528472900390625, -0.6183700561523438, -0.583892822265625, -0.5494155883789062, -0.5149383544921875, -0.48046112060546875, -0.44598388671875, -0.41150665283203125, -0.3770294189453125, -0.34255218505859375, -0.308074951171875, -0.27359771728515625, -0.2391204833984375, -0.20464324951171875, -0.170166015625, -0.13568878173828125, -0.1012115478515625, -0.06673431396484375, -0.032257080078125, 0.00222015380859375, 0.0366973876953125, 0.07117462158203125, 0.10565185546875, 0.14012908935546875, 0.1746063232421875, 0.20908355712890625, 0.243560791015625, 0.27803802490234375, 0.3125152587890625, 0.34699249267578125, 0.3814697265625, 0.41594696044921875, 0.4504241943359375, 0.48490142822265625, 0.519378662109375, 0.5538558959960938, 0.5883331298828125, 0.6228103637695312, 0.65728759765625, 0.6917648315429688, 0.7262420654296875, 0.7607192993164062, 0.795196533203125, 0.8296737670898438, 0.8641510009765625, 0.8986282348632812, 0.93310546875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 2.0, 0.0, 6.0, 4.0, 11.0, 12.0, 18.0, 39.0, 24.0, 41.0, 55.0, 60.0, 77.0, 70.0, 82.0, 88.0, 79.0, 66.0, 82.0, 60.0, 40.0, 29.0, 21.0, 13.0, 11.0, 10.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.46484375, -4.346405029296875, -4.22796630859375, -4.109527587890625, -3.9910888671875, -3.872650146484375, -3.75421142578125, -3.635772705078125, -3.517333984375, -3.398895263671875, -3.28045654296875, -3.162017822265625, -3.0435791015625, -2.925140380859375, -2.80670166015625, -2.688262939453125, -2.56982421875, -2.451385498046875, -2.33294677734375, -2.214508056640625, -2.0960693359375, -1.977630615234375, -1.85919189453125, -1.740753173828125, -1.622314453125, -1.503875732421875, -1.38543701171875, -1.266998291015625, -1.1485595703125, -1.030120849609375, -0.91168212890625, -0.793243408203125, -0.6748046875, -0.556365966796875, -0.43792724609375, -0.319488525390625, -0.2010498046875, -0.082611083984375, 0.03582763671875, 0.154266357421875, 0.272705078125, 0.391143798828125, 0.50958251953125, 0.628021240234375, 0.7464599609375, 0.864898681640625, 0.98333740234375, 1.101776123046875, 1.22021484375, 1.338653564453125, 1.45709228515625, 1.575531005859375, 1.6939697265625, 1.812408447265625, 1.93084716796875, 2.049285888671875, 2.167724609375, 2.286163330078125, 2.40460205078125, 2.523040771484375, 2.6414794921875, 2.759918212890625, 2.87835693359375, 2.996795654296875, 3.115234375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 2.0, 5.0, 3.0, 8.0, 6.0, 6.0, 7.0, 11.0, 11.0, 20.0, 16.0, 33.0, 57.0, 65.0, 122.0, 162.0, 261.0, 454.0, 770.0, 1418.0, 2752.0, 5952.0, 13823.0, 40045.0, 147418.0, 470631.0, 260065.0, 66986.0, 21064.0, 8371.0, 3673.0, 1810.0, 991.0, 565.0, 312.0, 213.0, 134.0, 98.0, 53.0, 40.0, 38.0, 29.0, 18.0, 6.0, 9.0, 6.0, 4.0, 4.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 4.0, 2.0], "bins": [-0.9599609375, -0.9306106567382812, -0.9012603759765625, -0.8719100952148438, -0.842559814453125, -0.8132095336914062, -0.7838592529296875, -0.7545089721679688, -0.72515869140625, -0.6958084106445312, -0.6664581298828125, -0.6371078491210938, -0.607757568359375, -0.5784072875976562, -0.5490570068359375, -0.5197067260742188, -0.4903564453125, -0.46100616455078125, -0.4316558837890625, -0.40230560302734375, -0.372955322265625, -0.34360504150390625, -0.3142547607421875, -0.28490447998046875, -0.25555419921875, -0.22620391845703125, -0.1968536376953125, -0.16750335693359375, -0.138153076171875, -0.10880279541015625, -0.0794525146484375, -0.05010223388671875, -0.020751953125, 0.00859832763671875, 0.0379486083984375, 0.06729888916015625, 0.096649169921875, 0.12599945068359375, 0.1553497314453125, 0.18470001220703125, 0.21405029296875, 0.24340057373046875, 0.2727508544921875, 0.30210113525390625, 0.331451416015625, 0.36080169677734375, 0.3901519775390625, 0.41950225830078125, 0.4488525390625, 0.47820281982421875, 0.5075531005859375, 0.5369033813476562, 0.566253662109375, 0.5956039428710938, 0.6249542236328125, 0.6543045043945312, 0.68365478515625, 0.7130050659179688, 0.7423553466796875, 0.7717056274414062, 0.801055908203125, 0.8304061889648438, 0.8597564697265625, 0.8891067504882812, 0.91845703125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 2.0, 5.0, 3.0, 5.0, 4.0, 8.0, 8.0, 7.0, 6.0, 8.0, 12.0, 15.0, 15.0, 19.0, 20.0, 29.0, 28.0, 29.0, 35.0, 42.0, 31.0, 38.0, 45.0, 38.0, 46.0, 32.0, 46.0, 49.0, 41.0, 38.0, 40.0, 34.0, 30.0, 26.0, 23.0, 27.0, 18.0, 14.0, 10.0, 11.0, 11.0, 13.0, 13.0, 12.0, 7.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-3.4140625, -3.30328369140625, -3.1925048828125, -3.08172607421875, -2.970947265625, -2.86016845703125, -2.7493896484375, -2.63861083984375, -2.52783203125, -2.41705322265625, -2.3062744140625, -2.19549560546875, -2.084716796875, -1.97393798828125, -1.8631591796875, -1.75238037109375, -1.6416015625, -1.53082275390625, -1.4200439453125, -1.30926513671875, -1.198486328125, -1.08770751953125, -0.9769287109375, -0.86614990234375, -0.75537109375, -0.64459228515625, -0.5338134765625, -0.42303466796875, -0.312255859375, -0.20147705078125, -0.0906982421875, 0.02008056640625, 0.130859375, 0.24163818359375, 0.3524169921875, 0.46319580078125, 0.573974609375, 0.68475341796875, 0.7955322265625, 0.90631103515625, 1.01708984375, 1.12786865234375, 1.2386474609375, 1.34942626953125, 1.460205078125, 1.57098388671875, 1.6817626953125, 1.79254150390625, 1.9033203125, 2.01409912109375, 2.1248779296875, 2.23565673828125, 2.346435546875, 2.45721435546875, 2.5679931640625, 2.67877197265625, 2.78955078125, 2.90032958984375, 3.0111083984375, 3.12188720703125, 3.232666015625, 3.34344482421875, 3.4542236328125, 3.56500244140625, 3.67578125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 7.0, 18.0, 14.0, 26.0, 39.0, 71.0, 136.0, 160.0, 290.0, 474.0, 831.0, 1614.0, 3300.0, 7315.0, 18005.0, 56233.0, 257369.0, 532304.0, 117515.0, 31218.0, 11637.0, 4852.0, 2283.0, 1221.0, 693.0, 347.0, 219.0, 130.0, 74.0, 50.0, 35.0, 26.0, 15.0, 7.0, 4.0, 9.0, 2.0, 6.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.35498046875, -0.34430694580078125, -0.3336334228515625, -0.32295989990234375, -0.312286376953125, -0.30161285400390625, -0.2909393310546875, -0.28026580810546875, -0.26959228515625, -0.25891876220703125, -0.2482452392578125, -0.23757171630859375, -0.226898193359375, -0.21622467041015625, -0.2055511474609375, -0.19487762451171875, -0.1842041015625, -0.17353057861328125, -0.1628570556640625, -0.15218353271484375, -0.141510009765625, -0.13083648681640625, -0.1201629638671875, -0.10948944091796875, -0.09881591796875, -0.08814239501953125, -0.0774688720703125, -0.06679534912109375, -0.056121826171875, -0.04544830322265625, -0.0347747802734375, -0.02410125732421875, -0.013427734375, -0.00275421142578125, 0.0079193115234375, 0.01859283447265625, 0.029266357421875, 0.03993988037109375, 0.0506134033203125, 0.06128692626953125, 0.07196044921875, 0.08263397216796875, 0.0933074951171875, 0.10398101806640625, 0.114654541015625, 0.12532806396484375, 0.1360015869140625, 0.14667510986328125, 0.1573486328125, 0.16802215576171875, 0.1786956787109375, 0.18936920166015625, 0.200042724609375, 0.21071624755859375, 0.2213897705078125, 0.23206329345703125, 0.24273681640625, 0.25341033935546875, 0.2640838623046875, 0.27475738525390625, 0.285430908203125, 0.29610443115234375, 0.3067779541015625, 0.31745147705078125, 0.328125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 4.0, 8.0, 6.0, 4.0, 7.0, 12.0, 30.0, 25.0, 51.0, 91.0, 123.0, 155.0, 153.0, 112.0, 63.0, 43.0, 38.0, 17.0, 16.0, 12.0, 7.0, 8.0, 7.0, 7.0, 4.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002105236053466797, -0.00019943341612815857, -0.00018834322690963745, -0.00017725303769111633, -0.00016616284847259521, -0.0001550726592540741, -0.00014398247003555298, -0.00013289228081703186, -0.00012180209159851074, -0.00011071190237998962, -9.96217131614685e-05, -8.853152394294739e-05, -7.744133472442627e-05, -6.635114550590515e-05, -5.526095628738403e-05, -4.4170767068862915e-05, -3.30805778503418e-05, -2.199038863182068e-05, -1.090019941329956e-05, 1.8998980522155762e-07, 1.1280179023742676e-05, 2.2370368242263794e-05, 3.346055746078491e-05, 4.455074667930603e-05, 5.564093589782715e-05, 6.673112511634827e-05, 7.782131433486938e-05, 8.89115035533905e-05, 0.00010000169277191162, 0.00011109188199043274, 0.00012218207120895386, 0.00013327226042747498, 0.0001443624496459961, 0.0001554526388645172, 0.00016654282808303833, 0.00017763301730155945, 0.00018872320652008057, 0.00019981339573860168, 0.0002109035849571228, 0.00022199377417564392, 0.00023308396339416504, 0.00024417415261268616, 0.0002552643418312073, 0.0002663545310497284, 0.0002774447202682495, 0.00028853490948677063, 0.00029962509870529175, 0.00031071528792381287, 0.000321805477142334, 0.0003328956663608551, 0.0003439858555793762, 0.00035507604479789734, 0.00036616623401641846, 0.0003772564232349396, 0.0003883466124534607, 0.0003994368016719818, 0.00041052699089050293, 0.00042161718010902405, 0.00043270736932754517, 0.0004437975585460663, 0.0004548877477645874, 0.0004659779369831085, 0.00047706812620162964, 0.00048815831542015076, 0.0004992485046386719]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 3.0, 4.0, 7.0, 7.0, 11.0, 17.0, 10.0, 22.0, 14.0, 32.0, 51.0, 62.0, 99.0, 210.0, 426.0, 978.0, 2767.0, 10401.0, 98433.0, 860371.0, 62425.0, 8180.0, 2253.0, 853.0, 413.0, 186.0, 100.0, 59.0, 38.0, 31.0, 22.0, 10.0, 10.0, 11.0, 12.0, 8.0, 4.0, 4.0, 5.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8740234375, -0.8470687866210938, -0.8201141357421875, -0.7931594848632812, -0.766204833984375, -0.7392501831054688, -0.7122955322265625, -0.6853408813476562, -0.65838623046875, -0.6314315795898438, -0.6044769287109375, -0.5775222778320312, -0.550567626953125, -0.5236129760742188, -0.4966583251953125, -0.46970367431640625, -0.4427490234375, -0.41579437255859375, -0.3888397216796875, -0.36188507080078125, -0.334930419921875, -0.30797576904296875, -0.2810211181640625, -0.25406646728515625, -0.22711181640625, -0.20015716552734375, -0.1732025146484375, -0.14624786376953125, -0.119293212890625, -0.09233856201171875, -0.0653839111328125, -0.03842926025390625, -0.011474609375, 0.01548004150390625, 0.0424346923828125, 0.06938934326171875, 0.096343994140625, 0.12329864501953125, 0.1502532958984375, 0.17720794677734375, 0.20416259765625, 0.23111724853515625, 0.2580718994140625, 0.28502655029296875, 0.311981201171875, 0.33893585205078125, 0.3658905029296875, 0.39284515380859375, 0.4197998046875, 0.44675445556640625, 0.4737091064453125, 0.5006637573242188, 0.527618408203125, 0.5545730590820312, 0.5815277099609375, 0.6084823608398438, 0.63543701171875, 0.6623916625976562, 0.6893463134765625, 0.7163009643554688, 0.743255615234375, 0.7702102661132812, 0.7971649169921875, 0.8241195678710938, 0.85107421875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 2.0, 2.0, 7.0, 9.0, 9.0, 22.0, 12.0, 17.0, 23.0, 42.0, 40.0, 49.0, 67.0, 72.0, 70.0, 105.0, 80.0, 79.0, 56.0, 49.0, 37.0, 31.0, 28.0, 21.0, 13.0, 9.0, 9.0, 6.0, 7.0, 5.0, 4.0, 4.0, 4.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.08489990234375, -0.08214282989501953, -0.07938575744628906, -0.0766286849975586, -0.07387161254882812, -0.07111454010009766, -0.06835746765136719, -0.06560039520263672, -0.06284332275390625, -0.06008625030517578, -0.05732917785644531, -0.054572105407714844, -0.051815032958984375, -0.049057960510253906, -0.04630088806152344, -0.04354381561279297, -0.0407867431640625, -0.03802967071533203, -0.03527259826660156, -0.032515525817871094, -0.029758453369140625, -0.027001380920410156, -0.024244308471679688, -0.02148723602294922, -0.01873016357421875, -0.01597309112548828, -0.013216018676757812, -0.010458946228027344, -0.007701873779296875, -0.004944801330566406, -0.0021877288818359375, 0.0005693435668945312, 0.003326416015625, 0.006083488464355469, 0.008840560913085938, 0.011597633361816406, 0.014354705810546875, 0.017111778259277344, 0.019868850708007812, 0.02262592315673828, 0.02538299560546875, 0.02814006805419922, 0.030897140502929688, 0.033654212951660156, 0.036411285400390625, 0.039168357849121094, 0.04192543029785156, 0.04468250274658203, 0.0474395751953125, 0.05019664764404297, 0.05295372009277344, 0.055710792541503906, 0.058467864990234375, 0.061224937438964844, 0.06398200988769531, 0.06673908233642578, 0.06949615478515625, 0.07225322723388672, 0.07501029968261719, 0.07776737213134766, 0.08052444458007812, 0.0832815170288086, 0.08603858947753906, 0.08879566192626953, 0.091552734375]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 7.0, 9.0, 32.0, 44.0, 103.0, 234.0, 246.0, 189.0, 62.0, 46.0, 22.0, 7.0, 9.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.347467422485352, -12.080865859985352, -11.814263343811035, -11.547661781311035, -11.281060218811035, -11.014457702636719, -10.747856140136719, -10.481254577636719, -10.214653015136719, -9.948051452636719, -9.681448936462402, -9.414847373962402, -9.148245811462402, -8.881643295288086, -8.615041732788086, -8.348440170288086, -8.08183765411377, -7.815235614776611, -7.548634052276611, -7.282032012939453, -7.015430450439453, -6.748828411102295, -6.482226371765137, -6.215624809265137, -5.9490227699279785, -5.68242073059082, -5.41581916809082, -5.149217128753662, -4.882615089416504, -4.616013526916504, -4.349411487579346, -4.0828094482421875, -3.8162078857421875, -3.5496060848236084, -3.2830042839050293, -3.016402244567871, -2.749800443649292, -2.483198642730713, -2.2165966033935547, -1.9499948024749756, -1.6833930015563965, -1.4167912006378174, -1.1501892805099487, -0.8835874199867249, -0.616985559463501, -0.3503837585449219, -0.08378183841705322, 0.18282008171081543, 0.44942188262939453, 0.7160237431526184, 0.9826256036758423, 1.249227523803711, 1.51582932472229, 1.7824311256408691, 2.0490331649780273, 2.3156349658966064, 2.5822367668151855, 2.8488385677337646, 3.1154403686523438, 3.382042407989502, 3.648644208908081, 3.91524600982666, 4.181848049163818, 4.448450088500977, 4.715051651000977]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 4.0, 4.0, 5.0, 5.0, 7.0, 19.0, 23.0, 29.0, 43.0, 61.0, 45.0, 60.0, 80.0, 74.0, 91.0, 91.0, 74.0, 75.0, 66.0, 47.0, 22.0, 32.0, 15.0, 13.0, 8.0, 7.0, 3.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.14798641204834, -4.033320426940918, -3.918654203414917, -3.803987979888916, -3.689321994781494, -3.574655771255493, -3.459989547729492, -3.3453235626220703, -3.2306575775146484, -3.1159913539886475, -3.0013253688812256, -2.8866591453552246, -2.7719931602478027, -2.6573269367218018, -2.542660713195801, -2.427994728088379, -2.313328504562378, -2.198662281036377, -2.083996295928955, -1.969330072402954, -1.8546640872955322, -1.7399978637695312, -1.6253317594528198, -1.5106656551361084, -1.395999550819397, -1.2813334465026855, -1.1666673421859741, -1.0520012378692627, -0.9373350739479065, -0.8226689696311951, -0.7080028057098389, -0.5933367013931274, -0.4786708354949951, -0.3640047311782837, -0.24933859705924988, -0.13467246294021606, -0.02000635862350464, 0.09465974569320679, 0.209325909614563, 0.3239920139312744, 0.43865811824798584, 0.5533242225646973, 0.6679903268814087, 0.7826564908027649, 0.8973225951194763, 1.011988639831543, 1.126654863357544, 1.2413209676742554, 1.3559870719909668, 1.4706531763076782, 1.5853192806243896, 1.6999855041503906, 1.8146514892578125, 1.9293177127838135, 2.0439839363098145, 2.1586499214172363, 2.273315906524658, 2.387982130050659, 2.502648115158081, 2.617314338684082, 2.731980323791504, 2.846646547317505, 2.961312770843506, 3.0759787559509277, 3.1906449794769287]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 2.0, 6.0, 12.0, 8.0, 19.0, 24.0, 30.0, 48.0, 94.0, 124.0, 210.0, 366.0, 604.0, 991.0, 1683.0, 3011.0, 5455.0, 10718.0, 22240.0, 60584.0, 360490.0, 459299.0, 72454.0, 24917.0, 11353.0, 5982.0, 3225.0, 1883.0, 1032.0, 636.0, 382.0, 246.0, 131.0, 111.0, 60.0, 51.0, 27.0, 18.0, 4.0, 8.0, 6.0, 3.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 4.0], "bins": [-2.4140625, -2.34521484375, -2.2763671875, -2.20751953125, -2.138671875, -2.06982421875, -2.0009765625, -1.93212890625, -1.86328125, -1.79443359375, -1.7255859375, -1.65673828125, -1.587890625, -1.51904296875, -1.4501953125, -1.38134765625, -1.3125, -1.24365234375, -1.1748046875, -1.10595703125, -1.037109375, -0.96826171875, -0.8994140625, -0.83056640625, -0.76171875, -0.69287109375, -0.6240234375, -0.55517578125, -0.486328125, -0.41748046875, -0.3486328125, -0.27978515625, -0.2109375, -0.14208984375, -0.0732421875, -0.00439453125, 0.064453125, 0.13330078125, 0.2021484375, 0.27099609375, 0.33984375, 0.40869140625, 0.4775390625, 0.54638671875, 0.615234375, 0.68408203125, 0.7529296875, 0.82177734375, 0.890625, 0.95947265625, 1.0283203125, 1.09716796875, 1.166015625, 1.23486328125, 1.3037109375, 1.37255859375, 1.44140625, 1.51025390625, 1.5791015625, 1.64794921875, 1.716796875, 1.78564453125, 1.8544921875, 1.92333984375, 1.9921875]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 4.0, 3.0, 5.0, 2.0, 6.0, 2.0, 5.0, 6.0, 9.0, 13.0, 12.0, 16.0, 20.0, 15.0, 29.0, 23.0, 34.0, 49.0, 25.0, 46.0, 52.0, 42.0, 61.0, 40.0, 47.0, 42.0, 52.0, 46.0, 45.0, 29.0, 39.0, 23.0, 34.0, 22.0, 17.0, 18.0, 10.0, 15.0, 7.0, 13.0, 9.0, 9.0, 3.0, 2.0, 4.0, 4.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.63671875, -5.4742431640625, -5.311767578125, -5.1492919921875, -4.98681640625, -4.8243408203125, -4.661865234375, -4.4993896484375, -4.3369140625, -4.1744384765625, -4.011962890625, -3.8494873046875, -3.68701171875, -3.5245361328125, -3.362060546875, -3.1995849609375, -3.037109375, -2.8746337890625, -2.712158203125, -2.5496826171875, -2.38720703125, -2.2247314453125, -2.062255859375, -1.8997802734375, -1.7373046875, -1.5748291015625, -1.412353515625, -1.2498779296875, -1.08740234375, -0.9249267578125, -0.762451171875, -0.5999755859375, -0.4375, -0.2750244140625, -0.112548828125, 0.0499267578125, 0.21240234375, 0.3748779296875, 0.537353515625, 0.6998291015625, 0.8623046875, 1.0247802734375, 1.187255859375, 1.3497314453125, 1.51220703125, 1.6746826171875, 1.837158203125, 1.9996337890625, 2.162109375, 2.3245849609375, 2.487060546875, 2.6495361328125, 2.81201171875, 2.9744873046875, 3.136962890625, 3.2994384765625, 3.4619140625, 3.6243896484375, 3.786865234375, 3.9493408203125, 4.11181640625, 4.2742919921875, 4.436767578125, 4.5992431640625, 4.76171875]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 4.0, 5.0, 5.0, 1.0, 9.0, 8.0, 6.0, 15.0, 16.0, 19.0, 15.0, 27.0, 32.0, 30.0, 29.0, 47.0, 46.0, 68.0, 78.0, 331.0, 8335.0, 1032146.0, 6557.0, 277.0, 95.0, 57.0, 38.0, 38.0, 46.0, 17.0, 27.0, 25.0, 20.0, 19.0, 22.0, 10.0, 7.0, 4.0, 6.0, 6.0, 4.0, 5.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-18.5625, -18.0535888671875, -17.544677734375, -17.0357666015625, -16.52685546875, -16.0179443359375, -15.509033203125, -15.0001220703125, -14.4912109375, -13.9822998046875, -13.473388671875, -12.9644775390625, -12.45556640625, -11.9466552734375, -11.437744140625, -10.9288330078125, -10.419921875, -9.9110107421875, -9.402099609375, -8.8931884765625, -8.38427734375, -7.8753662109375, -7.366455078125, -6.8575439453125, -6.3486328125, -5.8397216796875, -5.330810546875, -4.8218994140625, -4.31298828125, -3.8040771484375, -3.295166015625, -2.7862548828125, -2.27734375, -1.7684326171875, -1.259521484375, -0.7506103515625, -0.24169921875, 0.2672119140625, 0.776123046875, 1.2850341796875, 1.7939453125, 2.3028564453125, 2.811767578125, 3.3206787109375, 3.82958984375, 4.3385009765625, 4.847412109375, 5.3563232421875, 5.865234375, 6.3741455078125, 6.883056640625, 7.3919677734375, 7.90087890625, 8.4097900390625, 8.918701171875, 9.4276123046875, 9.9365234375, 10.4454345703125, 10.954345703125, 11.4632568359375, 11.97216796875, 12.4810791015625, 12.989990234375, 13.4989013671875, 14.0078125]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 4.0, 6.0, 5.0, 3.0, 8.0, 14.0, 5.0, 11.0, 16.0, 19.0, 19.0, 33.0, 25.0, 33.0, 23.0, 39.0, 35.0, 51.0, 48.0, 51.0, 54.0, 37.0, 38.0, 41.0, 51.0, 36.0, 35.0, 46.0, 34.0, 18.0, 29.0, 23.0, 18.0, 22.0, 20.0, 12.0, 11.0, 5.0, 8.0, 4.0, 3.0, 5.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-6.6875, -6.50421142578125, -6.3209228515625, -6.13763427734375, -5.954345703125, -5.77105712890625, -5.5877685546875, -5.40447998046875, -5.22119140625, -5.03790283203125, -4.8546142578125, -4.67132568359375, -4.488037109375, -4.30474853515625, -4.1214599609375, -3.93817138671875, -3.7548828125, -3.57159423828125, -3.3883056640625, -3.20501708984375, -3.021728515625, -2.83843994140625, -2.6551513671875, -2.47186279296875, -2.28857421875, -2.10528564453125, -1.9219970703125, -1.73870849609375, -1.555419921875, -1.37213134765625, -1.1888427734375, -1.00555419921875, -0.822265625, -0.63897705078125, -0.4556884765625, -0.27239990234375, -0.089111328125, 0.09417724609375, 0.2774658203125, 0.46075439453125, 0.64404296875, 0.82733154296875, 1.0106201171875, 1.19390869140625, 1.377197265625, 1.56048583984375, 1.7437744140625, 1.92706298828125, 2.1103515625, 2.29364013671875, 2.4769287109375, 2.66021728515625, 2.843505859375, 3.02679443359375, 3.2100830078125, 3.39337158203125, 3.57666015625, 3.75994873046875, 3.9432373046875, 4.12652587890625, 4.309814453125, 4.49310302734375, 4.6763916015625, 4.85968017578125, 5.04296875]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 5.0, 9.0, 7.0, 13.0, 8.0, 20.0, 25.0, 37.0, 59.0, 93.0, 139.0, 222.0, 365.0, 657.0, 1382.0, 3288.0, 9069.0, 32897.0, 703880.0, 254593.0, 27883.0, 8064.0, 2946.0, 1283.0, 632.0, 351.0, 217.0, 134.0, 83.0, 60.0, 40.0, 20.0, 23.0, 13.0, 6.0, 11.0, 3.0, 3.0, 3.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.2958984375, -1.256561279296875, -1.21722412109375, -1.177886962890625, -1.1385498046875, -1.099212646484375, -1.05987548828125, -1.020538330078125, -0.981201171875, -0.941864013671875, -0.90252685546875, -0.863189697265625, -0.8238525390625, -0.784515380859375, -0.74517822265625, -0.705841064453125, -0.66650390625, -0.627166748046875, -0.58782958984375, -0.548492431640625, -0.5091552734375, -0.469818115234375, -0.43048095703125, -0.391143798828125, -0.351806640625, -0.312469482421875, -0.27313232421875, -0.233795166015625, -0.1944580078125, -0.155120849609375, -0.11578369140625, -0.076446533203125, -0.037109375, 0.002227783203125, 0.04156494140625, 0.080902099609375, 0.1202392578125, 0.159576416015625, 0.19891357421875, 0.238250732421875, 0.277587890625, 0.316925048828125, 0.35626220703125, 0.395599365234375, 0.4349365234375, 0.474273681640625, 0.51361083984375, 0.552947998046875, 0.59228515625, 0.631622314453125, 0.67095947265625, 0.710296630859375, 0.7496337890625, 0.788970947265625, 0.82830810546875, 0.867645263671875, 0.906982421875, 0.946319580078125, 0.98565673828125, 1.024993896484375, 1.0643310546875, 1.103668212890625, 1.14300537109375, 1.182342529296875, 1.2216796875]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 4.0, 7.0, 2.0, 5.0, 8.0, 22.0, 16.0, 23.0, 30.0, 55.0, 114.0, 236.0, 226.0, 83.0, 65.0, 25.0, 19.0, 13.0, 5.0, 8.0, 7.0, 3.0, 7.0, 5.0, 4.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00016188621520996094, -0.0001572445034980774, -0.00015260279178619385, -0.0001479610800743103, -0.00014331936836242676, -0.0001386776566505432, -0.00013403594493865967, -0.00012939423322677612, -0.00012475252151489258, -0.00012011080980300903, -0.00011546909809112549, -0.00011082738637924194, -0.0001061856746673584, -0.00010154396295547485, -9.690225124359131e-05, -9.226053953170776e-05, -8.761882781982422e-05, -8.297711610794067e-05, -7.833540439605713e-05, -7.369369268417358e-05, -6.905198097229004e-05, -6.44102692604065e-05, -5.976855754852295e-05, -5.5126845836639404e-05, -5.048513412475586e-05, -4.5843422412872314e-05, -4.120171070098877e-05, -3.6559998989105225e-05, -3.191828727722168e-05, -2.7276575565338135e-05, -2.263486385345459e-05, -1.7993152141571045e-05, -1.33514404296875e-05, -8.709728717803955e-06, -4.06801700592041e-06, 5.736947059631348e-07, 5.21540641784668e-06, 9.857118129730225e-06, 1.449882984161377e-05, 1.9140541553497314e-05, 2.378225326538086e-05, 2.8423964977264404e-05, 3.306567668914795e-05, 3.7707388401031494e-05, 4.234910011291504e-05, 4.6990811824798584e-05, 5.163252353668213e-05, 5.6274235248565674e-05, 6.091594696044922e-05, 6.555765867233276e-05, 7.019937038421631e-05, 7.484108209609985e-05, 7.94827938079834e-05, 8.412450551986694e-05, 8.876621723175049e-05, 9.340792894363403e-05, 9.804964065551758e-05, 0.00010269135236740112, 0.00010733306407928467, 0.00011197477579116821, 0.00011661648750305176, 0.0001212581992149353, 0.00012589991092681885, 0.0001305416226387024, 0.00013518333435058594]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 5.0, 4.0, 1.0, 6.0, 12.0, 13.0, 12.0, 19.0, 25.0, 56.0, 56.0, 85.0, 92.0, 167.0, 301.0, 444.0, 869.0, 1661.0, 3638.0, 9532.0, 32619.0, 288354.0, 655372.0, 36902.0, 10306.0, 3903.0, 1795.0, 905.0, 555.0, 294.0, 197.0, 119.0, 82.0, 55.0, 30.0, 19.0, 17.0, 12.0, 5.0, 8.0, 7.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0634765625, -1.028076171875, -0.99267578125, -0.957275390625, -0.921875, -0.886474609375, -0.85107421875, -0.815673828125, -0.7802734375, -0.744873046875, -0.70947265625, -0.674072265625, -0.638671875, -0.603271484375, -0.56787109375, -0.532470703125, -0.4970703125, -0.461669921875, -0.42626953125, -0.390869140625, -0.35546875, -0.320068359375, -0.28466796875, -0.249267578125, -0.2138671875, -0.178466796875, -0.14306640625, -0.107666015625, -0.072265625, -0.036865234375, -0.00146484375, 0.033935546875, 0.0693359375, 0.104736328125, 0.14013671875, 0.175537109375, 0.2109375, 0.246337890625, 0.28173828125, 0.317138671875, 0.3525390625, 0.387939453125, 0.42333984375, 0.458740234375, 0.494140625, 0.529541015625, 0.56494140625, 0.600341796875, 0.6357421875, 0.671142578125, 0.70654296875, 0.741943359375, 0.77734375, 0.812744140625, 0.84814453125, 0.883544921875, 0.9189453125, 0.954345703125, 0.98974609375, 1.025146484375, 1.060546875, 1.095947265625, 1.13134765625, 1.166748046875, 1.2021484375]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 7.0, 5.0, 4.0, 9.0, 16.0, 14.0, 13.0, 20.0, 30.0, 44.0, 88.0, 400.0, 142.0, 55.0, 37.0, 35.0, 21.0, 10.0, 15.0, 8.0, 6.0, 2.0, 4.0, 3.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.6044921875, -0.5880203247070312, -0.5715484619140625, -0.5550765991210938, -0.538604736328125, -0.5221328735351562, -0.5056610107421875, -0.48918914794921875, -0.47271728515625, -0.45624542236328125, -0.4397735595703125, -0.42330169677734375, -0.406829833984375, -0.39035797119140625, -0.3738861083984375, -0.35741424560546875, -0.3409423828125, -0.32447052001953125, -0.3079986572265625, -0.29152679443359375, -0.275054931640625, -0.25858306884765625, -0.2421112060546875, -0.22563934326171875, -0.20916748046875, -0.19269561767578125, -0.1762237548828125, -0.15975189208984375, -0.143280029296875, -0.12680816650390625, -0.1103363037109375, -0.09386444091796875, -0.077392578125, -0.06092071533203125, -0.0444488525390625, -0.02797698974609375, -0.011505126953125, 0.00496673583984375, 0.0214385986328125, 0.03791046142578125, 0.05438232421875, 0.07085418701171875, 0.0873260498046875, 0.10379791259765625, 0.120269775390625, 0.13674163818359375, 0.1532135009765625, 0.16968536376953125, 0.1861572265625, 0.20262908935546875, 0.2191009521484375, 0.23557281494140625, 0.252044677734375, 0.26851654052734375, 0.2849884033203125, 0.30146026611328125, 0.31793212890625, 0.33440399169921875, 0.3508758544921875, 0.36734771728515625, 0.383819580078125, 0.40029144287109375, 0.4167633056640625, 0.43323516845703125, 0.44970703125]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 8.0, 9.0, 26.0, 58.0, 167.0, 315.0, 254.0, 106.0, 41.0, 15.0, 11.0, 5.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-33.3998908996582, -32.76668167114258, -32.13346862792969, -31.500259399414062, -30.867048263549805, -30.233837127685547, -29.60062599182129, -28.96741485595703, -28.334205627441406, -27.70099449157715, -27.06778335571289, -26.434574127197266, -25.801362991333008, -25.16815185546875, -24.534940719604492, -23.901729583740234, -23.26852035522461, -22.63530921936035, -22.002098083496094, -21.36888885498047, -20.73567771911621, -20.102466583251953, -19.469255447387695, -18.836044311523438, -18.20283317565918, -17.569622039794922, -16.936410903930664, -16.30320167541504, -15.669990539550781, -15.036779403686523, -14.403568267822266, -13.770358085632324, -13.1371488571167, -12.503937721252441, -11.8707275390625, -11.237516403198242, -10.6043062210083, -9.971095085144043, -9.337884902954102, -8.704673767089844, -8.071462631225586, -7.438251972198486, -6.805041313171387, -6.171830177307129, -5.5386199951171875, -4.90540885925293, -4.27219820022583, -3.6389875411987305, -3.005777359008789, -2.3725666999816895, -1.7393559217453003, -1.1061451435089111, -0.4729344844818115, 0.16027617454528809, 0.7934870719909668, 1.4266977310180664, 2.059908390045166, 2.6931190490722656, 3.3263297080993652, 3.959540605545044, 4.592751502990723, 5.225961685180664, 5.859172821044922, 6.4923834800720215, 7.125594139099121]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 4.0, 4.0, 4.0, 11.0, 14.0, 17.0, 17.0, 14.0, 17.0, 28.0, 24.0, 31.0, 41.0, 33.0, 36.0, 45.0, 52.0, 47.0, 48.0, 43.0, 53.0, 49.0, 47.0, 31.0, 47.0, 35.0, 35.0, 27.0, 29.0, 28.0, 15.0, 12.0, 16.0, 16.0, 9.0, 9.0, 5.0, 3.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.205902099609375, -9.90009593963623, -9.594289779663086, -9.288483619689941, -8.982677459716797, -8.676871299743652, -8.371065139770508, -8.065258979797363, -7.759452819824219, -7.453646659851074, -7.14784049987793, -6.842034339904785, -6.536228179931641, -6.230422019958496, -5.924615859985352, -5.618809700012207, -5.3130035400390625, -5.007197380065918, -4.701391220092773, -4.395585060119629, -4.089778900146484, -3.78397274017334, -3.4781665802001953, -3.172360420227051, -2.8665542602539062, -2.5607481002807617, -2.254941940307617, -1.9491357803344727, -1.6433296203613281, -1.3375234603881836, -1.031717300415039, -0.7259111404418945, -0.42010498046875, -0.11429882049560547, 0.19150733947753906, 0.4973134994506836, 0.8031196594238281, 1.1089258193969727, 1.4147319793701172, 1.7205381393432617, 2.0263442993164062, 2.332150459289551, 2.6379566192626953, 2.94376277923584, 3.2495689392089844, 3.555375099182129, 3.8611812591552734, 4.166987419128418, 4.4727935791015625, 4.778599739074707, 5.084405899047852, 5.390212059020996, 5.696018218994141, 6.001824378967285, 6.30763053894043, 6.613436698913574, 6.919242858886719, 7.225049018859863, 7.530855178833008, 7.836661338806152, 8.142467498779297, 8.448273658752441, 8.754079818725586, 9.05988597869873, 9.365692138671875]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 0.0, 1.0, 1.0, 6.0, 5.0, 9.0, 10.0, 17.0, 9.0, 13.0, 25.0, 38.0, 34.0, 63.0, 113.0, 199.0, 330.0, 718.0, 1531.0, 4072.0, 13613.0, 70164.0, 1661647.0, 2336200.0, 82939.0, 14835.0, 4480.0, 1664.0, 701.0, 348.0, 171.0, 103.0, 81.0, 42.0, 32.0, 21.0, 13.0, 10.0, 5.0, 6.0, 12.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.70703125, -5.52886962890625, -5.3507080078125, -5.17254638671875, -4.994384765625, -4.81622314453125, -4.6380615234375, -4.45989990234375, -4.28173828125, -4.10357666015625, -3.9254150390625, -3.74725341796875, -3.569091796875, -3.39093017578125, -3.2127685546875, -3.03460693359375, -2.8564453125, -2.67828369140625, -2.5001220703125, -2.32196044921875, -2.143798828125, -1.96563720703125, -1.7874755859375, -1.60931396484375, -1.43115234375, -1.25299072265625, -1.0748291015625, -0.89666748046875, -0.718505859375, -0.54034423828125, -0.3621826171875, -0.18402099609375, -0.005859375, 0.17230224609375, 0.3504638671875, 0.52862548828125, 0.706787109375, 0.88494873046875, 1.0631103515625, 1.24127197265625, 1.41943359375, 1.59759521484375, 1.7757568359375, 1.95391845703125, 2.132080078125, 2.31024169921875, 2.4884033203125, 2.66656494140625, 2.8447265625, 3.02288818359375, 3.2010498046875, 3.37921142578125, 3.557373046875, 3.73553466796875, 3.9136962890625, 4.09185791015625, 4.27001953125, 4.44818115234375, 4.6263427734375, 4.80450439453125, 4.982666015625, 5.16082763671875, 5.3389892578125, 5.51715087890625, 5.6953125]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 7.0, 7.0, 4.0, 24.0, 24.0, 30.0, 35.0, 55.0, 60.0, 72.0, 81.0, 88.0, 87.0, 77.0, 110.0, 69.0, 49.0, 41.0, 20.0, 22.0, 14.0, 11.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.2109375, -5.073486328125, -4.93603515625, -4.798583984375, -4.6611328125, -4.523681640625, -4.38623046875, -4.248779296875, -4.111328125, -3.973876953125, -3.83642578125, -3.698974609375, -3.5615234375, -3.424072265625, -3.28662109375, -3.149169921875, -3.01171875, -2.874267578125, -2.73681640625, -2.599365234375, -2.4619140625, -2.324462890625, -2.18701171875, -2.049560546875, -1.912109375, -1.774658203125, -1.63720703125, -1.499755859375, -1.3623046875, -1.224853515625, -1.08740234375, -0.949951171875, -0.8125, -0.675048828125, -0.53759765625, -0.400146484375, -0.2626953125, -0.125244140625, 0.01220703125, 0.149658203125, 0.287109375, 0.424560546875, 0.56201171875, 0.699462890625, 0.8369140625, 0.974365234375, 1.11181640625, 1.249267578125, 1.38671875, 1.524169921875, 1.66162109375, 1.799072265625, 1.9365234375, 2.073974609375, 2.21142578125, 2.348876953125, 2.486328125, 2.623779296875, 2.76123046875, 2.898681640625, 3.0361328125, 3.173583984375, 3.31103515625, 3.448486328125, 3.5859375]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 6.0, 16.0, 50.0, 280.0, 18906.0, 4173348.0, 1513.0, 128.0, 27.0, 8.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.046875, -22.967529296875, -21.88818359375, -20.808837890625, -19.7294921875, -18.650146484375, -17.57080078125, -16.491455078125, -15.412109375, -14.332763671875, -13.25341796875, -12.174072265625, -11.0947265625, -10.015380859375, -8.93603515625, -7.856689453125, -6.77734375, -5.697998046875, -4.61865234375, -3.539306640625, -2.4599609375, -1.380615234375, -0.30126953125, 0.778076171875, 1.857421875, 2.936767578125, 4.01611328125, 5.095458984375, 6.1748046875, 7.254150390625, 8.33349609375, 9.412841796875, 10.4921875, 11.571533203125, 12.65087890625, 13.730224609375, 14.8095703125, 15.888916015625, 16.96826171875, 18.047607421875, 19.126953125, 20.206298828125, 21.28564453125, 22.364990234375, 23.4443359375, 24.523681640625, 25.60302734375, 26.682373046875, 27.76171875, 28.841064453125, 29.92041015625, 30.999755859375, 32.0791015625, 33.158447265625, 34.23779296875, 35.317138671875, 36.396484375, 37.475830078125, 38.55517578125, 39.634521484375, 40.7138671875, 41.793212890625, 42.87255859375, 43.951904296875, 45.03125]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 6.0, 2.0, 8.0, 4.0, 7.0, 11.0, 12.0, 24.0, 34.0, 33.0, 44.0, 60.0, 121.0, 172.0, 305.0, 521.0, 1050.0, 669.0, 338.0, 206.0, 138.0, 99.0, 68.0, 27.0, 30.0, 22.0, 13.0, 12.0, 9.0, 9.0, 6.0, 4.0, 6.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2841796875, -1.2490997314453125, -1.214019775390625, -1.1789398193359375, -1.14385986328125, -1.1087799072265625, -1.073699951171875, -1.0386199951171875, -1.0035400390625, -0.9684600830078125, -0.933380126953125, -0.8983001708984375, -0.86322021484375, -0.8281402587890625, -0.793060302734375, -0.7579803466796875, -0.722900390625, -0.6878204345703125, -0.652740478515625, -0.6176605224609375, -0.58258056640625, -0.5475006103515625, -0.512420654296875, -0.4773406982421875, -0.4422607421875, -0.4071807861328125, -0.372100830078125, -0.3370208740234375, -0.30194091796875, -0.2668609619140625, -0.231781005859375, -0.1967010498046875, -0.16162109375, -0.1265411376953125, -0.091461181640625, -0.0563812255859375, -0.02130126953125, 0.0137786865234375, 0.048858642578125, 0.0839385986328125, 0.1190185546875, 0.1540985107421875, 0.189178466796875, 0.2242584228515625, 0.25933837890625, 0.2944183349609375, 0.329498291015625, 0.3645782470703125, 0.399658203125, 0.4347381591796875, 0.469818115234375, 0.5048980712890625, 0.53997802734375, 0.5750579833984375, 0.610137939453125, 0.6452178955078125, 0.6802978515625, 0.7153778076171875, 0.750457763671875, 0.7855377197265625, 0.82061767578125, 0.8556976318359375, 0.890777587890625, 0.9258575439453125, 0.9609375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 10.0, 11.0, 18.0, 30.0, 33.0, 62.0, 75.0, 121.0, 146.0, 135.0, 114.0, 85.0, 52.0, 46.0, 18.0, 9.0, 11.0, 6.0, 4.0, 3.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.353464126586914, -7.154359817504883, -6.955255508422852, -6.75615119934082, -6.557046890258789, -6.357943058013916, -6.158838748931885, -5.9597344398498535, -5.760630130767822, -5.561525821685791, -5.36242151260376, -5.1633172035217285, -4.9642133712768555, -4.765109062194824, -4.566004753112793, -4.366900444030762, -4.1677961349487305, -3.968691825866699, -3.769587516784668, -3.570483446121216, -3.3713791370391846, -3.1722748279571533, -2.973170757293701, -2.77406644821167, -2.5749621391296387, -2.3758578300476074, -2.176753520965576, -1.977649450302124, -1.7785451412200928, -1.5794408321380615, -1.3803366422653198, -1.1812324523925781, -0.9821276664733887, -0.7830234169960022, -0.5839191675186157, -0.38481491804122925, -0.18571066856384277, 0.013393580913543701, 0.21249783039093018, 0.4116020202636719, 0.6107063293457031, 0.8098105788230896, 1.008914828300476, 1.2080190181732178, 1.407123327255249, 1.6062276363372803, 1.805331826210022, 2.0044360160827637, 2.203540325164795, 2.402644634246826, 2.6017489433288574, 2.8008530139923096, 2.999957323074341, 3.199061632156372, 3.398165702819824, 3.5972700119018555, 3.7963743209838867, 3.995478630065918, 4.194582939147949, 4.3936872482299805, 4.592791557312012, 4.791895389556885, 4.990999698638916, 5.190104007720947, 5.3892083168029785]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 4.0, 3.0, 0.0, 4.0, 3.0, 13.0, 10.0, 14.0, 12.0, 25.0, 27.0, 39.0, 37.0, 37.0, 45.0, 46.0, 52.0, 70.0, 69.0, 61.0, 57.0, 51.0, 54.0, 45.0, 41.0, 41.0, 26.0, 28.0, 22.0, 18.0, 19.0, 10.0, 6.0, 4.0, 4.0, 3.0, 5.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-4.372010707855225, -4.262429714202881, -4.152849197387695, -4.043268203735352, -3.933687448501587, -3.8241066932678223, -3.7145259380340576, -3.604945182800293, -3.4953644275665283, -3.3857836723327637, -3.276202917098999, -3.1666221618652344, -3.0570411682128906, -2.947460412979126, -2.8378796577453613, -2.7282989025115967, -2.618718147277832, -2.5091373920440674, -2.3995566368103027, -2.289975643157959, -2.1803948879241943, -2.0708141326904297, -1.961233377456665, -1.8516526222229004, -1.7420716285705566, -1.632490873336792, -1.5229099988937378, -1.4133292436599731, -1.3037484884262085, -1.1941676139831543, -1.0845868587493896, -0.975006103515625, -0.8654253482818604, -0.7558445334434509, -0.6462637782096863, -0.5366829633712769, -0.4271021783351898, -0.3175213932991028, -0.20794057846069336, -0.09835982322692871, 0.011220991611480713, 0.12080178409814835, 0.23038257658481598, 0.3399633765220642, 0.44954416155815125, 0.5591249465942383, 0.6687057614326477, 0.7782865166664124, 0.8878673315048218, 0.9974481463432312, 1.1070289611816406, 1.2166097164154053, 1.32619047164917, 1.4357712268829346, 1.5453521013259888, 1.6549328565597534, 1.7645137310028076, 1.8740944862365723, 1.9836753606796265, 2.0932559967041016, 2.2028369903564453, 2.31241774559021, 2.4219985008239746, 2.5315792560577393, 2.641160011291504]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 6.0, 3.0, 7.0, 10.0, 18.0, 17.0, 29.0, 52.0, 104.0, 231.0, 540.0, 1607.0, 5843.0, 32101.0, 465609.0, 498980.0, 34519.0, 6094.0, 1707.0, 635.0, 229.0, 98.0, 52.0, 23.0, 15.0, 10.0, 5.0, 4.0, 7.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.224609375, -1.182403564453125, -1.14019775390625, -1.097991943359375, -1.0557861328125, -1.013580322265625, -0.97137451171875, -0.929168701171875, -0.886962890625, -0.844757080078125, -0.80255126953125, -0.760345458984375, -0.7181396484375, -0.675933837890625, -0.63372802734375, -0.591522216796875, -0.54931640625, -0.507110595703125, -0.46490478515625, -0.422698974609375, -0.3804931640625, -0.338287353515625, -0.29608154296875, -0.253875732421875, -0.211669921875, -0.169464111328125, -0.12725830078125, -0.085052490234375, -0.0428466796875, -0.000640869140625, 0.04156494140625, 0.083770751953125, 0.1259765625, 0.168182373046875, 0.21038818359375, 0.252593994140625, 0.2947998046875, 0.337005615234375, 0.37921142578125, 0.421417236328125, 0.463623046875, 0.505828857421875, 0.54803466796875, 0.590240478515625, 0.6324462890625, 0.674652099609375, 0.71685791015625, 0.759063720703125, 0.80126953125, 0.843475341796875, 0.88568115234375, 0.927886962890625, 0.9700927734375, 1.012298583984375, 1.05450439453125, 1.096710205078125, 1.138916015625, 1.181121826171875, 1.22332763671875, 1.265533447265625, 1.3077392578125, 1.349945068359375, 1.39215087890625, 1.434356689453125, 1.4765625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 1.0, 4.0, 9.0, 14.0, 15.0, 25.0, 42.0, 33.0, 59.0, 79.0, 69.0, 88.0, 97.0, 93.0, 87.0, 75.0, 57.0, 57.0, 24.0, 26.0, 18.0, 10.0, 6.0, 6.0, 8.0, 3.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3828125, -4.277313232421875, -4.17181396484375, -4.066314697265625, -3.9608154296875, -3.855316162109375, -3.74981689453125, -3.644317626953125, -3.538818359375, -3.433319091796875, -3.32781982421875, -3.222320556640625, -3.1168212890625, -3.011322021484375, -2.90582275390625, -2.800323486328125, -2.69482421875, -2.589324951171875, -2.48382568359375, -2.378326416015625, -2.2728271484375, -2.167327880859375, -2.06182861328125, -1.956329345703125, -1.850830078125, -1.745330810546875, -1.63983154296875, -1.534332275390625, -1.4288330078125, -1.323333740234375, -1.21783447265625, -1.112335205078125, -1.0068359375, -0.901336669921875, -0.79583740234375, -0.690338134765625, -0.5848388671875, -0.479339599609375, -0.37384033203125, -0.268341064453125, -0.162841796875, -0.057342529296875, 0.04815673828125, 0.153656005859375, 0.2591552734375, 0.364654541015625, 0.47015380859375, 0.575653076171875, 0.68115234375, 0.786651611328125, 0.89215087890625, 0.997650146484375, 1.1031494140625, 1.208648681640625, 1.31414794921875, 1.419647216796875, 1.525146484375, 1.630645751953125, 1.73614501953125, 1.841644287109375, 1.9471435546875, 2.052642822265625, 2.15814208984375, 2.263641357421875, 2.369140625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 0.0, 5.0, 5.0, 9.0, 9.0, 23.0, 33.0, 57.0, 84.0, 127.0, 228.0, 430.0, 881.0, 2146.0, 5343.0, 15867.0, 63566.0, 343031.0, 482565.0, 99776.0, 22375.0, 6983.0, 2690.0, 1174.0, 516.0, 255.0, 148.0, 104.0, 46.0, 21.0, 20.0, 11.0, 6.0, 5.0, 6.0, 5.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.63134765625, -0.6122970581054688, -0.5932464599609375, -0.5741958618164062, -0.555145263671875, -0.5360946655273438, -0.5170440673828125, -0.49799346923828125, -0.47894287109375, -0.45989227294921875, -0.4408416748046875, -0.42179107666015625, -0.402740478515625, -0.38368988037109375, -0.3646392822265625, -0.34558868408203125, -0.3265380859375, -0.30748748779296875, -0.2884368896484375, -0.26938629150390625, -0.250335693359375, -0.23128509521484375, -0.2122344970703125, -0.19318389892578125, -0.17413330078125, -0.15508270263671875, -0.1360321044921875, -0.11698150634765625, -0.097930908203125, -0.07888031005859375, -0.0598297119140625, -0.04077911376953125, -0.021728515625, -0.00267791748046875, 0.0163726806640625, 0.03542327880859375, 0.054473876953125, 0.07352447509765625, 0.0925750732421875, 0.11162567138671875, 0.13067626953125, 0.14972686767578125, 0.1687774658203125, 0.18782806396484375, 0.206878662109375, 0.22592926025390625, 0.2449798583984375, 0.26403045654296875, 0.2830810546875, 0.30213165283203125, 0.3211822509765625, 0.34023284912109375, 0.359283447265625, 0.37833404541015625, 0.3973846435546875, 0.41643524169921875, 0.43548583984375, 0.45453643798828125, 0.4735870361328125, 0.49263763427734375, 0.511688232421875, 0.5307388305664062, 0.5497894287109375, 0.5688400268554688, 0.587890625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 2.0, 2.0, 6.0, 9.0, 9.0, 13.0, 13.0, 15.0, 26.0, 19.0, 36.0, 33.0, 41.0, 50.0, 46.0, 59.0, 70.0, 58.0, 61.0, 56.0, 55.0, 53.0, 47.0, 43.0, 35.0, 26.0, 36.0, 16.0, 17.0, 11.0, 14.0, 10.0, 6.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.53515625, -3.4093017578125, -3.283447265625, -3.1575927734375, -3.03173828125, -2.9058837890625, -2.780029296875, -2.6541748046875, -2.5283203125, -2.4024658203125, -2.276611328125, -2.1507568359375, -2.02490234375, -1.8990478515625, -1.773193359375, -1.6473388671875, -1.521484375, -1.3956298828125, -1.269775390625, -1.1439208984375, -1.01806640625, -0.8922119140625, -0.766357421875, -0.6405029296875, -0.5146484375, -0.3887939453125, -0.262939453125, -0.1370849609375, -0.01123046875, 0.1146240234375, 0.240478515625, 0.3663330078125, 0.4921875, 0.6180419921875, 0.743896484375, 0.8697509765625, 0.99560546875, 1.1214599609375, 1.247314453125, 1.3731689453125, 1.4990234375, 1.6248779296875, 1.750732421875, 1.8765869140625, 2.00244140625, 2.1282958984375, 2.254150390625, 2.3800048828125, 2.505859375, 2.6317138671875, 2.757568359375, 2.8834228515625, 3.00927734375, 3.1351318359375, 3.260986328125, 3.3868408203125, 3.5126953125, 3.6385498046875, 3.764404296875, 3.8902587890625, 4.01611328125, 4.1419677734375, 4.267822265625, 4.3936767578125, 4.51953125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 3.0, 6.0, 11.0, 20.0, 25.0, 37.0, 66.0, 91.0, 152.0, 271.0, 517.0, 891.0, 1761.0, 3407.0, 7594.0, 20829.0, 75326.0, 378474.0, 431378.0, 88468.0, 22913.0, 8504.0, 3674.0, 1885.0, 1026.0, 507.0, 274.0, 153.0, 104.0, 65.0, 38.0, 33.0, 19.0, 12.0, 7.0, 4.0, 7.0, 3.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.22216796875, -0.21632957458496094, -0.21049118041992188, -0.2046527862548828, -0.19881439208984375, -0.1929759979248047, -0.18713760375976562, -0.18129920959472656, -0.1754608154296875, -0.16962242126464844, -0.16378402709960938, -0.1579456329345703, -0.15210723876953125, -0.1462688446044922, -0.14043045043945312, -0.13459205627441406, -0.128753662109375, -0.12291526794433594, -0.11707687377929688, -0.11123847961425781, -0.10540008544921875, -0.09956169128417969, -0.09372329711914062, -0.08788490295410156, -0.0820465087890625, -0.07620811462402344, -0.07036972045898438, -0.06453132629394531, -0.05869293212890625, -0.05285453796386719, -0.047016143798828125, -0.04117774963378906, -0.03533935546875, -0.029500961303710938, -0.023662567138671875, -0.017824172973632812, -0.01198577880859375, -0.0061473846435546875, -0.000308990478515625, 0.0055294036865234375, 0.0113677978515625, 0.017206192016601562, 0.023044586181640625, 0.028882980346679688, 0.03472137451171875, 0.04055976867675781, 0.046398162841796875, 0.05223655700683594, 0.058074951171875, 0.06391334533691406, 0.06975173950195312, 0.07559013366699219, 0.08142852783203125, 0.08726692199707031, 0.09310531616210938, 0.09894371032714844, 0.1047821044921875, 0.11062049865722656, 0.11645889282226562, 0.12229728698730469, 0.12813568115234375, 0.1339740753173828, 0.13981246948242188, 0.14565086364746094, 0.1514892578125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 8.0, 5.0, 9.0, 19.0, 25.0, 33.0, 41.0, 70.0, 101.0, 102.0, 132.0, 120.0, 91.0, 70.0, 52.0, 35.0, 25.0, 19.0, 15.0, 4.0, 4.0, 9.0, 5.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011783838272094727, -0.00011319946497678757, -0.00010856054723262787, -0.00010392162948846817, -9.928271174430847e-05, -9.464379400014877e-05, -9.000487625598907e-05, -8.536595851182938e-05, -8.072704076766968e-05, -7.608812302350998e-05, -7.144920527935028e-05, -6.681028753519058e-05, -6.217136979103088e-05, -5.7532452046871185e-05, -5.289353430271149e-05, -4.825461655855179e-05, -4.361569881439209e-05, -3.897678107023239e-05, -3.433786332607269e-05, -2.9698945581912994e-05, -2.5060027837753296e-05, -2.0421110093593597e-05, -1.57821923494339e-05, -1.11432746052742e-05, -6.504356861114502e-06, -1.8654391169548035e-06, 2.773478627204895e-06, 7.4123963713645935e-06, 1.2051314115524292e-05, 1.669023185968399e-05, 2.132914960384369e-05, 2.5968067348003387e-05, 3.0606985092163086e-05, 3.5245902836322784e-05, 3.988482058048248e-05, 4.452373832464218e-05, 4.916265606880188e-05, 5.380157381296158e-05, 5.844049155712128e-05, 6.307940930128098e-05, 6.771832704544067e-05, 7.235724478960037e-05, 7.699616253376007e-05, 8.163508027791977e-05, 8.627399802207947e-05, 9.091291576623917e-05, 9.555183351039886e-05, 0.00010019075125455856, 0.00010482966899871826, 0.00010946858674287796, 0.00011410750448703766, 0.00011874642223119736, 0.00012338533997535706, 0.00012802425771951675, 0.00013266317546367645, 0.00013730209320783615, 0.00014194101095199585, 0.00014657992869615555, 0.00015121884644031525, 0.00015585776418447495, 0.00016049668192863464, 0.00016513559967279434, 0.00016977451741695404, 0.00017441343516111374, 0.00017905235290527344]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 1.0, 13.0, 4.0, 14.0, 12.0, 15.0, 23.0, 36.0, 67.0, 66.0, 137.0, 188.0, 366.0, 647.0, 1184.0, 2266.0, 4590.0, 10643.0, 29567.0, 108000.0, 451810.0, 327216.0, 73766.0, 21596.0, 8270.0, 3830.0, 1847.0, 956.0, 546.0, 320.0, 180.0, 126.0, 74.0, 54.0, 40.0, 23.0, 10.0, 12.0, 9.0, 12.0, 7.0, 1.0, 2.0, 3.0, 6.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.166259765625, -0.16049957275390625, -0.1547393798828125, -0.14897918701171875, -0.143218994140625, -0.13745880126953125, -0.1316986083984375, -0.12593841552734375, -0.12017822265625, -0.11441802978515625, -0.1086578369140625, -0.10289764404296875, -0.097137451171875, -0.09137725830078125, -0.0856170654296875, -0.07985687255859375, -0.0740966796875, -0.06833648681640625, -0.0625762939453125, -0.05681610107421875, -0.051055908203125, -0.04529571533203125, -0.0395355224609375, -0.03377532958984375, -0.02801513671875, -0.02225494384765625, -0.0164947509765625, -0.01073455810546875, -0.004974365234375, 0.00078582763671875, 0.0065460205078125, 0.01230621337890625, 0.01806640625, 0.02382659912109375, 0.0295867919921875, 0.03534698486328125, 0.041107177734375, 0.04686737060546875, 0.0526275634765625, 0.05838775634765625, 0.06414794921875, 0.06990814208984375, 0.0756683349609375, 0.08142852783203125, 0.087188720703125, 0.09294891357421875, 0.0987091064453125, 0.10446929931640625, 0.1102294921875, 0.11598968505859375, 0.1217498779296875, 0.12751007080078125, 0.133270263671875, 0.13903045654296875, 0.1447906494140625, 0.15055084228515625, 0.15631103515625, 0.16207122802734375, 0.1678314208984375, 0.17359161376953125, 0.179351806640625, 0.18511199951171875, 0.1908721923828125, 0.19663238525390625, 0.202392578125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 5.0, 12.0, 12.0, 22.0, 10.0, 18.0, 38.0, 42.0, 39.0, 56.0, 82.0, 86.0, 94.0, 93.0, 80.0, 69.0, 63.0, 47.0, 38.0, 22.0, 21.0, 14.0, 9.0, 9.0, 2.0, 4.0, 3.0, 3.0, 5.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.037109375, -0.03561687469482422, -0.03412437438964844, -0.032631874084472656, -0.031139373779296875, -0.029646873474121094, -0.028154373168945312, -0.02666187286376953, -0.02516937255859375, -0.02367687225341797, -0.022184371948242188, -0.020691871643066406, -0.019199371337890625, -0.017706871032714844, -0.016214370727539062, -0.014721870422363281, -0.0132293701171875, -0.011736869812011719, -0.010244369506835938, -0.008751869201660156, -0.007259368896484375, -0.005766868591308594, -0.0042743682861328125, -0.0027818679809570312, -0.00128936767578125, 0.00020313262939453125, 0.0016956329345703125, 0.0031881332397460938, 0.004680633544921875, 0.006173133850097656, 0.0076656341552734375, 0.009158134460449219, 0.010650634765625, 0.012143135070800781, 0.013635635375976562, 0.015128135681152344, 0.016620635986328125, 0.018113136291503906, 0.019605636596679688, 0.02109813690185547, 0.02259063720703125, 0.02408313751220703, 0.025575637817382812, 0.027068138122558594, 0.028560638427734375, 0.030053138732910156, 0.03154563903808594, 0.03303813934326172, 0.0345306396484375, 0.03602313995361328, 0.03751564025878906, 0.039008140563964844, 0.040500640869140625, 0.041993141174316406, 0.04348564147949219, 0.04497814178466797, 0.04647064208984375, 0.04796314239501953, 0.04945564270019531, 0.050948143005371094, 0.052440643310546875, 0.053933143615722656, 0.05542564392089844, 0.05691814422607422, 0.05841064453125]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 10.0, 7.0, 19.0, 26.0, 39.0, 66.0, 94.0, 175.0, 165.0, 137.0, 104.0, 72.0, 31.0, 17.0, 10.0, 8.0, 7.0, 4.0, 7.0, 7.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.084479808807373, -4.936653137207031, -4.7888264656066895, -4.641000270843506, -4.493173599243164, -4.345346927642822, -4.1975202560424805, -4.049693584442139, -3.901867151260376, -3.754040479660034, -3.6062140464782715, -3.4583873748779297, -3.310560703277588, -3.162734270095825, -3.0149075984954834, -2.8670811653137207, -2.719254493713379, -2.571427822113037, -2.4236013889312744, -2.2757747173309326, -2.12794828414917, -1.9801216125488281, -1.8322949409484863, -1.684468388557434, -1.5366418361663818, -1.3888152837753296, -1.2409887313842773, -1.0931620597839355, -0.9453355073928833, -0.797508955001831, -0.649682343006134, -0.501855731010437, -0.35402917861938477, -0.20620259642601013, -0.0583760142326355, 0.08945056796073914, 0.23727715015411377, 0.385103702545166, 0.532930314540863, 0.6807569265365601, 0.8285834789276123, 0.9764100313186646, 1.1242365837097168, 1.2720632553100586, 1.4198898077011108, 1.567716360092163, 1.7155430316925049, 1.8633695840835571, 2.0111961364746094, 2.159022808074951, 2.306849241256714, 2.4546759128570557, 2.6025023460388184, 2.75032901763916, 2.898155689239502, 3.0459823608398438, 3.1938087940216064, 3.3416354656219482, 3.489461898803711, 3.6372885704040527, 3.7851152420043945, 3.9329416751861572, 4.08076810836792, 4.228594779968262, 4.3764214515686035]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 2.0, 3.0, 4.0, 8.0, 17.0, 13.0, 22.0, 28.0, 39.0, 51.0, 50.0, 51.0, 68.0, 85.0, 95.0, 68.0, 79.0, 62.0, 55.0, 55.0, 35.0, 33.0, 22.0, 22.0, 9.0, 8.0, 4.0, 7.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.4835197925567627, -3.3976821899414062, -3.31184458732605, -3.2260069847106934, -3.140169620513916, -3.0543320178985596, -2.968494415283203, -2.8826568126678467, -2.7968192100524902, -2.710981607437134, -2.6251440048217773, -2.539306640625, -2.4534690380096436, -2.367631435394287, -2.2817938327789307, -2.195956230163574, -2.110118865966797, -2.0242812633514404, -1.9384437799453735, -1.852606177330017, -1.7667686939239502, -1.6809310913085938, -1.5950934886932373, -1.5092558860778809, -1.423418402671814, -1.3375808000564575, -1.2517433166503906, -1.1659057140350342, -1.0800681114196777, -0.9942306280136108, -0.9083930253982544, -0.8225554823875427, -0.7367181777954102, -0.6508806347846985, -0.5650430917739868, -0.47920548915863037, -0.3933679461479187, -0.30753040313720703, -0.22169280052185059, -0.13585525751113892, -0.050017714500427246, 0.03581984341144562, 0.12165740132331848, 0.20749497413635254, 0.2933325171470642, 0.3791700601577759, 0.4650076627731323, 0.550845205783844, 0.6366827487945557, 0.7225202918052673, 0.808357834815979, 0.8941954374313354, 0.9800329804420471, 1.0658705234527588, 1.1517081260681152, 1.2375457286834717, 1.3233832120895386, 1.409220814704895, 1.495058298110962, 1.5808959007263184, 1.6667335033416748, 1.7525709867477417, 1.8384085893630981, 1.924246072769165, 2.0100836753845215]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 4.0, 3.0, 9.0, 8.0, 14.0, 22.0, 42.0, 65.0, 157.0, 244.0, 519.0, 1053.0, 2354.0, 6112.0, 19030.0, 79613.0, 644098.0, 238707.0, 38524.0, 11053.0, 3887.0, 1583.0, 687.0, 370.0, 178.0, 88.0, 51.0, 29.0, 22.0, 9.0, 6.0, 6.0, 5.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.19921875, -3.09173583984375, -2.9842529296875, -2.87677001953125, -2.769287109375, -2.66180419921875, -2.5543212890625, -2.44683837890625, -2.33935546875, -2.23187255859375, -2.1243896484375, -2.01690673828125, -1.909423828125, -1.80194091796875, -1.6944580078125, -1.58697509765625, -1.4794921875, -1.37200927734375, -1.2645263671875, -1.15704345703125, -1.049560546875, -0.94207763671875, -0.8345947265625, -0.72711181640625, -0.61962890625, -0.51214599609375, -0.4046630859375, -0.29718017578125, -0.189697265625, -0.08221435546875, 0.0252685546875, 0.13275146484375, 0.240234375, 0.34771728515625, 0.4552001953125, 0.56268310546875, 0.670166015625, 0.77764892578125, 0.8851318359375, 0.99261474609375, 1.10009765625, 1.20758056640625, 1.3150634765625, 1.42254638671875, 1.530029296875, 1.63751220703125, 1.7449951171875, 1.85247802734375, 1.9599609375, 2.06744384765625, 2.1749267578125, 2.28240966796875, 2.389892578125, 2.49737548828125, 2.6048583984375, 2.71234130859375, 2.81982421875, 2.92730712890625, 3.0347900390625, 3.14227294921875, 3.249755859375, 3.35723876953125, 3.4647216796875, 3.57220458984375, 3.6796875]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 6.0, 9.0, 4.0, 8.0, 11.0, 11.0, 14.0, 10.0, 32.0, 23.0, 33.0, 35.0, 43.0, 70.0, 60.0, 57.0, 78.0, 56.0, 54.0, 71.0, 41.0, 49.0, 49.0, 39.0, 34.0, 21.0, 22.0, 18.0, 13.0, 7.0, 5.0, 12.0, 4.0, 2.0, 2.0, 0.0, 1.0, 3.0, 2.0], "bins": [-6.9296875, -6.764923095703125, -6.60015869140625, -6.435394287109375, -6.2706298828125, -6.105865478515625, -5.94110107421875, -5.776336669921875, -5.611572265625, -5.446807861328125, -5.28204345703125, -5.117279052734375, -4.9525146484375, -4.787750244140625, -4.62298583984375, -4.458221435546875, -4.29345703125, -4.128692626953125, -3.96392822265625, -3.799163818359375, -3.6343994140625, -3.469635009765625, -3.30487060546875, -3.140106201171875, -2.975341796875, -2.810577392578125, -2.64581298828125, -2.481048583984375, -2.3162841796875, -2.151519775390625, -1.98675537109375, -1.821990966796875, -1.6572265625, -1.492462158203125, -1.32769775390625, -1.162933349609375, -0.9981689453125, -0.833404541015625, -0.66864013671875, -0.503875732421875, -0.339111328125, -0.174346923828125, -0.00958251953125, 0.155181884765625, 0.3199462890625, 0.484710693359375, 0.64947509765625, 0.814239501953125, 0.97900390625, 1.143768310546875, 1.30853271484375, 1.473297119140625, 1.6380615234375, 1.802825927734375, 1.96759033203125, 2.132354736328125, 2.297119140625, 2.461883544921875, 2.62664794921875, 2.791412353515625, 2.9561767578125, 3.120941162109375, 3.28570556640625, 3.450469970703125, 3.615234375]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 1.0, 4.0, 3.0, 4.0, 5.0, 4.0, 4.0, 4.0, 12.0, 12.0, 14.0, 14.0, 16.0, 22.0, 21.0, 21.0, 25.0, 26.0, 27.0, 24.0, 33.0, 41.0, 47.0, 88.0, 342.0, 5564.0, 915583.0, 123997.0, 1963.0, 218.0, 76.0, 38.0, 30.0, 25.0, 20.0, 33.0, 26.0, 16.0, 20.0, 19.0, 18.0, 15.0, 14.0, 8.0, 11.0, 9.0, 8.0, 10.0, 10.0, 4.0, 6.0, 1.0, 3.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-10.0078125, -9.67236328125, -9.3369140625, -9.00146484375, -8.666015625, -8.33056640625, -7.9951171875, -7.65966796875, -7.32421875, -6.98876953125, -6.6533203125, -6.31787109375, -5.982421875, -5.64697265625, -5.3115234375, -4.97607421875, -4.640625, -4.30517578125, -3.9697265625, -3.63427734375, -3.298828125, -2.96337890625, -2.6279296875, -2.29248046875, -1.95703125, -1.62158203125, -1.2861328125, -0.95068359375, -0.615234375, -0.27978515625, 0.0556640625, 0.39111328125, 0.7265625, 1.06201171875, 1.3974609375, 1.73291015625, 2.068359375, 2.40380859375, 2.7392578125, 3.07470703125, 3.41015625, 3.74560546875, 4.0810546875, 4.41650390625, 4.751953125, 5.08740234375, 5.4228515625, 5.75830078125, 6.09375, 6.42919921875, 6.7646484375, 7.10009765625, 7.435546875, 7.77099609375, 8.1064453125, 8.44189453125, 8.77734375, 9.11279296875, 9.4482421875, 9.78369140625, 10.119140625, 10.45458984375, 10.7900390625, 11.12548828125, 11.4609375]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 4.0, 3.0, 5.0, 2.0, 3.0, 6.0, 5.0, 9.0, 11.0, 13.0, 21.0, 20.0, 17.0, 12.0, 21.0, 30.0, 23.0, 21.0, 27.0, 29.0, 27.0, 42.0, 34.0, 37.0, 43.0, 42.0, 44.0, 38.0, 31.0, 50.0, 24.0, 27.0, 24.0, 22.0, 34.0, 22.0, 22.0, 19.0, 23.0, 20.0, 17.0, 13.0, 6.0, 10.0, 14.0, 8.0, 11.0, 5.0, 10.0, 3.0, 2.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.630859375, -3.502593994140625, -3.37432861328125, -3.246063232421875, -3.1177978515625, -2.989532470703125, -2.86126708984375, -2.733001708984375, -2.604736328125, -2.476470947265625, -2.34820556640625, -2.219940185546875, -2.0916748046875, -1.963409423828125, -1.83514404296875, -1.706878662109375, -1.57861328125, -1.450347900390625, -1.32208251953125, -1.193817138671875, -1.0655517578125, -0.937286376953125, -0.80902099609375, -0.680755615234375, -0.552490234375, -0.424224853515625, -0.29595947265625, -0.167694091796875, -0.0394287109375, 0.088836669921875, 0.21710205078125, 0.345367431640625, 0.4736328125, 0.601898193359375, 0.73016357421875, 0.858428955078125, 0.9866943359375, 1.114959716796875, 1.24322509765625, 1.371490478515625, 1.499755859375, 1.628021240234375, 1.75628662109375, 1.884552001953125, 2.0128173828125, 2.141082763671875, 2.26934814453125, 2.397613525390625, 2.52587890625, 2.654144287109375, 2.78240966796875, 2.910675048828125, 3.0389404296875, 3.167205810546875, 3.29547119140625, 3.423736572265625, 3.552001953125, 3.680267333984375, 3.80853271484375, 3.936798095703125, 4.0650634765625, 4.193328857421875, 4.32159423828125, 4.449859619140625, 4.578125]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 7.0, 6.0, 9.0, 7.0, 21.0, 24.0, 35.0, 85.0, 145.0, 298.0, 627.0, 1408.0, 4508.0, 20673.0, 259957.0, 711070.0, 39692.0, 6552.0, 1915.0, 751.0, 331.0, 154.0, 98.0, 55.0, 40.0, 23.0, 19.0, 8.0, 12.0, 2.0, 8.0, 5.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1396484375, -1.0904388427734375, -1.041229248046875, -0.9920196533203125, -0.94281005859375, -0.8936004638671875, -0.844390869140625, -0.7951812744140625, -0.7459716796875, -0.6967620849609375, -0.647552490234375, -0.5983428955078125, -0.54913330078125, -0.4999237060546875, -0.450714111328125, -0.4015045166015625, -0.352294921875, -0.3030853271484375, -0.253875732421875, -0.2046661376953125, -0.15545654296875, -0.1062469482421875, -0.057037353515625, -0.0078277587890625, 0.0413818359375, 0.0905914306640625, 0.139801025390625, 0.1890106201171875, 0.23822021484375, 0.2874298095703125, 0.336639404296875, 0.3858489990234375, 0.43505859375, 0.4842681884765625, 0.533477783203125, 0.5826873779296875, 0.63189697265625, 0.6811065673828125, 0.730316162109375, 0.7795257568359375, 0.8287353515625, 0.8779449462890625, 0.927154541015625, 0.9763641357421875, 1.02557373046875, 1.0747833251953125, 1.123992919921875, 1.1732025146484375, 1.222412109375, 1.2716217041015625, 1.320831298828125, 1.3700408935546875, 1.41925048828125, 1.4684600830078125, 1.517669677734375, 1.5668792724609375, 1.6160888671875, 1.6652984619140625, 1.714508056640625, 1.7637176513671875, 1.81292724609375, 1.8621368408203125, 1.911346435546875, 1.9605560302734375, 2.009765625]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 6.0, 4.0, 7.0, 15.0, 15.0, 25.0, 35.0, 47.0, 71.0, 107.0, 182.0, 142.0, 118.0, 76.0, 33.0, 31.0, 18.0, 19.0, 14.0, 12.0, 6.0, 3.0, 3.0, 6.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002149343490600586, -0.00020877830684185028, -0.00020262226462364197, -0.00019646622240543365, -0.00019031018018722534, -0.00018415413796901703, -0.00017799809575080872, -0.0001718420535326004, -0.0001656860113143921, -0.00015952996909618378, -0.00015337392687797546, -0.00014721788465976715, -0.00014106184244155884, -0.00013490580022335052, -0.0001287497580051422, -0.0001225937157869339, -0.00011643767356872559, -0.00011028163135051727, -0.00010412558913230896, -9.796954691410065e-05, -9.181350469589233e-05, -8.565746247768402e-05, -7.950142025947571e-05, -7.33453780412674e-05, -6.718933582305908e-05, -6.103329360485077e-05, -5.4877251386642456e-05, -4.872120916843414e-05, -4.256516695022583e-05, -3.640912473201752e-05, -3.0253082513809204e-05, -2.409704029560089e-05, -1.7940998077392578e-05, -1.1784955859184265e-05, -5.628913640975952e-06, 5.271285772323608e-07, 6.683170795440674e-06, 1.2839213013648987e-05, 1.89952552318573e-05, 2.5151297450065613e-05, 3.1307339668273926e-05, 3.746338188648224e-05, 4.361942410469055e-05, 4.9775466322898865e-05, 5.593150854110718e-05, 6.208755075931549e-05, 6.82435929775238e-05, 7.439963519573212e-05, 8.055567741394043e-05, 8.671171963214874e-05, 9.286776185035706e-05, 9.902380406856537e-05, 0.00010517984628677368, 0.000111335888504982, 0.00011749193072319031, 0.00012364797294139862, 0.00012980401515960693, 0.00013596005737781525, 0.00014211609959602356, 0.00014827214181423187, 0.00015442818403244019, 0.0001605842262506485, 0.0001667402684688568, 0.00017289631068706512, 0.00017905235290527344]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 8.0, 8.0, 8.0, 11.0, 17.0, 25.0, 44.0, 47.0, 92.0, 147.0, 218.0, 359.0, 613.0, 1109.0, 2104.0, 4314.0, 10179.0, 30302.0, 145194.0, 678716.0, 128470.0, 28017.0, 9730.0, 4184.0, 2006.0, 1115.0, 565.0, 323.0, 197.0, 133.0, 104.0, 55.0, 45.0, 24.0, 26.0, 14.0, 9.0, 8.0, 3.0, 4.0, 1.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.033203125, -1.0040740966796875, -0.974945068359375, -0.9458160400390625, -0.91668701171875, -0.8875579833984375, -0.858428955078125, -0.8292999267578125, -0.8001708984375, -0.7710418701171875, -0.741912841796875, -0.7127838134765625, -0.68365478515625, -0.6545257568359375, -0.625396728515625, -0.5962677001953125, -0.567138671875, -0.5380096435546875, -0.508880615234375, -0.4797515869140625, -0.45062255859375, -0.4214935302734375, -0.392364501953125, -0.3632354736328125, -0.3341064453125, -0.3049774169921875, -0.275848388671875, -0.2467193603515625, -0.21759033203125, -0.1884613037109375, -0.159332275390625, -0.1302032470703125, -0.10107421875, -0.0719451904296875, -0.042816162109375, -0.0136871337890625, 0.01544189453125, 0.0445709228515625, 0.073699951171875, 0.1028289794921875, 0.1319580078125, 0.1610870361328125, 0.190216064453125, 0.2193450927734375, 0.24847412109375, 0.2776031494140625, 0.306732177734375, 0.3358612060546875, 0.364990234375, 0.3941192626953125, 0.423248291015625, 0.4523773193359375, 0.48150634765625, 0.5106353759765625, 0.539764404296875, 0.5688934326171875, 0.5980224609375, 0.6271514892578125, 0.656280517578125, 0.6854095458984375, 0.71453857421875, 0.7436676025390625, 0.772796630859375, 0.8019256591796875, 0.8310546875]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 6.0, 9.0, 2.0, 7.0, 7.0, 12.0, 22.0, 39.0, 42.0, 53.0, 89.0, 151.0, 187.0, 146.0, 76.0, 44.0, 34.0, 22.0, 17.0, 9.0, 10.0, 4.0, 1.0, 7.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6259765625, -0.6065673828125, -0.587158203125, -0.5677490234375, -0.54833984375, -0.5289306640625, -0.509521484375, -0.4901123046875, -0.470703125, -0.4512939453125, -0.431884765625, -0.4124755859375, -0.39306640625, -0.3736572265625, -0.354248046875, -0.3348388671875, -0.3154296875, -0.2960205078125, -0.276611328125, -0.2572021484375, -0.23779296875, -0.2183837890625, -0.198974609375, -0.1795654296875, -0.16015625, -0.1407470703125, -0.121337890625, -0.1019287109375, -0.08251953125, -0.0631103515625, -0.043701171875, -0.0242919921875, -0.0048828125, 0.0145263671875, 0.033935546875, 0.0533447265625, 0.07275390625, 0.0921630859375, 0.111572265625, 0.1309814453125, 0.150390625, 0.1697998046875, 0.189208984375, 0.2086181640625, 0.22802734375, 0.2474365234375, 0.266845703125, 0.2862548828125, 0.3056640625, 0.3250732421875, 0.344482421875, 0.3638916015625, 0.38330078125, 0.4027099609375, 0.422119140625, 0.4415283203125, 0.4609375, 0.4803466796875, 0.499755859375, 0.5191650390625, 0.53857421875, 0.5579833984375, 0.577392578125, 0.5968017578125, 0.6162109375]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 4.0, 2.0, 1.0, 2.0, 4.0, 12.0, 15.0, 9.0, 16.0, 42.0, 40.0, 59.0, 88.0, 129.0, 130.0, 105.0, 98.0, 78.0, 61.0, 34.0, 17.0, 13.0, 17.0, 9.0, 6.0, 7.0, 7.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.66705322265625, -7.446164608001709, -7.225276470184326, -7.004387855529785, -6.783499240875244, -6.562610626220703, -6.34172248840332, -6.120833873748779, -5.899945259094238, -5.679056644439697, -5.4581685066223145, -5.237279891967773, -5.016391277313232, -4.795502662658691, -4.574614524841309, -4.353725910186768, -4.132837295532227, -3.9119489192962646, -3.6910603046417236, -3.4701719284057617, -3.2492833137512207, -3.028394937515259, -2.807506561279297, -2.586617946624756, -2.365729808807373, -2.144841432571411, -1.9239528179168701, -1.7030644416809082, -1.4821758270263672, -1.2612874507904053, -1.0403989553451538, -0.8195104598999023, -0.5986218452453613, -0.37773334980010986, -0.1568448841571808, 0.06404358148574829, 0.28493207693099976, 0.5058205127716064, 0.7267090082168579, 0.9475975036621094, 1.1684859991073608, 1.3893744945526123, 1.6102629899978638, 1.8311514854431152, 2.052039861679077, 2.272928237915039, 2.49381685256958, 2.714705467224121, 2.935593843460083, 3.156482219696045, 3.377370834350586, 3.598259210586548, 3.819147825241089, 4.040036201477051, 4.260924816131592, 4.481813430786133, 4.702701568603516, 4.923590183258057, 5.1444783210754395, 5.3653669357299805, 5.5862555503845215, 5.8071441650390625, 6.028032302856445, 6.248920917510986, 6.469809532165527]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 6.0, 4.0, 3.0, 4.0, 8.0, 7.0, 11.0, 8.0, 11.0, 12.0, 21.0, 12.0, 21.0, 24.0, 31.0, 31.0, 39.0, 41.0, 41.0, 40.0, 52.0, 33.0, 48.0, 40.0, 32.0, 37.0, 40.0, 35.0, 36.0, 34.0, 31.0, 27.0, 32.0, 25.0, 27.0, 20.0, 11.0, 14.0, 14.0, 14.0, 3.0, 5.0, 4.0, 10.0, 1.0, 3.0, 6.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-7.317837238311768, -7.08499002456665, -6.852142810821533, -6.619295597076416, -6.386447906494141, -6.153600692749023, -5.920753479003906, -5.687906265258789, -5.455059051513672, -5.222211837768555, -4.9893646240234375, -4.75651741027832, -4.523670196533203, -4.290822982788086, -4.0579752922058105, -3.8251280784606934, -3.592280864715576, -3.359433650970459, -3.126586437225342, -2.8937389850616455, -2.6608917713165283, -2.428044557571411, -2.195197105407715, -1.9623498916625977, -1.7295026779174805, -1.4966554641723633, -1.2638081312179565, -1.0309607982635498, -0.7981135845184326, -0.5652663707733154, -0.3324190378189087, -0.09957170486450195, 0.13327550888061523, 0.3661227822303772, 0.5989700555801392, 0.8318173289299011, 1.064664602279663, 1.2975118160247803, 1.530359148979187, 1.7632064819335938, 1.996053695678711, 2.228900909423828, 2.4617481231689453, 2.6945955753326416, 2.927442789077759, 3.160290002822876, 3.3931374549865723, 3.6259846687316895, 3.8588318824768066, 4.091679096221924, 4.324526309967041, 4.557373523712158, 4.790221214294434, 5.023068428039551, 5.255915641784668, 5.488762855529785, 5.721610069274902, 5.9544572830200195, 6.187304496765137, 6.420151710510254, 6.652998924255371, 6.885846138000488, 7.118693828582764, 7.351541042327881, 7.584388256072998]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 3.0, 3.0, 7.0, 7.0, 3.0, 8.0, 8.0, 17.0, 20.0, 30.0, 26.0, 72.0, 85.0, 156.0, 293.0, 640.0, 1775.0, 6013.0, 31885.0, 641030.0, 3408779.0, 87095.0, 11616.0, 2821.0, 941.0, 414.0, 203.0, 109.0, 64.0, 48.0, 29.0, 27.0, 12.0, 10.0, 8.0, 8.0, 5.0, 8.0, 2.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.1796875, -6.9698486328125, -6.760009765625, -6.5501708984375, -6.34033203125, -6.1304931640625, -5.920654296875, -5.7108154296875, -5.5009765625, -5.2911376953125, -5.081298828125, -4.8714599609375, -4.66162109375, -4.4517822265625, -4.241943359375, -4.0321044921875, -3.822265625, -3.6124267578125, -3.402587890625, -3.1927490234375, -2.98291015625, -2.7730712890625, -2.563232421875, -2.3533935546875, -2.1435546875, -1.9337158203125, -1.723876953125, -1.5140380859375, -1.30419921875, -1.0943603515625, -0.884521484375, -0.6746826171875, -0.46484375, -0.2550048828125, -0.045166015625, 0.1646728515625, 0.37451171875, 0.5843505859375, 0.794189453125, 1.0040283203125, 1.2138671875, 1.4237060546875, 1.633544921875, 1.8433837890625, 2.05322265625, 2.2630615234375, 2.472900390625, 2.6827392578125, 2.892578125, 3.1024169921875, 3.312255859375, 3.5220947265625, 3.73193359375, 3.9417724609375, 4.151611328125, 4.3614501953125, 4.5712890625, 4.7811279296875, 4.990966796875, 5.2008056640625, 5.41064453125, 5.6204833984375, 5.830322265625, 6.0401611328125, 6.25]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 7.0, 6.0, 7.0, 6.0, 10.0, 19.0, 25.0, 26.0, 32.0, 59.0, 56.0, 61.0, 80.0, 84.0, 82.0, 70.0, 64.0, 61.0, 52.0, 51.0, 35.0, 26.0, 17.0, 13.0, 13.0, 13.0, 7.0, 6.0, 4.0, 3.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.908203125, -3.808563232421875, -3.70892333984375, -3.609283447265625, -3.5096435546875, -3.410003662109375, -3.31036376953125, -3.210723876953125, -3.111083984375, -3.011444091796875, -2.91180419921875, -2.812164306640625, -2.7125244140625, -2.612884521484375, -2.51324462890625, -2.413604736328125, -2.31396484375, -2.214324951171875, -2.11468505859375, -2.015045166015625, -1.9154052734375, -1.815765380859375, -1.71612548828125, -1.616485595703125, -1.516845703125, -1.417205810546875, -1.31756591796875, -1.217926025390625, -1.1182861328125, -1.018646240234375, -0.91900634765625, -0.819366455078125, -0.7197265625, -0.620086669921875, -0.52044677734375, -0.420806884765625, -0.3211669921875, -0.221527099609375, -0.12188720703125, -0.022247314453125, 0.077392578125, 0.177032470703125, 0.27667236328125, 0.376312255859375, 0.4759521484375, 0.575592041015625, 0.67523193359375, 0.774871826171875, 0.87451171875, 0.974151611328125, 1.07379150390625, 1.173431396484375, 1.2730712890625, 1.372711181640625, 1.47235107421875, 1.571990966796875, 1.671630859375, 1.771270751953125, 1.87091064453125, 1.970550537109375, 2.0701904296875, 2.169830322265625, 2.26947021484375, 2.369110107421875, 2.46875]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 3.0, 3.0, 3.0, 4.0, 12.0, 15.0, 31.0, 43.0, 113.0, 308.0, 1645.0, 53296.0, 4120618.0, 16792.0, 969.0, 219.0, 98.0, 43.0, 22.0, 21.0, 6.0, 4.0, 3.0, 2.0, 3.0, 3.0, 0.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.390625, -9.880859375, -9.37109375, -8.861328125, -8.3515625, -7.841796875, -7.33203125, -6.822265625, -6.3125, -5.802734375, -5.29296875, -4.783203125, -4.2734375, -3.763671875, -3.25390625, -2.744140625, -2.234375, -1.724609375, -1.21484375, -0.705078125, -0.1953125, 0.314453125, 0.82421875, 1.333984375, 1.84375, 2.353515625, 2.86328125, 3.373046875, 3.8828125, 4.392578125, 4.90234375, 5.412109375, 5.921875, 6.431640625, 6.94140625, 7.451171875, 7.9609375, 8.470703125, 8.98046875, 9.490234375, 10.0, 10.509765625, 11.01953125, 11.529296875, 12.0390625, 12.548828125, 13.05859375, 13.568359375, 14.078125, 14.587890625, 15.09765625, 15.607421875, 16.1171875, 16.626953125, 17.13671875, 17.646484375, 18.15625, 18.666015625, 19.17578125, 19.685546875, 20.1953125, 20.705078125, 21.21484375, 21.724609375, 22.234375]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 2.0, 5.0, 3.0, 9.0, 6.0, 9.0, 17.0, 26.0, 22.0, 31.0, 43.0, 75.0, 99.0, 120.0, 153.0, 226.0, 407.0, 727.0, 751.0, 420.0, 273.0, 188.0, 133.0, 65.0, 70.0, 49.0, 35.0, 18.0, 21.0, 22.0, 7.0, 13.0, 4.0, 2.0, 9.0, 3.0, 3.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.89794921875, -0.8680801391601562, -0.8382110595703125, -0.8083419799804688, -0.778472900390625, -0.7486038208007812, -0.7187347412109375, -0.6888656616210938, -0.65899658203125, -0.6291275024414062, -0.5992584228515625, -0.5693893432617188, -0.539520263671875, -0.5096511840820312, -0.4797821044921875, -0.44991302490234375, -0.4200439453125, -0.39017486572265625, -0.3603057861328125, -0.33043670654296875, -0.300567626953125, -0.27069854736328125, -0.2408294677734375, -0.21096038818359375, -0.18109130859375, -0.15122222900390625, -0.1213531494140625, -0.09148406982421875, -0.061614990234375, -0.03174591064453125, -0.0018768310546875, 0.02799224853515625, 0.057861328125, 0.08773040771484375, 0.1175994873046875, 0.14746856689453125, 0.177337646484375, 0.20720672607421875, 0.2370758056640625, 0.26694488525390625, 0.29681396484375, 0.32668304443359375, 0.3565521240234375, 0.38642120361328125, 0.416290283203125, 0.44615936279296875, 0.4760284423828125, 0.5058975219726562, 0.5357666015625, 0.5656356811523438, 0.5955047607421875, 0.6253738403320312, 0.655242919921875, 0.6851119995117188, 0.7149810791015625, 0.7448501586914062, 0.77471923828125, 0.8045883178710938, 0.8344573974609375, 0.8643264770507812, 0.894195556640625, 0.9240646362304688, 0.9539337158203125, 0.9838027954101562, 1.013671875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 4.0, 2.0, 5.0, 5.0, 7.0, 16.0, 11.0, 15.0, 28.0, 28.0, 52.0, 64.0, 71.0, 100.0, 107.0, 118.0, 75.0, 69.0, 59.0, 36.0, 34.0, 21.0, 21.0, 8.0, 13.0, 14.0, 7.0, 0.0, 5.0, 3.0, 7.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.490677356719971, -4.362713813781738, -4.234749794006348, -4.106786251068115, -3.9788224697113037, -3.850858688354492, -3.7228951454162598, -3.5949313640594482, -3.4669675827026367, -3.339003801345825, -3.2110402584075928, -3.0830764770507812, -2.9551126956939697, -2.827148914337158, -2.699185371398926, -2.5712215900421143, -2.443258047103882, -2.3152942657470703, -2.187330722808838, -2.0593669414520264, -1.9314031600952148, -1.8034394979476929, -1.675475835800171, -1.5475120544433594, -1.4195483922958374, -1.2915847301483154, -1.163620948791504, -1.035657286643982, -0.9076935648918152, -0.7797298431396484, -0.6517661809921265, -0.5238024592399597, -0.39583897590637207, -0.2678752541542053, -0.13991156220436096, -0.011947870254516602, 0.11601585149765015, 0.2439795732498169, 0.37194323539733887, 0.4999069571495056, 0.6278706789016724, 0.7558344006538391, 0.8837981224060059, 1.0117617845535278, 1.1397254467010498, 1.2676892280578613, 1.3956528902053833, 1.5236165523529053, 1.6515803337097168, 1.7795439958572388, 1.9075077772140503, 2.0354714393615723, 2.163435220718384, 2.2913990020751953, 2.4193625450134277, 2.5473263263702393, 2.675290107727051, 2.8032538890838623, 2.9312174320220947, 3.0591812133789062, 3.1871449947357178, 3.3151087760925293, 3.4430723190307617, 3.5710361003875732, 3.6989996433258057]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 4.0, 6.0, 12.0, 13.0, 9.0, 13.0, 23.0, 35.0, 32.0, 29.0, 41.0, 55.0, 66.0, 61.0, 53.0, 63.0, 67.0, 55.0, 41.0, 56.0, 55.0, 42.0, 27.0, 28.0, 22.0, 23.0, 17.0, 21.0, 12.0, 7.0, 5.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-3.8028132915496826, -3.7039666175842285, -3.6051201820373535, -3.5062735080718994, -3.4074270725250244, -3.3085803985595703, -3.2097339630126953, -3.110887289047241, -3.012040615081787, -2.913193941116333, -2.814347505569458, -2.715500831604004, -2.616654396057129, -2.517807722091675, -2.4189610481262207, -2.3201146125793457, -2.2212681770324707, -2.1224215030670166, -2.0235750675201416, -1.9247283935546875, -1.825881838798523, -1.7270352840423584, -1.6281887292861938, -1.5293421745300293, -1.4304955005645752, -1.3316489458084106, -1.232802391052246, -1.133955717086792, -1.0351091623306274, -0.9362626075744629, -0.8374160528182983, -0.738569438457489, -0.6397228240966797, -0.5408762693405151, -0.4420296549797058, -0.34318310022354126, -0.24433651566505432, -0.14548993110656738, -0.04664337635040283, 0.052203238010406494, 0.15104979276657104, 0.24989637732505798, 0.3487429618835449, 0.4475895166397095, 0.546436071395874, 0.6452826857566833, 0.7441292405128479, 0.8429758548736572, 0.9418224096298218, 1.0406689643859863, 1.1395155191421509, 1.2383620738983154, 1.3372087478637695, 1.436055302619934, 1.5349018573760986, 1.6337485313415527, 1.7325949668884277, 1.8314415216445923, 1.9302880764007568, 2.029134750366211, 2.127981185913086, 2.22682785987854, 2.325674533843994, 2.424520969390869, 2.5233676433563232]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 7.0, 10.0, 7.0, 13.0, 36.0, 22.0, 42.0, 62.0, 101.0, 153.0, 290.0, 549.0, 1260.0, 3028.0, 9263.0, 40415.0, 293162.0, 577431.0, 96677.0, 17533.0, 4918.0, 1746.0, 829.0, 407.0, 206.0, 133.0, 83.0, 43.0, 36.0, 21.0, 17.0, 12.0, 10.0, 4.0, 3.0, 5.0, 7.0, 2.0, 1.0, 1.0, 0.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.7158203125, -0.692901611328125, -0.66998291015625, -0.647064208984375, -0.6241455078125, -0.601226806640625, -0.57830810546875, -0.555389404296875, -0.532470703125, -0.509552001953125, -0.48663330078125, -0.463714599609375, -0.4407958984375, -0.417877197265625, -0.39495849609375, -0.372039794921875, -0.34912109375, -0.326202392578125, -0.30328369140625, -0.280364990234375, -0.2574462890625, -0.234527587890625, -0.21160888671875, -0.188690185546875, -0.165771484375, -0.142852783203125, -0.11993408203125, -0.097015380859375, -0.0740966796875, -0.051177978515625, -0.02825927734375, -0.005340576171875, 0.017578125, 0.040496826171875, 0.06341552734375, 0.086334228515625, 0.1092529296875, 0.132171630859375, 0.15509033203125, 0.178009033203125, 0.200927734375, 0.223846435546875, 0.24676513671875, 0.269683837890625, 0.2926025390625, 0.315521240234375, 0.33843994140625, 0.361358642578125, 0.38427734375, 0.407196044921875, 0.43011474609375, 0.453033447265625, 0.4759521484375, 0.498870849609375, 0.52178955078125, 0.544708251953125, 0.567626953125, 0.590545654296875, 0.61346435546875, 0.636383056640625, 0.6593017578125, 0.682220458984375, 0.70513916015625, 0.728057861328125, 0.7509765625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 8.0, 8.0, 7.0, 14.0, 14.0, 23.0, 24.0, 22.0, 44.0, 44.0, 51.0, 56.0, 67.0, 77.0, 59.0, 69.0, 55.0, 64.0, 57.0, 51.0, 35.0, 32.0, 31.0, 22.0, 21.0, 16.0, 14.0, 2.0, 4.0, 2.0, 4.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.24609375, -2.17523193359375, -2.1043701171875, -2.03350830078125, -1.962646484375, -1.89178466796875, -1.8209228515625, -1.75006103515625, -1.67919921875, -1.60833740234375, -1.5374755859375, -1.46661376953125, -1.395751953125, -1.32489013671875, -1.2540283203125, -1.18316650390625, -1.1123046875, -1.04144287109375, -0.9705810546875, -0.89971923828125, -0.828857421875, -0.75799560546875, -0.6871337890625, -0.61627197265625, -0.54541015625, -0.47454833984375, -0.4036865234375, -0.33282470703125, -0.261962890625, -0.19110107421875, -0.1202392578125, -0.04937744140625, 0.021484375, 0.09234619140625, 0.1632080078125, 0.23406982421875, 0.304931640625, 0.37579345703125, 0.4466552734375, 0.51751708984375, 0.58837890625, 0.65924072265625, 0.7301025390625, 0.80096435546875, 0.871826171875, 0.94268798828125, 1.0135498046875, 1.08441162109375, 1.1552734375, 1.22613525390625, 1.2969970703125, 1.36785888671875, 1.438720703125, 1.50958251953125, 1.5804443359375, 1.65130615234375, 1.72216796875, 1.79302978515625, 1.8638916015625, 1.93475341796875, 2.005615234375, 2.07647705078125, 2.1473388671875, 2.21820068359375, 2.2890625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 4.0, 4.0, 5.0, 4.0, 8.0, 8.0, 19.0, 19.0, 24.0, 34.0, 54.0, 91.0, 113.0, 221.0, 344.0, 637.0, 1262.0, 2637.0, 5809.0, 16577.0, 58124.0, 238949.0, 464340.0, 190392.0, 45623.0, 13358.0, 5119.0, 2238.0, 1010.0, 584.0, 347.0, 191.0, 140.0, 85.0, 57.0, 40.0, 21.0, 14.0, 19.0, 12.0, 7.0, 8.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0], "bins": [-0.49609375, -0.4828338623046875, -0.469573974609375, -0.4563140869140625, -0.44305419921875, -0.4297943115234375, -0.416534423828125, -0.4032745361328125, -0.3900146484375, -0.3767547607421875, -0.363494873046875, -0.3502349853515625, -0.33697509765625, -0.3237152099609375, -0.310455322265625, -0.2971954345703125, -0.283935546875, -0.2706756591796875, -0.257415771484375, -0.2441558837890625, -0.23089599609375, -0.2176361083984375, -0.204376220703125, -0.1911163330078125, -0.1778564453125, -0.1645965576171875, -0.151336669921875, -0.1380767822265625, -0.12481689453125, -0.1115570068359375, -0.098297119140625, -0.0850372314453125, -0.07177734375, -0.0585174560546875, -0.045257568359375, -0.0319976806640625, -0.01873779296875, -0.0054779052734375, 0.007781982421875, 0.0210418701171875, 0.0343017578125, 0.0475616455078125, 0.060821533203125, 0.0740814208984375, 0.08734130859375, 0.1006011962890625, 0.113861083984375, 0.1271209716796875, 0.140380859375, 0.1536407470703125, 0.166900634765625, 0.1801605224609375, 0.19342041015625, 0.2066802978515625, 0.219940185546875, 0.2332000732421875, 0.2464599609375, 0.2597198486328125, 0.272979736328125, 0.2862396240234375, 0.29949951171875, 0.3127593994140625, 0.326019287109375, 0.3392791748046875, 0.3525390625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 2.0, 3.0, 10.0, 5.0, 7.0, 12.0, 17.0, 26.0, 18.0, 20.0, 20.0, 38.0, 33.0, 41.0, 51.0, 58.0, 54.0, 61.0, 71.0, 58.0, 51.0, 50.0, 46.0, 38.0, 39.0, 37.0, 27.0, 29.0, 28.0, 14.0, 9.0, 11.0, 6.0, 5.0, 4.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.17578125, -4.061065673828125, -3.94635009765625, -3.831634521484375, -3.7169189453125, -3.602203369140625, -3.48748779296875, -3.372772216796875, -3.258056640625, -3.143341064453125, -3.02862548828125, -2.913909912109375, -2.7991943359375, -2.684478759765625, -2.56976318359375, -2.455047607421875, -2.34033203125, -2.225616455078125, -2.11090087890625, -1.996185302734375, -1.8814697265625, -1.766754150390625, -1.65203857421875, -1.537322998046875, -1.422607421875, -1.307891845703125, -1.19317626953125, -1.078460693359375, -0.9637451171875, -0.849029541015625, -0.73431396484375, -0.619598388671875, -0.5048828125, -0.390167236328125, -0.27545166015625, -0.160736083984375, -0.0460205078125, 0.068695068359375, 0.18341064453125, 0.298126220703125, 0.412841796875, 0.527557373046875, 0.64227294921875, 0.756988525390625, 0.8717041015625, 0.986419677734375, 1.10113525390625, 1.215850830078125, 1.33056640625, 1.445281982421875, 1.55999755859375, 1.674713134765625, 1.7894287109375, 1.904144287109375, 2.01885986328125, 2.133575439453125, 2.248291015625, 2.363006591796875, 2.47772216796875, 2.592437744140625, 2.7071533203125, 2.821868896484375, 2.93658447265625, 3.051300048828125, 3.166015625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 3.0, 14.0, 7.0, 7.0, 15.0, 19.0, 48.0, 47.0, 88.0, 155.0, 321.0, 589.0, 1228.0, 2783.0, 7110.0, 22831.0, 104706.0, 494179.0, 329133.0, 60742.0, 15220.0, 5202.0, 2078.0, 937.0, 456.0, 224.0, 161.0, 87.0, 62.0, 28.0, 32.0, 11.0, 14.0, 4.0, 6.0, 6.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.20654296875, -0.20093536376953125, -0.1953277587890625, -0.18972015380859375, -0.184112548828125, -0.17850494384765625, -0.1728973388671875, -0.16728973388671875, -0.16168212890625, -0.15607452392578125, -0.1504669189453125, -0.14485931396484375, -0.139251708984375, -0.13364410400390625, -0.1280364990234375, -0.12242889404296875, -0.1168212890625, -0.11121368408203125, -0.1056060791015625, -0.09999847412109375, -0.094390869140625, -0.08878326416015625, -0.0831756591796875, -0.07756805419921875, -0.07196044921875, -0.06635284423828125, -0.0607452392578125, -0.05513763427734375, -0.049530029296875, -0.04392242431640625, -0.0383148193359375, -0.03270721435546875, -0.027099609375, -0.02149200439453125, -0.0158843994140625, -0.01027679443359375, -0.004669189453125, 0.00093841552734375, 0.0065460205078125, 0.01215362548828125, 0.01776123046875, 0.02336883544921875, 0.0289764404296875, 0.03458404541015625, 0.040191650390625, 0.04579925537109375, 0.0514068603515625, 0.05701446533203125, 0.0626220703125, 0.06822967529296875, 0.0738372802734375, 0.07944488525390625, 0.085052490234375, 0.09066009521484375, 0.0962677001953125, 0.10187530517578125, 0.10748291015625, 0.11309051513671875, 0.1186981201171875, 0.12430572509765625, 0.129913330078125, 0.13552093505859375, 0.1411285400390625, 0.14673614501953125, 0.15234375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 5.0, 0.0, 3.0, 5.0, 9.0, 11.0, 13.0, 11.0, 16.0, 31.0, 26.0, 29.0, 37.0, 56.0, 61.0, 81.0, 66.0, 79.0, 74.0, 66.0, 66.0, 46.0, 42.0, 43.0, 37.0, 23.0, 18.0, 8.0, 13.0, 7.0, 4.0, 6.0, 4.0, 5.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.208917617797852e-05, -8.940789848566055e-05, -8.672662079334259e-05, -8.404534310102463e-05, -8.136406540870667e-05, -7.86827877163887e-05, -7.600151002407074e-05, -7.332023233175278e-05, -7.063895463943481e-05, -6.795767694711685e-05, -6.527639925479889e-05, -6.259512156248093e-05, -5.9913843870162964e-05, -5.7232566177845e-05, -5.455128848552704e-05, -5.1870010793209076e-05, -4.918873310089111e-05, -4.650745540857315e-05, -4.382617771625519e-05, -4.1144900023937225e-05, -3.846362233161926e-05, -3.57823446393013e-05, -3.310106694698334e-05, -3.0419789254665375e-05, -2.7738511562347412e-05, -2.505723387002945e-05, -2.2375956177711487e-05, -1.9694678485393524e-05, -1.701340079307556e-05, -1.4332123100757599e-05, -1.1650845408439636e-05, -8.969567716121674e-06, -6.288290023803711e-06, -3.6070123314857483e-06, -9.257346391677856e-07, 1.755543053150177e-06, 4.43682074546814e-06, 7.118098437786102e-06, 9.799376130104065e-06, 1.2480653822422028e-05, 1.516193151473999e-05, 1.7843209207057953e-05, 2.0524486899375916e-05, 2.3205764591693878e-05, 2.588704228401184e-05, 2.8568319976329803e-05, 3.1249597668647766e-05, 3.393087536096573e-05, 3.661215305328369e-05, 3.9293430745601654e-05, 4.197470843791962e-05, 4.465598613023758e-05, 4.733726382255554e-05, 5.0018541514873505e-05, 5.269981920719147e-05, 5.538109689950943e-05, 5.806237459182739e-05, 6.0743652284145355e-05, 6.342492997646332e-05, 6.610620766878128e-05, 6.878748536109924e-05, 7.14687630534172e-05, 7.415004074573517e-05, 7.683131843805313e-05, 7.95125961303711e-05]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 2.0, 5.0, 9.0, 14.0, 19.0, 37.0, 44.0, 76.0, 195.0, 400.0, 777.0, 1872.0, 5334.0, 22871.0, 282742.0, 671391.0, 49536.0, 8487.0, 2671.0, 1034.0, 482.0, 253.0, 125.0, 64.0, 49.0, 22.0, 20.0, 10.0, 6.0, 2.0, 5.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33984375, -0.32990264892578125, -0.3199615478515625, -0.31002044677734375, -0.300079345703125, -0.29013824462890625, -0.2801971435546875, -0.27025604248046875, -0.26031494140625, -0.25037384033203125, -0.2404327392578125, -0.23049163818359375, -0.220550537109375, -0.21060943603515625, -0.2006683349609375, -0.19072723388671875, -0.1807861328125, -0.17084503173828125, -0.1609039306640625, -0.15096282958984375, -0.141021728515625, -0.13108062744140625, -0.1211395263671875, -0.11119842529296875, -0.10125732421875, -0.09131622314453125, -0.0813751220703125, -0.07143402099609375, -0.061492919921875, -0.05155181884765625, -0.0416107177734375, -0.03166961669921875, -0.021728515625, -0.01178741455078125, -0.0018463134765625, 0.00809478759765625, 0.018035888671875, 0.02797698974609375, 0.0379180908203125, 0.04785919189453125, 0.05780029296875, 0.06774139404296875, 0.0776824951171875, 0.08762359619140625, 0.097564697265625, 0.10750579833984375, 0.1174468994140625, 0.12738800048828125, 0.1373291015625, 0.14727020263671875, 0.1572113037109375, 0.16715240478515625, 0.177093505859375, 0.18703460693359375, 0.1969757080078125, 0.20691680908203125, 0.21685791015625, 0.22679901123046875, 0.2367401123046875, 0.24668121337890625, 0.256622314453125, 0.26656341552734375, 0.2765045166015625, 0.28644561767578125, 0.29638671875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 2.0, 8.0, 8.0, 13.0, 22.0, 27.0, 36.0, 69.0, 82.0, 152.0, 166.0, 150.0, 107.0, 51.0, 38.0, 23.0, 13.0, 6.0, 10.0, 3.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.063232421875, -0.0611572265625, -0.05908203125, -0.0570068359375, -0.054931640625, -0.0528564453125, -0.05078125, -0.0487060546875, -0.046630859375, -0.0445556640625, -0.04248046875, -0.0404052734375, -0.038330078125, -0.0362548828125, -0.0341796875, -0.0321044921875, -0.030029296875, -0.0279541015625, -0.02587890625, -0.0238037109375, -0.021728515625, -0.0196533203125, -0.017578125, -0.0155029296875, -0.013427734375, -0.0113525390625, -0.00927734375, -0.0072021484375, -0.005126953125, -0.0030517578125, -0.0009765625, 0.0010986328125, 0.003173828125, 0.0052490234375, 0.00732421875, 0.0093994140625, 0.011474609375, 0.0135498046875, 0.015625, 0.0177001953125, 0.019775390625, 0.0218505859375, 0.02392578125, 0.0260009765625, 0.028076171875, 0.0301513671875, 0.0322265625, 0.0343017578125, 0.036376953125, 0.0384521484375, 0.04052734375, 0.0426025390625, 0.044677734375, 0.0467529296875, 0.048828125, 0.0509033203125, 0.052978515625, 0.0550537109375, 0.05712890625, 0.0592041015625, 0.061279296875, 0.0633544921875, 0.0654296875, 0.0675048828125, 0.069580078125]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 1.0, 6.0, 5.0, 7.0, 8.0, 8.0, 19.0, 24.0, 33.0, 31.0, 70.0, 88.0, 118.0, 107.0, 127.0, 82.0, 65.0, 55.0, 36.0, 30.0, 17.0, 18.0, 16.0, 8.0, 5.0, 6.0, 1.0, 4.0, 7.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.2435925006866455, -3.153115749359131, -3.062638998031616, -2.9721622467041016, -2.881685256958008, -2.791208505630493, -2.7007317543029785, -2.610255002975464, -2.519778251647949, -2.4293015003204346, -2.33882474899292, -2.2483479976654053, -2.1578712463378906, -2.067394256591797, -1.9769175052642822, -1.8864407539367676, -1.795964002609253, -1.7054872512817383, -1.6150104999542236, -1.5245336294174194, -1.4340568780899048, -1.3435801267623901, -1.253103256225586, -1.1626265048980713, -1.0721497535705566, -0.981673002243042, -0.8911961913108826, -0.8007193803787231, -0.7102426290512085, -0.6197658777236938, -0.5292890667915344, -0.438812255859375, -0.34833574295043945, -0.2578589618206024, -0.16738218069076538, -0.07690539956092834, 0.013571381568908691, 0.10404816269874573, 0.19452494382858276, 0.2850017547607422, 0.37547850608825684, 0.46595528721809387, 0.5564320683479309, 0.6469088792800903, 0.737385630607605, 0.8278623819351196, 0.918339192867279, 1.0088160037994385, 1.0992927551269531, 1.1897695064544678, 1.2802462577819824, 1.3707231283187866, 1.4611998796463013, 1.551676630973816, 1.6421535015106201, 1.7326302528381348, 1.8231070041656494, 1.913583755493164, 2.0040605068206787, 2.0945372581481934, 2.185014247894287, 2.2754909992218018, 2.3659677505493164, 2.456444501876831, 2.5469212532043457]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 3.0, 5.0, 5.0, 5.0, 12.0, 12.0, 20.0, 22.0, 35.0, 28.0, 46.0, 57.0, 59.0, 79.0, 64.0, 74.0, 91.0, 46.0, 66.0, 70.0, 45.0, 28.0, 33.0, 27.0, 20.0, 17.0, 14.0, 11.0, 5.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-2.759587049484253, -2.686246871948242, -2.6129066944122314, -2.5395665168762207, -2.46622633934021, -2.392886161804199, -2.3195459842681885, -2.2462058067321777, -2.172865629196167, -2.0995254516601562, -2.0261852741241455, -1.9528450965881348, -1.879504919052124, -1.8061647415161133, -1.7328245639801025, -1.6594843864440918, -1.5861440896987915, -1.5128039121627808, -1.43946373462677, -1.3661235570907593, -1.2927833795547485, -1.2194432020187378, -1.1461029052734375, -1.0727627277374268, -0.9994226098060608, -0.92608243227005, -0.8527422547340393, -0.7794020175933838, -0.706061840057373, -0.6327216625213623, -0.5593814849853516, -0.4860413074493408, -0.41270124912261963, -0.3393610715866089, -0.26602089405059814, -0.19268068671226501, -0.11934050917625427, -0.04600033164024353, 0.0273398756980896, 0.10068005323410034, 0.17402023077011108, 0.24736040830612183, 0.32070058584213257, 0.3940407931804657, 0.46738097071647644, 0.5407211780548096, 0.6140613555908203, 0.687401533126831, 0.7607417106628418, 0.8340818881988525, 0.9074220657348633, 0.980762243270874, 1.0541024208068848, 1.1274425983428955, 1.2007827758789062, 1.274122953414917, 1.3474631309509277, 1.4208033084869385, 1.4941434860229492, 1.56748366355896, 1.6408238410949707, 1.7141640186309814, 1.7875041961669922, 1.860844373703003, 1.9341846704483032]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 5.0, 6.0, 14.0, 20.0, 28.0, 29.0, 48.0, 65.0, 110.0, 158.0, 310.0, 509.0, 912.0, 1704.0, 3366.0, 7353.0, 18630.0, 60834.0, 296499.0, 507023.0, 103733.0, 27608.0, 10160.0, 4573.0, 2173.0, 1164.0, 631.0, 348.0, 188.0, 121.0, 83.0, 52.0, 25.0, 21.0, 19.0, 14.0, 4.0, 8.0, 5.0, 7.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.84765625, -2.75634765625, -2.6650390625, -2.57373046875, -2.482421875, -2.39111328125, -2.2998046875, -2.20849609375, -2.1171875, -2.02587890625, -1.9345703125, -1.84326171875, -1.751953125, -1.66064453125, -1.5693359375, -1.47802734375, -1.38671875, -1.29541015625, -1.2041015625, -1.11279296875, -1.021484375, -0.93017578125, -0.8388671875, -0.74755859375, -0.65625, -0.56494140625, -0.4736328125, -0.38232421875, -0.291015625, -0.19970703125, -0.1083984375, -0.01708984375, 0.07421875, 0.16552734375, 0.2568359375, 0.34814453125, 0.439453125, 0.53076171875, 0.6220703125, 0.71337890625, 0.8046875, 0.89599609375, 0.9873046875, 1.07861328125, 1.169921875, 1.26123046875, 1.3525390625, 1.44384765625, 1.53515625, 1.62646484375, 1.7177734375, 1.80908203125, 1.900390625, 1.99169921875, 2.0830078125, 2.17431640625, 2.265625, 2.35693359375, 2.4482421875, 2.53955078125, 2.630859375, 2.72216796875, 2.8134765625, 2.90478515625, 2.99609375]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 7.0, 5.0, 5.0, 9.0, 3.0, 5.0, 16.0, 13.0, 12.0, 19.0, 27.0, 25.0, 26.0, 32.0, 37.0, 51.0, 62.0, 53.0, 65.0, 66.0, 75.0, 61.0, 46.0, 38.0, 44.0, 34.0, 28.0, 23.0, 15.0, 22.0, 20.0, 19.0, 11.0, 5.0, 12.0, 7.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-4.28125, -4.14056396484375, -3.9998779296875, -3.85919189453125, -3.718505859375, -3.57781982421875, -3.4371337890625, -3.29644775390625, -3.15576171875, -3.01507568359375, -2.8743896484375, -2.73370361328125, -2.593017578125, -2.45233154296875, -2.3116455078125, -2.17095947265625, -2.0302734375, -1.88958740234375, -1.7489013671875, -1.60821533203125, -1.467529296875, -1.32684326171875, -1.1861572265625, -1.04547119140625, -0.90478515625, -0.76409912109375, -0.6234130859375, -0.48272705078125, -0.342041015625, -0.20135498046875, -0.0606689453125, 0.08001708984375, 0.220703125, 0.36138916015625, 0.5020751953125, 0.64276123046875, 0.783447265625, 0.92413330078125, 1.0648193359375, 1.20550537109375, 1.34619140625, 1.48687744140625, 1.6275634765625, 1.76824951171875, 1.908935546875, 2.04962158203125, 2.1903076171875, 2.33099365234375, 2.4716796875, 2.61236572265625, 2.7530517578125, 2.89373779296875, 3.034423828125, 3.17510986328125, 3.3157958984375, 3.45648193359375, 3.59716796875, 3.73785400390625, 3.8785400390625, 4.01922607421875, 4.159912109375, 4.30059814453125, 4.4412841796875, 4.58197021484375, 4.72265625]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 4.0, 1.0, 1.0, 3.0, 3.0, 3.0, 5.0, 5.0, 5.0, 5.0, 9.0, 8.0, 14.0, 11.0, 15.0, 11.0, 17.0, 16.0, 26.0, 24.0, 23.0, 34.0, 24.0, 52.0, 45.0, 48.0, 104.0, 411.0, 5130.0, 725483.0, 312707.0, 3478.0, 354.0, 82.0, 62.0, 42.0, 33.0, 32.0, 25.0, 31.0, 27.0, 23.0, 12.0, 12.0, 22.0, 13.0, 11.0, 12.0, 13.0, 7.0, 5.0, 5.0, 2.0, 3.0, 0.0, 3.0, 3.0, 3.0, 1.0, 3.0, 1.0, 6.0], "bins": [-11.5546875, -11.19287109375, -10.8310546875, -10.46923828125, -10.107421875, -9.74560546875, -9.3837890625, -9.02197265625, -8.66015625, -8.29833984375, -7.9365234375, -7.57470703125, -7.212890625, -6.85107421875, -6.4892578125, -6.12744140625, -5.765625, -5.40380859375, -5.0419921875, -4.68017578125, -4.318359375, -3.95654296875, -3.5947265625, -3.23291015625, -2.87109375, -2.50927734375, -2.1474609375, -1.78564453125, -1.423828125, -1.06201171875, -0.7001953125, -0.33837890625, 0.0234375, 0.38525390625, 0.7470703125, 1.10888671875, 1.470703125, 1.83251953125, 2.1943359375, 2.55615234375, 2.91796875, 3.27978515625, 3.6416015625, 4.00341796875, 4.365234375, 4.72705078125, 5.0888671875, 5.45068359375, 5.8125, 6.17431640625, 6.5361328125, 6.89794921875, 7.259765625, 7.62158203125, 7.9833984375, 8.34521484375, 8.70703125, 9.06884765625, 9.4306640625, 9.79248046875, 10.154296875, 10.51611328125, 10.8779296875, 11.23974609375, 11.6015625]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 4.0, 2.0, 1.0, 2.0, 4.0, 3.0, 6.0, 5.0, 9.0, 5.0, 7.0, 12.0, 7.0, 14.0, 17.0, 20.0, 21.0, 23.0, 15.0, 26.0, 33.0, 34.0, 38.0, 27.0, 27.0, 36.0, 45.0, 41.0, 39.0, 32.0, 40.0, 31.0, 43.0, 34.0, 28.0, 30.0, 31.0, 25.0, 23.0, 26.0, 21.0, 14.0, 22.0, 11.0, 12.0, 19.0, 8.0, 11.0, 2.0, 6.0, 5.0, 2.0, 4.0, 0.0, 6.0, 1.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.77734375, -3.65057373046875, -3.5238037109375, -3.39703369140625, -3.270263671875, -3.14349365234375, -3.0167236328125, -2.88995361328125, -2.76318359375, -2.63641357421875, -2.5096435546875, -2.38287353515625, -2.256103515625, -2.12933349609375, -2.0025634765625, -1.87579345703125, -1.7490234375, -1.62225341796875, -1.4954833984375, -1.36871337890625, -1.241943359375, -1.11517333984375, -0.9884033203125, -0.86163330078125, -0.73486328125, -0.60809326171875, -0.4813232421875, -0.35455322265625, -0.227783203125, -0.10101318359375, 0.0257568359375, 0.15252685546875, 0.279296875, 0.40606689453125, 0.5328369140625, 0.65960693359375, 0.786376953125, 0.91314697265625, 1.0399169921875, 1.16668701171875, 1.29345703125, 1.42022705078125, 1.5469970703125, 1.67376708984375, 1.800537109375, 1.92730712890625, 2.0540771484375, 2.18084716796875, 2.3076171875, 2.43438720703125, 2.5611572265625, 2.68792724609375, 2.814697265625, 2.94146728515625, 3.0682373046875, 3.19500732421875, 3.32177734375, 3.44854736328125, 3.5753173828125, 3.70208740234375, 3.828857421875, 3.95562744140625, 4.0823974609375, 4.20916748046875, 4.3359375]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 7.0, 15.0, 23.0, 19.0, 50.0, 90.0, 139.0, 247.0, 488.0, 943.0, 2012.0, 5286.0, 18294.0, 114226.0, 736898.0, 138859.0, 20778.0, 5824.0, 2265.0, 1002.0, 484.0, 243.0, 136.0, 83.0, 48.0, 34.0, 16.0, 13.0, 14.0, 4.0, 5.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2421875, -1.2028045654296875, -1.163421630859375, -1.1240386962890625, -1.08465576171875, -1.0452728271484375, -1.005889892578125, -0.9665069580078125, -0.9271240234375, -0.8877410888671875, -0.848358154296875, -0.8089752197265625, -0.76959228515625, -0.7302093505859375, -0.690826416015625, -0.6514434814453125, -0.612060546875, -0.5726776123046875, -0.533294677734375, -0.4939117431640625, -0.45452880859375, -0.4151458740234375, -0.375762939453125, -0.3363800048828125, -0.2969970703125, -0.2576141357421875, -0.218231201171875, -0.1788482666015625, -0.13946533203125, -0.1000823974609375, -0.060699462890625, -0.0213165283203125, 0.01806640625, 0.0574493408203125, 0.096832275390625, 0.1362152099609375, 0.17559814453125, 0.2149810791015625, 0.254364013671875, 0.2937469482421875, 0.3331298828125, 0.3725128173828125, 0.411895751953125, 0.4512786865234375, 0.49066162109375, 0.5300445556640625, 0.569427490234375, 0.6088104248046875, 0.648193359375, 0.6875762939453125, 0.726959228515625, 0.7663421630859375, 0.80572509765625, 0.8451080322265625, 0.884490966796875, 0.9238739013671875, 0.9632568359375, 1.0026397705078125, 1.042022705078125, 1.0814056396484375, 1.12078857421875, 1.1601715087890625, 1.199554443359375, 1.2389373779296875, 1.2783203125]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 3.0, 7.0, 3.0, 2.0, 7.0, 8.0, 8.0, 8.0, 11.0, 16.0, 17.0, 34.0, 60.0, 65.0, 75.0, 84.0, 135.0, 90.0, 77.0, 61.0, 60.0, 44.0, 32.0, 18.0, 19.0, 11.0, 10.0, 10.0, 4.0, 5.0, 6.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.00015783309936523438, -0.00015268847346305847, -0.00014754384756088257, -0.00014239922165870667, -0.00013725459575653076, -0.00013210996985435486, -0.00012696534395217896, -0.00012182071805000305, -0.00011667609214782715, -0.00011153146624565125, -0.00010638684034347534, -0.00010124221444129944, -9.609758853912354e-05, -9.095296263694763e-05, -8.580833673477173e-05, -8.066371083259583e-05, -7.551908493041992e-05, -7.037445902824402e-05, -6.522983312606812e-05, -6.008520722389221e-05, -5.494058132171631e-05, -4.9795955419540405e-05, -4.46513295173645e-05, -3.95067036151886e-05, -3.4362077713012695e-05, -2.9217451810836792e-05, -2.407282590866089e-05, -1.8928200006484985e-05, -1.3783574104309082e-05, -8.638948202133179e-06, -3.4943222999572754e-06, 1.650303602218628e-06, 6.794929504394531e-06, 1.1939555406570435e-05, 1.7084181308746338e-05, 2.222880721092224e-05, 2.7373433113098145e-05, 3.251805901527405e-05, 3.766268491744995e-05, 4.2807310819625854e-05, 4.795193672180176e-05, 5.309656262397766e-05, 5.8241188526153564e-05, 6.338581442832947e-05, 6.853044033050537e-05, 7.367506623268127e-05, 7.881969213485718e-05, 8.396431803703308e-05, 8.910894393920898e-05, 9.425356984138489e-05, 9.939819574356079e-05, 0.0001045428216457367, 0.0001096874475479126, 0.0001148320734500885, 0.0001199766993522644, 0.0001251213252544403, 0.0001302659511566162, 0.00013541057705879211, 0.00014055520296096802, 0.00014569982886314392, 0.00015084445476531982, 0.00015598908066749573, 0.00016113370656967163, 0.00016627833247184753, 0.00017142295837402344]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 8.0, 5.0, 4.0, 8.0, 10.0, 5.0, 24.0, 29.0, 40.0, 51.0, 76.0, 132.0, 197.0, 320.0, 546.0, 1049.0, 2164.0, 5183.0, 14551.0, 58375.0, 384336.0, 480786.0, 72006.0, 17373.0, 6005.0, 2515.0, 1161.0, 603.0, 368.0, 212.0, 134.0, 90.0, 59.0, 34.0, 24.0, 24.0, 17.0, 15.0, 8.0, 9.0, 3.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.96728515625, -0.9361495971679688, -0.9050140380859375, -0.8738784790039062, -0.842742919921875, -0.8116073608398438, -0.7804718017578125, -0.7493362426757812, -0.71820068359375, -0.6870651245117188, -0.6559295654296875, -0.6247940063476562, -0.593658447265625, -0.5625228881835938, -0.5313873291015625, -0.5002517700195312, -0.4691162109375, -0.43798065185546875, -0.4068450927734375, -0.37570953369140625, -0.344573974609375, -0.31343841552734375, -0.2823028564453125, -0.25116729736328125, -0.22003173828125, -0.18889617919921875, -0.1577606201171875, -0.12662506103515625, -0.095489501953125, -0.06435394287109375, -0.0332183837890625, -0.00208282470703125, 0.029052734375, 0.06018829345703125, 0.0913238525390625, 0.12245941162109375, 0.153594970703125, 0.18473052978515625, 0.2158660888671875, 0.24700164794921875, 0.27813720703125, 0.30927276611328125, 0.3404083251953125, 0.37154388427734375, 0.402679443359375, 0.43381500244140625, 0.4649505615234375, 0.49608612060546875, 0.5272216796875, 0.5583572387695312, 0.5894927978515625, 0.6206283569335938, 0.651763916015625, 0.6828994750976562, 0.7140350341796875, 0.7451705932617188, 0.77630615234375, 0.8074417114257812, 0.8385772705078125, 0.8697128295898438, 0.900848388671875, 0.9319839477539062, 0.9631195068359375, 0.9942550659179688, 1.025390625]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 1.0, 5.0, 8.0, 6.0, 8.0, 21.0, 21.0, 22.0, 29.0, 28.0, 60.0, 78.0, 87.0, 94.0, 107.0, 83.0, 76.0, 75.0, 54.0, 36.0, 30.0, 17.0, 14.0, 4.0, 6.0, 6.0, 10.0, 3.0, 2.0, 1.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.406494140625, -0.3915596008300781, -0.37662506103515625, -0.3616905212402344, -0.3467559814453125, -0.3318214416503906, -0.31688690185546875, -0.3019523620605469, -0.287017822265625, -0.2720832824707031, -0.25714874267578125, -0.24221420288085938, -0.2272796630859375, -0.21234512329101562, -0.19741058349609375, -0.18247604370117188, -0.16754150390625, -0.15260696411132812, -0.13767242431640625, -0.12273788452148438, -0.1078033447265625, -0.09286880493164062, -0.07793426513671875, -0.06299972534179688, -0.048065185546875, -0.033130645751953125, -0.01819610595703125, -0.003261566162109375, 0.0116729736328125, 0.026607513427734375, 0.04154205322265625, 0.056476593017578125, 0.0714111328125, 0.08634567260742188, 0.10128021240234375, 0.11621475219726562, 0.1311492919921875, 0.14608383178710938, 0.16101837158203125, 0.17595291137695312, 0.190887451171875, 0.20582199096679688, 0.22075653076171875, 0.23569107055664062, 0.2506256103515625, 0.2655601501464844, 0.28049468994140625, 0.2954292297363281, 0.31036376953125, 0.3252983093261719, 0.34023284912109375, 0.3551673889160156, 0.3701019287109375, 0.3850364685058594, 0.39997100830078125, 0.4149055480957031, 0.429840087890625, 0.4447746276855469, 0.45970916748046875, 0.4746437072753906, 0.4895782470703125, 0.5045127868652344, 0.5194473266601562, 0.5343818664550781, 0.54931640625]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 6.0, 10.0, 11.0, 20.0, 35.0, 52.0, 128.0, 207.0, 203.0, 152.0, 73.0, 52.0, 25.0, 16.0, 11.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.38946008682251, -5.03520393371582, -4.680947780609131, -4.326691627502441, -3.972435712814331, -3.6181795597076416, -3.2639236450195312, -2.909667491912842, -2.5554113388061523, -2.201155185699463, -1.846899151802063, -1.492643117904663, -1.1383869647979736, -0.7841308116912842, -0.42987489700317383, -0.07561874389648438, 0.2786374092102051, 0.6328935027122498, 0.9871495962142944, 1.3414056301116943, 1.6956617832183838, 2.0499179363250732, 2.4041738510131836, 2.758430004119873, 3.1126861572265625, 3.466942310333252, 3.8211984634399414, 4.175454139709473, 4.52971076965332, 4.883966445922852, 5.238222599029541, 5.5924787521362305, 5.946735382080078, 6.300991535186768, 6.655247688293457, 7.009503364562988, 7.363759994506836, 7.718015670776367, 8.072271347045898, 8.426527976989746, 8.780784606933594, 9.135040283203125, 9.489296913146973, 9.843552589416504, 10.197809219360352, 10.552064895629883, 10.906320571899414, 11.260577201843262, 11.614832878112793, 11.969088554382324, 12.323345184326172, 12.677600860595703, 13.03185749053955, 13.386113166809082, 13.74036979675293, 14.094625473022461, 14.448881149291992, 14.803136825561523, 15.157393455505371, 15.511649131774902, 15.86590576171875, 16.22016143798828, 16.574417114257812, 16.928672790527344, 17.282930374145508]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 1.0, 7.0, 6.0, 2.0, 9.0, 11.0, 13.0, 12.0, 14.0, 17.0, 27.0, 18.0, 36.0, 32.0, 30.0, 34.0, 36.0, 37.0, 30.0, 38.0, 43.0, 43.0, 36.0, 54.0, 41.0, 38.0, 30.0, 37.0, 49.0, 19.0, 26.0, 24.0, 20.0, 23.0, 15.0, 18.0, 13.0, 12.0, 8.0, 8.0, 10.0, 5.0, 2.0, 5.0, 7.0, 1.0, 5.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.1865620613098145, -6.943087577819824, -6.699612617492676, -6.4561381340026855, -6.212663650512695, -5.969188690185547, -5.725714206695557, -5.482239723205566, -5.238764762878418, -4.995290279388428, -4.751815319061279, -4.508340835571289, -4.264866352081299, -4.021391868591309, -3.77791690826416, -3.53444242477417, -3.2909679412841797, -3.0474932193756104, -2.80401873588562, -2.560544013977051, -2.3170695304870605, -2.073594808578491, -1.8301200866699219, -1.586645483970642, -1.3431708812713623, -1.0996962785720825, -0.856221616268158, -0.6127469539642334, -0.3692723512649536, -0.12579774856567383, 0.11767697334289551, 0.3611515760421753, 0.6046266555786133, 0.8481012582778931, 1.0915758609771729, 1.3350505828857422, 1.578525185585022, 1.8219997882843018, 2.065474510192871, 2.3089489936828613, 2.5524237155914307, 2.7958984375, 3.0393729209899902, 3.2828476428985596, 3.526322364807129, 3.769796848297119, 4.013271331787109, 4.256746292114258, 4.500220775604248, 4.743695259094238, 4.987170219421387, 5.230644702911377, 5.474119186401367, 5.717594146728516, 5.961068630218506, 6.204543113708496, 6.4480180740356445, 6.691492557525635, 6.934967517852783, 7.178442001342773, 7.421916484832764, 7.665390968322754, 7.908865928649902, 8.15234088897705, 8.395814895629883]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 6.0, 4.0, 7.0, 6.0, 16.0, 25.0, 28.0, 50.0, 63.0, 115.0, 136.0, 220.0, 354.0, 657.0, 1183.0, 2451.0, 5655.0, 16456.0, 71271.0, 992198.0, 2938674.0, 127088.0, 23582.0, 7538.0, 3099.0, 1465.0, 755.0, 432.0, 262.0, 170.0, 89.0, 61.0, 42.0, 37.0, 32.0, 16.0, 19.0, 8.0, 2.0, 7.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.181640625, -3.059967041015625, -2.93829345703125, -2.816619873046875, -2.6949462890625, -2.573272705078125, -2.45159912109375, -2.329925537109375, -2.208251953125, -2.086578369140625, -1.96490478515625, -1.843231201171875, -1.7215576171875, -1.599884033203125, -1.47821044921875, -1.356536865234375, -1.23486328125, -1.113189697265625, -0.99151611328125, -0.869842529296875, -0.7481689453125, -0.626495361328125, -0.50482177734375, -0.383148193359375, -0.261474609375, -0.139801025390625, -0.01812744140625, 0.103546142578125, 0.2252197265625, 0.346893310546875, 0.46856689453125, 0.590240478515625, 0.7119140625, 0.833587646484375, 0.95526123046875, 1.076934814453125, 1.1986083984375, 1.320281982421875, 1.44195556640625, 1.563629150390625, 1.685302734375, 1.806976318359375, 1.92864990234375, 2.050323486328125, 2.1719970703125, 2.293670654296875, 2.41534423828125, 2.537017822265625, 2.65869140625, 2.780364990234375, 2.90203857421875, 3.023712158203125, 3.1453857421875, 3.267059326171875, 3.38873291015625, 3.510406494140625, 3.632080078125, 3.753753662109375, 3.87542724609375, 3.997100830078125, 4.1187744140625, 4.240447998046875, 4.36212158203125, 4.483795166015625, 4.60546875]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 6.0, 4.0, 6.0, 9.0, 13.0, 16.0, 36.0, 28.0, 38.0, 45.0, 59.0, 65.0, 70.0, 77.0, 58.0, 62.0, 82.0, 54.0, 62.0, 49.0, 32.0, 26.0, 22.0, 22.0, 16.0, 11.0, 13.0, 5.0, 3.0, 5.0, 2.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.890625, -2.802154541015625, -2.71368408203125, -2.625213623046875, -2.5367431640625, -2.448272705078125, -2.35980224609375, -2.271331787109375, -2.182861328125, -2.094390869140625, -2.00592041015625, -1.917449951171875, -1.8289794921875, -1.740509033203125, -1.65203857421875, -1.563568115234375, -1.47509765625, -1.386627197265625, -1.29815673828125, -1.209686279296875, -1.1212158203125, -1.032745361328125, -0.94427490234375, -0.855804443359375, -0.767333984375, -0.678863525390625, -0.59039306640625, -0.501922607421875, -0.4134521484375, -0.324981689453125, -0.23651123046875, -0.148040771484375, -0.0595703125, 0.028900146484375, 0.11737060546875, 0.205841064453125, 0.2943115234375, 0.382781982421875, 0.47125244140625, 0.559722900390625, 0.648193359375, 0.736663818359375, 0.82513427734375, 0.913604736328125, 1.0020751953125, 1.090545654296875, 1.17901611328125, 1.267486572265625, 1.35595703125, 1.444427490234375, 1.53289794921875, 1.621368408203125, 1.7098388671875, 1.798309326171875, 1.88677978515625, 1.975250244140625, 2.063720703125, 2.152191162109375, 2.24066162109375, 2.329132080078125, 2.4176025390625, 2.506072998046875, 2.59454345703125, 2.683013916015625, 2.771484375]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 8.0, 4.0, 5.0, 11.0, 7.0, 11.0, 21.0, 30.0, 45.0, 85.0, 127.0, 342.0, 1472.0, 27982.0, 4120721.0, 40904.0, 1743.0, 397.0, 153.0, 70.0, 54.0, 27.0, 28.0, 16.0, 7.0, 5.0, 5.0, 3.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.6328125, -14.2430419921875, -13.853271484375, -13.4635009765625, -13.07373046875, -12.6839599609375, -12.294189453125, -11.9044189453125, -11.5146484375, -11.1248779296875, -10.735107421875, -10.3453369140625, -9.95556640625, -9.5657958984375, -9.176025390625, -8.7862548828125, -8.396484375, -8.0067138671875, -7.616943359375, -7.2271728515625, -6.83740234375, -6.4476318359375, -6.057861328125, -5.6680908203125, -5.2783203125, -4.8885498046875, -4.498779296875, -4.1090087890625, -3.71923828125, -3.3294677734375, -2.939697265625, -2.5499267578125, -2.16015625, -1.7703857421875, -1.380615234375, -0.9908447265625, -0.60107421875, -0.2113037109375, 0.178466796875, 0.5682373046875, 0.9580078125, 1.3477783203125, 1.737548828125, 2.1273193359375, 2.51708984375, 2.9068603515625, 3.296630859375, 3.6864013671875, 4.076171875, 4.4659423828125, 4.855712890625, 5.2454833984375, 5.63525390625, 6.0250244140625, 6.414794921875, 6.8045654296875, 7.1943359375, 7.5841064453125, 7.973876953125, 8.3636474609375, 8.75341796875, 9.1431884765625, 9.532958984375, 9.9227294921875, 10.3125]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 1.0, 2.0, 5.0, 21.0, 14.0, 17.0, 29.0, 26.0, 43.0, 74.0, 96.0, 166.0, 273.0, 457.0, 1092.0, 755.0, 378.0, 195.0, 122.0, 92.0, 58.0, 48.0, 24.0, 21.0, 16.0, 17.0, 6.0, 8.0, 6.0, 5.0, 6.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0, -0.97039794921875, -0.9407958984375, -0.91119384765625, -0.881591796875, -0.85198974609375, -0.8223876953125, -0.79278564453125, -0.76318359375, -0.73358154296875, -0.7039794921875, -0.67437744140625, -0.644775390625, -0.61517333984375, -0.5855712890625, -0.55596923828125, -0.5263671875, -0.49676513671875, -0.4671630859375, -0.43756103515625, -0.407958984375, -0.37835693359375, -0.3487548828125, -0.31915283203125, -0.28955078125, -0.25994873046875, -0.2303466796875, -0.20074462890625, -0.171142578125, -0.14154052734375, -0.1119384765625, -0.08233642578125, -0.052734375, -0.02313232421875, 0.0064697265625, 0.03607177734375, 0.065673828125, 0.09527587890625, 0.1248779296875, 0.15447998046875, 0.18408203125, 0.21368408203125, 0.2432861328125, 0.27288818359375, 0.302490234375, 0.33209228515625, 0.3616943359375, 0.39129638671875, 0.4208984375, 0.45050048828125, 0.4801025390625, 0.50970458984375, 0.539306640625, 0.56890869140625, 0.5985107421875, 0.62811279296875, 0.65771484375, 0.68731689453125, 0.7169189453125, 0.74652099609375, 0.776123046875, 0.80572509765625, 0.8353271484375, 0.86492919921875, 0.89453125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 3.0, 1.0, 2.0, 6.0, 8.0, 5.0, 8.0, 6.0, 9.0, 18.0, 19.0, 27.0, 48.0, 72.0, 73.0, 100.0, 104.0, 111.0, 96.0, 87.0, 52.0, 37.0, 40.0, 17.0, 12.0, 8.0, 8.0, 8.0, 7.0, 3.0, 5.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.718958854675293, -3.6025497913360596, -3.486140727996826, -3.3697316646575928, -3.2533226013183594, -3.136913537979126, -3.0205044746398926, -2.9040956497192383, -2.787686347961426, -2.6712772846221924, -2.554868221282959, -2.4384591579437256, -2.322050094604492, -2.205641031265259, -2.0892319679260254, -1.9728230237960815, -1.8564140796661377, -1.7400050163269043, -1.623595952987671, -1.5071868896484375, -1.390777826309204, -1.2743687629699707, -1.1579598188400269, -1.0415507555007935, -0.9251416921615601, -0.8087326288223267, -0.6923235654830933, -0.5759145617485046, -0.45950549840927124, -0.34309643507003784, -0.22668743133544922, -0.11027836799621582, 0.0061304569244384766, 0.12253950536251068, 0.23894855380058289, 0.3553575873374939, 0.4717666506767273, 0.5881757140159607, 0.7045847177505493, 0.8209937810897827, 0.9374028444290161, 1.0538119077682495, 1.170220971107483, 1.2866299152374268, 1.4030389785766602, 1.5194480419158936, 1.635857105255127, 1.7522661685943604, 1.8686752319335938, 1.9850842952728271, 2.1014933586120605, 2.217902421951294, 2.3343114852905273, 2.4507205486297607, 2.567129611968994, 2.6835384368896484, 2.799947738647461, 2.9163568019866943, 3.0327658653259277, 3.149174928665161, 3.2655839920043945, 3.381993055343628, 3.4984021186828613, 3.6148109436035156, 3.731220006942749]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 4.0, 2.0, 6.0, 12.0, 17.0, 20.0, 21.0, 33.0, 31.0, 35.0, 38.0, 55.0, 55.0, 64.0, 74.0, 61.0, 51.0, 67.0, 58.0, 60.0, 49.0, 41.0, 32.0, 25.0, 22.0, 15.0, 12.0, 10.0, 11.0, 7.0, 7.0, 4.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.964372158050537, -2.870063543319702, -2.775754928588867, -2.6814465522766113, -2.5871379375457764, -2.4928293228149414, -2.3985207080841064, -2.3042120933532715, -2.2099037170410156, -2.1155951023101807, -2.0212864875793457, -1.9269779920578003, -1.8326694965362549, -1.73836088180542, -1.644052267074585, -1.54974365234375, -1.455435037612915, -1.36112642288208, -1.2668179273605347, -1.1725093126296997, -1.0782008171081543, -0.9838922023773193, -0.8895835876464844, -0.7952750325202942, -0.700966477394104, -0.6066579222679138, -0.5123493671417236, -0.41804075241088867, -0.3237321972846985, -0.2294236421585083, -0.13511502742767334, -0.040806472301483154, 0.05350208282470703, 0.1478106528520584, 0.2421192228794098, 0.33642780780792236, 0.43073636293411255, 0.5250449180603027, 0.6193535327911377, 0.7136620879173279, 0.8079706430435181, 0.9022791981697083, 0.9965877532958984, 1.0908963680267334, 1.1852049827575684, 1.2795134782791138, 1.3738220930099487, 1.4681305885314941, 1.562439203262329, 1.656747817993164, 1.7510563135147095, 1.8453649282455444, 1.9396734237670898, 2.033982038497925, 2.1282906532287598, 2.2225992679595947, 2.3169078826904297, 2.4112164974212646, 2.5055251121520996, 2.5998334884643555, 2.6941421031951904, 2.7884507179260254, 2.8827593326568604, 2.9770679473876953, 3.071376323699951]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 6.0, 6.0, 4.0, 8.0, 10.0, 15.0, 30.0, 42.0, 62.0, 98.0, 208.0, 471.0, 1231.0, 3376.0, 12123.0, 59278.0, 370261.0, 491907.0, 86372.0, 16438.0, 4167.0, 1365.0, 520.0, 245.0, 119.0, 59.0, 46.0, 27.0, 14.0, 18.0, 13.0, 7.0, 6.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.487060546875, -0.4714012145996094, -0.45574188232421875, -0.4400825500488281, -0.4244232177734375, -0.4087638854980469, -0.39310455322265625, -0.3774452209472656, -0.361785888671875, -0.3461265563964844, -0.33046722412109375, -0.3148078918457031, -0.2991485595703125, -0.2834892272949219, -0.26782989501953125, -0.2521705627441406, -0.23651123046875, -0.22085189819335938, -0.20519256591796875, -0.18953323364257812, -0.1738739013671875, -0.15821456909179688, -0.14255523681640625, -0.12689590454101562, -0.111236572265625, -0.09557723999023438, -0.07991790771484375, -0.06425857543945312, -0.0485992431640625, -0.032939910888671875, -0.01728057861328125, -0.001621246337890625, 0.0140380859375, 0.029697418212890625, 0.04535675048828125, 0.061016082763671875, 0.0766754150390625, 0.09233474731445312, 0.10799407958984375, 0.12365341186523438, 0.139312744140625, 0.15497207641601562, 0.17063140869140625, 0.18629074096679688, 0.2019500732421875, 0.21760940551757812, 0.23326873779296875, 0.24892807006835938, 0.26458740234375, 0.2802467346191406, 0.29590606689453125, 0.3115653991699219, 0.3272247314453125, 0.3428840637207031, 0.35854339599609375, 0.3742027282714844, 0.389862060546875, 0.4055213928222656, 0.42118072509765625, 0.4368400573730469, 0.4524993896484375, 0.4681587219238281, 0.48381805419921875, 0.4994773864746094, 0.51513671875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 6.0, 9.0, 12.0, 14.0, 16.0, 17.0, 29.0, 32.0, 45.0, 59.0, 66.0, 82.0, 90.0, 86.0, 70.0, 85.0, 68.0, 58.0, 45.0, 25.0, 24.0, 15.0, 14.0, 7.0, 10.0, 6.0, 8.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-2.8203125, -2.74053955078125, -2.6607666015625, -2.58099365234375, -2.501220703125, -2.42144775390625, -2.3416748046875, -2.26190185546875, -2.18212890625, -2.10235595703125, -2.0225830078125, -1.94281005859375, -1.863037109375, -1.78326416015625, -1.7034912109375, -1.62371826171875, -1.5439453125, -1.46417236328125, -1.3843994140625, -1.30462646484375, -1.224853515625, -1.14508056640625, -1.0653076171875, -0.98553466796875, -0.90576171875, -0.82598876953125, -0.7462158203125, -0.66644287109375, -0.586669921875, -0.50689697265625, -0.4271240234375, -0.34735107421875, -0.267578125, -0.18780517578125, -0.1080322265625, -0.02825927734375, 0.051513671875, 0.13128662109375, 0.2110595703125, 0.29083251953125, 0.37060546875, 0.45037841796875, 0.5301513671875, 0.60992431640625, 0.689697265625, 0.76947021484375, 0.8492431640625, 0.92901611328125, 1.0087890625, 1.08856201171875, 1.1683349609375, 1.24810791015625, 1.327880859375, 1.40765380859375, 1.4874267578125, 1.56719970703125, 1.64697265625, 1.72674560546875, 1.8065185546875, 1.88629150390625, 1.966064453125, 2.04583740234375, 2.1256103515625, 2.20538330078125, 2.28515625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 6.0, 7.0, 18.0, 15.0, 23.0, 30.0, 46.0, 67.0, 92.0, 120.0, 181.0, 311.0, 475.0, 948.0, 1865.0, 4090.0, 11101.0, 33998.0, 118573.0, 341070.0, 352817.0, 126051.0, 36329.0, 11511.0, 4487.0, 1886.0, 955.0, 515.0, 310.0, 193.0, 153.0, 93.0, 71.0, 40.0, 34.0, 27.0, 17.0, 14.0, 6.0, 4.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.284912109375, -0.2750968933105469, -0.26528167724609375, -0.2554664611816406, -0.2456512451171875, -0.23583602905273438, -0.22602081298828125, -0.21620559692382812, -0.206390380859375, -0.19657516479492188, -0.18675994873046875, -0.17694473266601562, -0.1671295166015625, -0.15731430053710938, -0.14749908447265625, -0.13768386840820312, -0.12786865234375, -0.11805343627929688, -0.10823822021484375, -0.09842300415039062, -0.0886077880859375, -0.07879257202148438, -0.06897735595703125, -0.059162139892578125, -0.049346923828125, -0.039531707763671875, -0.02971649169921875, -0.019901275634765625, -0.0100860595703125, -0.000270843505859375, 0.00954437255859375, 0.019359588623046875, 0.0291748046875, 0.038990020751953125, 0.04880523681640625, 0.058620452880859375, 0.0684356689453125, 0.07825088500976562, 0.08806610107421875, 0.09788131713867188, 0.107696533203125, 0.11751174926757812, 0.12732696533203125, 0.13714218139648438, 0.1469573974609375, 0.15677261352539062, 0.16658782958984375, 0.17640304565429688, 0.18621826171875, 0.19603347778320312, 0.20584869384765625, 0.21566390991210938, 0.2254791259765625, 0.23529434204101562, 0.24510955810546875, 0.2549247741699219, 0.264739990234375, 0.2745552062988281, 0.28437042236328125, 0.2941856384277344, 0.3040008544921875, 0.3138160705566406, 0.32363128662109375, 0.3334465026855469, 0.34326171875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 3.0, 5.0, 6.0, 7.0, 6.0, 5.0, 14.0, 17.0, 18.0, 17.0, 31.0, 32.0, 35.0, 42.0, 52.0, 40.0, 45.0, 49.0, 44.0, 63.0, 65.0, 43.0, 64.0, 45.0, 46.0, 33.0, 33.0, 25.0, 26.0, 24.0, 10.0, 16.0, 8.0, 9.0, 7.0, 5.0, 6.0, 5.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.02734375, -2.92083740234375, -2.8143310546875, -2.70782470703125, -2.601318359375, -2.49481201171875, -2.3883056640625, -2.28179931640625, -2.17529296875, -2.06878662109375, -1.9622802734375, -1.85577392578125, -1.749267578125, -1.64276123046875, -1.5362548828125, -1.42974853515625, -1.3232421875, -1.21673583984375, -1.1102294921875, -1.00372314453125, -0.897216796875, -0.79071044921875, -0.6842041015625, -0.57769775390625, -0.47119140625, -0.36468505859375, -0.2581787109375, -0.15167236328125, -0.045166015625, 0.06134033203125, 0.1678466796875, 0.27435302734375, 0.380859375, 0.48736572265625, 0.5938720703125, 0.70037841796875, 0.806884765625, 0.91339111328125, 1.0198974609375, 1.12640380859375, 1.23291015625, 1.33941650390625, 1.4459228515625, 1.55242919921875, 1.658935546875, 1.76544189453125, 1.8719482421875, 1.97845458984375, 2.0849609375, 2.19146728515625, 2.2979736328125, 2.40447998046875, 2.510986328125, 2.61749267578125, 2.7239990234375, 2.83050537109375, 2.93701171875, 3.04351806640625, 3.1500244140625, 3.25653076171875, 3.363037109375, 3.46954345703125, 3.5760498046875, 3.68255615234375, 3.7890625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 2.0, 6.0, 4.0, 12.0, 15.0, 29.0, 52.0, 67.0, 137.0, 303.0, 659.0, 1832.0, 7820.0, 101507.0, 886482.0, 42041.0, 5123.0, 1415.0, 540.0, 216.0, 125.0, 65.0, 36.0, 22.0, 15.0, 12.0, 1.0, 6.0, 5.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.43505859375, -0.42240142822265625, -0.4097442626953125, -0.39708709716796875, -0.384429931640625, -0.37177276611328125, -0.3591156005859375, -0.34645843505859375, -0.33380126953125, -0.32114410400390625, -0.3084869384765625, -0.29582977294921875, -0.283172607421875, -0.27051544189453125, -0.2578582763671875, -0.24520111083984375, -0.2325439453125, -0.21988677978515625, -0.2072296142578125, -0.19457244873046875, -0.181915283203125, -0.16925811767578125, -0.1566009521484375, -0.14394378662109375, -0.13128662109375, -0.11862945556640625, -0.1059722900390625, -0.09331512451171875, -0.080657958984375, -0.06800079345703125, -0.0553436279296875, -0.04268646240234375, -0.030029296875, -0.01737213134765625, -0.0047149658203125, 0.00794219970703125, 0.020599365234375, 0.03325653076171875, 0.0459136962890625, 0.05857086181640625, 0.07122802734375, 0.08388519287109375, 0.0965423583984375, 0.10919952392578125, 0.121856689453125, 0.13451385498046875, 0.1471710205078125, 0.15982818603515625, 0.1724853515625, 0.18514251708984375, 0.1977996826171875, 0.21045684814453125, 0.223114013671875, 0.23577117919921875, 0.2484283447265625, 0.26108551025390625, 0.27374267578125, 0.28639984130859375, 0.2990570068359375, 0.31171417236328125, 0.324371337890625, 0.33702850341796875, 0.3496856689453125, 0.36234283447265625, 0.375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 4.0, 5.0, 2.0, 6.0, 6.0, 10.0, 14.0, 16.0, 35.0, 52.0, 78.0, 95.0, 94.0, 116.0, 123.0, 87.0, 88.0, 56.0, 33.0, 31.0, 14.0, 10.0, 6.0, 5.0, 2.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010162591934204102, -9.807851165533066e-05, -9.45311039686203e-05, -9.098369628190994e-05, -8.743628859519958e-05, -8.388888090848923e-05, -8.034147322177887e-05, -7.679406553506851e-05, -7.324665784835815e-05, -6.96992501616478e-05, -6.615184247493744e-05, -6.260443478822708e-05, -5.9057027101516724e-05, -5.5509619414806366e-05, -5.196221172809601e-05, -4.841480404138565e-05, -4.486739635467529e-05, -4.1319988667964935e-05, -3.777258098125458e-05, -3.422517329454422e-05, -3.067776560783386e-05, -2.7130357921123505e-05, -2.3582950234413147e-05, -2.003554254770279e-05, -1.648813486099243e-05, -1.2940727174282074e-05, -9.393319487571716e-06, -5.845911800861359e-06, -2.298504114151001e-06, 1.2489035725593567e-06, 4.796311259269714e-06, 8.343718945980072e-06, 1.189112663269043e-05, 1.5438534319400787e-05, 1.8985942006111145e-05, 2.2533349692821503e-05, 2.608075737953186e-05, 2.9628165066242218e-05, 3.3175572752952576e-05, 3.672298043966293e-05, 4.027038812637329e-05, 4.381779581308365e-05, 4.7365203499794006e-05, 5.0912611186504364e-05, 5.446001887321472e-05, 5.800742655992508e-05, 6.155483424663544e-05, 6.51022419333458e-05, 6.864964962005615e-05, 7.219705730676651e-05, 7.574446499347687e-05, 7.929187268018723e-05, 8.283928036689758e-05, 8.638668805360794e-05, 8.99340957403183e-05, 9.348150342702866e-05, 9.702891111373901e-05, 0.00010057631880044937, 0.00010412372648715973, 0.00010767113417387009, 0.00011121854186058044, 0.0001147659495472908, 0.00011831335723400116, 0.00012186076492071152, 0.00012540817260742188]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 5.0, 5.0, 3.0, 8.0, 11.0, 19.0, 25.0, 34.0, 52.0, 69.0, 149.0, 187.0, 368.0, 714.0, 1501.0, 4258.0, 19823.0, 342446.0, 640002.0, 29756.0, 5344.0, 1872.0, 816.0, 439.0, 233.0, 147.0, 98.0, 54.0, 49.0, 30.0, 19.0, 7.0, 8.0, 3.0, 2.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.383544921875, -0.3734779357910156, -0.36341094970703125, -0.3533439636230469, -0.3432769775390625, -0.3332099914550781, -0.32314300537109375, -0.3130760192871094, -0.303009033203125, -0.2929420471191406, -0.28287506103515625, -0.2728080749511719, -0.2627410888671875, -0.2526741027832031, -0.24260711669921875, -0.23254013061523438, -0.22247314453125, -0.21240615844726562, -0.20233917236328125, -0.19227218627929688, -0.1822052001953125, -0.17213821411132812, -0.16207122802734375, -0.15200424194335938, -0.141937255859375, -0.13187026977539062, -0.12180328369140625, -0.11173629760742188, -0.1016693115234375, -0.09160232543945312, -0.08153533935546875, -0.07146835327148438, -0.0614013671875, -0.051334381103515625, -0.04126739501953125, -0.031200408935546875, -0.0211334228515625, -0.011066436767578125, -0.00099945068359375, 0.009067535400390625, 0.019134521484375, 0.029201507568359375, 0.03926849365234375, 0.049335479736328125, 0.0594024658203125, 0.06946945190429688, 0.07953643798828125, 0.08960342407226562, 0.09967041015625, 0.10973739624023438, 0.11980438232421875, 0.12987136840820312, 0.1399383544921875, 0.15000534057617188, 0.16007232666015625, 0.17013931274414062, 0.180206298828125, 0.19027328491210938, 0.20034027099609375, 0.21040725708007812, 0.2204742431640625, 0.23054122924804688, 0.24060821533203125, 0.2506752014160156, 0.2607421875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 0.0, 5.0, 6.0, 7.0, 13.0, 19.0, 38.0, 53.0, 78.0, 128.0, 181.0, 158.0, 118.0, 73.0, 46.0, 26.0, 8.0, 10.0, 13.0, 6.0, 6.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.044464111328125, -0.0427403450012207, -0.041016578674316406, -0.03929281234741211, -0.03756904602050781, -0.035845279693603516, -0.03412151336669922, -0.03239774703979492, -0.030673980712890625, -0.028950214385986328, -0.02722644805908203, -0.025502681732177734, -0.023778915405273438, -0.02205514907836914, -0.020331382751464844, -0.018607616424560547, -0.01688385009765625, -0.015160083770751953, -0.013436317443847656, -0.01171255111694336, -0.009988784790039062, -0.008265018463134766, -0.006541252136230469, -0.004817485809326172, -0.003093719482421875, -0.0013699531555175781, 0.00035381317138671875, 0.0020775794982910156, 0.0038013458251953125, 0.005525112152099609, 0.007248878479003906, 0.008972644805908203, 0.0106964111328125, 0.012420177459716797, 0.014143943786621094, 0.01586771011352539, 0.017591476440429688, 0.019315242767333984, 0.02103900909423828, 0.022762775421142578, 0.024486541748046875, 0.026210308074951172, 0.02793407440185547, 0.029657840728759766, 0.03138160705566406, 0.03310537338256836, 0.034829139709472656, 0.03655290603637695, 0.03827667236328125, 0.04000043869018555, 0.041724205017089844, 0.04344797134399414, 0.04517173767089844, 0.046895503997802734, 0.04861927032470703, 0.05034303665161133, 0.052066802978515625, 0.05379056930541992, 0.05551433563232422, 0.057238101959228516, 0.05896186828613281, 0.06068563461303711, 0.062409400939941406, 0.0641331672668457, 0.06585693359375]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 6.0, 4.0, 7.0, 8.0, 10.0, 8.0, 23.0, 23.0, 45.0, 85.0, 118.0, 146.0, 141.0, 140.0, 81.0, 56.0, 36.0, 15.0, 15.0, 10.0, 5.0, 10.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.5170416831970215, -2.4128308296203613, -2.308619737625122, -2.204408884048462, -2.1001977920532227, -1.9959869384765625, -1.8917760848999023, -1.7875651121139526, -1.683354139328003, -1.5791431665420532, -1.4749321937561035, -1.3707213401794434, -1.2665103673934937, -1.162299394607544, -1.0580885410308838, -0.9538775682449341, -0.8496665954589844, -0.7454556226730347, -0.6412447094917297, -0.5370337963104248, -0.4328228235244751, -0.3286118507385254, -0.22440093755722046, -0.12019002437591553, -0.01597905158996582, 0.0882318913936615, 0.19244283437728882, 0.29665377736091614, 0.40086472034454346, 0.5050756931304932, 0.6092866063117981, 0.713497519493103, 0.8177084922790527, 0.9219194650650024, 1.0261304378509521, 1.1303412914276123, 1.234552264213562, 1.3387632369995117, 1.4429740905761719, 1.5471850633621216, 1.6513960361480713, 1.755607008934021, 1.8598179817199707, 1.9640288352966309, 2.068239688873291, 2.1724507808685303, 2.2766616344451904, 2.3808727264404297, 2.48508358001709, 2.58929443359375, 2.6935055255889893, 2.7977163791656494, 2.9019274711608887, 3.006138324737549, 3.110349178314209, 3.214560031890869, 3.3187711238861084, 3.4229819774627686, 3.527193069458008, 3.631403923034668, 3.735614776611328, 3.8398258686065674, 3.9440367221832275, 4.048247814178467, 4.152458667755127]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 3.0, 5.0, 2.0, 5.0, 16.0, 13.0, 17.0, 30.0, 32.0, 37.0, 50.0, 58.0, 76.0, 91.0, 79.0, 79.0, 75.0, 77.0, 70.0, 51.0, 34.0, 26.0, 25.0, 10.0, 10.0, 11.0, 8.0, 6.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.6410934925079346, -2.565190076828003, -2.489286422729492, -2.4133830070495605, -2.337479591369629, -2.2615761756896973, -2.1856727600097656, -2.109769105911255, -2.0338656902313232, -1.9579622745513916, -1.8820587396621704, -1.8061552047729492, -1.7302517890930176, -1.654348373413086, -1.5784448385238647, -1.5025413036346436, -1.426637887954712, -1.3507344722747803, -1.274830937385559, -1.198927402496338, -1.1230239868164062, -1.0471205711364746, -0.9712170362472534, -0.895313560962677, -0.8194100856781006, -0.7435066103935242, -0.6676031351089478, -0.5916996598243713, -0.5157961845397949, -0.4398927092552185, -0.3639892339706421, -0.2880857586860657, -0.21218228340148926, -0.13627880811691284, -0.060375332832336426, 0.01552814245223999, 0.0914316177368164, 0.16733509302139282, 0.24323856830596924, 0.31914204359054565, 0.39504551887512207, 0.4709489941596985, 0.5468524694442749, 0.6227559447288513, 0.6986594200134277, 0.7745628952980042, 0.8504663705825806, 0.926369845867157, 1.0022733211517334, 1.078176736831665, 1.1540802717208862, 1.2299838066101074, 1.305887222290039, 1.3817906379699707, 1.457694172859192, 1.533597707748413, 1.6095011234283447, 1.6854045391082764, 1.7613080739974976, 1.8372116088867188, 1.9131150245666504, 1.989018440246582, 2.0649218559265137, 2.1408255100250244, 2.216728925704956]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 2.0, 3.0, 5.0, 9.0, 5.0, 12.0, 5.0, 23.0, 22.0, 20.0, 44.0, 85.0, 242.0, 1084.0, 6908.0, 95837.0, 876674.0, 61129.0, 5227.0, 805.0, 202.0, 75.0, 35.0, 30.0, 14.0, 13.0, 14.0, 11.0, 7.0, 5.0, 2.0, 4.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-9.6015625, -9.36407470703125, -9.1265869140625, -8.88909912109375, -8.651611328125, -8.41412353515625, -8.1766357421875, -7.93914794921875, -7.70166015625, -7.46417236328125, -7.2266845703125, -6.98919677734375, -6.751708984375, -6.51422119140625, -6.2767333984375, -6.03924560546875, -5.8017578125, -5.56427001953125, -5.3267822265625, -5.08929443359375, -4.851806640625, -4.61431884765625, -4.3768310546875, -4.13934326171875, -3.90185546875, -3.66436767578125, -3.4268798828125, -3.18939208984375, -2.951904296875, -2.71441650390625, -2.4769287109375, -2.23944091796875, -2.001953125, -1.76446533203125, -1.5269775390625, -1.28948974609375, -1.052001953125, -0.81451416015625, -0.5770263671875, -0.33953857421875, -0.10205078125, 0.13543701171875, 0.3729248046875, 0.61041259765625, 0.847900390625, 1.08538818359375, 1.3228759765625, 1.56036376953125, 1.7978515625, 2.03533935546875, 2.2728271484375, 2.51031494140625, 2.747802734375, 2.98529052734375, 3.2227783203125, 3.46026611328125, 3.69775390625, 3.93524169921875, 4.1727294921875, 4.41021728515625, 4.647705078125, 4.88519287109375, 5.1226806640625, 5.36016845703125, 5.59765625]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 9.0, 11.0, 19.0, 37.0, 52.0, 117.0, 148.0, 176.0, 164.0, 133.0, 62.0, 37.0, 20.0, 11.0, 8.0, 3.0, 5.0, 2.0, 3.0], "bins": [-21.4375, -21.03033447265625, -20.6231689453125, -20.21600341796875, -19.808837890625, -19.40167236328125, -18.9945068359375, -18.58734130859375, -18.18017578125, -17.77301025390625, -17.3658447265625, -16.95867919921875, -16.551513671875, -16.14434814453125, -15.7371826171875, -15.33001708984375, -14.9228515625, -14.51568603515625, -14.1085205078125, -13.70135498046875, -13.294189453125, -12.88702392578125, -12.4798583984375, -12.07269287109375, -11.66552734375, -11.25836181640625, -10.8511962890625, -10.44403076171875, -10.036865234375, -9.62969970703125, -9.2225341796875, -8.81536865234375, -8.408203125, -8.00103759765625, -7.5938720703125, -7.18670654296875, -6.779541015625, -6.37237548828125, -5.9652099609375, -5.55804443359375, -5.15087890625, -4.74371337890625, -4.3365478515625, -3.92938232421875, -3.522216796875, -3.11505126953125, -2.7078857421875, -2.30072021484375, -1.8935546875, -1.48638916015625, -1.0792236328125, -0.67205810546875, -0.264892578125, 0.14227294921875, 0.5494384765625, 0.95660400390625, 1.36376953125, 1.77093505859375, 2.1781005859375, 2.58526611328125, 2.992431640625, 3.39959716796875, 3.8067626953125, 4.21392822265625, 4.62109375]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 6.0, 7.0, 4.0, 7.0, 6.0, 16.0, 24.0, 26.0, 25.0, 45.0, 60.0, 61.0, 83.0, 97.0, 148.0, 272.0, 784.0, 3442.0, 33726.0, 846382.0, 152673.0, 8192.0, 1325.0, 407.0, 180.0, 120.0, 88.0, 76.0, 73.0, 45.0, 38.0, 28.0, 19.0, 20.0, 16.0, 10.0, 11.0, 5.0, 8.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.24609375, -6.04278564453125, -5.8394775390625, -5.63616943359375, -5.432861328125, -5.22955322265625, -5.0262451171875, -4.82293701171875, -4.61962890625, -4.41632080078125, -4.2130126953125, -4.00970458984375, -3.806396484375, -3.60308837890625, -3.3997802734375, -3.19647216796875, -2.9931640625, -2.78985595703125, -2.5865478515625, -2.38323974609375, -2.179931640625, -1.97662353515625, -1.7733154296875, -1.57000732421875, -1.36669921875, -1.16339111328125, -0.9600830078125, -0.75677490234375, -0.553466796875, -0.35015869140625, -0.1468505859375, 0.05645751953125, 0.259765625, 0.46307373046875, 0.6663818359375, 0.86968994140625, 1.072998046875, 1.27630615234375, 1.4796142578125, 1.68292236328125, 1.88623046875, 2.08953857421875, 2.2928466796875, 2.49615478515625, 2.699462890625, 2.90277099609375, 3.1060791015625, 3.30938720703125, 3.5126953125, 3.71600341796875, 3.9193115234375, 4.12261962890625, 4.325927734375, 4.52923583984375, 4.7325439453125, 4.93585205078125, 5.13916015625, 5.34246826171875, 5.5457763671875, 5.74908447265625, 5.952392578125, 6.15570068359375, 6.3590087890625, 6.56231689453125, 6.765625]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 6.0, 6.0, 11.0, 20.0, 12.0, 22.0, 20.0, 33.0, 34.0, 34.0, 38.0, 50.0, 52.0, 51.0, 43.0, 44.0, 48.0, 66.0, 43.0, 47.0, 42.0, 42.0, 40.0, 31.0, 28.0, 31.0, 27.0, 22.0, 18.0, 13.0, 9.0, 4.0, 2.0, 4.0, 1.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 2.0], "bins": [-6.23828125, -6.07025146484375, -5.9022216796875, -5.73419189453125, -5.566162109375, -5.39813232421875, -5.2301025390625, -5.06207275390625, -4.89404296875, -4.72601318359375, -4.5579833984375, -4.38995361328125, -4.221923828125, -4.05389404296875, -3.8858642578125, -3.71783447265625, -3.5498046875, -3.38177490234375, -3.2137451171875, -3.04571533203125, -2.877685546875, -2.70965576171875, -2.5416259765625, -2.37359619140625, -2.20556640625, -2.03753662109375, -1.8695068359375, -1.70147705078125, -1.533447265625, -1.36541748046875, -1.1973876953125, -1.02935791015625, -0.861328125, -0.69329833984375, -0.5252685546875, -0.35723876953125, -0.189208984375, -0.02117919921875, 0.1468505859375, 0.31488037109375, 0.48291015625, 0.65093994140625, 0.8189697265625, 0.98699951171875, 1.155029296875, 1.32305908203125, 1.4910888671875, 1.65911865234375, 1.8271484375, 1.99517822265625, 2.1632080078125, 2.33123779296875, 2.499267578125, 2.66729736328125, 2.8353271484375, 3.00335693359375, 3.17138671875, 3.33941650390625, 3.5074462890625, 3.67547607421875, 3.843505859375, 4.01153564453125, 4.1795654296875, 4.34759521484375, 4.515625]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 4.0, 3.0, 11.0, 4.0, 17.0, 15.0, 21.0, 22.0, 54.0, 67.0, 109.0, 168.0, 292.0, 474.0, 847.0, 1555.0, 3119.0, 6629.0, 16204.0, 44914.0, 164306.0, 514087.0, 208017.0, 54344.0, 18476.0, 7454.0, 3398.0, 1681.0, 945.0, 519.0, 290.0, 181.0, 121.0, 67.0, 50.0, 28.0, 18.0, 16.0, 5.0, 9.0, 3.0, 6.0, 4.0, 5.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53125, -0.5119857788085938, -0.4927215576171875, -0.47345733642578125, -0.454193115234375, -0.43492889404296875, -0.4156646728515625, -0.39640045166015625, -0.37713623046875, -0.35787200927734375, -0.3386077880859375, -0.31934356689453125, -0.300079345703125, -0.28081512451171875, -0.2615509033203125, -0.24228668212890625, -0.2230224609375, -0.20375823974609375, -0.1844940185546875, -0.16522979736328125, -0.145965576171875, -0.12670135498046875, -0.1074371337890625, -0.08817291259765625, -0.06890869140625, -0.04964447021484375, -0.0303802490234375, -0.01111602783203125, 0.008148193359375, 0.02741241455078125, 0.0466766357421875, 0.06594085693359375, 0.085205078125, 0.10446929931640625, 0.1237335205078125, 0.14299774169921875, 0.162261962890625, 0.18152618408203125, 0.2007904052734375, 0.22005462646484375, 0.23931884765625, 0.25858306884765625, 0.2778472900390625, 0.29711151123046875, 0.316375732421875, 0.33563995361328125, 0.3549041748046875, 0.37416839599609375, 0.3934326171875, 0.41269683837890625, 0.4319610595703125, 0.45122528076171875, 0.470489501953125, 0.48975372314453125, 0.5090179443359375, 0.5282821655273438, 0.54754638671875, 0.5668106079101562, 0.5860748291015625, 0.6053390502929688, 0.624603271484375, 0.6438674926757812, 0.6631317138671875, 0.6823959350585938, 0.70166015625]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 8.0, 1.0, 6.0, 4.0, 17.0, 13.0, 10.0, 19.0, 30.0, 36.0, 45.0, 73.0, 85.0, 77.0, 88.0, 97.0, 94.0, 58.0, 60.0, 47.0, 31.0, 20.0, 15.0, 13.0, 15.0, 12.0, 9.0, 4.0, 4.0, 6.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00012350082397460938, -0.00011936761438846588, -0.00011523440480232239, -0.0001111011952161789, -0.0001069679856300354, -0.0001028347760438919, -9.870156645774841e-05, -9.456835687160492e-05, -9.043514728546143e-05, -8.630193769931793e-05, -8.216872811317444e-05, -7.803551852703094e-05, -7.390230894088745e-05, -6.976909935474396e-05, -6.563588976860046e-05, -6.150268018245697e-05, -5.7369470596313477e-05, -5.323626101016998e-05, -4.910305142402649e-05, -4.4969841837882996e-05, -4.08366322517395e-05, -3.670342266559601e-05, -3.2570213079452515e-05, -2.843700349330902e-05, -2.4303793907165527e-05, -2.0170584321022034e-05, -1.603737473487854e-05, -1.1904165148735046e-05, -7.770955562591553e-06, -3.637745976448059e-06, 4.954636096954346e-07, 4.628673195838928e-06, 8.761882781982422e-06, 1.2895092368125916e-05, 1.702830195426941e-05, 2.1161511540412903e-05, 2.5294721126556396e-05, 2.942793071269989e-05, 3.3561140298843384e-05, 3.769434988498688e-05, 4.182755947113037e-05, 4.5960769057273865e-05, 5.009397864341736e-05, 5.422718822956085e-05, 5.8360397815704346e-05, 6.249360740184784e-05, 6.662681698799133e-05, 7.076002657413483e-05, 7.489323616027832e-05, 7.902644574642181e-05, 8.315965533256531e-05, 8.72928649187088e-05, 9.14260745048523e-05, 9.555928409099579e-05, 9.969249367713928e-05, 0.00010382570326328278, 0.00010795891284942627, 0.00011209212243556976, 0.00011622533202171326, 0.00012035854160785675, 0.00012449175119400024, 0.00012862496078014374, 0.00013275817036628723, 0.00013689137995243073, 0.00014102458953857422]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 10.0, 8.0, 8.0, 11.0, 17.0, 20.0, 28.0, 47.0, 86.0, 123.0, 182.0, 339.0, 562.0, 1142.0, 2651.0, 6641.0, 21524.0, 98873.0, 596953.0, 257356.0, 43035.0, 11348.0, 3923.0, 1696.0, 779.0, 447.0, 266.0, 155.0, 89.0, 71.0, 50.0, 38.0, 21.0, 14.0, 6.0, 8.0, 2.0, 7.0, 3.0, 7.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.93017578125, -0.9017715454101562, -0.8733673095703125, -0.8449630737304688, -0.816558837890625, -0.7881546020507812, -0.7597503662109375, -0.7313461303710938, -0.70294189453125, -0.6745376586914062, -0.6461334228515625, -0.6177291870117188, -0.589324951171875, -0.5609207153320312, -0.5325164794921875, -0.5041122436523438, -0.4757080078125, -0.44730377197265625, -0.4188995361328125, -0.39049530029296875, -0.362091064453125, -0.33368682861328125, -0.3052825927734375, -0.27687835693359375, -0.24847412109375, -0.22006988525390625, -0.1916656494140625, -0.16326141357421875, -0.134857177734375, -0.10645294189453125, -0.0780487060546875, -0.04964447021484375, -0.021240234375, 0.00716400146484375, 0.0355682373046875, 0.06397247314453125, 0.092376708984375, 0.12078094482421875, 0.1491851806640625, 0.17758941650390625, 0.20599365234375, 0.23439788818359375, 0.2628021240234375, 0.29120635986328125, 0.319610595703125, 0.34801483154296875, 0.3764190673828125, 0.40482330322265625, 0.4332275390625, 0.46163177490234375, 0.4900360107421875, 0.5184402465820312, 0.546844482421875, 0.5752487182617188, 0.6036529541015625, 0.6320571899414062, 0.66046142578125, 0.6888656616210938, 0.7172698974609375, 0.7456741333007812, 0.774078369140625, 0.8024826049804688, 0.8308868408203125, 0.8592910766601562, 0.8876953125]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 7.0, 11.0, 13.0, 4.0, 6.0, 9.0, 10.0, 23.0, 18.0, 35.0, 39.0, 57.0, 67.0, 77.0, 104.0, 112.0, 69.0, 62.0, 67.0, 59.0, 33.0, 31.0, 19.0, 14.0, 16.0, 14.0, 9.0, 6.0, 4.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.388916015625, -0.3756523132324219, -0.36238861083984375, -0.3491249084472656, -0.3358612060546875, -0.3225975036621094, -0.30933380126953125, -0.2960700988769531, -0.282806396484375, -0.2695426940917969, -0.25627899169921875, -0.24301528930664062, -0.2297515869140625, -0.21648788452148438, -0.20322418212890625, -0.18996047973632812, -0.17669677734375, -0.16343307495117188, -0.15016937255859375, -0.13690567016601562, -0.1236419677734375, -0.11037826538085938, -0.09711456298828125, -0.08385086059570312, -0.070587158203125, -0.057323455810546875, -0.04405975341796875, -0.030796051025390625, -0.0175323486328125, -0.004268646240234375, 0.00899505615234375, 0.022258758544921875, 0.0355224609375, 0.048786163330078125, 0.06204986572265625, 0.07531356811523438, 0.0885772705078125, 0.10184097290039062, 0.11510467529296875, 0.12836837768554688, 0.141632080078125, 0.15489578247070312, 0.16815948486328125, 0.18142318725585938, 0.1946868896484375, 0.20795059204101562, 0.22121429443359375, 0.23447799682617188, 0.24774169921875, 0.2610054016113281, 0.27426910400390625, 0.2875328063964844, 0.3007965087890625, 0.3140602111816406, 0.32732391357421875, 0.3405876159667969, 0.353851318359375, 0.3671150207519531, 0.38037872314453125, 0.3936424255371094, 0.4069061279296875, 0.4201698303222656, 0.43343353271484375, 0.4466972351074219, 0.4599609375]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 10.0, 23.0, 106.0, 559.0, 262.0, 41.0, 10.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.55836868286133, -31.56367301940918, -30.56897735595703, -29.574281692504883, -28.579586029052734, -27.584890365600586, -26.590194702148438, -25.595497131347656, -24.60080337524414, -23.606107711791992, -22.611412048339844, -21.616716384887695, -20.622020721435547, -19.6273250579834, -18.63262939453125, -17.63793182373047, -16.64323616027832, -15.648540496826172, -14.653844833374023, -13.659149169921875, -12.664453506469727, -11.669757843017578, -10.675061225891113, -9.680365562438965, -8.685669898986816, -7.690974235534668, -6.6962785720825195, -5.701582431793213, -4.7068867683410645, -3.712191104888916, -2.7174949645996094, -1.722799301147461, -0.7281036376953125, 0.2665921449661255, 1.2612879276275635, 2.255983829498291, 3.2506794929504395, 4.245375156402588, 5.2400712966918945, 6.234766960144043, 7.229462623596191, 8.22415828704834, 9.218853950500488, 10.213550567626953, 11.208246231079102, 12.20294189453125, 13.197637557983398, 14.192333221435547, 15.187028884887695, 16.181724548339844, 17.176420211791992, 18.17111587524414, 19.16581153869629, 20.160507202148438, 21.15520477294922, 22.149898529052734, 23.144596099853516, 24.139291763305664, 25.133987426757812, 26.12868309020996, 27.12337875366211, 28.118074417114258, 29.112770080566406, 30.107467651367188, 31.102161407470703]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 7.0, 4.0, 3.0, 14.0, 17.0, 20.0, 19.0, 28.0, 30.0, 52.0, 45.0, 59.0, 67.0, 63.0, 76.0, 62.0, 78.0, 66.0, 53.0, 53.0, 40.0, 35.0, 31.0, 22.0, 23.0, 15.0, 11.0, 5.0, 7.0, 6.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-17.181644439697266, -16.769371032714844, -16.357097625732422, -15.944825172424316, -15.532552719116211, -15.120279312133789, -14.708006858825684, -14.295733451843262, -13.883460998535156, -13.471187591552734, -13.058915138244629, -12.646641731262207, -12.234369277954102, -11.82209587097168, -11.409823417663574, -10.997550010681152, -10.585277557373047, -10.173004150390625, -9.76073169708252, -9.348458290100098, -8.936185836791992, -8.52391242980957, -8.111639976501465, -7.699366569519043, -7.287093162536621, -6.874820232391357, -6.462547302246094, -6.05027437210083, -5.638001441955566, -5.2257280349731445, -4.813455581665039, -4.401182174682617, -3.9889097213745117, -3.576636791229248, -3.1643638610839844, -2.7520909309387207, -2.339818000793457, -1.9275448322296143, -1.5152719020843506, -1.102998971939087, -0.6907260417938232, -0.2784530818462372, 0.13381987810134888, 0.5460928678512573, 0.958365797996521, 1.3706388473510742, 1.782911777496338, 2.1951847076416016, 2.6074576377868652, 3.019730567932129, 3.4320034980773926, 3.8442764282226562, 4.25654935836792, 4.668822288513184, 5.0810956954956055, 5.493368148803711, 5.905641555786133, 6.3179144859313965, 6.73018741607666, 7.142460346221924, 7.5547332763671875, 7.967006683349609, 8.379279136657715, 8.791552543640137, 9.203824996948242]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 6.0, 1.0, 6.0, 8.0, 9.0, 8.0, 10.0, 20.0, 15.0, 27.0, 24.0, 35.0, 64.0, 70.0, 77.0, 147.0, 175.0, 380.0, 958.0, 2851.0, 12565.0, 137615.0, 3896699.0, 125356.0, 12266.0, 2786.0, 960.0, 430.0, 236.0, 119.0, 112.0, 51.0, 43.0, 28.0, 22.0, 28.0, 18.0, 14.0, 18.0, 7.0, 9.0, 5.0, 1.0, 2.0, 6.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.6875, -5.512451171875, -5.33740234375, -5.162353515625, -4.9873046875, -4.812255859375, -4.63720703125, -4.462158203125, -4.287109375, -4.112060546875, -3.93701171875, -3.761962890625, -3.5869140625, -3.411865234375, -3.23681640625, -3.061767578125, -2.88671875, -2.711669921875, -2.53662109375, -2.361572265625, -2.1865234375, -2.011474609375, -1.83642578125, -1.661376953125, -1.486328125, -1.311279296875, -1.13623046875, -0.961181640625, -0.7861328125, -0.611083984375, -0.43603515625, -0.260986328125, -0.0859375, 0.089111328125, 0.26416015625, 0.439208984375, 0.6142578125, 0.789306640625, 0.96435546875, 1.139404296875, 1.314453125, 1.489501953125, 1.66455078125, 1.839599609375, 2.0146484375, 2.189697265625, 2.36474609375, 2.539794921875, 2.71484375, 2.889892578125, 3.06494140625, 3.239990234375, 3.4150390625, 3.590087890625, 3.76513671875, 3.940185546875, 4.115234375, 4.290283203125, 4.46533203125, 4.640380859375, 4.8154296875, 4.990478515625, 5.16552734375, 5.340576171875, 5.515625]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 7.0, 4.0, 4.0, 4.0, 9.0, 7.0, 15.0, 22.0, 27.0, 22.0, 39.0, 41.0, 48.0, 70.0, 68.0, 71.0, 63.0, 74.0, 62.0, 66.0, 48.0, 44.0, 30.0, 31.0, 31.0, 15.0, 18.0, 13.0, 14.0, 6.0, 7.0, 2.0, 3.0, 4.0, 5.0, 1.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-2.62890625, -2.548675537109375, -2.46844482421875, -2.388214111328125, -2.3079833984375, -2.227752685546875, -2.14752197265625, -2.067291259765625, -1.987060546875, -1.906829833984375, -1.82659912109375, -1.746368408203125, -1.6661376953125, -1.585906982421875, -1.50567626953125, -1.425445556640625, -1.34521484375, -1.264984130859375, -1.18475341796875, -1.104522705078125, -1.0242919921875, -0.944061279296875, -0.86383056640625, -0.783599853515625, -0.703369140625, -0.623138427734375, -0.54290771484375, -0.462677001953125, -0.3824462890625, -0.302215576171875, -0.22198486328125, -0.141754150390625, -0.0615234375, 0.018707275390625, 0.09893798828125, 0.179168701171875, 0.2593994140625, 0.339630126953125, 0.41986083984375, 0.500091552734375, 0.580322265625, 0.660552978515625, 0.74078369140625, 0.821014404296875, 0.9012451171875, 0.981475830078125, 1.06170654296875, 1.141937255859375, 1.22216796875, 1.302398681640625, 1.38262939453125, 1.462860107421875, 1.5430908203125, 1.623321533203125, 1.70355224609375, 1.783782958984375, 1.864013671875, 1.944244384765625, 2.02447509765625, 2.104705810546875, 2.1849365234375, 2.265167236328125, 2.34539794921875, 2.425628662109375, 2.505859375]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 3.0, 4.0, 4.0, 8.0, 2.0, 4.0, 5.0, 13.0, 10.0, 34.0, 23.0, 41.0, 76.0, 135.0, 248.0, 795.0, 4284.0, 99885.0, 4060329.0, 25237.0, 2206.0, 484.0, 179.0, 91.0, 59.0, 24.0, 22.0, 16.0, 21.0, 8.0, 4.0, 7.0, 7.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.5859375, -9.29833984375, -9.0107421875, -8.72314453125, -8.435546875, -8.14794921875, -7.8603515625, -7.57275390625, -7.28515625, -6.99755859375, -6.7099609375, -6.42236328125, -6.134765625, -5.84716796875, -5.5595703125, -5.27197265625, -4.984375, -4.69677734375, -4.4091796875, -4.12158203125, -3.833984375, -3.54638671875, -3.2587890625, -2.97119140625, -2.68359375, -2.39599609375, -2.1083984375, -1.82080078125, -1.533203125, -1.24560546875, -0.9580078125, -0.67041015625, -0.3828125, -0.09521484375, 0.1923828125, 0.47998046875, 0.767578125, 1.05517578125, 1.3427734375, 1.63037109375, 1.91796875, 2.20556640625, 2.4931640625, 2.78076171875, 3.068359375, 3.35595703125, 3.6435546875, 3.93115234375, 4.21875, 4.50634765625, 4.7939453125, 5.08154296875, 5.369140625, 5.65673828125, 5.9443359375, 6.23193359375, 6.51953125, 6.80712890625, 7.0947265625, 7.38232421875, 7.669921875, 7.95751953125, 8.2451171875, 8.53271484375, 8.8203125]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 8.0, 13.0, 12.0, 11.0, 34.0, 16.0, 55.0, 87.0, 136.0, 239.0, 584.0, 1632.0, 598.0, 262.0, 134.0, 76.0, 55.0, 29.0, 25.0, 23.0, 12.0, 10.0, 6.0, 3.0, 1.0, 7.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9765625, -0.9434814453125, -0.910400390625, -0.8773193359375, -0.84423828125, -0.8111572265625, -0.778076171875, -0.7449951171875, -0.7119140625, -0.6788330078125, -0.645751953125, -0.6126708984375, -0.57958984375, -0.5465087890625, -0.513427734375, -0.4803466796875, -0.447265625, -0.4141845703125, -0.381103515625, -0.3480224609375, -0.31494140625, -0.2818603515625, -0.248779296875, -0.2156982421875, -0.1826171875, -0.1495361328125, -0.116455078125, -0.0833740234375, -0.05029296875, -0.0172119140625, 0.015869140625, 0.0489501953125, 0.08203125, 0.1151123046875, 0.148193359375, 0.1812744140625, 0.21435546875, 0.2474365234375, 0.280517578125, 0.3135986328125, 0.3466796875, 0.3797607421875, 0.412841796875, 0.4459228515625, 0.47900390625, 0.5120849609375, 0.545166015625, 0.5782470703125, 0.611328125, 0.6444091796875, 0.677490234375, 0.7105712890625, 0.74365234375, 0.7767333984375, 0.809814453125, 0.8428955078125, 0.8759765625, 0.9090576171875, 0.942138671875, 0.9752197265625, 1.00830078125, 1.0413818359375, 1.074462890625, 1.1075439453125, 1.140625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 10.0, 2.0, 6.0, 2.0, 7.0, 3.0, 10.0, 9.0, 9.0, 16.0, 21.0, 21.0, 33.0, 57.0, 78.0, 77.0, 107.0, 104.0, 99.0, 73.0, 60.0, 43.0, 24.0, 32.0, 30.0, 15.0, 12.0, 8.0, 7.0, 2.0, 7.0, 4.0, 3.0, 3.0, 3.0, 0.0, 1.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.676827907562256, -2.5784897804260254, -2.480151653289795, -2.3818135261535645, -2.283475160598755, -2.1851370334625244, -2.086798906326294, -1.9884607791900635, -1.8901225328445435, -1.791784405708313, -1.693446159362793, -1.5951080322265625, -1.496769905090332, -1.398431658744812, -1.3000935316085815, -1.2017552852630615, -1.103417158126831, -1.0050790309906006, -0.9067407846450806, -0.8084026575088501, -0.7100644707679749, -0.6117262840270996, -0.5133881568908691, -0.4150499701499939, -0.31671178340911865, -0.2183736115694046, -0.12003543972969055, -0.021697282791137695, 0.07664090394973755, 0.1749790906906128, 0.27331721782684326, 0.3716554045677185, 0.46999359130859375, 0.568331778049469, 0.6666699647903442, 0.7650080919265747, 0.86334627866745, 0.9616844654083252, 1.0600225925445557, 1.1583607196807861, 1.2566989660263062, 1.3550370931625366, 1.4533753395080566, 1.551713466644287, 1.6500515937805176, 1.7483898401260376, 1.846727967262268, 1.945066213607788, 2.0434043407440186, 2.141742467880249, 2.2400805950164795, 2.338418960571289, 2.4367570877075195, 2.53509521484375, 2.6334333419799805, 2.731771469116211, 2.8301095962524414, 2.928447723388672, 3.0267858505249023, 3.125123977661133, 3.2234623432159424, 3.321800470352173, 3.4201385974884033, 3.518476724624634, 3.6168150901794434]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 4.0, 4.0, 5.0, 10.0, 5.0, 13.0, 9.0, 15.0, 15.0, 29.0, 25.0, 37.0, 39.0, 51.0, 60.0, 51.0, 60.0, 61.0, 52.0, 55.0, 49.0, 51.0, 46.0, 43.0, 28.0, 32.0, 26.0, 25.0, 27.0, 15.0, 14.0, 12.0, 10.0, 4.0, 8.0, 3.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.384866952896118, -2.3088696002960205, -2.232872486114502, -2.1568751335144043, -2.0808777809143066, -2.004880666732788, -1.9288833141326904, -1.8528860807418823, -1.7768888473510742, -1.7008916139602661, -1.624894380569458, -1.5488970279693604, -1.4728997945785522, -1.3969025611877441, -1.3209052085876465, -1.2449079751968384, -1.1689107418060303, -1.0929135084152222, -1.016916275024414, -0.9409189224243164, -0.8649216890335083, -0.7889244556427002, -0.7129271626472473, -0.6369298696517944, -0.5609326362609863, -0.48493537306785583, -0.40893810987472534, -0.33294084668159485, -0.25694358348846436, -0.18094632029533386, -0.10494905710220337, -0.02895176410675049, 0.047045230865478516, 0.12304249405860901, 0.1990397572517395, 0.27503702044487, 0.3510342836380005, 0.427031546831131, 0.5030288100242615, 0.5790261030197144, 0.6550233364105225, 0.7310205698013306, 0.8070178627967834, 0.8830151557922363, 0.9590123891830444, 1.0350096225738525, 1.1110069751739502, 1.1870042085647583, 1.2630014419555664, 1.3389986753463745, 1.4149959087371826, 1.4909932613372803, 1.5669904947280884, 1.6429877281188965, 1.7189850807189941, 1.7949823141098022, 1.8709795475006104, 1.9469767808914185, 2.0229740142822266, 2.098971366882324, 2.174968719482422, 2.2509658336639404, 2.326963186264038, 2.4029603004455566, 2.4789576530456543]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 3.0, 3.0, 2.0, 7.0, 14.0, 7.0, 30.0, 53.0, 68.0, 86.0, 125.0, 265.0, 421.0, 779.0, 1354.0, 2672.0, 5580.0, 12198.0, 29630.0, 80675.0, 221649.0, 368276.0, 202828.0, 72691.0, 27167.0, 11463.0, 5150.0, 2448.0, 1237.0, 660.0, 395.0, 235.0, 124.0, 88.0, 54.0, 43.0, 26.0, 9.0, 12.0, 7.0, 12.0, 4.0, 4.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.2457275390625, -0.23815536499023438, -0.23058319091796875, -0.22301101684570312, -0.2154388427734375, -0.20786666870117188, -0.20029449462890625, -0.19272232055664062, -0.185150146484375, -0.17757797241210938, -0.17000579833984375, -0.16243362426757812, -0.1548614501953125, -0.14728927612304688, -0.13971710205078125, -0.13214492797851562, -0.12457275390625, -0.11700057983398438, -0.10942840576171875, -0.10185623168945312, -0.0942840576171875, -0.08671188354492188, -0.07913970947265625, -0.07156753540039062, -0.063995361328125, -0.056423187255859375, -0.04885101318359375, -0.041278839111328125, -0.0337066650390625, -0.026134490966796875, -0.01856231689453125, -0.010990142822265625, -0.00341796875, 0.004154205322265625, 0.01172637939453125, 0.019298553466796875, 0.0268707275390625, 0.034442901611328125, 0.04201507568359375, 0.049587249755859375, 0.057159423828125, 0.06473159790039062, 0.07230377197265625, 0.07987594604492188, 0.0874481201171875, 0.09502029418945312, 0.10259246826171875, 0.11016464233398438, 0.11773681640625, 0.12530899047851562, 0.13288116455078125, 0.14045333862304688, 0.1480255126953125, 0.15559768676757812, 0.16316986083984375, 0.17074203491210938, 0.178314208984375, 0.18588638305664062, 0.19345855712890625, 0.20103073120117188, 0.2086029052734375, 0.21617507934570312, 0.22374725341796875, 0.23131942749023438, 0.2388916015625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 5.0, 3.0, 5.0, 5.0, 10.0, 17.0, 11.0, 17.0, 37.0, 53.0, 52.0, 64.0, 74.0, 101.0, 88.0, 82.0, 65.0, 70.0, 46.0, 43.0, 40.0, 22.0, 20.0, 27.0, 12.0, 10.0, 9.0, 3.0, 1.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.90234375, -2.82733154296875, -2.7523193359375, -2.67730712890625, -2.602294921875, -2.52728271484375, -2.4522705078125, -2.37725830078125, -2.30224609375, -2.22723388671875, -2.1522216796875, -2.07720947265625, -2.002197265625, -1.92718505859375, -1.8521728515625, -1.77716064453125, -1.7021484375, -1.62713623046875, -1.5521240234375, -1.47711181640625, -1.402099609375, -1.32708740234375, -1.2520751953125, -1.17706298828125, -1.10205078125, -1.02703857421875, -0.9520263671875, -0.87701416015625, -0.802001953125, -0.72698974609375, -0.6519775390625, -0.57696533203125, -0.501953125, -0.42694091796875, -0.3519287109375, -0.27691650390625, -0.201904296875, -0.12689208984375, -0.0518798828125, 0.02313232421875, 0.09814453125, 0.17315673828125, 0.2481689453125, 0.32318115234375, 0.398193359375, 0.47320556640625, 0.5482177734375, 0.62322998046875, 0.6982421875, 0.77325439453125, 0.8482666015625, 0.92327880859375, 0.998291015625, 1.07330322265625, 1.1483154296875, 1.22332763671875, 1.29833984375, 1.37335205078125, 1.4483642578125, 1.52337646484375, 1.598388671875, 1.67340087890625, 1.7484130859375, 1.82342529296875, 1.8984375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 5.0, 1.0, 4.0, 6.0, 7.0, 8.0, 1.0, 21.0, 17.0, 27.0, 46.0, 45.0, 88.0, 105.0, 120.0, 197.0, 358.0, 535.0, 875.0, 1592.0, 3433.0, 8473.0, 24553.0, 79099.0, 239742.0, 388488.0, 203819.0, 63299.0, 19939.0, 7246.0, 2949.0, 1384.0, 746.0, 418.0, 265.0, 187.0, 126.0, 94.0, 64.0, 54.0, 36.0, 31.0, 19.0, 10.0, 9.0, 9.0, 5.0, 1.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2359619140625, -0.2276592254638672, -0.21935653686523438, -0.21105384826660156, -0.20275115966796875, -0.19444847106933594, -0.18614578247070312, -0.1778430938720703, -0.1695404052734375, -0.1612377166748047, -0.15293502807617188, -0.14463233947753906, -0.13632965087890625, -0.12802696228027344, -0.11972427368164062, -0.11142158508300781, -0.103118896484375, -0.09481620788574219, -0.08651351928710938, -0.07821083068847656, -0.06990814208984375, -0.06160545349121094, -0.053302764892578125, -0.04500007629394531, -0.0366973876953125, -0.028394699096679688, -0.020092010498046875, -0.011789321899414062, -0.00348663330078125, 0.0048160552978515625, 0.013118743896484375, 0.021421432495117188, 0.02972412109375, 0.03802680969238281, 0.046329498291015625, 0.05463218688964844, 0.06293487548828125, 0.07123756408691406, 0.07954025268554688, 0.08784294128417969, 0.0961456298828125, 0.10444831848144531, 0.11275100708007812, 0.12105369567871094, 0.12935638427734375, 0.13765907287597656, 0.14596176147460938, 0.1542644500732422, 0.162567138671875, 0.1708698272705078, 0.17917251586914062, 0.18747520446777344, 0.19577789306640625, 0.20408058166503906, 0.21238327026367188, 0.2206859588623047, 0.2289886474609375, 0.2372913360595703, 0.24559402465820312, 0.25389671325683594, 0.26219940185546875, 0.27050209045410156, 0.2788047790527344, 0.2871074676513672, 0.29541015625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 5.0, 3.0, 13.0, 8.0, 7.0, 14.0, 27.0, 16.0, 22.0, 21.0, 36.0, 45.0, 39.0, 44.0, 48.0, 44.0, 51.0, 53.0, 52.0, 50.0, 52.0, 51.0, 35.0, 55.0, 38.0, 39.0, 30.0, 27.0, 8.0, 13.0, 17.0, 7.0, 5.0, 6.0, 6.0, 1.0, 4.0, 8.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0], "bins": [-3.794921875, -3.69329833984375, -3.5916748046875, -3.49005126953125, -3.388427734375, -3.28680419921875, -3.1851806640625, -3.08355712890625, -2.98193359375, -2.88031005859375, -2.7786865234375, -2.67706298828125, -2.575439453125, -2.47381591796875, -2.3721923828125, -2.27056884765625, -2.1689453125, -2.06732177734375, -1.9656982421875, -1.86407470703125, -1.762451171875, -1.66082763671875, -1.5592041015625, -1.45758056640625, -1.35595703125, -1.25433349609375, -1.1527099609375, -1.05108642578125, -0.949462890625, -0.84783935546875, -0.7462158203125, -0.64459228515625, -0.54296875, -0.44134521484375, -0.3397216796875, -0.23809814453125, -0.136474609375, -0.03485107421875, 0.0667724609375, 0.16839599609375, 0.27001953125, 0.37164306640625, 0.4732666015625, 0.57489013671875, 0.676513671875, 0.77813720703125, 0.8797607421875, 0.98138427734375, 1.0830078125, 1.18463134765625, 1.2862548828125, 1.38787841796875, 1.489501953125, 1.59112548828125, 1.6927490234375, 1.79437255859375, 1.89599609375, 1.99761962890625, 2.0992431640625, 2.20086669921875, 2.302490234375, 2.40411376953125, 2.5057373046875, 2.60736083984375, 2.708984375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 5.0, 7.0, 10.0, 5.0, 16.0, 19.0, 26.0, 39.0, 60.0, 66.0, 103.0, 186.0, 321.0, 494.0, 958.0, 2044.0, 5114.0, 16498.0, 74225.0, 383241.0, 445559.0, 89533.0, 19422.0, 5887.0, 2233.0, 1075.0, 505.0, 309.0, 205.0, 110.0, 89.0, 49.0, 32.0, 30.0, 24.0, 20.0, 7.0, 7.0, 2.0, 5.0, 3.0, 8.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.123046875, -0.11881256103515625, -0.1145782470703125, -0.11034393310546875, -0.106109619140625, -0.10187530517578125, -0.0976409912109375, -0.09340667724609375, -0.08917236328125, -0.08493804931640625, -0.0807037353515625, -0.07646942138671875, -0.072235107421875, -0.06800079345703125, -0.0637664794921875, -0.05953216552734375, -0.0552978515625, -0.05106353759765625, -0.0468292236328125, -0.04259490966796875, -0.038360595703125, -0.03412628173828125, -0.0298919677734375, -0.02565765380859375, -0.02142333984375, -0.01718902587890625, -0.0129547119140625, -0.00872039794921875, -0.004486083984375, -0.00025177001953125, 0.0039825439453125, 0.00821685791015625, 0.012451171875, 0.01668548583984375, 0.0209197998046875, 0.02515411376953125, 0.029388427734375, 0.03362274169921875, 0.0378570556640625, 0.04209136962890625, 0.04632568359375, 0.05055999755859375, 0.0547943115234375, 0.05902862548828125, 0.063262939453125, 0.06749725341796875, 0.0717315673828125, 0.07596588134765625, 0.0802001953125, 0.08443450927734375, 0.0886688232421875, 0.09290313720703125, 0.097137451171875, 0.10137176513671875, 0.1056060791015625, 0.10984039306640625, 0.11407470703125, 0.11830902099609375, 0.1225433349609375, 0.12677764892578125, 0.131011962890625, 0.13524627685546875, 0.1394805908203125, 0.14371490478515625, 0.14794921875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 7.0, 6.0, 6.0, 11.0, 15.0, 14.0, 34.0, 47.0, 54.0, 81.0, 85.0, 108.0, 115.0, 100.0, 86.0, 64.0, 45.0, 32.0, 27.0, 20.0, 17.0, 15.0, 2.0, 8.0, 5.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0001232624053955078, -0.00012029241770505905, -0.00011732243001461029, -0.00011435244232416153, -0.00011138245463371277, -0.00010841246694326401, -0.00010544247925281525, -0.00010247249156236649, -9.950250387191772e-05, -9.653251618146896e-05, -9.35625284910202e-05, -9.059254080057144e-05, -8.762255311012268e-05, -8.465256541967392e-05, -8.168257772922516e-05, -7.87125900387764e-05, -7.574260234832764e-05, -7.277261465787888e-05, -6.980262696743011e-05, -6.683263927698135e-05, -6.386265158653259e-05, -6.089266389608383e-05, -5.792267620563507e-05, -5.495268851518631e-05, -5.198270082473755e-05, -4.901271313428879e-05, -4.604272544384003e-05, -4.3072737753391266e-05, -4.0102750062942505e-05, -3.7132762372493744e-05, -3.416277468204498e-05, -3.119278699159622e-05, -2.822279930114746e-05, -2.52528116106987e-05, -2.228282392024994e-05, -1.9312836229801178e-05, -1.6342848539352417e-05, -1.3372860848903656e-05, -1.0402873158454895e-05, -7.432885468006134e-06, -4.462897777557373e-06, -1.492910087108612e-06, 1.477077603340149e-06, 4.44706529378891e-06, 7.417052984237671e-06, 1.0387040674686432e-05, 1.3357028365135193e-05, 1.6327016055583954e-05, 1.9297003746032715e-05, 2.2266991436481476e-05, 2.5236979126930237e-05, 2.8206966817378998e-05, 3.117695450782776e-05, 3.414694219827652e-05, 3.711692988872528e-05, 4.008691757917404e-05, 4.30569052696228e-05, 4.6026892960071564e-05, 4.8996880650520325e-05, 5.1966868340969086e-05, 5.493685603141785e-05, 5.790684372186661e-05, 6.087683141231537e-05, 6.384681910276413e-05, 6.681680679321289e-05]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 6.0, 1.0, 3.0, 3.0, 9.0, 19.0, 28.0, 37.0, 55.0, 97.0, 249.0, 640.0, 2083.0, 9092.0, 71176.0, 704578.0, 234217.0, 20740.0, 3763.0, 1044.0, 341.0, 153.0, 93.0, 36.0, 34.0, 20.0, 17.0, 4.0, 11.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1907958984375, -0.18437767028808594, -0.17795944213867188, -0.1715412139892578, -0.16512298583984375, -0.1587047576904297, -0.15228652954101562, -0.14586830139160156, -0.1394500732421875, -0.13303184509277344, -0.12661361694335938, -0.12019538879394531, -0.11377716064453125, -0.10735893249511719, -0.10094070434570312, -0.09452247619628906, -0.088104248046875, -0.08168601989746094, -0.07526779174804688, -0.06884956359863281, -0.06243133544921875, -0.05601310729980469, -0.049594879150390625, -0.04317665100097656, -0.0367584228515625, -0.030340194702148438, -0.023921966552734375, -0.017503738403320312, -0.01108551025390625, -0.0046672821044921875, 0.001750946044921875, 0.008169174194335938, 0.01458740234375, 0.021005630493164062, 0.027423858642578125, 0.03384208679199219, 0.04026031494140625, 0.04667854309082031, 0.053096771240234375, 0.05951499938964844, 0.0659332275390625, 0.07235145568847656, 0.07876968383789062, 0.08518791198730469, 0.09160614013671875, 0.09802436828613281, 0.10444259643554688, 0.11086082458496094, 0.117279052734375, 0.12369728088378906, 0.13011550903320312, 0.1365337371826172, 0.14295196533203125, 0.1493701934814453, 0.15578842163085938, 0.16220664978027344, 0.1686248779296875, 0.17504310607910156, 0.18146133422851562, 0.1878795623779297, 0.19429779052734375, 0.2007160186767578, 0.20713424682617188, 0.21355247497558594, 0.219970703125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 6.0, 9.0, 6.0, 11.0, 12.0, 17.0, 22.0, 28.0, 44.0, 50.0, 50.0, 64.0, 89.0, 99.0, 82.0, 74.0, 70.0, 62.0, 35.0, 43.0, 30.0, 28.0, 15.0, 14.0, 7.0, 8.0, 5.0, 4.0, 3.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0281829833984375, -0.02735733985900879, -0.026531696319580078, -0.025706052780151367, -0.024880409240722656, -0.024054765701293945, -0.023229122161865234, -0.022403478622436523, -0.021577835083007812, -0.0207521915435791, -0.01992654800415039, -0.01910090446472168, -0.01827526092529297, -0.017449617385864258, -0.016623973846435547, -0.015798330307006836, -0.014972686767578125, -0.014147043228149414, -0.013321399688720703, -0.012495756149291992, -0.011670112609863281, -0.01084446907043457, -0.01001882553100586, -0.009193181991577148, -0.008367538452148438, -0.0075418949127197266, -0.006716251373291016, -0.005890607833862305, -0.005064964294433594, -0.004239320755004883, -0.003413677215576172, -0.002588033676147461, -0.00176239013671875, -0.0009367465972900391, -0.00011110305786132812, 0.0007145404815673828, 0.0015401840209960938, 0.0023658275604248047, 0.0031914710998535156, 0.0040171146392822266, 0.0048427581787109375, 0.0056684017181396484, 0.006494045257568359, 0.00731968879699707, 0.008145332336425781, 0.008970975875854492, 0.009796619415283203, 0.010622262954711914, 0.011447906494140625, 0.012273550033569336, 0.013099193572998047, 0.013924837112426758, 0.014750480651855469, 0.01557612419128418, 0.01640176773071289, 0.0172274112701416, 0.018053054809570312, 0.018878698348999023, 0.019704341888427734, 0.020529985427856445, 0.021355628967285156, 0.022181272506713867, 0.023006916046142578, 0.02383255958557129, 0.024658203125]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 3.0, 3.0, 2.0, 5.0, 7.0, 3.0, 13.0, 8.0, 11.0, 10.0, 24.0, 31.0, 44.0, 89.0, 133.0, 150.0, 155.0, 101.0, 62.0, 53.0, 28.0, 25.0, 10.0, 12.0, 1.0, 9.0, 5.0, 1.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9297759532928467, -1.8323655128479004, -1.734955072402954, -1.6375447511672974, -1.540134310722351, -1.4427238702774048, -1.345313549041748, -1.2479031085968018, -1.1504926681518555, -1.0530822277069092, -0.9556718468666077, -0.8582614660263062, -0.7608510255813599, -0.6634405851364136, -0.5660302042961121, -0.46861982345581055, -0.37120938301086426, -0.27379897236824036, -0.17638856172561646, -0.07897815108299255, 0.018432259559631348, 0.11584267020225525, 0.21325308084487915, 0.31066346168518066, 0.40807390213012695, 0.5054843425750732, 0.6028947234153748, 0.7003051042556763, 0.7977155447006226, 0.8951259851455688, 0.9925363659858704, 1.0899467468261719, 1.1873574256896973, 1.2847678661346436, 1.3821783065795898, 1.4795886278152466, 1.5769990682601929, 1.6744095087051392, 1.771819829940796, 1.8692302703857422, 1.9666407108306885, 2.0640511512756348, 2.161461591720581, 2.2588720321655273, 2.3562822341918945, 2.453692674636841, 2.551103115081787, 2.6485135555267334, 2.7459239959716797, 2.843334436416626, 2.9407448768615723, 3.0381553173065186, 3.135565757751465, 3.232975959777832, 3.3303864002227783, 3.4277968406677246, 3.525207281112671, 3.622617721557617, 3.7200281620025635, 3.8174386024475098, 3.914848804473877, 4.012259483337402, 4.1096696853637695, 4.207079887390137, 4.304490566253662]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 9.0, 5.0, 4.0, 11.0, 14.0, 21.0, 16.0, 38.0, 51.0, 59.0, 78.0, 85.0, 90.0, 89.0, 84.0, 65.0, 66.0, 42.0, 44.0, 32.0, 31.0, 21.0, 14.0, 13.0, 5.0, 7.0, 2.0, 3.0, 5.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-2.9620790481567383, -2.8868136405944824, -2.8115482330322266, -2.7362828254699707, -2.661017417907715, -2.585752010345459, -2.510486602783203, -2.435220956802368, -2.3599555492401123, -2.2846901416778564, -2.2094247341156006, -2.1341593265533447, -2.058893918991089, -1.9836283922195435, -1.9083629846572876, -1.8330974578857422, -1.7578321695327759, -1.68256676197052, -1.6073013544082642, -1.5320358276367188, -1.456770420074463, -1.381505012512207, -1.3062396049499512, -1.2309741973876953, -1.1557087898254395, -1.0804433822631836, -1.0051779747009277, -0.9299125075340271, -0.8546470403671265, -0.7793816328048706, -0.7041162252426147, -0.6288507580757141, -0.5535851716995239, -0.4783197343349457, -0.40305429697036743, -0.3277888894081116, -0.2525234520435333, -0.17725801467895508, -0.10199260711669922, -0.026727139949798584, 0.048538267612457275, 0.12380369752645493, 0.19906912744045258, 0.27433454990386963, 0.3495999872684479, 0.4248654246330261, 0.500130832195282, 0.5753962993621826, 0.6506617069244385, 0.7259271144866943, 0.801192581653595, 0.8764579892158508, 0.9517234563827515, 1.0269888639450073, 1.1022542715072632, 1.1775197982788086, 1.2527852058410645, 1.3280506134033203, 1.4033160209655762, 1.478581428527832, 1.5538469552993774, 1.6291123628616333, 1.7043777704238892, 1.7796432971954346, 1.8549085855484009]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 4.0, 2.0, 8.0, 4.0, 5.0, 15.0, 22.0, 18.0, 57.0, 83.0, 180.0, 453.0, 1308.0, 4412.0, 20735.0, 177501.0, 756125.0, 71941.0, 11362.0, 2756.0, 843.0, 364.0, 151.0, 81.0, 32.0, 27.0, 15.0, 9.0, 12.0, 6.0, 7.0, 4.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.55859375, -3.44122314453125, -3.3238525390625, -3.20648193359375, -3.089111328125, -2.97174072265625, -2.8543701171875, -2.73699951171875, -2.61962890625, -2.50225830078125, -2.3848876953125, -2.26751708984375, -2.150146484375, -2.03277587890625, -1.9154052734375, -1.79803466796875, -1.6806640625, -1.56329345703125, -1.4459228515625, -1.32855224609375, -1.211181640625, -1.09381103515625, -0.9764404296875, -0.85906982421875, -0.74169921875, -0.62432861328125, -0.5069580078125, -0.38958740234375, -0.272216796875, -0.15484619140625, -0.0374755859375, 0.07989501953125, 0.197265625, 0.31463623046875, 0.4320068359375, 0.54937744140625, 0.666748046875, 0.78411865234375, 0.9014892578125, 1.01885986328125, 1.13623046875, 1.25360107421875, 1.3709716796875, 1.48834228515625, 1.605712890625, 1.72308349609375, 1.8404541015625, 1.95782470703125, 2.0751953125, 2.19256591796875, 2.3099365234375, 2.42730712890625, 2.544677734375, 2.66204833984375, 2.7794189453125, 2.89678955078125, 3.01416015625, 3.13153076171875, 3.2489013671875, 3.36627197265625, 3.483642578125, 3.60101318359375, 3.7183837890625, 3.83575439453125, 3.953125]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 4.0, 9.0, 20.0, 33.0, 78.0, 142.0, 176.0, 184.0, 151.0, 89.0, 57.0, 35.0, 19.0, 8.0, 1.0, 4.0, 2.0, 1.0, 1.0], "bins": [-20.765625, -20.36798095703125, -19.9703369140625, -19.57269287109375, -19.175048828125, -18.77740478515625, -18.3797607421875, -17.98211669921875, -17.58447265625, -17.18682861328125, -16.7891845703125, -16.39154052734375, -15.993896484375, -15.59625244140625, -15.1986083984375, -14.80096435546875, -14.4033203125, -14.00567626953125, -13.6080322265625, -13.21038818359375, -12.812744140625, -12.41510009765625, -12.0174560546875, -11.61981201171875, -11.22216796875, -10.82452392578125, -10.4268798828125, -10.02923583984375, -9.631591796875, -9.23394775390625, -8.8363037109375, -8.43865966796875, -8.041015625, -7.64337158203125, -7.2457275390625, -6.84808349609375, -6.450439453125, -6.05279541015625, -5.6551513671875, -5.25750732421875, -4.85986328125, -4.46221923828125, -4.0645751953125, -3.66693115234375, -3.269287109375, -2.87164306640625, -2.4739990234375, -2.07635498046875, -1.6787109375, -1.28106689453125, -0.8834228515625, -0.48577880859375, -0.088134765625, 0.30950927734375, 0.7071533203125, 1.10479736328125, 1.50244140625, 1.90008544921875, 2.2977294921875, 2.69537353515625, 3.093017578125, 3.49066162109375, 3.8883056640625, 4.28594970703125, 4.68359375]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 1.0, 4.0, 7.0, 10.0, 7.0, 11.0, 22.0, 36.0, 51.0, 75.0, 113.0, 214.0, 350.0, 771.0, 1997.0, 7234.0, 47887.0, 756436.0, 208986.0, 18030.0, 3902.0, 1215.0, 510.0, 278.0, 159.0, 61.0, 56.0, 38.0, 38.0, 23.0, 10.0, 12.0, 4.0, 6.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.916015625, -2.82122802734375, -2.7264404296875, -2.63165283203125, -2.536865234375, -2.44207763671875, -2.3472900390625, -2.25250244140625, -2.15771484375, -2.06292724609375, -1.9681396484375, -1.87335205078125, -1.778564453125, -1.68377685546875, -1.5889892578125, -1.49420166015625, -1.3994140625, -1.30462646484375, -1.2098388671875, -1.11505126953125, -1.020263671875, -0.92547607421875, -0.8306884765625, -0.73590087890625, -0.64111328125, -0.54632568359375, -0.4515380859375, -0.35675048828125, -0.261962890625, -0.16717529296875, -0.0723876953125, 0.02239990234375, 0.1171875, 0.21197509765625, 0.3067626953125, 0.40155029296875, 0.496337890625, 0.59112548828125, 0.6859130859375, 0.78070068359375, 0.87548828125, 0.97027587890625, 1.0650634765625, 1.15985107421875, 1.254638671875, 1.34942626953125, 1.4442138671875, 1.53900146484375, 1.6337890625, 1.72857666015625, 1.8233642578125, 1.91815185546875, 2.012939453125, 2.10772705078125, 2.2025146484375, 2.29730224609375, 2.39208984375, 2.48687744140625, 2.5816650390625, 2.67645263671875, 2.771240234375, 2.86602783203125, 2.9608154296875, 3.05560302734375, 3.150390625]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 8.0, 8.0, 7.0, 10.0, 12.0, 17.0, 13.0, 17.0, 26.0, 30.0, 26.0, 26.0, 39.0, 38.0, 38.0, 31.0, 41.0, 38.0, 41.0, 37.0, 44.0, 45.0, 45.0, 38.0, 39.0, 36.0, 41.0, 32.0, 19.0, 26.0, 20.0, 18.0, 10.0, 11.0, 8.0, 13.0, 7.0, 8.0, 12.0, 5.0, 7.0, 2.0, 5.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.24609375, -4.1112060546875, -3.976318359375, -3.8414306640625, -3.70654296875, -3.5716552734375, -3.436767578125, -3.3018798828125, -3.1669921875, -3.0321044921875, -2.897216796875, -2.7623291015625, -2.62744140625, -2.4925537109375, -2.357666015625, -2.2227783203125, -2.087890625, -1.9530029296875, -1.818115234375, -1.6832275390625, -1.54833984375, -1.4134521484375, -1.278564453125, -1.1436767578125, -1.0087890625, -0.8739013671875, -0.739013671875, -0.6041259765625, -0.46923828125, -0.3343505859375, -0.199462890625, -0.0645751953125, 0.0703125, 0.2052001953125, 0.340087890625, 0.4749755859375, 0.60986328125, 0.7447509765625, 0.879638671875, 1.0145263671875, 1.1494140625, 1.2843017578125, 1.419189453125, 1.5540771484375, 1.68896484375, 1.8238525390625, 1.958740234375, 2.0936279296875, 2.228515625, 2.3634033203125, 2.498291015625, 2.6331787109375, 2.76806640625, 2.9029541015625, 3.037841796875, 3.1727294921875, 3.3076171875, 3.4425048828125, 3.577392578125, 3.7122802734375, 3.84716796875, 3.9820556640625, 4.116943359375, 4.2518310546875, 4.38671875]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 1.0, 6.0, 4.0, 3.0, 4.0, 10.0, 14.0, 13.0, 14.0, 30.0, 34.0, 39.0, 74.0, 69.0, 108.0, 188.0, 244.0, 420.0, 611.0, 1065.0, 1843.0, 3390.0, 6355.0, 13637.0, 32414.0, 92517.0, 356980.0, 377154.0, 97465.0, 34458.0, 14420.0, 6752.0, 3328.0, 1849.0, 1075.0, 678.0, 430.0, 293.0, 175.0, 112.0, 83.0, 59.0, 49.0, 25.0, 19.0, 9.0, 14.0, 10.0, 7.0, 6.0, 1.0, 4.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.427490234375, -0.4132499694824219, -0.39900970458984375, -0.3847694396972656, -0.3705291748046875, -0.3562889099121094, -0.34204864501953125, -0.3278083801269531, -0.313568115234375, -0.2993278503417969, -0.28508758544921875, -0.2708473205566406, -0.2566070556640625, -0.24236679077148438, -0.22812652587890625, -0.21388626098632812, -0.19964599609375, -0.18540573120117188, -0.17116546630859375, -0.15692520141601562, -0.1426849365234375, -0.12844467163085938, -0.11420440673828125, -0.09996414184570312, -0.085723876953125, -0.07148361206054688, -0.05724334716796875, -0.043003082275390625, -0.0287628173828125, -0.014522552490234375, -0.00028228759765625, 0.013957977294921875, 0.0281982421875, 0.042438507080078125, 0.05667877197265625, 0.07091903686523438, 0.0851593017578125, 0.09939956665039062, 0.11363983154296875, 0.12788009643554688, 0.142120361328125, 0.15636062622070312, 0.17060089111328125, 0.18484115600585938, 0.1990814208984375, 0.21332168579101562, 0.22756195068359375, 0.24180221557617188, 0.25604248046875, 0.2702827453613281, 0.28452301025390625, 0.2987632751464844, 0.3130035400390625, 0.3272438049316406, 0.34148406982421875, 0.3557243347167969, 0.369964599609375, 0.3842048645019531, 0.39844512939453125, 0.4126853942871094, 0.4269256591796875, 0.4411659240722656, 0.45540618896484375, 0.4696464538574219, 0.48388671875]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 5.0, 5.0, 3.0, 7.0, 3.0, 4.0, 9.0, 10.0, 17.0, 26.0, 29.0, 27.0, 34.0, 49.0, 58.0, 104.0, 105.0, 125.0, 97.0, 63.0, 48.0, 40.0, 31.0, 20.0, 14.0, 12.0, 13.0, 9.0, 10.0, 2.0, 6.0, 4.0, 3.0, 3.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00012373924255371094, -0.00011987611651420593, -0.00011601299047470093, -0.00011214986443519592, -0.00010828673839569092, -0.00010442361235618591, -0.00010056048631668091, -9.66973602771759e-05, -9.28342342376709e-05, -8.89711081981659e-05, -8.510798215866089e-05, -8.124485611915588e-05, -7.738173007965088e-05, -7.351860404014587e-05, -6.965547800064087e-05, -6.579235196113586e-05, -6.192922592163086e-05, -5.8066099882125854e-05, -5.420297384262085e-05, -5.0339847803115845e-05, -4.647672176361084e-05, -4.2613595724105835e-05, -3.875046968460083e-05, -3.4887343645095825e-05, -3.102421760559082e-05, -2.7161091566085815e-05, -2.329796552658081e-05, -1.9434839487075806e-05, -1.55717134475708e-05, -1.1708587408065796e-05, -7.845461368560791e-06, -3.982335329055786e-06, -1.1920928955078125e-07, 3.7439167499542236e-06, 7.6070427894592285e-06, 1.1470168828964233e-05, 1.5333294868469238e-05, 1.9196420907974243e-05, 2.3059546947479248e-05, 2.6922672986984253e-05, 3.078579902648926e-05, 3.464892506599426e-05, 3.851205110549927e-05, 4.237517714500427e-05, 4.623830318450928e-05, 5.010142922401428e-05, 5.396455526351929e-05, 5.782768130302429e-05, 6.16908073425293e-05, 6.55539333820343e-05, 6.94170594215393e-05, 7.328018546104431e-05, 7.714331150054932e-05, 8.100643754005432e-05, 8.486956357955933e-05, 8.873268961906433e-05, 9.259581565856934e-05, 9.645894169807434e-05, 0.00010032206773757935, 0.00010418519377708435, 0.00010804831981658936, 0.00011191144585609436, 0.00011577457189559937, 0.00011963769793510437, 0.00012350082397460938]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 7.0, 5.0, 11.0, 2.0, 7.0, 14.0, 23.0, 22.0, 24.0, 60.0, 71.0, 117.0, 170.0, 273.0, 550.0, 888.0, 1853.0, 4104.0, 10722.0, 36693.0, 205627.0, 650645.0, 100163.0, 22547.0, 7681.0, 3059.0, 1374.0, 679.0, 427.0, 231.0, 170.0, 89.0, 66.0, 60.0, 25.0, 22.0, 29.0, 15.0, 10.0, 5.0, 5.0, 3.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.70751953125, -0.6833877563476562, -0.6592559814453125, -0.6351242065429688, -0.610992431640625, -0.5868606567382812, -0.5627288818359375, -0.5385971069335938, -0.51446533203125, -0.49033355712890625, -0.4662017822265625, -0.44207000732421875, -0.417938232421875, -0.39380645751953125, -0.3696746826171875, -0.34554290771484375, -0.3214111328125, -0.29727935791015625, -0.2731475830078125, -0.24901580810546875, -0.224884033203125, -0.20075225830078125, -0.1766204833984375, -0.15248870849609375, -0.12835693359375, -0.10422515869140625, -0.0800933837890625, -0.05596160888671875, -0.031829833984375, -0.00769805908203125, 0.0164337158203125, 0.04056549072265625, 0.064697265625, 0.08882904052734375, 0.1129608154296875, 0.13709259033203125, 0.161224365234375, 0.18535614013671875, 0.2094879150390625, 0.23361968994140625, 0.25775146484375, 0.28188323974609375, 0.3060150146484375, 0.33014678955078125, 0.354278564453125, 0.37841033935546875, 0.4025421142578125, 0.42667388916015625, 0.4508056640625, 0.47493743896484375, 0.4990692138671875, 0.5232009887695312, 0.547332763671875, 0.5714645385742188, 0.5955963134765625, 0.6197280883789062, 0.64385986328125, 0.6679916381835938, 0.6921234130859375, 0.7162551879882812, 0.740386962890625, 0.7645187377929688, 0.7886505126953125, 0.8127822875976562, 0.8369140625]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 2.0, 2.0, 5.0, 1.0, 4.0, 1.0, 6.0, 10.0, 11.0, 21.0, 17.0, 18.0, 25.0, 32.0, 35.0, 47.0, 63.0, 72.0, 101.0, 98.0, 82.0, 72.0, 49.0, 44.0, 40.0, 25.0, 17.0, 14.0, 14.0, 11.0, 15.0, 10.0, 9.0, 4.0, 7.0, 5.0, 5.0, 2.0, 3.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.36669921875, -0.3563041687011719, -0.34590911865234375, -0.3355140686035156, -0.3251190185546875, -0.3147239685058594, -0.30432891845703125, -0.2939338684082031, -0.283538818359375, -0.2731437683105469, -0.26274871826171875, -0.2523536682128906, -0.2419586181640625, -0.23156356811523438, -0.22116851806640625, -0.21077346801757812, -0.20037841796875, -0.18998336791992188, -0.17958831787109375, -0.16919326782226562, -0.1587982177734375, -0.14840316772460938, -0.13800811767578125, -0.12761306762695312, -0.117218017578125, -0.10682296752929688, -0.09642791748046875, -0.08603286743164062, -0.0756378173828125, -0.06524276733398438, -0.05484771728515625, -0.044452667236328125, -0.0340576171875, -0.023662567138671875, -0.01326751708984375, -0.002872467041015625, 0.0075225830078125, 0.017917633056640625, 0.02831268310546875, 0.038707733154296875, 0.049102783203125, 0.059497833251953125, 0.06989288330078125, 0.08028793334960938, 0.0906829833984375, 0.10107803344726562, 0.11147308349609375, 0.12186813354492188, 0.13226318359375, 0.14265823364257812, 0.15305328369140625, 0.16344833374023438, 0.1738433837890625, 0.18423843383789062, 0.19463348388671875, 0.20502853393554688, 0.215423583984375, 0.22581863403320312, 0.23621368408203125, 0.24660873413085938, 0.2570037841796875, 0.2673988342285156, 0.27779388427734375, 0.2881889343261719, 0.298583984375]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 6.0, 8.0, 12.0, 28.0, 94.0, 333.0, 365.0, 103.0, 33.0, 14.0, 5.0, 9.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.957146644592285, -10.350625991821289, -9.74410629272461, -9.137585639953613, -8.531065940856934, -7.9245452880859375, -7.3180251121521, -6.711504936218262, -6.104984760284424, -5.498464584350586, -4.891944408416748, -4.28542423248291, -3.678903818130493, -3.0723836421966553, -2.4658632278442383, -1.8593430519104004, -1.2528228759765625, -0.6463026404380798, -0.03978240489959717, 0.5667378902435303, 1.1732580661773682, 1.779778242111206, 2.386298656463623, 2.992818832397461, 3.599339008331299, 4.205859184265137, 4.812379360198975, 5.4188995361328125, 6.025420188903809, 6.631939888000488, 7.238460540771484, 7.844980716705322, 8.451499938964844, 9.05802059173584, 9.66454029083252, 10.271060943603516, 10.877580642700195, 11.484101295471191, 12.090621948242188, 12.697141647338867, 13.303661346435547, 13.910181999206543, 14.516701698303223, 15.123222351074219, 15.729742050170898, 16.336261749267578, 16.94278335571289, 17.54930305480957, 18.15582275390625, 18.76234245300293, 19.368864059448242, 19.975383758544922, 20.5819034576416, 21.18842315673828, 21.794944763183594, 22.401464462280273, 23.007986068725586, 23.614505767822266, 24.221027374267578, 24.827547073364258, 25.434066772460938, 26.040586471557617, 26.64710807800293, 27.25362777709961, 27.86014747619629]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 8.0, 7.0, 13.0, 13.0, 18.0, 27.0, 30.0, 44.0, 45.0, 56.0, 59.0, 56.0, 71.0, 58.0, 71.0, 69.0, 52.0, 68.0, 38.0, 41.0, 43.0, 32.0, 23.0, 13.0, 12.0, 13.0, 12.0, 10.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-18.36768341064453, -17.93861198425293, -17.509538650512695, -17.080467224121094, -16.651395797729492, -16.222322463989258, -15.793251037597656, -15.364178657531738, -14.93510627746582, -14.506033897399902, -14.0769624710083, -13.647890090942383, -13.218817710876465, -12.789745330810547, -12.360673904418945, -11.931601524353027, -11.502530097961426, -11.073457717895508, -10.644386291503906, -10.215313911437988, -9.78624153137207, -9.357170104980469, -8.92809772491455, -8.499025344848633, -8.069953918457031, -7.6408820152282715, -7.2118096351623535, -6.782737731933594, -6.353665351867676, -5.924593448638916, -5.495521545410156, -5.066449165344238, -4.63737678527832, -4.2083048820495605, -3.7792325019836426, -3.350160598754883, -2.921088457107544, -2.492016315460205, -2.0629444122314453, -1.6338722705841064, -1.2048001289367676, -0.7757280468940735, -0.3466559648513794, 0.08241605758666992, 0.5114881992340088, 0.9405603408813477, 1.3696322441101074, 1.7987043857574463, 2.227776527404785, 2.656848669052124, 3.085920810699463, 3.5149927139282227, 3.9440648555755615, 4.3731369972229, 4.80220890045166, 5.231281280517578, 5.660353183746338, 6.089425086975098, 6.518497467041016, 6.947569370269775, 7.376641273498535, 7.805713653564453, 8.234785079956055, 8.663857460021973, 9.09292984008789]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 9.0, 16.0, 15.0, 25.0, 34.0, 53.0, 102.0, 135.0, 206.0, 376.0, 580.0, 1054.0, 2029.0, 4658.0, 12200.0, 48435.0, 549766.0, 3395785.0, 140877.0, 23619.0, 7532.0, 3136.0, 1537.0, 845.0, 455.0, 276.0, 186.0, 103.0, 75.0, 38.0, 59.0, 17.0, 17.0, 13.0, 7.0, 4.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.412109375, -3.303009033203125, -3.19390869140625, -3.084808349609375, -2.9757080078125, -2.866607666015625, -2.75750732421875, -2.648406982421875, -2.539306640625, -2.430206298828125, -2.32110595703125, -2.212005615234375, -2.1029052734375, -1.993804931640625, -1.88470458984375, -1.775604248046875, -1.66650390625, -1.557403564453125, -1.44830322265625, -1.339202880859375, -1.2301025390625, -1.121002197265625, -1.01190185546875, -0.902801513671875, -0.793701171875, -0.684600830078125, -0.57550048828125, -0.466400146484375, -0.3572998046875, -0.248199462890625, -0.13909912109375, -0.029998779296875, 0.0791015625, 0.188201904296875, 0.29730224609375, 0.406402587890625, 0.5155029296875, 0.624603271484375, 0.73370361328125, 0.842803955078125, 0.951904296875, 1.061004638671875, 1.17010498046875, 1.279205322265625, 1.3883056640625, 1.497406005859375, 1.60650634765625, 1.715606689453125, 1.82470703125, 1.933807373046875, 2.04290771484375, 2.152008056640625, 2.2611083984375, 2.370208740234375, 2.47930908203125, 2.588409423828125, 2.697509765625, 2.806610107421875, 2.91571044921875, 3.024810791015625, 3.1339111328125, 3.243011474609375, 3.35211181640625, 3.461212158203125, 3.5703125]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 7.0, 8.0, 7.0, 19.0, 12.0, 14.0, 15.0, 25.0, 39.0, 52.0, 66.0, 68.0, 81.0, 69.0, 75.0, 78.0, 61.0, 47.0, 35.0, 45.0, 33.0, 24.0, 25.0, 12.0, 9.0, 15.0, 19.0, 9.0, 5.0, 3.0, 6.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.02734375, -1.958282470703125, -1.88922119140625, -1.820159912109375, -1.7510986328125, -1.682037353515625, -1.61297607421875, -1.543914794921875, -1.474853515625, -1.405792236328125, -1.33673095703125, -1.267669677734375, -1.1986083984375, -1.129547119140625, -1.06048583984375, -0.991424560546875, -0.92236328125, -0.853302001953125, -0.78424072265625, -0.715179443359375, -0.6461181640625, -0.577056884765625, -0.50799560546875, -0.438934326171875, -0.369873046875, -0.300811767578125, -0.23175048828125, -0.162689208984375, -0.0936279296875, -0.024566650390625, 0.04449462890625, 0.113555908203125, 0.1826171875, 0.251678466796875, 0.32073974609375, 0.389801025390625, 0.4588623046875, 0.527923583984375, 0.59698486328125, 0.666046142578125, 0.735107421875, 0.804168701171875, 0.87322998046875, 0.942291259765625, 1.0113525390625, 1.080413818359375, 1.14947509765625, 1.218536376953125, 1.28759765625, 1.356658935546875, 1.42572021484375, 1.494781494140625, 1.5638427734375, 1.632904052734375, 1.70196533203125, 1.771026611328125, 1.840087890625, 1.909149169921875, 1.97821044921875, 2.047271728515625, 2.1163330078125, 2.185394287109375, 2.25445556640625, 2.323516845703125, 2.392578125]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 4.0, 4.0, 5.0, 7.0, 6.0, 14.0, 16.0, 31.0, 35.0, 45.0, 81.0, 149.0, 239.0, 421.0, 971.0, 2608.0, 9637.0, 64408.0, 3642105.0, 439564.0, 25731.0, 5095.0, 1579.0, 669.0, 348.0, 180.0, 105.0, 66.0, 45.0, 33.0, 24.0, 11.0, 13.0, 7.0, 7.0, 8.0, 6.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.22265625, -4.08551025390625, -3.9483642578125, -3.81121826171875, -3.674072265625, -3.53692626953125, -3.3997802734375, -3.26263427734375, -3.12548828125, -2.98834228515625, -2.8511962890625, -2.71405029296875, -2.576904296875, -2.43975830078125, -2.3026123046875, -2.16546630859375, -2.0283203125, -1.89117431640625, -1.7540283203125, -1.61688232421875, -1.479736328125, -1.34259033203125, -1.2054443359375, -1.06829833984375, -0.93115234375, -0.79400634765625, -0.6568603515625, -0.51971435546875, -0.382568359375, -0.24542236328125, -0.1082763671875, 0.02886962890625, 0.166015625, 0.30316162109375, 0.4403076171875, 0.57745361328125, 0.714599609375, 0.85174560546875, 0.9888916015625, 1.12603759765625, 1.26318359375, 1.40032958984375, 1.5374755859375, 1.67462158203125, 1.811767578125, 1.94891357421875, 2.0860595703125, 2.22320556640625, 2.3603515625, 2.49749755859375, 2.6346435546875, 2.77178955078125, 2.908935546875, 3.04608154296875, 3.1832275390625, 3.32037353515625, 3.45751953125, 3.59466552734375, 3.7318115234375, 3.86895751953125, 4.006103515625, 4.14324951171875, 4.2803955078125, 4.41754150390625, 4.5546875]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 6.0, 8.0, 6.0, 10.0, 14.0, 11.0, 31.0, 20.0, 46.0, 55.0, 74.0, 88.0, 173.0, 283.0, 595.0, 1046.0, 653.0, 327.0, 184.0, 113.0, 82.0, 66.0, 47.0, 30.0, 30.0, 16.0, 13.0, 12.0, 8.0, 9.0, 4.0, 3.0, 4.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.66064453125, -0.6375045776367188, -0.6143646240234375, -0.5912246704101562, -0.568084716796875, -0.5449447631835938, -0.5218048095703125, -0.49866485595703125, -0.47552490234375, -0.45238494873046875, -0.4292449951171875, -0.40610504150390625, -0.382965087890625, -0.35982513427734375, -0.3366851806640625, -0.31354522705078125, -0.2904052734375, -0.26726531982421875, -0.2441253662109375, -0.22098541259765625, -0.197845458984375, -0.17470550537109375, -0.1515655517578125, -0.12842559814453125, -0.10528564453125, -0.08214569091796875, -0.0590057373046875, -0.03586578369140625, -0.012725830078125, 0.01041412353515625, 0.0335540771484375, 0.05669403076171875, 0.079833984375, 0.10297393798828125, 0.1261138916015625, 0.14925384521484375, 0.172393798828125, 0.19553375244140625, 0.2186737060546875, 0.24181365966796875, 0.26495361328125, 0.28809356689453125, 0.3112335205078125, 0.33437347412109375, 0.357513427734375, 0.38065338134765625, 0.4037933349609375, 0.42693328857421875, 0.4500732421875, 0.47321319580078125, 0.4963531494140625, 0.5194931030273438, 0.542633056640625, 0.5657730102539062, 0.5889129638671875, 0.6120529174804688, 0.63519287109375, 0.6583328247070312, 0.6814727783203125, 0.7046127319335938, 0.727752685546875, 0.7508926391601562, 0.7740325927734375, 0.7971725463867188, 0.8203125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 5.0, 3.0, 3.0, 6.0, 6.0, 7.0, 9.0, 8.0, 17.0, 24.0, 56.0, 84.0, 139.0, 190.0, 139.0, 104.0, 70.0, 37.0, 37.0, 15.0, 12.0, 9.0, 10.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.906198978424072, -4.765286922454834, -4.624375343322754, -4.483463287353516, -4.342551231384277, -4.201639652252197, -4.060727596282959, -3.9198157787323, -3.7789039611816406, -3.6379921436309814, -3.497080087661743, -3.356168270111084, -3.215256452560425, -3.0743446350097656, -2.9334325790405273, -2.792520761489868, -2.65160870552063, -2.5106968879699707, -2.3697848320007324, -2.2288730144500732, -2.087961196899414, -1.9470492601394653, -1.8061373233795166, -1.6652255058288574, -1.5243135690689087, -1.38340163230896, -1.2424898147583008, -1.101577877998352, -0.9606660008430481, -0.8197541236877441, -0.6788421869277954, -0.5379303097724915, -0.3970184326171875, -0.25610655546188354, -0.1151946485042572, 0.02571725845336914, 0.1666291356086731, 0.30754101276397705, 0.4484529495239258, 0.5893648266792297, 0.7302767038345337, 0.8711885809898376, 1.0121004581451416, 1.1530123949050903, 1.293924331665039, 1.4348361492156982, 1.575748085975647, 1.7166600227355957, 1.8575718402862549, 1.9984837770462036, 2.1393957138061523, 2.2803075313568115, 2.4212193489074707, 2.562131404876709, 2.703043222427368, 2.8439550399780273, 2.9848670959472656, 3.125778913497925, 3.266690969467163, 3.4076027870178223, 3.5485146045684814, 3.6894264221191406, 3.830338478088379, 3.971250295639038, 4.112162113189697]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 4.0, 3.0, 2.0, 2.0, 3.0, 6.0, 7.0, 5.0, 7.0, 13.0, 20.0, 18.0, 14.0, 17.0, 37.0, 40.0, 27.0, 45.0, 40.0, 53.0, 53.0, 61.0, 65.0, 61.0, 41.0, 51.0, 49.0, 43.0, 24.0, 31.0, 36.0, 23.0, 15.0, 15.0, 18.0, 13.0, 9.0, 9.0, 8.0, 6.0, 3.0, 5.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7863608598709106, -1.7207067012786865, -1.6550525426864624, -1.5893983840942383, -1.5237441062927246, -1.4580899477005005, -1.3924357891082764, -1.3267816305160522, -1.2611274719238281, -1.195473313331604, -1.1298191547393799, -1.0641648769378662, -0.9985107183456421, -0.932856559753418, -0.8672024011611938, -0.8015482425689697, -0.735893964767456, -0.6702398061752319, -0.604585587978363, -0.5389314293861389, -0.4732772409915924, -0.4076230525970459, -0.3419688940048218, -0.27631470561027527, -0.21066051721572876, -0.14500632882118225, -0.07935215532779694, -0.013697981834411621, 0.05195620656013489, 0.1176103949546814, 0.18326455354690552, 0.24891874194145203, 0.3145730495452881, 0.3802272379398346, 0.4458814263343811, 0.5115355849266052, 0.5771898031234741, 0.6428439617156982, 0.7084981203079224, 0.7741522789001465, 0.8398064970970154, 0.9054606556892395, 0.9711148738861084, 1.0367690324783325, 1.1024231910705566, 1.1680774688720703, 1.2337315082550049, 1.2993857860565186, 1.3650399446487427, 1.4306941032409668, 1.496348261833191, 1.562002420425415, 1.6276566982269287, 1.6933108568191528, 1.758965015411377, 1.824619174003601, 1.8902733325958252, 1.9559274911880493, 2.0215816497802734, 2.087235927581787, 2.1528899669647217, 2.2185442447662354, 2.28419828414917, 2.3498525619506836, 2.4155068397521973]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 6.0, 3.0, 2.0, 5.0, 13.0, 17.0, 28.0, 38.0, 57.0, 84.0, 137.0, 249.0, 431.0, 719.0, 1341.0, 2669.0, 5740.0, 13176.0, 33859.0, 98176.0, 284134.0, 369496.0, 152609.0, 50918.0, 19028.0, 7936.0, 3647.0, 1834.0, 959.0, 499.0, 288.0, 193.0, 122.0, 65.0, 32.0, 11.0, 16.0, 11.0, 11.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.2335205078125, -0.22669219970703125, -0.2198638916015625, -0.21303558349609375, -0.206207275390625, -0.19937896728515625, -0.1925506591796875, -0.18572235107421875, -0.17889404296875, -0.17206573486328125, -0.1652374267578125, -0.15840911865234375, -0.151580810546875, -0.14475250244140625, -0.1379241943359375, -0.13109588623046875, -0.124267578125, -0.11743927001953125, -0.1106109619140625, -0.10378265380859375, -0.096954345703125, -0.09012603759765625, -0.0832977294921875, -0.07646942138671875, -0.06964111328125, -0.06281280517578125, -0.0559844970703125, -0.04915618896484375, -0.042327880859375, -0.03549957275390625, -0.0286712646484375, -0.02184295654296875, -0.0150146484375, -0.00818634033203125, -0.0013580322265625, 0.00547027587890625, 0.012298583984375, 0.01912689208984375, 0.0259552001953125, 0.03278350830078125, 0.03961181640625, 0.04644012451171875, 0.0532684326171875, 0.06009674072265625, 0.066925048828125, 0.07375335693359375, 0.0805816650390625, 0.08740997314453125, 0.09423828125, 0.10106658935546875, 0.1078948974609375, 0.11472320556640625, 0.121551513671875, 0.12837982177734375, 0.1352081298828125, 0.14203643798828125, 0.14886474609375, 0.15569305419921875, 0.1625213623046875, 0.16934967041015625, 0.176177978515625, 0.18300628662109375, 0.1898345947265625, 0.19666290283203125, 0.2034912109375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 4.0, 7.0, 10.0, 6.0, 16.0, 21.0, 17.0, 26.0, 30.0, 42.0, 43.0, 64.0, 66.0, 76.0, 83.0, 55.0, 66.0, 53.0, 61.0, 46.0, 35.0, 29.0, 32.0, 25.0, 22.0, 10.0, 9.0, 13.0, 13.0, 3.0, 1.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.650390625, -1.5955963134765625, -1.540802001953125, -1.4860076904296875, -1.43121337890625, -1.3764190673828125, -1.321624755859375, -1.2668304443359375, -1.2120361328125, -1.1572418212890625, -1.102447509765625, -1.0476531982421875, -0.99285888671875, -0.9380645751953125, -0.883270263671875, -0.8284759521484375, -0.773681640625, -0.7188873291015625, -0.664093017578125, -0.6092987060546875, -0.55450439453125, -0.4997100830078125, -0.444915771484375, -0.3901214599609375, -0.3353271484375, -0.2805328369140625, -0.225738525390625, -0.1709442138671875, -0.11614990234375, -0.0613555908203125, -0.006561279296875, 0.0482330322265625, 0.10302734375, 0.1578216552734375, 0.212615966796875, 0.2674102783203125, 0.32220458984375, 0.3769989013671875, 0.431793212890625, 0.4865875244140625, 0.5413818359375, 0.5961761474609375, 0.650970458984375, 0.7057647705078125, 0.76055908203125, 0.8153533935546875, 0.870147705078125, 0.9249420166015625, 0.979736328125, 1.0345306396484375, 1.089324951171875, 1.1441192626953125, 1.19891357421875, 1.2537078857421875, 1.308502197265625, 1.3632965087890625, 1.4180908203125, 1.4728851318359375, 1.527679443359375, 1.5824737548828125, 1.63726806640625, 1.6920623779296875, 1.746856689453125, 1.8016510009765625, 1.8564453125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 6.0, 13.0, 9.0, 19.0, 24.0, 38.0, 40.0, 63.0, 98.0, 154.0, 180.0, 310.0, 530.0, 1021.0, 2294.0, 5874.0, 18895.0, 73060.0, 270229.0, 432472.0, 176810.0, 45570.0, 12695.0, 4209.0, 1778.0, 824.0, 468.0, 253.0, 177.0, 131.0, 75.0, 78.0, 36.0, 31.0, 27.0, 17.0, 13.0, 7.0, 4.0, 9.0, 4.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.261962890625, -0.2541027069091797, -0.24624252319335938, -0.23838233947753906, -0.23052215576171875, -0.22266197204589844, -0.21480178833007812, -0.2069416046142578, -0.1990814208984375, -0.1912212371826172, -0.18336105346679688, -0.17550086975097656, -0.16764068603515625, -0.15978050231933594, -0.15192031860351562, -0.1440601348876953, -0.136199951171875, -0.1283397674560547, -0.12047958374023438, -0.11261940002441406, -0.10475921630859375, -0.09689903259277344, -0.08903884887695312, -0.08117866516113281, -0.0733184814453125, -0.06545829772949219, -0.057598114013671875, -0.04973793029785156, -0.04187774658203125, -0.03401756286621094, -0.026157379150390625, -0.018297195434570312, -0.01043701171875, -0.0025768280029296875, 0.005283355712890625, 0.013143539428710938, 0.02100372314453125, 0.028863906860351562, 0.036724090576171875, 0.04458427429199219, 0.0524444580078125, 0.06030464172363281, 0.06816482543945312, 0.07602500915527344, 0.08388519287109375, 0.09174537658691406, 0.09960556030273438, 0.10746574401855469, 0.115325927734375, 0.12318611145019531, 0.13104629516601562, 0.13890647888183594, 0.14676666259765625, 0.15462684631347656, 0.16248703002929688, 0.1703472137451172, 0.1782073974609375, 0.1860675811767578, 0.19392776489257812, 0.20178794860839844, 0.20964813232421875, 0.21750831604003906, 0.22536849975585938, 0.2332286834716797, 0.2410888671875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 6.0, 2.0, 4.0, 3.0, 5.0, 10.0, 4.0, 10.0, 16.0, 20.0, 13.0, 20.0, 24.0, 32.0, 26.0, 39.0, 46.0, 54.0, 54.0, 51.0, 64.0, 60.0, 58.0, 38.0, 39.0, 44.0, 45.0, 30.0, 28.0, 31.0, 33.0, 18.0, 18.0, 11.0, 10.0, 10.0, 10.0, 6.0, 4.0, 3.0, 2.0, 6.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.181640625, -3.088714599609375, -2.99578857421875, -2.902862548828125, -2.8099365234375, -2.717010498046875, -2.62408447265625, -2.531158447265625, -2.438232421875, -2.345306396484375, -2.25238037109375, -2.159454345703125, -2.0665283203125, -1.973602294921875, -1.88067626953125, -1.787750244140625, -1.69482421875, -1.601898193359375, -1.50897216796875, -1.416046142578125, -1.3231201171875, -1.230194091796875, -1.13726806640625, -1.044342041015625, -0.951416015625, -0.858489990234375, -0.76556396484375, -0.672637939453125, -0.5797119140625, -0.486785888671875, -0.39385986328125, -0.300933837890625, -0.2080078125, -0.115081787109375, -0.02215576171875, 0.070770263671875, 0.1636962890625, 0.256622314453125, 0.34954833984375, 0.442474365234375, 0.535400390625, 0.628326416015625, 0.72125244140625, 0.814178466796875, 0.9071044921875, 1.000030517578125, 1.09295654296875, 1.185882568359375, 1.27880859375, 1.371734619140625, 1.46466064453125, 1.557586669921875, 1.6505126953125, 1.743438720703125, 1.83636474609375, 1.929290771484375, 2.022216796875, 2.115142822265625, 2.20806884765625, 2.300994873046875, 2.3939208984375, 2.486846923828125, 2.57977294921875, 2.672698974609375, 2.765625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 6.0, 7.0, 10.0, 13.0, 29.0, 34.0, 33.0, 92.0, 117.0, 190.0, 394.0, 656.0, 1373.0, 3350.0, 10500.0, 74894.0, 775706.0, 157590.0, 15696.0, 4314.0, 1695.0, 822.0, 422.0, 220.0, 131.0, 78.0, 59.0, 42.0, 16.0, 17.0, 14.0, 10.0, 4.0, 7.0, 1.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.167236328125, -0.1615924835205078, -0.15594863891601562, -0.15030479431152344, -0.14466094970703125, -0.13901710510253906, -0.13337326049804688, -0.1277294158935547, -0.1220855712890625, -0.11644172668457031, -0.11079788208007812, -0.10515403747558594, -0.09951019287109375, -0.09386634826660156, -0.08822250366210938, -0.08257865905761719, -0.076934814453125, -0.07129096984863281, -0.06564712524414062, -0.06000328063964844, -0.05435943603515625, -0.04871559143066406, -0.043071746826171875, -0.03742790222167969, -0.0317840576171875, -0.026140213012695312, -0.020496368408203125, -0.014852523803710938, -0.00920867919921875, -0.0035648345947265625, 0.002079010009765625, 0.0077228546142578125, 0.01336669921875, 0.019010543823242188, 0.024654388427734375, 0.030298233032226562, 0.03594207763671875, 0.04158592224121094, 0.047229766845703125, 0.05287361145019531, 0.0585174560546875, 0.06416130065917969, 0.06980514526367188, 0.07544898986816406, 0.08109283447265625, 0.08673667907714844, 0.09238052368164062, 0.09802436828613281, 0.103668212890625, 0.10931205749511719, 0.11495590209960938, 0.12059974670410156, 0.12624359130859375, 0.13188743591308594, 0.13753128051757812, 0.1431751251220703, 0.1488189697265625, 0.1544628143310547, 0.16010665893554688, 0.16575050354003906, 0.17139434814453125, 0.17703819274902344, 0.18268203735351562, 0.1883258819580078, 0.1939697265625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 10.0, 2.0, 15.0, 18.0, 28.0, 55.0, 103.0, 212.0, 252.0, 164.0, 77.0, 30.0, 14.0, 6.0, 5.0, 4.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0001590251922607422, -0.00015451014041900635, -0.0001499950885772705, -0.00014548003673553467, -0.00014096498489379883, -0.000136449933052063, -0.00013193488121032715, -0.0001274198293685913, -0.00012290477752685547, -0.00011838972568511963, -0.00011387467384338379, -0.00010935962200164795, -0.00010484457015991211, -0.00010032951831817627, -9.581446647644043e-05, -9.129941463470459e-05, -8.678436279296875e-05, -8.226931095123291e-05, -7.775425910949707e-05, -7.323920726776123e-05, -6.872415542602539e-05, -6.420910358428955e-05, -5.969405174255371e-05, -5.517899990081787e-05, -5.066394805908203e-05, -4.614889621734619e-05, -4.163384437561035e-05, -3.711879253387451e-05, -3.260374069213867e-05, -2.8088688850402832e-05, -2.3573637008666992e-05, -1.9058585166931152e-05, -1.4543533325195312e-05, -1.0028481483459473e-05, -5.513429641723633e-06, -9.98377799987793e-07, 3.516674041748047e-06, 8.031725883483887e-06, 1.2546777725219727e-05, 1.7061829566955566e-05, 2.1576881408691406e-05, 2.6091933250427246e-05, 3.0606985092163086e-05, 3.5122036933898926e-05, 3.9637088775634766e-05, 4.4152140617370605e-05, 4.8667192459106445e-05, 5.3182244300842285e-05, 5.7697296142578125e-05, 6.221234798431396e-05, 6.67273998260498e-05, 7.124245166778564e-05, 7.575750350952148e-05, 8.027255535125732e-05, 8.478760719299316e-05, 8.9302659034729e-05, 9.381771087646484e-05, 9.833276271820068e-05, 0.00010284781455993652, 0.00010736286640167236, 0.0001118779182434082, 0.00011639297008514404, 0.00012090802192687988, 0.00012542307376861572, 0.00012993812561035156]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 12.0, 11.0, 23.0, 23.0, 29.0, 45.0, 67.0, 101.0, 120.0, 207.0, 336.0, 599.0, 1248.0, 3188.0, 9822.0, 58798.0, 736624.0, 208219.0, 20139.0, 5098.0, 1832.0, 839.0, 390.0, 268.0, 135.0, 113.0, 71.0, 52.0, 31.0, 28.0, 23.0, 16.0, 8.0, 10.0, 6.0, 5.0, 8.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.209228515625, -0.20337295532226562, -0.19751739501953125, -0.19166183471679688, -0.1858062744140625, -0.17995071411132812, -0.17409515380859375, -0.16823959350585938, -0.162384033203125, -0.15652847290039062, -0.15067291259765625, -0.14481735229492188, -0.1389617919921875, -0.13310623168945312, -0.12725067138671875, -0.12139511108398438, -0.11553955078125, -0.10968399047851562, -0.10382843017578125, -0.09797286987304688, -0.0921173095703125, -0.08626174926757812, -0.08040618896484375, -0.07455062866210938, -0.068695068359375, -0.06283950805664062, -0.05698394775390625, -0.051128387451171875, -0.0452728271484375, -0.039417266845703125, -0.03356170654296875, -0.027706146240234375, -0.0218505859375, -0.015995025634765625, -0.01013946533203125, -0.004283905029296875, 0.0015716552734375, 0.007427215576171875, 0.01328277587890625, 0.019138336181640625, 0.024993896484375, 0.030849456787109375, 0.03670501708984375, 0.042560577392578125, 0.0484161376953125, 0.054271697998046875, 0.06012725830078125, 0.06598281860351562, 0.07183837890625, 0.07769393920898438, 0.08354949951171875, 0.08940505981445312, 0.0952606201171875, 0.10111618041992188, 0.10697174072265625, 0.11282730102539062, 0.118682861328125, 0.12453842163085938, 0.13039398193359375, 0.13624954223632812, 0.1421051025390625, 0.14796066284179688, 0.15381622314453125, 0.15967178344726562, 0.16552734375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 4.0, 0.0, 3.0, 4.0, 1.0, 0.0, 3.0, 6.0, 6.0, 3.0, 5.0, 14.0, 12.0, 22.0, 24.0, 43.0, 40.0, 72.0, 101.0, 112.0, 120.0, 94.0, 84.0, 52.0, 48.0, 32.0, 33.0, 12.0, 14.0, 16.0, 7.0, 5.0, 4.0, 5.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.03656005859375, -0.03555583953857422, -0.03455162048339844, -0.033547401428222656, -0.032543182373046875, -0.031538963317871094, -0.030534744262695312, -0.02953052520751953, -0.02852630615234375, -0.02752208709716797, -0.026517868041992188, -0.025513648986816406, -0.024509429931640625, -0.023505210876464844, -0.022500991821289062, -0.02149677276611328, -0.0204925537109375, -0.01948833465576172, -0.018484115600585938, -0.017479896545410156, -0.016475677490234375, -0.015471458435058594, -0.014467239379882812, -0.013463020324707031, -0.01245880126953125, -0.011454582214355469, -0.010450363159179688, -0.009446144104003906, -0.008441925048828125, -0.007437705993652344, -0.0064334869384765625, -0.005429267883300781, -0.004425048828125, -0.0034208297729492188, -0.0024166107177734375, -0.0014123916625976562, -0.000408172607421875, 0.0005960464477539062, 0.0016002655029296875, 0.0026044845581054688, 0.00360870361328125, 0.004612922668457031, 0.0056171417236328125, 0.006621360778808594, 0.007625579833984375, 0.008629798889160156, 0.009634017944335938, 0.010638236999511719, 0.0116424560546875, 0.012646675109863281, 0.013650894165039062, 0.014655113220214844, 0.015659332275390625, 0.016663551330566406, 0.017667770385742188, 0.01867198944091797, 0.01967620849609375, 0.02068042755126953, 0.021684646606445312, 0.022688865661621094, 0.023693084716796875, 0.024697303771972656, 0.025701522827148438, 0.02670574188232422, 0.0277099609375]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 7.0, 4.0, 10.0, 13.0, 24.0, 32.0, 115.0, 266.0, 285.0, 128.0, 58.0, 27.0, 13.0, 8.0, 5.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.100545883178711, -3.9370317459106445, -3.773517608642578, -3.6100034713745117, -3.4464893341064453, -3.282975196838379, -3.1194610595703125, -2.955946922302246, -2.7924327850341797, -2.6289186477661133, -2.465404510498047, -2.3018903732299805, -2.138376235961914, -1.9748620986938477, -1.8113479614257812, -1.6478338241577148, -1.4843196868896484, -1.320805549621582, -1.1572914123535156, -0.9937772750854492, -0.8302631378173828, -0.6667490005493164, -0.50323486328125, -0.3397207260131836, -0.1762065887451172, -0.012692451477050781, 0.15082168579101562, 0.31433582305908203, 0.47784996032714844, 0.6413640975952148, 0.8048782348632812, 0.9683923721313477, 1.1319069862365723, 1.2954211235046387, 1.458935260772705, 1.6224493980407715, 1.785963535308838, 1.9494776725769043, 2.1129918098449707, 2.276505947113037, 2.4400200843811035, 2.60353422164917, 2.7670483589172363, 2.9305624961853027, 3.094076633453369, 3.2575907707214355, 3.421104907989502, 3.5846190452575684, 3.7481331825256348, 3.911647319793701, 4.075161457061768, 4.238675594329834, 4.4021897315979, 4.565703868865967, 4.729218006134033, 4.8927321434021, 5.056246280670166, 5.219760417938232, 5.383274555206299, 5.546788692474365, 5.710302829742432, 5.873816967010498, 6.0373311042785645, 6.200845241546631, 6.364359378814697]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 5.0, 2.0, 2.0, 3.0, 4.0, 4.0, 2.0, 5.0, 7.0, 12.0, 17.0, 16.0, 28.0, 29.0, 35.0, 50.0, 60.0, 54.0, 67.0, 82.0, 86.0, 72.0, 73.0, 60.0, 38.0, 34.0, 40.0, 30.0, 23.0, 10.0, 11.0, 13.0, 9.0, 6.0, 10.0, 6.0, 2.0, 5.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6169227361679077, -1.5615910291671753, -1.5062594413757324, -1.450927734375, -1.3955961465835571, -1.3402644395828247, -1.2849328517913818, -1.2296011447906494, -1.174269437789917, -1.1189377307891846, -1.0636061429977417, -1.0082744359970093, -0.9529428482055664, -0.897611141204834, -0.8422794938087463, -0.7869478464126587, -0.7316162586212158, -0.6762846112251282, -0.6209529638290405, -0.5656212568283081, -0.5102896690368652, -0.4549579918384552, -0.39962631464004517, -0.3442946672439575, -0.2889630198478699, -0.23363137245178223, -0.1782997101545334, -0.12296804785728455, -0.0676364004611969, -0.012304753065109253, 0.04302692413330078, 0.09835857152938843, 0.15369033813476562, 0.20902198553085327, 0.2643536329269409, 0.31968531012535095, 0.3750169575214386, 0.43034860491752625, 0.4856802821159363, 0.5410119295120239, 0.5963435769081116, 0.6516752243041992, 0.7070068717002869, 0.7623385190963745, 0.8176702260971069, 0.8730018138885498, 0.9283335208892822, 0.9836651682853699, 1.0389968156814575, 1.09432852268219, 1.1496601104736328, 1.2049918174743652, 1.260323405265808, 1.3156551122665405, 1.3709867000579834, 1.4263184070587158, 1.4816501140594482, 1.5369818210601807, 1.5923134088516235, 1.647645115852356, 1.7029767036437988, 1.7583084106445312, 1.8136401176452637, 1.8689717054367065, 1.9243032932281494]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 5.0, 4.0, 11.0, 19.0, 13.0, 25.0, 35.0, 51.0, 83.0, 100.0, 143.0, 235.0, 359.0, 565.0, 835.0, 1442.0, 2433.0, 4662.0, 9154.0, 20178.0, 53350.0, 194108.0, 528481.0, 151479.0, 44947.0, 17543.0, 8204.0, 4141.0, 2195.0, 1354.0, 849.0, 505.0, 349.0, 200.0, 145.0, 100.0, 88.0, 49.0, 34.0, 22.0, 14.0, 11.0, 12.0, 4.0, 7.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1552734375, -1.1172943115234375, -1.079315185546875, -1.0413360595703125, -1.00335693359375, -0.9653778076171875, -0.927398681640625, -0.8894195556640625, -0.8514404296875, -0.8134613037109375, -0.775482177734375, -0.7375030517578125, -0.69952392578125, -0.6615447998046875, -0.623565673828125, -0.5855865478515625, -0.547607421875, -0.5096282958984375, -0.471649169921875, -0.4336700439453125, -0.39569091796875, -0.3577117919921875, -0.319732666015625, -0.2817535400390625, -0.2437744140625, -0.2057952880859375, -0.167816162109375, -0.1298370361328125, -0.09185791015625, -0.0538787841796875, -0.015899658203125, 0.0220794677734375, 0.06005859375, 0.0980377197265625, 0.136016845703125, 0.1739959716796875, 0.21197509765625, 0.2499542236328125, 0.287933349609375, 0.3259124755859375, 0.3638916015625, 0.4018707275390625, 0.439849853515625, 0.4778289794921875, 0.51580810546875, 0.5537872314453125, 0.591766357421875, 0.6297454833984375, 0.667724609375, 0.7057037353515625, 0.743682861328125, 0.7816619873046875, 0.81964111328125, 0.8576202392578125, 0.895599365234375, 0.9335784912109375, 0.9715576171875, 1.0095367431640625, 1.047515869140625, 1.0854949951171875, 1.12347412109375, 1.1614532470703125, 1.199432373046875, 1.2374114990234375, 1.275390625]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 1.0, 1.0, 4.0, 5.0, 7.0, 2.0, 10.0, 10.0, 22.0, 24.0, 28.0, 38.0, 35.0, 40.0, 56.0, 63.0, 68.0, 85.0, 80.0, 71.0, 54.0, 57.0, 53.0, 33.0, 32.0, 25.0, 24.0, 17.0, 14.0, 9.0, 6.0, 9.0, 8.0, 3.0, 2.0, 2.0, 1.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.958984375, -3.817901611328125, -3.67681884765625, -3.535736083984375, -3.3946533203125, -3.253570556640625, -3.11248779296875, -2.971405029296875, -2.830322265625, -2.689239501953125, -2.54815673828125, -2.407073974609375, -2.2659912109375, -2.124908447265625, -1.98382568359375, -1.842742919921875, -1.70166015625, -1.560577392578125, -1.41949462890625, -1.278411865234375, -1.1373291015625, -0.996246337890625, -0.85516357421875, -0.714080810546875, -0.572998046875, -0.431915283203125, -0.29083251953125, -0.149749755859375, -0.0086669921875, 0.132415771484375, 0.27349853515625, 0.414581298828125, 0.5556640625, 0.696746826171875, 0.83782958984375, 0.978912353515625, 1.1199951171875, 1.261077880859375, 1.40216064453125, 1.543243408203125, 1.684326171875, 1.825408935546875, 1.96649169921875, 2.107574462890625, 2.2486572265625, 2.389739990234375, 2.53082275390625, 2.671905517578125, 2.81298828125, 2.954071044921875, 3.09515380859375, 3.236236572265625, 3.3773193359375, 3.518402099609375, 3.65948486328125, 3.800567626953125, 3.941650390625, 4.082733154296875, 4.22381591796875, 4.364898681640625, 4.5059814453125, 4.647064208984375, 4.78814697265625, 4.929229736328125, 5.0703125]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 3.0, 5.0, 6.0, 7.0, 9.0, 12.0, 21.0, 26.0, 40.0, 51.0, 71.0, 109.0, 193.0, 346.0, 580.0, 1158.0, 2592.0, 6358.0, 20128.0, 94393.0, 662087.0, 210294.0, 33664.0, 9460.0, 3561.0, 1540.0, 747.0, 409.0, 210.0, 157.0, 94.0, 65.0, 40.0, 29.0, 23.0, 16.0, 13.0, 11.0, 7.0, 4.0, 4.0, 3.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-1.26171875, -1.217742919921875, -1.17376708984375, -1.129791259765625, -1.0858154296875, -1.041839599609375, -0.99786376953125, -0.953887939453125, -0.909912109375, -0.865936279296875, -0.82196044921875, -0.777984619140625, -0.7340087890625, -0.690032958984375, -0.64605712890625, -0.602081298828125, -0.55810546875, -0.514129638671875, -0.47015380859375, -0.426177978515625, -0.3822021484375, -0.338226318359375, -0.29425048828125, -0.250274658203125, -0.206298828125, -0.162322998046875, -0.11834716796875, -0.074371337890625, -0.0303955078125, 0.013580322265625, 0.05755615234375, 0.101531982421875, 0.1455078125, 0.189483642578125, 0.23345947265625, 0.277435302734375, 0.3214111328125, 0.365386962890625, 0.40936279296875, 0.453338623046875, 0.497314453125, 0.541290283203125, 0.58526611328125, 0.629241943359375, 0.6732177734375, 0.717193603515625, 0.76116943359375, 0.805145263671875, 0.84912109375, 0.893096923828125, 0.93707275390625, 0.981048583984375, 1.0250244140625, 1.069000244140625, 1.11297607421875, 1.156951904296875, 1.200927734375, 1.244903564453125, 1.28887939453125, 1.332855224609375, 1.3768310546875, 1.420806884765625, 1.46478271484375, 1.508758544921875, 1.552734375]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 3.0, 3.0, 6.0, 7.0, 12.0, 6.0, 11.0, 11.0, 10.0, 15.0, 19.0, 19.0, 28.0, 36.0, 29.0, 36.0, 48.0, 43.0, 37.0, 50.0, 42.0, 42.0, 45.0, 47.0, 41.0, 39.0, 41.0, 34.0, 31.0, 40.0, 33.0, 30.0, 19.0, 16.0, 17.0, 11.0, 8.0, 13.0, 8.0, 6.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.3046875, -4.1729736328125, -4.041259765625, -3.9095458984375, -3.77783203125, -3.6461181640625, -3.514404296875, -3.3826904296875, -3.2509765625, -3.1192626953125, -2.987548828125, -2.8558349609375, -2.72412109375, -2.5924072265625, -2.460693359375, -2.3289794921875, -2.197265625, -2.0655517578125, -1.933837890625, -1.8021240234375, -1.67041015625, -1.5386962890625, -1.406982421875, -1.2752685546875, -1.1435546875, -1.0118408203125, -0.880126953125, -0.7484130859375, -0.61669921875, -0.4849853515625, -0.353271484375, -0.2215576171875, -0.08984375, 0.0418701171875, 0.173583984375, 0.3052978515625, 0.43701171875, 0.5687255859375, 0.700439453125, 0.8321533203125, 0.9638671875, 1.0955810546875, 1.227294921875, 1.3590087890625, 1.49072265625, 1.6224365234375, 1.754150390625, 1.8858642578125, 2.017578125, 2.1492919921875, 2.281005859375, 2.4127197265625, 2.54443359375, 2.6761474609375, 2.807861328125, 2.9395751953125, 3.0712890625, 3.2030029296875, 3.334716796875, 3.4664306640625, 3.59814453125, 3.7298583984375, 3.861572265625, 3.9932861328125, 4.125]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 4.0, 11.0, 18.0, 39.0, 44.0, 125.0, 308.0, 1245.0, 9409.0, 481812.0, 543592.0, 10184.0, 1223.0, 330.0, 107.0, 52.0, 17.0, 15.0, 9.0, 5.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.583984375, -1.5443954467773438, -1.5048065185546875, -1.4652175903320312, -1.425628662109375, -1.3860397338867188, -1.3464508056640625, -1.3068618774414062, -1.26727294921875, -1.2276840209960938, -1.1880950927734375, -1.1485061645507812, -1.108917236328125, -1.0693283081054688, -1.0297393798828125, -0.9901504516601562, -0.9505615234375, -0.9109725952148438, -0.8713836669921875, -0.8317947387695312, -0.792205810546875, -0.7526168823242188, -0.7130279541015625, -0.6734390258789062, -0.63385009765625, -0.5942611694335938, -0.5546722412109375, -0.5150833129882812, -0.475494384765625, -0.43590545654296875, -0.3963165283203125, -0.35672760009765625, -0.317138671875, -0.27754974365234375, -0.2379608154296875, -0.19837188720703125, -0.158782958984375, -0.11919403076171875, -0.0796051025390625, -0.04001617431640625, -0.00042724609375, 0.03916168212890625, 0.0787506103515625, 0.11833953857421875, 0.157928466796875, 0.19751739501953125, 0.2371063232421875, 0.27669525146484375, 0.3162841796875, 0.35587310791015625, 0.3954620361328125, 0.43505096435546875, 0.474639892578125, 0.5142288208007812, 0.5538177490234375, 0.5934066772460938, 0.63299560546875, 0.6725845336914062, 0.7121734619140625, 0.7517623901367188, 0.791351318359375, 0.8309402465820312, 0.8705291748046875, 0.9101181030273438, 0.94970703125]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 3.0, 4.0, 8.0, 8.0, 13.0, 28.0, 66.0, 110.0, 228.0, 232.0, 116.0, 78.0, 38.0, 28.0, 18.0, 14.0, 9.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001556873321533203, -0.00015014410018920898, -0.00014460086822509766, -0.00013905763626098633, -0.000133514404296875, -0.00012797117233276367, -0.00012242794036865234, -0.00011688470840454102, -0.00011134147644042969, -0.00010579824447631836, -0.00010025501251220703, -9.47117805480957e-05, -8.916854858398438e-05, -8.362531661987305e-05, -7.808208465576172e-05, -7.253885269165039e-05, -6.699562072753906e-05, -6.145238876342773e-05, -5.5909156799316406e-05, -5.036592483520508e-05, -4.482269287109375e-05, -3.927946090698242e-05, -3.3736228942871094e-05, -2.8192996978759766e-05, -2.2649765014648438e-05, -1.710653305053711e-05, -1.1563301086425781e-05, -6.020069122314453e-06, -4.76837158203125e-07, 5.066394805908203e-06, 1.0609626770019531e-05, 1.615285873413086e-05, 2.1696090698242188e-05, 2.7239322662353516e-05, 3.2782554626464844e-05, 3.832578659057617e-05, 4.38690185546875e-05, 4.941225051879883e-05, 5.4955482482910156e-05, 6.0498714447021484e-05, 6.604194641113281e-05, 7.158517837524414e-05, 7.712841033935547e-05, 8.26716423034668e-05, 8.821487426757812e-05, 9.375810623168945e-05, 9.930133819580078e-05, 0.00010484457015991211, 0.00011038780212402344, 0.00011593103408813477, 0.0001214742660522461, 0.00012701749801635742, 0.00013256072998046875, 0.00013810396194458008, 0.0001436471939086914, 0.00014919042587280273, 0.00015473365783691406, 0.0001602768898010254, 0.00016582012176513672, 0.00017136335372924805, 0.00017690658569335938, 0.0001824498176574707, 0.00018799304962158203, 0.00019353628158569336, 0.0001990795135498047]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 6.0, 10.0, 15.0, 22.0, 47.0, 99.0, 252.0, 675.0, 2571.0, 15849.0, 491806.0, 517155.0, 16229.0, 2602.0, 775.0, 226.0, 93.0, 55.0, 25.0, 16.0, 6.0, 5.0, 4.0, 6.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.92529296875, -0.8910293579101562, -0.8567657470703125, -0.8225021362304688, -0.788238525390625, -0.7539749145507812, -0.7197113037109375, -0.6854476928710938, -0.65118408203125, -0.6169204711914062, -0.5826568603515625, -0.5483932495117188, -0.514129638671875, -0.47986602783203125, -0.4456024169921875, -0.41133880615234375, -0.3770751953125, -0.34281158447265625, -0.3085479736328125, -0.27428436279296875, -0.240020751953125, -0.20575714111328125, -0.1714935302734375, -0.13722991943359375, -0.10296630859375, -0.06870269775390625, -0.0344390869140625, -0.00017547607421875, 0.034088134765625, 0.06835174560546875, 0.1026153564453125, 0.13687896728515625, 0.171142578125, 0.20540618896484375, 0.2396697998046875, 0.27393341064453125, 0.308197021484375, 0.34246063232421875, 0.3767242431640625, 0.41098785400390625, 0.44525146484375, 0.47951507568359375, 0.5137786865234375, 0.5480422973632812, 0.582305908203125, 0.6165695190429688, 0.6508331298828125, 0.6850967407226562, 0.7193603515625, 0.7536239624023438, 0.7878875732421875, 0.8221511840820312, 0.856414794921875, 0.8906784057617188, 0.9249420166015625, 0.9592056274414062, 0.99346923828125, 1.0277328491210938, 1.0619964599609375, 1.0962600708007812, 1.130523681640625, 1.1647872924804688, 1.1990509033203125, 1.2333145141601562, 1.267578125]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 1.0, 3.0, 4.0, 6.0, 15.0, 13.0, 32.0, 60.0, 90.0, 162.0, 224.0, 163.0, 103.0, 51.0, 29.0, 23.0, 16.0, 6.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.66015625, -0.6420707702636719, -0.6239852905273438, -0.6058998107910156, -0.5878143310546875, -0.5697288513183594, -0.5516433715820312, -0.5335578918457031, -0.515472412109375, -0.4973869323730469, -0.47930145263671875, -0.4612159729003906, -0.4431304931640625, -0.4250450134277344, -0.40695953369140625, -0.3888740539550781, -0.37078857421875, -0.3527030944824219, -0.33461761474609375, -0.3165321350097656, -0.2984466552734375, -0.2803611755371094, -0.26227569580078125, -0.24419021606445312, -0.226104736328125, -0.20801925659179688, -0.18993377685546875, -0.17184829711914062, -0.1537628173828125, -0.13567733764648438, -0.11759185791015625, -0.09950637817382812, -0.0814208984375, -0.06333541870117188, -0.04524993896484375, -0.027164459228515625, -0.0090789794921875, 0.009006500244140625, 0.02709197998046875, 0.045177459716796875, 0.063262939453125, 0.08134841918945312, 0.09943389892578125, 0.11751937866210938, 0.1356048583984375, 0.15369033813476562, 0.17177581787109375, 0.18986129760742188, 0.20794677734375, 0.22603225708007812, 0.24411773681640625, 0.2622032165527344, 0.2802886962890625, 0.2983741760253906, 0.31645965576171875, 0.3345451354980469, 0.352630615234375, 0.3707160949707031, 0.38880157470703125, 0.4068870544433594, 0.4249725341796875, 0.4430580139160156, 0.46114349365234375, 0.4792289733886719, 0.497314453125]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 14.0, 28.0, 221.0, 639.0, 87.0, 18.0, 4.0, 3.0, 1.0], "bins": [-57.02280807495117, -56.044891357421875, -55.06697082519531, -54.089054107666016, -53.11113739013672, -52.133216857910156, -51.15530014038086, -50.17738342285156, -49.199462890625, -48.2215461730957, -47.24362564086914, -46.265708923339844, -45.28779220581055, -44.309871673583984, -43.33195495605469, -42.354034423828125, -41.37611770629883, -40.39820098876953, -39.42028045654297, -38.44236373901367, -37.464447021484375, -36.48652648925781, -35.508609771728516, -34.53069305419922, -33.552772521972656, -32.57485580444336, -31.59693717956543, -30.6190185546875, -29.64109992980957, -28.66318130493164, -27.685264587402344, -26.707345962524414, -25.729429244995117, -24.751510620117188, -23.77359390258789, -22.79567527770996, -21.81775665283203, -20.839839935302734, -19.861921310424805, -18.884002685546875, -17.906084060668945, -16.928165435791016, -15.950247764587402, -14.972330093383789, -13.99441146850586, -13.016493797302246, -12.038576126098633, -11.060657501220703, -10.082738876342773, -9.10482120513916, -8.12690258026123, -7.148984909057617, -6.1710662841796875, -5.193148612976074, -4.215230464935303, -3.2373123168945312, -2.259394645690918, -1.2814764976501465, -0.30355846881866455, 0.6743595600128174, 1.6522777080535889, 2.6301956176757812, 3.6081137657165527, 4.586031913757324, 5.563950061798096]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 1.0, 1.0, 2.0, 4.0, 4.0, 7.0, 5.0, 5.0, 7.0, 10.0, 16.0, 12.0, 17.0, 17.0, 27.0, 25.0, 22.0, 25.0, 29.0, 42.0, 34.0, 41.0, 49.0, 32.0, 33.0, 39.0, 47.0, 37.0, 41.0, 31.0, 34.0, 43.0, 19.0, 26.0, 25.0, 23.0, 21.0, 15.0, 19.0, 21.0, 20.0, 18.0, 13.0, 6.0, 9.0, 9.0, 5.0, 5.0, 6.0, 4.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.727214336395264, -6.497513294219971, -6.2678117752075195, -6.038110733032227, -5.808409690856934, -5.578708648681641, -5.349007606506348, -5.1193060874938965, -4.8896050453186035, -4.6599040031433105, -4.430202484130859, -4.200501441955566, -3.9708003997802734, -3.7410993576049805, -3.5113980770111084, -3.2816967964172363, -3.0519957542419434, -2.8222947120666504, -2.5925934314727783, -2.3628921508789062, -2.1331911087036133, -1.9034899473190308, -1.6737887859344482, -1.4440876245498657, -1.2143864631652832, -0.9846853017807007, -0.7549841403961182, -0.5252829790115356, -0.2955818176269531, -0.0658806562423706, 0.16382050514221191, 0.39352166652679443, 0.6232233047485352, 0.8529244661331177, 1.0826256275177002, 1.3123267889022827, 1.5420279502868652, 1.7717291116714478, 2.0014302730560303, 2.2311315536499023, 2.4608325958251953, 2.6905336380004883, 2.9202349185943604, 3.1499361991882324, 3.3796372413635254, 3.6093382835388184, 3.8390395641326904, 4.0687408447265625, 4.2984418869018555, 4.528142929077148, 4.757843971252441, 4.987545490264893, 5.2172465324401855, 5.4469475746154785, 5.67664909362793, 5.906350135803223, 6.136051177978516, 6.365752220153809, 6.595453262329102, 6.825154781341553, 7.054855823516846, 7.284556865692139, 7.51425838470459, 7.743959426879883, 7.973660469055176]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 5.0, 8.0, 17.0, 16.0, 23.0, 34.0, 42.0, 66.0, 92.0, 139.0, 193.0, 321.0, 496.0, 777.0, 1330.0, 2385.0, 4661.0, 10608.0, 31128.0, 141712.0, 2584516.0, 1272444.0, 100071.0, 24427.0, 9067.0, 4097.0, 2132.0, 1255.0, 763.0, 484.0, 341.0, 220.0, 134.0, 87.0, 53.0, 42.0, 40.0, 19.0, 13.0, 8.0, 8.0, 8.0, 2.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.033203125, -1.965240478515625, -1.89727783203125, -1.829315185546875, -1.7613525390625, -1.693389892578125, -1.62542724609375, -1.557464599609375, -1.489501953125, -1.421539306640625, -1.35357666015625, -1.285614013671875, -1.2176513671875, -1.149688720703125, -1.08172607421875, -1.013763427734375, -0.94580078125, -0.877838134765625, -0.80987548828125, -0.741912841796875, -0.6739501953125, -0.605987548828125, -0.53802490234375, -0.470062255859375, -0.402099609375, -0.334136962890625, -0.26617431640625, -0.198211669921875, -0.1302490234375, -0.062286376953125, 0.00567626953125, 0.073638916015625, 0.1416015625, 0.209564208984375, 0.27752685546875, 0.345489501953125, 0.4134521484375, 0.481414794921875, 0.54937744140625, 0.617340087890625, 0.685302734375, 0.753265380859375, 0.82122802734375, 0.889190673828125, 0.9571533203125, 1.025115966796875, 1.09307861328125, 1.161041259765625, 1.22900390625, 1.296966552734375, 1.36492919921875, 1.432891845703125, 1.5008544921875, 1.568817138671875, 1.63677978515625, 1.704742431640625, 1.772705078125, 1.840667724609375, 1.90863037109375, 1.976593017578125, 2.0445556640625, 2.112518310546875, 2.18048095703125, 2.248443603515625, 2.31640625]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 1.0, 4.0, 6.0, 7.0, 10.0, 8.0, 15.0, 22.0, 40.0, 37.0, 49.0, 58.0, 78.0, 77.0, 87.0, 67.0, 83.0, 65.0, 54.0, 56.0, 31.0, 25.0, 25.0, 18.0, 15.0, 12.0, 11.0, 12.0, 7.0, 3.0, 4.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.095703125, -2.0281982421875, -1.960693359375, -1.8931884765625, -1.82568359375, -1.7581787109375, -1.690673828125, -1.6231689453125, -1.5556640625, -1.4881591796875, -1.420654296875, -1.3531494140625, -1.28564453125, -1.2181396484375, -1.150634765625, -1.0831298828125, -1.015625, -0.9481201171875, -0.880615234375, -0.8131103515625, -0.74560546875, -0.6781005859375, -0.610595703125, -0.5430908203125, -0.4755859375, -0.4080810546875, -0.340576171875, -0.2730712890625, -0.20556640625, -0.1380615234375, -0.070556640625, -0.0030517578125, 0.064453125, 0.1319580078125, 0.199462890625, 0.2669677734375, 0.33447265625, 0.4019775390625, 0.469482421875, 0.5369873046875, 0.6044921875, 0.6719970703125, 0.739501953125, 0.8070068359375, 0.87451171875, 0.9420166015625, 1.009521484375, 1.0770263671875, 1.14453125, 1.2120361328125, 1.279541015625, 1.3470458984375, 1.41455078125, 1.4820556640625, 1.549560546875, 1.6170654296875, 1.6845703125, 1.7520751953125, 1.819580078125, 1.8870849609375, 1.95458984375, 2.0220947265625, 2.089599609375, 2.1571044921875, 2.224609375]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 4.0, 6.0, 9.0, 9.0, 14.0, 31.0, 30.0, 69.0, 133.0, 223.0, 596.0, 2024.0, 10606.0, 188176.0, 3933832.0, 51001.0, 5348.0, 1280.0, 442.0, 211.0, 106.0, 49.0, 27.0, 12.0, 23.0, 11.0, 3.0, 4.0, 3.0, 3.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5390625, -4.3787841796875, -4.218505859375, -4.0582275390625, -3.89794921875, -3.7376708984375, -3.577392578125, -3.4171142578125, -3.2568359375, -3.0965576171875, -2.936279296875, -2.7760009765625, -2.61572265625, -2.4554443359375, -2.295166015625, -2.1348876953125, -1.974609375, -1.8143310546875, -1.654052734375, -1.4937744140625, -1.33349609375, -1.1732177734375, -1.012939453125, -0.8526611328125, -0.6923828125, -0.5321044921875, -0.371826171875, -0.2115478515625, -0.05126953125, 0.1090087890625, 0.269287109375, 0.4295654296875, 0.58984375, 0.7501220703125, 0.910400390625, 1.0706787109375, 1.23095703125, 1.3912353515625, 1.551513671875, 1.7117919921875, 1.8720703125, 2.0323486328125, 2.192626953125, 2.3529052734375, 2.51318359375, 2.6734619140625, 2.833740234375, 2.9940185546875, 3.154296875, 3.3145751953125, 3.474853515625, 3.6351318359375, 3.79541015625, 3.9556884765625, 4.115966796875, 4.2762451171875, 4.4365234375, 4.5968017578125, 4.757080078125, 4.9173583984375, 5.07763671875, 5.2379150390625, 5.398193359375, 5.5584716796875, 5.71875]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 3.0, 2.0, 2.0, 9.0, 11.0, 12.0, 27.0, 33.0, 58.0, 69.0, 132.0, 264.0, 505.0, 1435.0, 716.0, 359.0, 177.0, 76.0, 67.0, 32.0, 27.0, 16.0, 10.0, 8.0, 8.0, 4.0, 3.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.93212890625, -0.9052200317382812, -0.8783111572265625, -0.8514022827148438, -0.824493408203125, -0.7975845336914062, -0.7706756591796875, -0.7437667846679688, -0.71685791015625, -0.6899490356445312, -0.6630401611328125, -0.6361312866210938, -0.609222412109375, -0.5823135375976562, -0.5554046630859375, -0.5284957885742188, -0.5015869140625, -0.47467803955078125, -0.4477691650390625, -0.42086029052734375, -0.393951416015625, -0.36704254150390625, -0.3401336669921875, -0.31322479248046875, -0.28631591796875, -0.25940704345703125, -0.2324981689453125, -0.20558929443359375, -0.178680419921875, -0.15177154541015625, -0.1248626708984375, -0.09795379638671875, -0.071044921875, -0.04413604736328125, -0.0172271728515625, 0.00968170166015625, 0.036590576171875, 0.06349945068359375, 0.0904083251953125, 0.11731719970703125, 0.14422607421875, 0.17113494873046875, 0.1980438232421875, 0.22495269775390625, 0.251861572265625, 0.27877044677734375, 0.3056793212890625, 0.33258819580078125, 0.3594970703125, 0.38640594482421875, 0.4133148193359375, 0.44022369384765625, 0.467132568359375, 0.49404144287109375, 0.5209503173828125, 0.5478591918945312, 0.57476806640625, 0.6016769409179688, 0.6285858154296875, 0.6554946899414062, 0.682403564453125, 0.7093124389648438, 0.7362213134765625, 0.7631301879882812, 0.7900390625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 8.0, 4.0, 8.0, 8.0, 12.0, 11.0, 19.0, 29.0, 51.0, 77.0, 158.0, 204.0, 166.0, 96.0, 57.0, 36.0, 17.0, 15.0, 8.0, 5.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.210004806518555, -5.067798137664795, -4.925590991973877, -4.783384323120117, -4.641177177429199, -4.4989705085754395, -4.35676383972168, -4.214556694030762, -4.072350025177002, -3.930143117904663, -3.787936210632324, -3.6457295417785645, -3.5035226345062256, -3.3613157272338867, -3.219109058380127, -3.076902151107788, -2.934695243835449, -2.7924883365631104, -2.6502814292907715, -2.5080747604370117, -2.365867853164673, -2.223660945892334, -2.081454277038574, -1.9392473697662354, -1.7970404624938965, -1.6548335552215576, -1.5126267671585083, -1.370419979095459, -1.2282130718231201, -1.0860061645507812, -0.9437993764877319, -0.8015925288200378, -0.6593859195709229, -0.5171790719032288, -0.37497222423553467, -0.23276537656784058, -0.09055852890014648, 0.05164831876754761, 0.1938551664352417, 0.3360620141029358, 0.4782688617706299, 0.620475709438324, 0.7626825571060181, 0.9048894047737122, 1.0470962524414062, 1.1893031597137451, 1.3315099477767944, 1.4737167358398438, 1.6159236431121826, 1.7581305503845215, 1.9003373384475708, 2.04254412651062, 2.184751033782959, 2.326957941055298, 2.4691648483276367, 2.6113715171813965, 2.7535784244537354, 2.895785331726074, 3.037992000579834, 3.180198907852173, 3.3224058151245117, 3.4646127223968506, 3.6068196296691895, 3.749026298522949, 3.891233205795288]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 4.0, 5.0, 3.0, 1.0, 5.0, 7.0, 2.0, 9.0, 3.0, 12.0, 12.0, 18.0, 25.0, 30.0, 35.0, 45.0, 46.0, 61.0, 71.0, 76.0, 64.0, 55.0, 55.0, 50.0, 55.0, 41.0, 34.0, 34.0, 30.0, 28.0, 15.0, 20.0, 14.0, 8.0, 8.0, 12.0, 3.0, 5.0, 6.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.9250521659851074, -1.8598415851593018, -1.794631004333496, -1.7294204235076904, -1.6642097234725952, -1.5989991426467896, -1.5337885618209839, -1.4685779809951782, -1.403367280960083, -1.3381567001342773, -1.2729461193084717, -1.207735538482666, -1.1425248384475708, -1.0773142576217651, -1.0121036767959595, -0.9468930959701538, -0.8816825151443481, -0.8164719343185425, -0.751261293888092, -0.6860507130622864, -0.6208400726318359, -0.5556294918060303, -0.4904189109802246, -0.42520830035209656, -0.3599976897239685, -0.29478707909584045, -0.2295764833688736, -0.16436588764190674, -0.09915527701377869, -0.033944666385650635, 0.03126591444015503, 0.09647652506828308, 0.16168713569641113, 0.22689774632453918, 0.29210835695266724, 0.3573189377784729, 0.42252954840660095, 0.487740159034729, 0.5529507398605347, 0.6181613206863403, 0.6833719611167908, 0.7485825419425964, 0.8137931823730469, 0.8790037631988525, 0.9442143440246582, 1.0094249248504639, 1.0746355056762695, 1.1398462057113647, 1.2050567865371704, 1.270267367362976, 1.3354779481887817, 1.400688648223877, 1.4658992290496826, 1.5311098098754883, 1.596320390701294, 1.6615309715270996, 1.7267415523529053, 1.791952133178711, 1.8571627140045166, 1.9223732948303223, 1.9875839948654175, 2.0527944564819336, 2.1180052757263184, 2.183215856552124, 2.2484264373779297]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 6.0, 3.0, 5.0, 5.0, 6.0, 6.0, 10.0, 11.0, 24.0, 29.0, 71.0, 78.0, 190.0, 317.0, 576.0, 1265.0, 2916.0, 7994.0, 24983.0, 97619.0, 413008.0, 378325.0, 86668.0, 21956.0, 7273.0, 2760.0, 1181.0, 539.0, 261.0, 197.0, 90.0, 59.0, 39.0, 29.0, 19.0, 14.0, 10.0, 7.0, 3.0, 4.0, 0.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.273193359375, -0.2649040222167969, -0.25661468505859375, -0.24832534790039062, -0.2400360107421875, -0.23174667358398438, -0.22345733642578125, -0.21516799926757812, -0.206878662109375, -0.19858932495117188, -0.19029998779296875, -0.18201065063476562, -0.1737213134765625, -0.16543197631835938, -0.15714263916015625, -0.14885330200195312, -0.14056396484375, -0.13227462768554688, -0.12398529052734375, -0.11569595336914062, -0.1074066162109375, -0.09911727905273438, -0.09082794189453125, -0.08253860473632812, -0.074249267578125, -0.06595993041992188, -0.05767059326171875, -0.049381256103515625, -0.0410919189453125, -0.032802581787109375, -0.02451324462890625, -0.016223907470703125, -0.0079345703125, 0.000354766845703125, 0.00864410400390625, 0.016933441162109375, 0.0252227783203125, 0.033512115478515625, 0.04180145263671875, 0.050090789794921875, 0.058380126953125, 0.06666946411132812, 0.07495880126953125, 0.08324813842773438, 0.0915374755859375, 0.09982681274414062, 0.10811614990234375, 0.11640548706054688, 0.12469482421875, 0.13298416137695312, 0.14127349853515625, 0.14956283569335938, 0.1578521728515625, 0.16614151000976562, 0.17443084716796875, 0.18272018432617188, 0.191009521484375, 0.19929885864257812, 0.20758819580078125, 0.21587753295898438, 0.2241668701171875, 0.23245620727539062, 0.24074554443359375, 0.24903488159179688, 0.25732421875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 5.0, 3.0, 2.0, 5.0, 7.0, 3.0, 4.0, 8.0, 11.0, 17.0, 14.0, 20.0, 30.0, 35.0, 55.0, 47.0, 85.0, 81.0, 60.0, 81.0, 62.0, 71.0, 49.0, 47.0, 35.0, 23.0, 31.0, 26.0, 27.0, 18.0, 5.0, 12.0, 8.0, 6.0, 1.0, 4.0, 1.0, 3.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5751953125, -1.52313232421875, -1.4710693359375, -1.41900634765625, -1.366943359375, -1.31488037109375, -1.2628173828125, -1.21075439453125, -1.15869140625, -1.10662841796875, -1.0545654296875, -1.00250244140625, -0.950439453125, -0.89837646484375, -0.8463134765625, -0.79425048828125, -0.7421875, -0.69012451171875, -0.6380615234375, -0.58599853515625, -0.533935546875, -0.48187255859375, -0.4298095703125, -0.37774658203125, -0.32568359375, -0.27362060546875, -0.2215576171875, -0.16949462890625, -0.117431640625, -0.06536865234375, -0.0133056640625, 0.03875732421875, 0.0908203125, 0.14288330078125, 0.1949462890625, 0.24700927734375, 0.299072265625, 0.35113525390625, 0.4031982421875, 0.45526123046875, 0.50732421875, 0.55938720703125, 0.6114501953125, 0.66351318359375, 0.715576171875, 0.76763916015625, 0.8197021484375, 0.87176513671875, 0.923828125, 0.97589111328125, 1.0279541015625, 1.08001708984375, 1.132080078125, 1.18414306640625, 1.2362060546875, 1.28826904296875, 1.34033203125, 1.39239501953125, 1.4444580078125, 1.49652099609375, 1.548583984375, 1.60064697265625, 1.6527099609375, 1.70477294921875, 1.7568359375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 7.0, 8.0, 15.0, 14.0, 18.0, 25.0, 45.0, 63.0, 71.0, 127.0, 153.0, 215.0, 293.0, 462.0, 761.0, 1476.0, 3586.0, 9540.0, 33069.0, 124339.0, 359523.0, 348481.0, 118261.0, 31639.0, 9302.0, 3321.0, 1495.0, 754.0, 473.0, 258.0, 219.0, 158.0, 100.0, 77.0, 59.0, 32.0, 37.0, 24.0, 22.0, 8.0, 6.0, 12.0, 4.0, 5.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1920166015625, -0.18581771850585938, -0.17961883544921875, -0.17341995239257812, -0.1672210693359375, -0.16102218627929688, -0.15482330322265625, -0.14862442016601562, -0.142425537109375, -0.13622665405273438, -0.13002777099609375, -0.12382888793945312, -0.1176300048828125, -0.11143112182617188, -0.10523223876953125, -0.09903335571289062, -0.09283447265625, -0.08663558959960938, -0.08043670654296875, -0.07423782348632812, -0.0680389404296875, -0.061840057373046875, -0.05564117431640625, -0.049442291259765625, -0.043243408203125, -0.037044525146484375, -0.03084564208984375, -0.024646759033203125, -0.0184478759765625, -0.012248992919921875, -0.00605010986328125, 0.000148773193359375, 0.00634765625, 0.012546539306640625, 0.01874542236328125, 0.024944305419921875, 0.0311431884765625, 0.037342071533203125, 0.04354095458984375, 0.049739837646484375, 0.055938720703125, 0.062137603759765625, 0.06833648681640625, 0.07453536987304688, 0.0807342529296875, 0.08693313598632812, 0.09313201904296875, 0.09933090209960938, 0.10552978515625, 0.11172866821289062, 0.11792755126953125, 0.12412643432617188, 0.1303253173828125, 0.13652420043945312, 0.14272308349609375, 0.14892196655273438, 0.155120849609375, 0.16131973266601562, 0.16751861572265625, 0.17371749877929688, 0.1799163818359375, 0.18611526489257812, 0.19231414794921875, 0.19851303100585938, 0.2047119140625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 5.0, 8.0, 10.0, 6.0, 9.0, 13.0, 17.0, 20.0, 23.0, 19.0, 20.0, 24.0, 32.0, 47.0, 28.0, 39.0, 34.0, 50.0, 49.0, 45.0, 43.0, 41.0, 45.0, 39.0, 35.0, 39.0, 37.0, 34.0, 28.0, 23.0, 21.0, 20.0, 18.0, 12.0, 13.0, 11.0, 8.0, 4.0, 10.0, 6.0, 7.0, 3.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.31640625, -2.24383544921875, -2.1712646484375, -2.09869384765625, -2.026123046875, -1.95355224609375, -1.8809814453125, -1.80841064453125, -1.73583984375, -1.66326904296875, -1.5906982421875, -1.51812744140625, -1.445556640625, -1.37298583984375, -1.3004150390625, -1.22784423828125, -1.1552734375, -1.08270263671875, -1.0101318359375, -0.93756103515625, -0.864990234375, -0.79241943359375, -0.7198486328125, -0.64727783203125, -0.57470703125, -0.50213623046875, -0.4295654296875, -0.35699462890625, -0.284423828125, -0.21185302734375, -0.1392822265625, -0.06671142578125, 0.005859375, 0.07843017578125, 0.1510009765625, 0.22357177734375, 0.296142578125, 0.36871337890625, 0.4412841796875, 0.51385498046875, 0.58642578125, 0.65899658203125, 0.7315673828125, 0.80413818359375, 0.876708984375, 0.94927978515625, 1.0218505859375, 1.09442138671875, 1.1669921875, 1.23956298828125, 1.3121337890625, 1.38470458984375, 1.457275390625, 1.52984619140625, 1.6024169921875, 1.67498779296875, 1.74755859375, 1.82012939453125, 1.8927001953125, 1.96527099609375, 2.037841796875, 2.11041259765625, 2.1829833984375, 2.25555419921875, 2.328125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 5.0, 6.0, 9.0, 18.0, 20.0, 47.0, 97.0, 217.0, 630.0, 2024.0, 11669.0, 195606.0, 790763.0, 41070.0, 4705.0, 993.0, 323.0, 152.0, 75.0, 52.0, 32.0, 11.0, 11.0, 7.0, 5.0, 6.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.2197265625, -0.21452713012695312, -0.20932769775390625, -0.20412826538085938, -0.1989288330078125, -0.19372940063476562, -0.18852996826171875, -0.18333053588867188, -0.178131103515625, -0.17293167114257812, -0.16773223876953125, -0.16253280639648438, -0.1573333740234375, -0.15213394165039062, -0.14693450927734375, -0.14173507690429688, -0.13653564453125, -0.13133621215820312, -0.12613677978515625, -0.12093734741210938, -0.1157379150390625, -0.11053848266601562, -0.10533905029296875, -0.10013961791992188, -0.094940185546875, -0.08974075317382812, -0.08454132080078125, -0.07934188842773438, -0.0741424560546875, -0.06894302368164062, -0.06374359130859375, -0.058544158935546875, -0.0533447265625, -0.048145294189453125, -0.04294586181640625, -0.037746429443359375, -0.0325469970703125, -0.027347564697265625, -0.02214813232421875, -0.016948699951171875, -0.011749267578125, -0.006549835205078125, -0.00135040283203125, 0.003849029541015625, 0.0090484619140625, 0.014247894287109375, 0.01944732666015625, 0.024646759033203125, 0.02984619140625, 0.035045623779296875, 0.04024505615234375, 0.045444488525390625, 0.0506439208984375, 0.055843353271484375, 0.06104278564453125, 0.06624221801757812, 0.071441650390625, 0.07664108276367188, 0.08184051513671875, 0.08703994750976562, 0.0922393798828125, 0.09743881225585938, 0.10263824462890625, 0.10783767700195312, 0.113037109375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 4.0, 3.0, 8.0, 27.0, 34.0, 41.0, 108.0, 129.0, 142.0, 149.0, 135.0, 90.0, 49.0, 30.0, 15.0, 20.0, 9.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.00011348724365234375, -0.00011090654879808426, -0.00010832585394382477, -0.00010574515908956528, -0.00010316446423530579, -0.0001005837693810463, -9.80030745267868e-05, -9.542237967252731e-05, -9.284168481826782e-05, -9.026098996400833e-05, -8.768029510974884e-05, -8.509960025548935e-05, -8.251890540122986e-05, -7.993821054697037e-05, -7.735751569271088e-05, -7.477682083845139e-05, -7.21961259841919e-05, -6.96154311299324e-05, -6.703473627567291e-05, -6.445404142141342e-05, -6.187334656715393e-05, -5.929265171289444e-05, -5.671195685863495e-05, -5.413126200437546e-05, -5.155056715011597e-05, -4.8969872295856476e-05, -4.6389177441596985e-05, -4.3808482587337494e-05, -4.1227787733078e-05, -3.864709287881851e-05, -3.606639802455902e-05, -3.348570317029953e-05, -3.090500831604004e-05, -2.8324313461780548e-05, -2.5743618607521057e-05, -2.3162923753261566e-05, -2.0582228899002075e-05, -1.8001534044742584e-05, -1.5420839190483093e-05, -1.2840144336223602e-05, -1.0259449481964111e-05, -7.67875462770462e-06, -5.098059773445129e-06, -2.5173649191856384e-06, 6.332993507385254e-08, 2.6440247893333435e-06, 5.2247196435928345e-06, 7.805414497852325e-06, 1.0386109352111816e-05, 1.2966804206371307e-05, 1.55474990606308e-05, 1.812819391489029e-05, 2.070888876914978e-05, 2.328958362340927e-05, 2.5870278477668762e-05, 2.8450973331928253e-05, 3.1031668186187744e-05, 3.3612363040447235e-05, 3.6193057894706726e-05, 3.877375274896622e-05, 4.135444760322571e-05, 4.39351424574852e-05, 4.651583731174469e-05, 4.909653216600418e-05, 5.167722702026367e-05]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 6.0, 7.0, 12.0, 9.0, 17.0, 15.0, 46.0, 87.0, 179.0, 442.0, 1507.0, 10669.0, 430810.0, 589175.0, 13101.0, 1634.0, 472.0, 165.0, 84.0, 47.0, 32.0, 15.0, 9.0, 6.0, 7.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.28076171875, -0.27392005920410156, -0.2670783996582031, -0.2602367401123047, -0.25339508056640625, -0.2465534210205078, -0.23971176147460938, -0.23287010192871094, -0.2260284423828125, -0.21918678283691406, -0.21234512329101562, -0.2055034637451172, -0.19866180419921875, -0.1918201446533203, -0.18497848510742188, -0.17813682556152344, -0.171295166015625, -0.16445350646972656, -0.15761184692382812, -0.1507701873779297, -0.14392852783203125, -0.1370868682861328, -0.13024520874023438, -0.12340354919433594, -0.1165618896484375, -0.10972023010253906, -0.10287857055664062, -0.09603691101074219, -0.08919525146484375, -0.08235359191894531, -0.07551193237304688, -0.06867027282714844, -0.06182861328125, -0.05498695373535156, -0.048145294189453125, -0.04130363464355469, -0.03446197509765625, -0.027620315551757812, -0.020778656005859375, -0.013936996459960938, -0.0070953369140625, -0.0002536773681640625, 0.006587982177734375, 0.013429641723632812, 0.02027130126953125, 0.027112960815429688, 0.033954620361328125, 0.04079627990722656, 0.047637939453125, 0.05447959899902344, 0.061321258544921875, 0.06816291809082031, 0.07500457763671875, 0.08184623718261719, 0.08868789672851562, 0.09552955627441406, 0.1023712158203125, 0.10921287536621094, 0.11605453491210938, 0.12289619445800781, 0.12973785400390625, 0.1365795135498047, 0.14342117309570312, 0.15026283264160156, 0.1571044921875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 3.0, 7.0, 19.0, 24.0, 77.0, 149.0, 262.0, 234.0, 113.0, 51.0, 30.0, 13.0, 8.0, 6.0, 5.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.036895751953125, -0.0352787971496582, -0.033661842346191406, -0.03204488754272461, -0.030427932739257812, -0.028810977935791016, -0.02719402313232422, -0.025577068328857422, -0.023960113525390625, -0.022343158721923828, -0.02072620391845703, -0.019109249114990234, -0.017492294311523438, -0.01587533950805664, -0.014258384704589844, -0.012641429901123047, -0.01102447509765625, -0.009407520294189453, -0.007790565490722656, -0.006173610687255859, -0.0045566558837890625, -0.0029397010803222656, -0.0013227462768554688, 0.0002942085266113281, 0.001911163330078125, 0.003528118133544922, 0.005145072937011719, 0.006762027740478516, 0.008378982543945312, 0.00999593734741211, 0.011612892150878906, 0.013229846954345703, 0.0148468017578125, 0.016463756561279297, 0.018080711364746094, 0.01969766616821289, 0.021314620971679688, 0.022931575775146484, 0.02454853057861328, 0.026165485382080078, 0.027782440185546875, 0.029399394989013672, 0.03101634979248047, 0.032633304595947266, 0.03425025939941406, 0.03586721420288086, 0.037484169006347656, 0.03910112380981445, 0.04071807861328125, 0.04233503341674805, 0.043951988220214844, 0.04556894302368164, 0.04718589782714844, 0.048802852630615234, 0.05041980743408203, 0.05203676223754883, 0.053653717041015625, 0.05527067184448242, 0.05688762664794922, 0.058504581451416016, 0.06012153625488281, 0.06173849105834961, 0.0633554458618164, 0.0649724006652832, 0.06658935546875]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 5.0, 5.0, 6.0, 4.0, 10.0, 12.0, 11.0, 21.0, 32.0, 59.0, 129.0, 224.0, 213.0, 107.0, 66.0, 29.0, 30.0, 17.0, 8.0, 5.0, 4.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.4636218547821045, -3.3551101684570312, -3.246598482131958, -3.1380867958068848, -3.0295751094818115, -2.9210634231567383, -2.812551736831665, -2.704040050506592, -2.5955283641815186, -2.4870166778564453, -2.378504991531372, -2.269993305206299, -2.1614816188812256, -2.0529699325561523, -1.944458246231079, -1.8359465599060059, -1.7274348735809326, -1.6189231872558594, -1.5104115009307861, -1.401899814605713, -1.2933881282806396, -1.1848764419555664, -1.0763647556304932, -0.9678530693054199, -0.8593413829803467, -0.7508296966552734, -0.6423180103302002, -0.533806324005127, -0.4252946376800537, -0.31678295135498047, -0.20827126502990723, -0.09975957870483398, 0.008751869201660156, 0.1172635555267334, 0.22577524185180664, 0.3342869281768799, 0.4427986145019531, 0.5513103008270264, 0.6598219871520996, 0.7683336734771729, 0.8768453598022461, 0.9853570461273193, 1.0938687324523926, 1.2023804187774658, 1.310892105102539, 1.4194037914276123, 1.5279154777526855, 1.6364271640777588, 1.744938850402832, 1.8534505367279053, 1.9619622230529785, 2.0704739093780518, 2.178985595703125, 2.2874972820281982, 2.3960089683532715, 2.5045206546783447, 2.613032341003418, 2.721544027328491, 2.8300557136535645, 2.9385673999786377, 3.047079086303711, 3.155590772628784, 3.2641024589538574, 3.3726141452789307, 3.481125831604004]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 5.0, 3.0, 2.0, 1.0, 4.0, 1.0, 9.0, 1.0, 5.0, 5.0, 10.0, 9.0, 14.0, 25.0, 29.0, 28.0, 45.0, 50.0, 64.0, 84.0, 74.0, 73.0, 58.0, 61.0, 63.0, 47.0, 44.0, 40.0, 25.0, 32.0, 20.0, 16.0, 13.0, 11.0, 6.0, 11.0, 8.0, 3.0, 5.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.5008580684661865, -1.452011227607727, -1.4031645059585571, -1.3543176651000977, -1.3054708242416382, -1.2566239833831787, -1.2077772617340088, -1.1589304208755493, -1.1100835800170898, -1.0612367391586304, -1.0123900175094604, -0.963543176651001, -0.9146963357925415, -0.8658495545387268, -0.8170027732849121, -0.7681559324264526, -0.7193092107772827, -0.670462429523468, -0.6216155886650085, -0.5727688074111938, -0.5239219665527344, -0.4750751852989197, -0.426228404045105, -0.3773815929889679, -0.3285347819328308, -0.2796879708766937, -0.23084117472171783, -0.18199437856674194, -0.13314756751060486, -0.08430075645446777, -0.035453975200653076, 0.013392835855484009, 0.06223952770233154, 0.11108633130788803, 0.15993313491344452, 0.2087799310684204, 0.2576267421245575, 0.3064735531806946, 0.3553203344345093, 0.40416714549064636, 0.45301395654678345, 0.5018607378005981, 0.5507075786590576, 0.5995543599128723, 0.648401141166687, 0.6972479820251465, 0.7460947632789612, 0.7949415445327759, 0.8437883853912354, 0.89263516664505, 0.9414820075035095, 0.9903287887573242, 1.0391756296157837, 1.0880224704742432, 1.136869192123413, 1.1857160329818726, 1.234562873840332, 1.2834097146987915, 1.3322564363479614, 1.381103277206421, 1.4299501180648804, 1.4787969589233398, 1.5276436805725098, 1.5764905214309692, 1.6253372430801392]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 4.0, 6.0, 5.0, 7.0, 3.0, 8.0, 8.0, 23.0, 25.0, 26.0, 33.0, 56.0, 73.0, 93.0, 141.0, 188.0, 285.0, 402.0, 672.0, 1062.0, 1910.0, 3350.0, 6794.0, 16386.0, 55945.0, 543165.0, 344691.0, 44998.0, 14403.0, 6180.0, 2945.0, 1724.0, 990.0, 647.0, 419.0, 256.0, 148.0, 126.0, 108.0, 64.0, 49.0, 35.0, 32.0, 14.0, 20.0, 12.0, 7.0, 4.0, 8.0, 4.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-1.7451171875, -1.6936798095703125, -1.642242431640625, -1.5908050537109375, -1.53936767578125, -1.4879302978515625, -1.436492919921875, -1.3850555419921875, -1.3336181640625, -1.2821807861328125, -1.230743408203125, -1.1793060302734375, -1.12786865234375, -1.0764312744140625, -1.024993896484375, -0.9735565185546875, -0.922119140625, -0.8706817626953125, -0.819244384765625, -0.7678070068359375, -0.71636962890625, -0.6649322509765625, -0.613494873046875, -0.5620574951171875, -0.5106201171875, -0.4591827392578125, -0.407745361328125, -0.3563079833984375, -0.30487060546875, -0.2534332275390625, -0.201995849609375, -0.1505584716796875, -0.09912109375, -0.0476837158203125, 0.003753662109375, 0.0551910400390625, 0.10662841796875, 0.1580657958984375, 0.209503173828125, 0.2609405517578125, 0.3123779296875, 0.3638153076171875, 0.415252685546875, 0.4666900634765625, 0.51812744140625, 0.5695648193359375, 0.621002197265625, 0.6724395751953125, 0.723876953125, 0.7753143310546875, 0.826751708984375, 0.8781890869140625, 0.92962646484375, 0.9810638427734375, 1.032501220703125, 1.0839385986328125, 1.1353759765625, 1.1868133544921875, 1.238250732421875, 1.2896881103515625, 1.34112548828125, 1.3925628662109375, 1.444000244140625, 1.4954376220703125, 1.546875]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 0.0, 1.0, 6.0, 2.0, 8.0, 4.0, 7.0, 5.0, 9.0, 18.0, 21.0, 23.0, 45.0, 55.0, 66.0, 95.0, 99.0, 79.0, 63.0, 72.0, 62.0, 53.0, 45.0, 38.0, 36.0, 21.0, 13.0, 15.0, 8.0, 10.0, 7.0, 4.0, 4.0, 2.0, 3.0, 0.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.9921875, -3.86663818359375, -3.7410888671875, -3.61553955078125, -3.489990234375, -3.36444091796875, -3.2388916015625, -3.11334228515625, -2.98779296875, -2.86224365234375, -2.7366943359375, -2.61114501953125, -2.485595703125, -2.36004638671875, -2.2344970703125, -2.10894775390625, -1.9833984375, -1.85784912109375, -1.7322998046875, -1.60675048828125, -1.481201171875, -1.35565185546875, -1.2301025390625, -1.10455322265625, -0.97900390625, -0.85345458984375, -0.7279052734375, -0.60235595703125, -0.476806640625, -0.35125732421875, -0.2257080078125, -0.10015869140625, 0.025390625, 0.15093994140625, 0.2764892578125, 0.40203857421875, 0.527587890625, 0.65313720703125, 0.7786865234375, 0.90423583984375, 1.02978515625, 1.15533447265625, 1.2808837890625, 1.40643310546875, 1.531982421875, 1.65753173828125, 1.7830810546875, 1.90863037109375, 2.0341796875, 2.15972900390625, 2.2852783203125, 2.41082763671875, 2.536376953125, 2.66192626953125, 2.7874755859375, 2.91302490234375, 3.03857421875, 3.16412353515625, 3.2896728515625, 3.41522216796875, 3.540771484375, 3.66632080078125, 3.7918701171875, 3.91741943359375, 4.04296875]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 2.0, 5.0, 8.0, 10.0, 9.0, 12.0, 17.0, 39.0, 65.0, 83.0, 165.0, 265.0, 552.0, 1031.0, 2395.0, 6653.0, 25597.0, 329164.0, 635779.0, 33327.0, 7960.0, 2800.0, 1224.0, 596.0, 295.0, 185.0, 112.0, 60.0, 43.0, 33.0, 19.0, 14.0, 8.0, 5.0, 9.0, 6.0, 3.0, 2.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.587890625, -1.527008056640625, -1.46612548828125, -1.405242919921875, -1.3443603515625, -1.283477783203125, -1.22259521484375, -1.161712646484375, -1.100830078125, -1.039947509765625, -0.97906494140625, -0.918182373046875, -0.8572998046875, -0.796417236328125, -0.73553466796875, -0.674652099609375, -0.61376953125, -0.552886962890625, -0.49200439453125, -0.431121826171875, -0.3702392578125, -0.309356689453125, -0.24847412109375, -0.187591552734375, -0.126708984375, -0.065826416015625, -0.00494384765625, 0.055938720703125, 0.1168212890625, 0.177703857421875, 0.23858642578125, 0.299468994140625, 0.3603515625, 0.421234130859375, 0.48211669921875, 0.542999267578125, 0.6038818359375, 0.664764404296875, 0.72564697265625, 0.786529541015625, 0.847412109375, 0.908294677734375, 0.96917724609375, 1.030059814453125, 1.0909423828125, 1.151824951171875, 1.21270751953125, 1.273590087890625, 1.33447265625, 1.395355224609375, 1.45623779296875, 1.517120361328125, 1.5780029296875, 1.638885498046875, 1.69976806640625, 1.760650634765625, 1.821533203125, 1.882415771484375, 1.94329833984375, 2.004180908203125, 2.0650634765625, 2.125946044921875, 2.18682861328125, 2.247711181640625, 2.30859375]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 6.0, 3.0, 0.0, 3.0, 7.0, 6.0, 5.0, 5.0, 10.0, 12.0, 11.0, 11.0, 17.0, 22.0, 27.0, 25.0, 29.0, 26.0, 40.0, 39.0, 44.0, 42.0, 43.0, 48.0, 48.0, 34.0, 34.0, 45.0, 37.0, 44.0, 32.0, 32.0, 22.0, 28.0, 26.0, 23.0, 20.0, 15.0, 20.0, 17.0, 9.0, 9.0, 5.0, 8.0, 7.0, 1.0, 7.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.16015625, -3.055450439453125, -2.95074462890625, -2.846038818359375, -2.7413330078125, -2.636627197265625, -2.53192138671875, -2.427215576171875, -2.322509765625, -2.217803955078125, -2.11309814453125, -2.008392333984375, -1.9036865234375, -1.798980712890625, -1.69427490234375, -1.589569091796875, -1.48486328125, -1.380157470703125, -1.27545166015625, -1.170745849609375, -1.0660400390625, -0.961334228515625, -0.85662841796875, -0.751922607421875, -0.647216796875, -0.542510986328125, -0.43780517578125, -0.333099365234375, -0.2283935546875, -0.123687744140625, -0.01898193359375, 0.085723876953125, 0.1904296875, 0.295135498046875, 0.39984130859375, 0.504547119140625, 0.6092529296875, 0.713958740234375, 0.81866455078125, 0.923370361328125, 1.028076171875, 1.132781982421875, 1.23748779296875, 1.342193603515625, 1.4468994140625, 1.551605224609375, 1.65631103515625, 1.761016845703125, 1.86572265625, 1.970428466796875, 2.07513427734375, 2.179840087890625, 2.2845458984375, 2.389251708984375, 2.49395751953125, 2.598663330078125, 2.703369140625, 2.808074951171875, 2.91278076171875, 3.017486572265625, 3.1221923828125, 3.226898193359375, 3.33160400390625, 3.436309814453125, 3.541015625]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 12.0, 8.0, 8.0, 15.0, 21.0, 38.0, 58.0, 111.0, 189.0, 372.0, 719.0, 2169.0, 6543.0, 29291.0, 682685.0, 295464.0, 22057.0, 5466.0, 1802.0, 696.0, 332.0, 197.0, 105.0, 60.0, 41.0, 25.0, 24.0, 11.0, 5.0, 6.0, 4.0, 3.0, 3.0, 5.0, 4.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.0224609375, -0.9904327392578125, -0.958404541015625, -0.9263763427734375, -0.89434814453125, -0.8623199462890625, -0.830291748046875, -0.7982635498046875, -0.7662353515625, -0.7342071533203125, -0.702178955078125, -0.6701507568359375, -0.63812255859375, -0.6060943603515625, -0.574066162109375, -0.5420379638671875, -0.510009765625, -0.4779815673828125, -0.445953369140625, -0.4139251708984375, -0.38189697265625, -0.3498687744140625, -0.317840576171875, -0.2858123779296875, -0.2537841796875, -0.2217559814453125, -0.189727783203125, -0.1576995849609375, -0.12567138671875, -0.0936431884765625, -0.061614990234375, -0.0295867919921875, 0.00244140625, 0.0344696044921875, 0.066497802734375, 0.0985260009765625, 0.13055419921875, 0.1625823974609375, 0.194610595703125, 0.2266387939453125, 0.2586669921875, 0.2906951904296875, 0.322723388671875, 0.3547515869140625, 0.38677978515625, 0.4188079833984375, 0.450836181640625, 0.4828643798828125, 0.514892578125, 0.5469207763671875, 0.578948974609375, 0.6109771728515625, 0.64300537109375, 0.6750335693359375, 0.707061767578125, 0.7390899658203125, 0.7711181640625, 0.8031463623046875, 0.835174560546875, 0.8672027587890625, 0.89923095703125, 0.9312591552734375, 0.963287353515625, 0.9953155517578125, 1.02734375]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 5.0, 2.0, 8.0, 10.0, 9.0, 19.0, 17.0, 38.0, 77.0, 150.0, 390.0, 112.0, 61.0, 34.0, 16.0, 22.0, 8.0, 5.0, 4.0, 6.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00022530555725097656, -0.0002191103994846344, -0.00021291524171829224, -0.00020672008395195007, -0.0002005249261856079, -0.00019432976841926575, -0.00018813461065292358, -0.00018193945288658142, -0.00017574429512023926, -0.0001695491373538971, -0.00016335397958755493, -0.00015715882182121277, -0.0001509636640548706, -0.00014476850628852844, -0.00013857334852218628, -0.00013237819075584412, -0.00012618303298950195, -0.00011998787522315979, -0.00011379271745681763, -0.00010759755969047546, -0.0001014024019241333, -9.520724415779114e-05, -8.901208639144897e-05, -8.281692862510681e-05, -7.662177085876465e-05, -7.042661309242249e-05, -6.423145532608032e-05, -5.803629755973816e-05, -5.1841139793395996e-05, -4.564598202705383e-05, -3.945082426071167e-05, -3.325566649436951e-05, -2.7060508728027344e-05, -2.086535096168518e-05, -1.4670193195343018e-05, -8.475035429000854e-06, -2.2798776626586914e-06, 3.915280103683472e-06, 1.0110437870025635e-05, 1.6305595636367798e-05, 2.250075340270996e-05, 2.8695911169052124e-05, 3.489106893539429e-05, 4.108622670173645e-05, 4.728138446807861e-05, 5.3476542234420776e-05, 5.967170000076294e-05, 6.58668577671051e-05, 7.206201553344727e-05, 7.825717329978943e-05, 8.445233106613159e-05, 9.064748883247375e-05, 9.684264659881592e-05, 0.00010303780436515808, 0.00010923296213150024, 0.00011542811989784241, 0.00012162327766418457, 0.00012781843543052673, 0.0001340135931968689, 0.00014020875096321106, 0.00014640390872955322, 0.00015259906649589539, 0.00015879422426223755, 0.0001649893820285797, 0.00017118453979492188]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 4.0, 2.0, 3.0, 11.0, 16.0, 18.0, 25.0, 23.0, 31.0, 42.0, 65.0, 75.0, 109.0, 181.0, 264.0, 538.0, 983.0, 2062.0, 4775.0, 13587.0, 63189.0, 773865.0, 152679.0, 22947.0, 7044.0, 2895.0, 1276.0, 705.0, 386.0, 231.0, 149.0, 111.0, 73.0, 53.0, 25.0, 21.0, 27.0, 10.0, 16.0, 14.0, 8.0, 2.0, 6.0, 5.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.794921875, -0.771331787109375, -0.74774169921875, -0.724151611328125, -0.7005615234375, -0.676971435546875, -0.65338134765625, -0.629791259765625, -0.606201171875, -0.582611083984375, -0.55902099609375, -0.535430908203125, -0.5118408203125, -0.488250732421875, -0.46466064453125, -0.441070556640625, -0.41748046875, -0.393890380859375, -0.37030029296875, -0.346710205078125, -0.3231201171875, -0.299530029296875, -0.27593994140625, -0.252349853515625, -0.228759765625, -0.205169677734375, -0.18157958984375, -0.157989501953125, -0.1343994140625, -0.110809326171875, -0.08721923828125, -0.063629150390625, -0.0400390625, -0.016448974609375, 0.00714111328125, 0.030731201171875, 0.0543212890625, 0.077911376953125, 0.10150146484375, 0.125091552734375, 0.148681640625, 0.172271728515625, 0.19586181640625, 0.219451904296875, 0.2430419921875, 0.266632080078125, 0.29022216796875, 0.313812255859375, 0.33740234375, 0.360992431640625, 0.38458251953125, 0.408172607421875, 0.4317626953125, 0.455352783203125, 0.47894287109375, 0.502532958984375, 0.526123046875, 0.549713134765625, 0.57330322265625, 0.596893310546875, 0.6204833984375, 0.644073486328125, 0.66766357421875, 0.691253662109375, 0.71484375]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 3.0, 3.0, 6.0, 5.0, 5.0, 8.0, 13.0, 10.0, 15.0, 12.0, 30.0, 39.0, 30.0, 61.0, 112.0, 232.0, 139.0, 61.0, 51.0, 37.0, 21.0, 23.0, 14.0, 14.0, 9.0, 7.0, 2.0, 2.0, 7.0, 2.0, 3.0, 2.0, 3.0, 4.0, 2.0, 5.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.3388671875, -0.3288421630859375, -0.318817138671875, -0.3087921142578125, -0.29876708984375, -0.2887420654296875, -0.278717041015625, -0.2686920166015625, -0.2586669921875, -0.2486419677734375, -0.238616943359375, -0.2285919189453125, -0.21856689453125, -0.2085418701171875, -0.198516845703125, -0.1884918212890625, -0.178466796875, -0.1684417724609375, -0.158416748046875, -0.1483917236328125, -0.13836669921875, -0.1283416748046875, -0.118316650390625, -0.1082916259765625, -0.0982666015625, -0.0882415771484375, -0.078216552734375, -0.0681915283203125, -0.05816650390625, -0.0481414794921875, -0.038116455078125, -0.0280914306640625, -0.01806640625, -0.0080413818359375, 0.001983642578125, 0.0120086669921875, 0.02203369140625, 0.0320587158203125, 0.042083740234375, 0.0521087646484375, 0.0621337890625, 0.0721588134765625, 0.082183837890625, 0.0922088623046875, 0.10223388671875, 0.1122589111328125, 0.122283935546875, 0.1323089599609375, 0.142333984375, 0.1523590087890625, 0.162384033203125, 0.1724090576171875, 0.18243408203125, 0.1924591064453125, 0.202484130859375, 0.2125091552734375, 0.2225341796875, 0.2325592041015625, 0.242584228515625, 0.2526092529296875, 0.26263427734375, 0.2726593017578125, 0.282684326171875, 0.2927093505859375, 0.302734375]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 4.0, 8.0, 11.0, 18.0, 30.0, 82.0, 229.0, 366.0, 162.0, 57.0, 23.0, 7.0, 8.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.68994665145874, -4.275148391723633, -3.8603501319885254, -3.445551872253418, -3.0307536125183105, -2.6159555912017822, -2.201157331466675, -1.7863590717315674, -1.37156081199646, -0.9567625522613525, -0.5419643521308899, -0.12716615200042725, 0.2876321077346802, 0.702430248260498, 1.1172285079956055, 1.532026767730713, 1.9468250274658203, 2.3616232872009277, 2.776421546936035, 3.1912198066711426, 3.60601806640625, 4.020815849304199, 4.435614585876465, 4.850412368774414, 5.26521110534668, 5.680009365081787, 6.0948076248168945, 6.509605884552002, 6.924404144287109, 7.339201927185059, 7.754000663757324, 8.168798446655273, 8.583596229553223, 8.998394012451172, 9.413192749023438, 9.827990531921387, 10.242789268493652, 10.657587051391602, 11.072385787963867, 11.487183570861816, 11.901982307434082, 12.316780090332031, 12.731578826904297, 13.146376609802246, 13.561175346374512, 13.975973129272461, 14.390771865844727, 14.805569648742676, 15.220367431640625, 15.635165214538574, 16.049962997436523, 16.46476173400879, 16.879560470581055, 17.29435920715332, 17.709156036376953, 18.12395477294922, 18.538753509521484, 18.95355224609375, 19.368349075317383, 19.78314781188965, 20.197946548461914, 20.61274528503418, 21.027542114257812, 21.442340850830078, 21.857139587402344]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 1.0, 2.0, 4.0, 3.0, 5.0, 7.0, 9.0, 13.0, 11.0, 18.0, 15.0, 25.0, 28.0, 20.0, 14.0, 34.0, 30.0, 30.0, 34.0, 36.0, 31.0, 41.0, 41.0, 32.0, 38.0, 27.0, 38.0, 46.0, 31.0, 30.0, 37.0, 36.0, 31.0, 19.0, 30.0, 28.0, 5.0, 17.0, 18.0, 12.0, 16.0, 16.0, 4.0, 2.0, 9.0, 5.0, 4.0, 2.0, 5.0, 6.0, 5.0, 2.0, 3.0, 1.0, 1.0, 2.0], "bins": [-5.528428554534912, -5.359193801879883, -5.189959526062012, -5.020724773406982, -4.851490020751953, -4.682255744934082, -4.513020992279053, -4.343786239624023, -4.174551963806152, -4.005317211151123, -3.836082696914673, -3.6668481826782227, -3.4976136684417725, -3.3283791542053223, -3.159144401550293, -2.9899098873138428, -2.8206751346588135, -2.6514406204223633, -2.482205867767334, -2.312971353530884, -2.1437368392944336, -1.9745022058486938, -1.805267572402954, -1.636033058166504, -1.4667984247207642, -1.2975637912750244, -1.1283292770385742, -0.9590946435928345, -0.7898600697517395, -0.6206254959106445, -0.4513908624649048, -0.2821563482284546, -0.11292171478271484, 0.05631287395954132, 0.22554746270179749, 0.39478206634521484, 0.5640166401863098, 0.7332512140274048, 0.9024858474731445, 1.0717203617095947, 1.2409549951553345, 1.4101896286010742, 1.5794241428375244, 1.7486587762832642, 1.917893409729004, 2.087127923965454, 2.2563624382019043, 2.4255971908569336, 2.594831705093384, 2.764066219329834, 2.9333009719848633, 3.1025354862213135, 3.2717700004577637, 3.441004753112793, 3.610239267349243, 3.7794737815856934, 3.9487085342407227, 4.117943286895752, 4.287177562713623, 4.456412315368652, 4.625647068023682, 4.794881343841553, 4.964116096496582, 5.133350372314453, 5.302585124969482]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 2.0, 10.0, 11.0, 14.0, 18.0, 30.0, 49.0, 65.0, 102.0, 149.0, 267.0, 417.0, 800.0, 1568.0, 3382.0, 9402.0, 36615.0, 365435.0, 3605318.0, 137071.0, 21415.0, 6444.0, 2708.0, 1237.0, 651.0, 396.0, 246.0, 155.0, 94.0, 64.0, 44.0, 31.0, 24.0, 18.0, 8.0, 9.0, 8.0, 6.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-3.591796875, -3.50048828125, -3.4091796875, -3.31787109375, -3.2265625, -3.13525390625, -3.0439453125, -2.95263671875, -2.861328125, -2.77001953125, -2.6787109375, -2.58740234375, -2.49609375, -2.40478515625, -2.3134765625, -2.22216796875, -2.130859375, -2.03955078125, -1.9482421875, -1.85693359375, -1.765625, -1.67431640625, -1.5830078125, -1.49169921875, -1.400390625, -1.30908203125, -1.2177734375, -1.12646484375, -1.03515625, -0.94384765625, -0.8525390625, -0.76123046875, -0.669921875, -0.57861328125, -0.4873046875, -0.39599609375, -0.3046875, -0.21337890625, -0.1220703125, -0.03076171875, 0.060546875, 0.15185546875, 0.2431640625, 0.33447265625, 0.42578125, 0.51708984375, 0.6083984375, 0.69970703125, 0.791015625, 0.88232421875, 0.9736328125, 1.06494140625, 1.15625, 1.24755859375, 1.3388671875, 1.43017578125, 1.521484375, 1.61279296875, 1.7041015625, 1.79541015625, 1.88671875, 1.97802734375, 2.0693359375, 2.16064453125, 2.251953125]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 3.0, 3.0, 5.0, 4.0, 5.0, 2.0, 5.0, 4.0, 8.0, 14.0, 12.0, 20.0, 20.0, 21.0, 25.0, 55.0, 49.0, 62.0, 64.0, 76.0, 85.0, 70.0, 62.0, 54.0, 46.0, 40.0, 46.0, 25.0, 21.0, 19.0, 18.0, 7.0, 10.0, 6.0, 10.0, 7.0, 4.0, 6.0, 3.0, 0.0, 1.0, 4.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.76171875, -1.7061309814453125, -1.650543212890625, -1.5949554443359375, -1.53936767578125, -1.4837799072265625, -1.428192138671875, -1.3726043701171875, -1.3170166015625, -1.2614288330078125, -1.205841064453125, -1.1502532958984375, -1.09466552734375, -1.0390777587890625, -0.983489990234375, -0.9279022216796875, -0.872314453125, -0.8167266845703125, -0.761138916015625, -0.7055511474609375, -0.64996337890625, -0.5943756103515625, -0.538787841796875, -0.4832000732421875, -0.4276123046875, -0.3720245361328125, -0.316436767578125, -0.2608489990234375, -0.20526123046875, -0.1496734619140625, -0.094085693359375, -0.0384979248046875, 0.01708984375, 0.0726776123046875, 0.128265380859375, 0.1838531494140625, 0.23944091796875, 0.2950286865234375, 0.350616455078125, 0.4062042236328125, 0.4617919921875, 0.5173797607421875, 0.572967529296875, 0.6285552978515625, 0.68414306640625, 0.7397308349609375, 0.795318603515625, 0.8509063720703125, 0.906494140625, 0.9620819091796875, 1.017669677734375, 1.0732574462890625, 1.12884521484375, 1.1844329833984375, 1.240020751953125, 1.2956085205078125, 1.3511962890625, 1.4067840576171875, 1.462371826171875, 1.5179595947265625, 1.57354736328125, 1.6291351318359375, 1.684722900390625, 1.7403106689453125, 1.7958984375]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 4.0, 5.0, 7.0, 13.0, 18.0, 19.0, 24.0, 51.0, 69.0, 110.0, 226.0, 407.0, 1058.0, 2782.0, 10882.0, 78259.0, 3782767.0, 288476.0, 21510.0, 4796.0, 1538.0, 561.0, 250.0, 164.0, 90.0, 56.0, 44.0, 25.0, 18.0, 16.0, 6.0, 4.0, 7.0, 2.0, 4.0, 4.0, 0.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.6953125, -3.582305908203125, -3.46929931640625, -3.356292724609375, -3.2432861328125, -3.130279541015625, -3.01727294921875, -2.904266357421875, -2.791259765625, -2.678253173828125, -2.56524658203125, -2.452239990234375, -2.3392333984375, -2.226226806640625, -2.11322021484375, -2.000213623046875, -1.88720703125, -1.774200439453125, -1.66119384765625, -1.548187255859375, -1.4351806640625, -1.322174072265625, -1.20916748046875, -1.096160888671875, -0.983154296875, -0.870147705078125, -0.75714111328125, -0.644134521484375, -0.5311279296875, -0.418121337890625, -0.30511474609375, -0.192108154296875, -0.0791015625, 0.033905029296875, 0.14691162109375, 0.259918212890625, 0.3729248046875, 0.485931396484375, 0.59893798828125, 0.711944580078125, 0.824951171875, 0.937957763671875, 1.05096435546875, 1.163970947265625, 1.2769775390625, 1.389984130859375, 1.50299072265625, 1.615997314453125, 1.72900390625, 1.842010498046875, 1.95501708984375, 2.068023681640625, 2.1810302734375, 2.294036865234375, 2.40704345703125, 2.520050048828125, 2.633056640625, 2.746063232421875, 2.85906982421875, 2.972076416015625, 3.0850830078125, 3.198089599609375, 3.31109619140625, 3.424102783203125, 3.537109375]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 4.0, 1.0, 2.0, 5.0, 3.0, 6.0, 5.0, 5.0, 6.0, 9.0, 6.0, 18.0, 25.0, 26.0, 50.0, 48.0, 81.0, 133.0, 201.0, 364.0, 728.0, 1132.0, 479.0, 286.0, 131.0, 94.0, 61.0, 40.0, 30.0, 33.0, 16.0, 12.0, 12.0, 11.0, 10.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.544921875, -0.5256195068359375, -0.506317138671875, -0.4870147705078125, -0.46771240234375, -0.4484100341796875, -0.429107666015625, -0.4098052978515625, -0.3905029296875, -0.3712005615234375, -0.351898193359375, -0.3325958251953125, -0.31329345703125, -0.2939910888671875, -0.274688720703125, -0.2553863525390625, -0.236083984375, -0.2167816162109375, -0.197479248046875, -0.1781768798828125, -0.15887451171875, -0.1395721435546875, -0.120269775390625, -0.1009674072265625, -0.0816650390625, -0.0623626708984375, -0.043060302734375, -0.0237579345703125, -0.00445556640625, 0.0148468017578125, 0.034149169921875, 0.0534515380859375, 0.07275390625, 0.0920562744140625, 0.111358642578125, 0.1306610107421875, 0.14996337890625, 0.1692657470703125, 0.188568115234375, 0.2078704833984375, 0.2271728515625, 0.2464752197265625, 0.265777587890625, 0.2850799560546875, 0.30438232421875, 0.3236846923828125, 0.342987060546875, 0.3622894287109375, 0.381591796875, 0.4008941650390625, 0.420196533203125, 0.4394989013671875, 0.45880126953125, 0.4781036376953125, 0.497406005859375, 0.5167083740234375, 0.5360107421875, 0.5553131103515625, 0.574615478515625, 0.5939178466796875, 0.61322021484375, 0.6325225830078125, 0.651824951171875, 0.6711273193359375, 0.6904296875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 5.0, 10.0, 9.0, 4.0, 14.0, 18.0, 26.0, 35.0, 53.0, 88.0, 156.0, 170.0, 156.0, 94.0, 55.0, 32.0, 19.0, 18.0, 15.0, 9.0, 3.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.264806270599365, -4.1411027908325195, -4.017398834228516, -3.89369535446167, -3.769991874694824, -3.6462881565093994, -3.5225844383239746, -3.398880958557129, -3.275177240371704, -3.1514735221862793, -3.0277700424194336, -2.904066324234009, -2.780362844467163, -2.6566591262817383, -2.5329556465148926, -2.4092519283294678, -2.285548210144043, -2.161844491958618, -2.0381410121917725, -1.9144372940063477, -1.7907336950302124, -1.6670300960540771, -1.543326497077942, -1.4196228981018066, -1.295919418334961, -1.1722158193588257, -1.0485122203826904, -0.9248085618019104, -0.8011049032211304, -0.6774013042449951, -0.5536977052688599, -0.42999404668807983, -0.3062903881072998, -0.18258675932884216, -0.058883145451545715, 0.06482046842575073, 0.18852409720420837, 0.312227725982666, 0.43593132495880127, 0.5596349835395813, 0.6833385825157166, 0.8070421814918518, 0.9307458400726318, 1.054449439048767, 1.1781530380249023, 1.3018567562103271, 1.4255602359771729, 1.5492639541625977, 1.672967553138733, 1.7966711521148682, 1.9203747510910034, 2.0440783500671387, 2.1677820682525635, 2.2914857864379883, 2.415189266204834, 2.538892984390259, 2.6625964641571045, 2.7863001823425293, 2.910003662109375, 3.0337073802948, 3.1574108600616455, 3.2811145782470703, 3.404818058013916, 3.528521776199341, 3.6522254943847656]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 5.0, 5.0, 2.0, 6.0, 9.0, 12.0, 19.0, 13.0, 16.0, 25.0, 26.0, 35.0, 44.0, 37.0, 55.0, 49.0, 62.0, 55.0, 62.0, 55.0, 48.0, 62.0, 39.0, 45.0, 32.0, 36.0, 20.0, 23.0, 18.0, 13.0, 18.0, 9.0, 9.0, 5.0, 10.0, 6.0, 3.0, 2.0, 3.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.0225017070770264, -1.9644750356674194, -1.906448245048523, -1.848421573638916, -1.7903947830200195, -1.7323681116104126, -1.6743413209915161, -1.6163146495819092, -1.5582878589630127, -1.5002611875534058, -1.4422343969345093, -1.3842077255249023, -1.3261809349060059, -1.268154263496399, -1.2101274728775024, -1.1521008014678955, -1.094074010848999, -1.036047339439392, -0.9780205488204956, -0.9199938178062439, -0.8619670867919922, -0.8039404153823853, -0.7459136247634888, -0.6878869533538818, -0.6298602819442749, -0.5718335509300232, -0.5138068199157715, -0.4557800889015198, -0.39775335788726807, -0.33972665667533875, -0.28169992566108704, -0.22367319464683533, -0.16564643383026123, -0.10761970281600952, -0.04959297925233841, 0.008433744311332703, 0.06646047532558441, 0.12448719143867493, 0.18251392245292664, 0.24054065346717834, 0.29856738448143005, 0.35659411549568176, 0.41462084650993347, 0.4726475477218628, 0.5306742787361145, 0.5887010097503662, 0.6467277407646179, 0.7047544717788696, 0.7627812027931213, 0.820807933807373, 0.8788346648216248, 0.9368613958358765, 0.9948881268501282, 1.0529148578643799, 1.1109415292739868, 1.1689683198928833, 1.2269949913024902, 1.2850216627120972, 1.3430484533309937, 1.4010751247406006, 1.459101915359497, 1.517128586769104, 1.5751553773880005, 1.6331820487976074, 1.691208839416504]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 7.0, 10.0, 9.0, 16.0, 18.0, 26.0, 39.0, 60.0, 101.0, 124.0, 182.0, 339.0, 596.0, 952.0, 1824.0, 3691.0, 7796.0, 18026.0, 46948.0, 145246.0, 375740.0, 291902.0, 96456.0, 32988.0, 13046.0, 5882.0, 2894.0, 1576.0, 835.0, 458.0, 263.0, 167.0, 108.0, 73.0, 50.0, 34.0, 25.0, 21.0, 9.0, 7.0, 6.0, 3.0, 2.0, 6.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.1845703125, -0.17911338806152344, -0.17365646362304688, -0.1681995391845703, -0.16274261474609375, -0.1572856903076172, -0.15182876586914062, -0.14637184143066406, -0.1409149169921875, -0.13545799255371094, -0.13000106811523438, -0.12454414367675781, -0.11908721923828125, -0.11363029479980469, -0.10817337036132812, -0.10271644592285156, -0.097259521484375, -0.09180259704589844, -0.08634567260742188, -0.08088874816894531, -0.07543182373046875, -0.06997489929199219, -0.06451797485351562, -0.05906105041503906, -0.0536041259765625, -0.04814720153808594, -0.042690277099609375, -0.03723335266113281, -0.03177642822265625, -0.026319503784179688, -0.020862579345703125, -0.015405654907226562, -0.00994873046875, -0.0044918060302734375, 0.000965118408203125, 0.0064220428466796875, 0.01187896728515625, 0.017335891723632812, 0.022792816162109375, 0.028249740600585938, 0.0337066650390625, 0.03916358947753906, 0.044620513916015625, 0.05007743835449219, 0.05553436279296875, 0.06099128723144531, 0.06644821166992188, 0.07190513610839844, 0.077362060546875, 0.08281898498535156, 0.08827590942382812, 0.09373283386230469, 0.09918975830078125, 0.10464668273925781, 0.11010360717773438, 0.11556053161621094, 0.1210174560546875, 0.12647438049316406, 0.13193130493164062, 0.1373882293701172, 0.14284515380859375, 0.1483020782470703, 0.15375900268554688, 0.15921592712402344, 0.1646728515625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 7.0, 5.0, 3.0, 3.0, 8.0, 8.0, 16.0, 7.0, 14.0, 21.0, 29.0, 32.0, 45.0, 46.0, 69.0, 58.0, 86.0, 73.0, 80.0, 58.0, 59.0, 51.0, 49.0, 35.0, 32.0, 23.0, 14.0, 19.0, 13.0, 10.0, 4.0, 9.0, 6.0, 1.0, 4.0, 1.0, 7.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5859375, -1.5360260009765625, -1.486114501953125, -1.4362030029296875, -1.38629150390625, -1.3363800048828125, -1.286468505859375, -1.2365570068359375, -1.1866455078125, -1.1367340087890625, -1.086822509765625, -1.0369110107421875, -0.98699951171875, -0.9370880126953125, -0.887176513671875, -0.8372650146484375, -0.787353515625, -0.7374420166015625, -0.687530517578125, -0.6376190185546875, -0.58770751953125, -0.5377960205078125, -0.487884521484375, -0.4379730224609375, -0.3880615234375, -0.3381500244140625, -0.288238525390625, -0.2383270263671875, -0.18841552734375, -0.1385040283203125, -0.088592529296875, -0.0386810302734375, 0.01123046875, 0.0611419677734375, 0.111053466796875, 0.1609649658203125, 0.21087646484375, 0.2607879638671875, 0.310699462890625, 0.3606109619140625, 0.4105224609375, 0.4604339599609375, 0.510345458984375, 0.5602569580078125, 0.61016845703125, 0.6600799560546875, 0.709991455078125, 0.7599029541015625, 0.809814453125, 0.8597259521484375, 0.909637451171875, 0.9595489501953125, 1.00946044921875, 1.0593719482421875, 1.109283447265625, 1.1591949462890625, 1.2091064453125, 1.2590179443359375, 1.308929443359375, 1.3588409423828125, 1.40875244140625, 1.4586639404296875, 1.508575439453125, 1.5584869384765625, 1.6083984375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 5.0, 5.0, 9.0, 10.0, 25.0, 23.0, 48.0, 64.0, 113.0, 156.0, 264.0, 432.0, 758.0, 1735.0, 4443.0, 15756.0, 74413.0, 370327.0, 449231.0, 100853.0, 20100.0, 5524.0, 2031.0, 942.0, 520.0, 292.0, 178.0, 108.0, 64.0, 51.0, 25.0, 19.0, 13.0, 10.0, 6.0, 3.0, 2.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2098388671875, -0.20209312438964844, -0.19434738159179688, -0.1866016387939453, -0.17885589599609375, -0.1711101531982422, -0.16336441040039062, -0.15561866760253906, -0.1478729248046875, -0.14012718200683594, -0.13238143920898438, -0.12463569641113281, -0.11688995361328125, -0.10914421081542969, -0.10139846801757812, -0.09365272521972656, -0.085906982421875, -0.07816123962402344, -0.07041549682617188, -0.06266975402832031, -0.05492401123046875, -0.04717826843261719, -0.039432525634765625, -0.03168678283691406, -0.0239410400390625, -0.016195297241210938, -0.008449554443359375, -0.0007038116455078125, 0.00704193115234375, 0.014787673950195312, 0.022533416748046875, 0.030279159545898438, 0.03802490234375, 0.04577064514160156, 0.053516387939453125, 0.06126213073730469, 0.06900787353515625, 0.07675361633300781, 0.08449935913085938, 0.09224510192871094, 0.0999908447265625, 0.10773658752441406, 0.11548233032226562, 0.12322807312011719, 0.13097381591796875, 0.1387195587158203, 0.14646530151367188, 0.15421104431152344, 0.161956787109375, 0.16970252990722656, 0.17744827270507812, 0.1851940155029297, 0.19293975830078125, 0.2006855010986328, 0.20843124389648438, 0.21617698669433594, 0.2239227294921875, 0.23166847229003906, 0.23941421508789062, 0.2471599578857422, 0.25490570068359375, 0.2626514434814453, 0.2703971862792969, 0.27814292907714844, 0.285888671875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 2.0, 1.0, 4.0, 8.0, 11.0, 6.0, 16.0, 9.0, 9.0, 19.0, 23.0, 20.0, 24.0, 23.0, 42.0, 46.0, 47.0, 54.0, 53.0, 51.0, 45.0, 60.0, 48.0, 48.0, 47.0, 44.0, 44.0, 36.0, 34.0, 23.0, 18.0, 21.0, 14.0, 17.0, 12.0, 8.0, 9.0, 5.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1875, -2.108673095703125, -2.02984619140625, -1.951019287109375, -1.8721923828125, -1.793365478515625, -1.71453857421875, -1.635711669921875, -1.556884765625, -1.478057861328125, -1.39923095703125, -1.320404052734375, -1.2415771484375, -1.162750244140625, -1.08392333984375, -1.005096435546875, -0.92626953125, -0.847442626953125, -0.76861572265625, -0.689788818359375, -0.6109619140625, -0.532135009765625, -0.45330810546875, -0.374481201171875, -0.295654296875, -0.216827392578125, -0.13800048828125, -0.059173583984375, 0.0196533203125, 0.098480224609375, 0.17730712890625, 0.256134033203125, 0.3349609375, 0.413787841796875, 0.49261474609375, 0.571441650390625, 0.6502685546875, 0.729095458984375, 0.80792236328125, 0.886749267578125, 0.965576171875, 1.044403076171875, 1.12322998046875, 1.202056884765625, 1.2808837890625, 1.359710693359375, 1.43853759765625, 1.517364501953125, 1.59619140625, 1.675018310546875, 1.75384521484375, 1.832672119140625, 1.9114990234375, 1.990325927734375, 2.06915283203125, 2.147979736328125, 2.226806640625, 2.305633544921875, 2.38446044921875, 2.463287353515625, 2.5421142578125, 2.620941162109375, 2.69976806640625, 2.778594970703125, 2.857421875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 4.0, 10.0, 17.0, 16.0, 32.0, 47.0, 84.0, 196.0, 451.0, 1117.0, 3313.0, 14133.0, 219295.0, 761021.0, 39769.0, 6082.0, 1768.0, 646.0, 254.0, 131.0, 50.0, 34.0, 29.0, 16.0, 13.0, 7.0, 3.0, 5.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1392822265625, -0.13451766967773438, -0.12975311279296875, -0.12498855590820312, -0.1202239990234375, -0.11545944213867188, -0.11069488525390625, -0.10593032836914062, -0.101165771484375, -0.09640121459960938, -0.09163665771484375, -0.08687210083007812, -0.0821075439453125, -0.07734298706054688, -0.07257843017578125, -0.06781387329101562, -0.06304931640625, -0.058284759521484375, -0.05352020263671875, -0.048755645751953125, -0.0439910888671875, -0.039226531982421875, -0.03446197509765625, -0.029697418212890625, -0.024932861328125, -0.020168304443359375, -0.01540374755859375, -0.010639190673828125, -0.0058746337890625, -0.001110076904296875, 0.00365447998046875, 0.008419036865234375, 0.01318359375, 0.017948150634765625, 0.02271270751953125, 0.027477264404296875, 0.0322418212890625, 0.037006378173828125, 0.04177093505859375, 0.046535491943359375, 0.051300048828125, 0.056064605712890625, 0.06082916259765625, 0.06559371948242188, 0.0703582763671875, 0.07512283325195312, 0.07988739013671875, 0.08465194702148438, 0.08941650390625, 0.09418106079101562, 0.09894561767578125, 0.10371017456054688, 0.1084747314453125, 0.11323928833007812, 0.11800384521484375, 0.12276840209960938, 0.127532958984375, 0.13229751586914062, 0.13706207275390625, 0.14182662963867188, 0.1465911865234375, 0.15135574340820312, 0.15612030029296875, 0.16088485717773438, 0.1656494140625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 7.0, 5.0, 9.0, 10.0, 17.0, 13.0, 32.0, 40.0, 62.0, 72.0, 100.0, 117.0, 106.0, 116.0, 85.0, 57.0, 41.0, 27.0, 25.0, 16.0, 9.0, 14.0, 4.0, 4.0, 4.0, 3.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.628036499023438e-05, -6.448943167924881e-05, -6.269849836826324e-05, -6.090756505727768e-05, -5.9116631746292114e-05, -5.732569843530655e-05, -5.5534765124320984e-05, -5.374383181333542e-05, -5.1952898502349854e-05, -5.016196519136429e-05, -4.837103188037872e-05, -4.658009856939316e-05, -4.478916525840759e-05, -4.299823194742203e-05, -4.120729863643646e-05, -3.94163653254509e-05, -3.762543201446533e-05, -3.583449870347977e-05, -3.40435653924942e-05, -3.2252632081508636e-05, -3.046169877052307e-05, -2.8670765459537506e-05, -2.687983214855194e-05, -2.5088898837566376e-05, -2.329796552658081e-05, -2.1507032215595245e-05, -1.971609890460968e-05, -1.7925165593624115e-05, -1.613423228263855e-05, -1.4343298971652985e-05, -1.255236566066742e-05, -1.0761432349681854e-05, -8.970499038696289e-06, -7.179565727710724e-06, -5.388632416725159e-06, -3.5976991057395935e-06, -1.8067657947540283e-06, -1.5832483768463135e-08, 1.775100827217102e-06, 3.5660341382026672e-06, 5.356967449188232e-06, 7.147900760173798e-06, 8.938834071159363e-06, 1.0729767382144928e-05, 1.2520700693130493e-05, 1.4311634004116058e-05, 1.6102567315101624e-05, 1.789350062608719e-05, 1.9684433937072754e-05, 2.147536724805832e-05, 2.3266300559043884e-05, 2.505723387002945e-05, 2.6848167181015015e-05, 2.863910049200058e-05, 3.0430033802986145e-05, 3.222096711397171e-05, 3.4011900424957275e-05, 3.580283373594284e-05, 3.7593767046928406e-05, 3.938470035791397e-05, 4.1175633668899536e-05, 4.29665669798851e-05, 4.4757500290870667e-05, 4.654843360185623e-05, 4.83393669128418e-05]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 5.0, 4.0, 9.0, 14.0, 17.0, 38.0, 52.0, 109.0, 207.0, 477.0, 936.0, 2712.0, 10537.0, 104852.0, 831346.0, 83550.0, 9401.0, 2510.0, 919.0, 403.0, 201.0, 110.0, 53.0, 33.0, 20.0, 13.0, 13.0, 6.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1844482421875, -0.17977428436279297, -0.17510032653808594, -0.1704263687133789, -0.16575241088867188, -0.16107845306396484, -0.1564044952392578, -0.15173053741455078, -0.14705657958984375, -0.14238262176513672, -0.1377086639404297, -0.13303470611572266, -0.12836074829101562, -0.1236867904663086, -0.11901283264160156, -0.11433887481689453, -0.1096649169921875, -0.10499095916748047, -0.10031700134277344, -0.0956430435180664, -0.09096908569335938, -0.08629512786865234, -0.08162117004394531, -0.07694721221923828, -0.07227325439453125, -0.06759929656982422, -0.06292533874511719, -0.058251380920410156, -0.053577423095703125, -0.048903465270996094, -0.04422950744628906, -0.03955554962158203, -0.034881591796875, -0.03020763397216797, -0.025533676147460938, -0.020859718322753906, -0.016185760498046875, -0.011511802673339844, -0.0068378448486328125, -0.0021638870239257812, 0.00251007080078125, 0.007184028625488281, 0.011857986450195312, 0.016531944274902344, 0.021205902099609375, 0.025879859924316406, 0.030553817749023438, 0.03522777557373047, 0.0399017333984375, 0.04457569122314453, 0.04924964904785156, 0.053923606872558594, 0.058597564697265625, 0.06327152252197266, 0.06794548034667969, 0.07261943817138672, 0.07729339599609375, 0.08196735382080078, 0.08664131164550781, 0.09131526947021484, 0.09598922729492188, 0.1006631851196289, 0.10533714294433594, 0.11001110076904297, 0.11468505859375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 4.0, 5.0, 11.0, 10.0, 16.0, 24.0, 45.0, 55.0, 105.0, 146.0, 176.0, 152.0, 103.0, 57.0, 30.0, 19.0, 15.0, 8.0, 5.0, 9.0, 0.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.026214599609375, -0.025096893310546875, -0.02397918701171875, -0.022861480712890625, -0.0217437744140625, -0.020626068115234375, -0.01950836181640625, -0.018390655517578125, -0.01727294921875, -0.016155242919921875, -0.01503753662109375, -0.013919830322265625, -0.0128021240234375, -0.011684417724609375, -0.01056671142578125, -0.009449005126953125, -0.008331298828125, -0.007213592529296875, -0.00609588623046875, -0.004978179931640625, -0.0038604736328125, -0.002742767333984375, -0.00162506103515625, -0.000507354736328125, 0.0006103515625, 0.001728057861328125, 0.00284576416015625, 0.003963470458984375, 0.0050811767578125, 0.006198883056640625, 0.00731658935546875, 0.008434295654296875, 0.009552001953125, 0.010669708251953125, 0.01178741455078125, 0.012905120849609375, 0.0140228271484375, 0.015140533447265625, 0.01625823974609375, 0.017375946044921875, 0.01849365234375, 0.019611358642578125, 0.02072906494140625, 0.021846771240234375, 0.0229644775390625, 0.024082183837890625, 0.02519989013671875, 0.026317596435546875, 0.027435302734375, 0.028553009033203125, 0.02967071533203125, 0.030788421630859375, 0.0319061279296875, 0.033023834228515625, 0.03414154052734375, 0.035259246826171875, 0.036376953125, 0.037494659423828125, 0.03861236572265625, 0.039730072021484375, 0.0408477783203125, 0.041965484619140625, 0.04308319091796875, 0.044200897216796875, 0.045318603515625]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 0.0, 5.0, 12.0, 9.0, 6.0, 8.0, 20.0, 20.0, 34.0, 52.0, 94.0, 167.0, 196.0, 159.0, 82.0, 47.0, 27.0, 19.0, 11.0, 14.0, 5.0, 2.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-2.8472964763641357, -2.7590572834014893, -2.670818328857422, -2.5825791358947754, -2.494340181350708, -2.4061009883880615, -2.317862033843994, -2.2296228408813477, -2.141383647918701, -2.0531444549560547, -1.9649055004119873, -1.8766663074493408, -1.7884273529052734, -1.700188159942627, -1.61194908618927, -1.523710012435913, -1.4354710578918457, -1.3472319841384888, -1.2589929103851318, -1.1707537174224854, -1.082514762878418, -0.9942756295204163, -0.9060364961624146, -0.8177974224090576, -0.7295583486557007, -0.6413192749023438, -0.5530802011489868, -0.4648410677909851, -0.3766019940376282, -0.28836292028427124, -0.20012378692626953, -0.1118847131729126, -0.023645639419555664, 0.06459344923496246, 0.1528325378894806, 0.2410716414451599, 0.32931071519851685, 0.4175497889518738, 0.5057889223098755, 0.5940279960632324, 0.6822670698165894, 0.7705061435699463, 0.8587452173233032, 0.9469843506813049, 1.0352234840393066, 1.123462438583374, 1.2117016315460205, 1.2999407052993774, 1.3881797790527344, 1.4764188528060913, 1.5646579265594482, 1.6528971195220947, 1.741136074066162, 1.8293752670288086, 1.9176143407821655, 2.0058534145355225, 2.09409236907959, 2.1823315620422363, 2.2705705165863037, 2.35880970954895, 2.4470486640930176, 2.535287857055664, 2.6235270500183105, 2.711766004562378, 2.8000051975250244]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 7.0, 5.0, 4.0, 4.0, 7.0, 7.0, 12.0, 9.0, 18.0, 22.0, 24.0, 34.0, 44.0, 58.0, 58.0, 67.0, 70.0, 69.0, 69.0, 69.0, 64.0, 53.0, 43.0, 32.0, 28.0, 27.0, 17.0, 17.0, 16.0, 9.0, 6.0, 9.0, 7.0, 2.0, 5.0, 2.0, 3.0, 0.0, 8.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5011661052703857, -1.4553509950637817, -1.4095358848571777, -1.3637208938598633, -1.3179057836532593, -1.2720906734466553, -1.2262755632400513, -1.1804604530334473, -1.1346454620361328, -1.0888303518295288, -1.0430152416229248, -0.9972001910209656, -0.9513851404190063, -0.9055700302124023, -0.8597549200057983, -0.8139398097991943, -0.7681246995925903, -0.7223095893859863, -0.6764945387840271, -0.6306794285774231, -0.5848643779754639, -0.5390492677688599, -0.49323415756225586, -0.44741907715797424, -0.4016039967536926, -0.355788916349411, -0.3099738359451294, -0.2641587257385254, -0.21834364533424377, -0.17252856492996216, -0.12671345472335815, -0.08089837431907654, -0.03508317470550537, 0.010731913149356842, 0.056547001004219055, 0.10236209630966187, 0.14817717671394348, 0.1939922571182251, 0.2398073673248291, 0.2856224477291107, 0.33143752813339233, 0.37725260853767395, 0.42306768894195557, 0.46888279914855957, 0.5146979093551636, 0.5605129599571228, 0.6063280701637268, 0.652143120765686, 0.69795823097229, 0.743773341178894, 0.7895883917808533, 0.8354035019874573, 0.8812185525894165, 0.9270336627960205, 0.9728487730026245, 1.0186638832092285, 1.064478874206543, 1.110293984413147, 1.156109094619751, 1.2019240856170654, 1.2477391958236694, 1.2935543060302734, 1.3393694162368774, 1.3851845264434814, 1.4309996366500854]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 6.0, 3.0, 5.0, 9.0, 8.0, 14.0, 30.0, 28.0, 38.0, 62.0, 97.0, 114.0, 196.0, 249.0, 444.0, 739.0, 1293.0, 2669.0, 6072.0, 16585.0, 82805.0, 857637.0, 55176.0, 13706.0, 5164.0, 2301.0, 1155.0, 726.0, 392.0, 251.0, 166.0, 116.0, 94.0, 48.0, 42.0, 32.0, 26.0, 16.0, 16.0, 11.0, 8.0, 2.0, 3.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.013671875, -1.94744873046875, -1.8812255859375, -1.81500244140625, -1.748779296875, -1.68255615234375, -1.6163330078125, -1.55010986328125, -1.48388671875, -1.41766357421875, -1.3514404296875, -1.28521728515625, -1.218994140625, -1.15277099609375, -1.0865478515625, -1.02032470703125, -0.9541015625, -0.88787841796875, -0.8216552734375, -0.75543212890625, -0.689208984375, -0.62298583984375, -0.5567626953125, -0.49053955078125, -0.42431640625, -0.35809326171875, -0.2918701171875, -0.22564697265625, -0.159423828125, -0.09320068359375, -0.0269775390625, 0.03924560546875, 0.10546875, 0.17169189453125, 0.2379150390625, 0.30413818359375, 0.370361328125, 0.43658447265625, 0.5028076171875, 0.56903076171875, 0.63525390625, 0.70147705078125, 0.7677001953125, 0.83392333984375, 0.900146484375, 0.96636962890625, 1.0325927734375, 1.09881591796875, 1.1650390625, 1.23126220703125, 1.2974853515625, 1.36370849609375, 1.429931640625, 1.49615478515625, 1.5623779296875, 1.62860107421875, 1.69482421875, 1.76104736328125, 1.8272705078125, 1.89349365234375, 1.959716796875, 2.02593994140625, 2.0921630859375, 2.15838623046875, 2.224609375]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 3.0, 4.0, 1.0, 2.0, 2.0, 3.0, 7.0, 2.0, 4.0, 4.0, 4.0, 10.0, 7.0, 14.0, 21.0, 22.0, 37.0, 43.0, 50.0, 64.0, 48.0, 75.0, 81.0, 69.0, 85.0, 55.0, 51.0, 50.0, 40.0, 26.0, 17.0, 28.0, 16.0, 11.0, 12.0, 12.0, 5.0, 3.0, 4.0, 3.0, 1.0, 4.0, 5.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.44921875, -3.353424072265625, -3.25762939453125, -3.161834716796875, -3.0660400390625, -2.970245361328125, -2.87445068359375, -2.778656005859375, -2.682861328125, -2.587066650390625, -2.49127197265625, -2.395477294921875, -2.2996826171875, -2.203887939453125, -2.10809326171875, -2.012298583984375, -1.91650390625, -1.820709228515625, -1.72491455078125, -1.629119873046875, -1.5333251953125, -1.437530517578125, -1.34173583984375, -1.245941162109375, -1.150146484375, -1.054351806640625, -0.95855712890625, -0.862762451171875, -0.7669677734375, -0.671173095703125, -0.57537841796875, -0.479583740234375, -0.3837890625, -0.287994384765625, -0.19219970703125, -0.096405029296875, -0.0006103515625, 0.095184326171875, 0.19097900390625, 0.286773681640625, 0.382568359375, 0.478363037109375, 0.57415771484375, 0.669952392578125, 0.7657470703125, 0.861541748046875, 0.95733642578125, 1.053131103515625, 1.14892578125, 1.244720458984375, 1.34051513671875, 1.436309814453125, 1.5321044921875, 1.627899169921875, 1.72369384765625, 1.819488525390625, 1.915283203125, 2.011077880859375, 2.10687255859375, 2.202667236328125, 2.2984619140625, 2.394256591796875, 2.49005126953125, 2.585845947265625, 2.681640625]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 4.0, 8.0, 6.0, 12.0, 24.0, 27.0, 50.0, 96.0, 194.0, 505.0, 1580.0, 7310.0, 88006.0, 927453.0, 18842.0, 3007.0, 803.0, 319.0, 155.0, 62.0, 31.0, 18.0, 11.0, 10.0, 4.0, 2.0, 6.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.248046875, -3.14404296875, -3.0400390625, -2.93603515625, -2.83203125, -2.72802734375, -2.6240234375, -2.52001953125, -2.416015625, -2.31201171875, -2.2080078125, -2.10400390625, -2.0, -1.89599609375, -1.7919921875, -1.68798828125, -1.583984375, -1.47998046875, -1.3759765625, -1.27197265625, -1.16796875, -1.06396484375, -0.9599609375, -0.85595703125, -0.751953125, -0.64794921875, -0.5439453125, -0.43994140625, -0.3359375, -0.23193359375, -0.1279296875, -0.02392578125, 0.080078125, 0.18408203125, 0.2880859375, 0.39208984375, 0.49609375, 0.60009765625, 0.7041015625, 0.80810546875, 0.912109375, 1.01611328125, 1.1201171875, 1.22412109375, 1.328125, 1.43212890625, 1.5361328125, 1.64013671875, 1.744140625, 1.84814453125, 1.9521484375, 2.05615234375, 2.16015625, 2.26416015625, 2.3681640625, 2.47216796875, 2.576171875, 2.68017578125, 2.7841796875, 2.88818359375, 2.9921875, 3.09619140625, 3.2001953125, 3.30419921875, 3.408203125]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 3.0, 7.0, 8.0, 13.0, 9.0, 15.0, 24.0, 24.0, 37.0, 32.0, 41.0, 45.0, 39.0, 38.0, 49.0, 61.0, 54.0, 60.0, 54.0, 55.0, 40.0, 47.0, 46.0, 36.0, 28.0, 18.0, 22.0, 15.0, 20.0, 13.0, 9.0, 9.0, 5.0, 7.0, 5.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-3.859375, -3.751800537109375, -3.64422607421875, -3.536651611328125, -3.4290771484375, -3.321502685546875, -3.21392822265625, -3.106353759765625, -2.998779296875, -2.891204833984375, -2.78363037109375, -2.676055908203125, -2.5684814453125, -2.460906982421875, -2.35333251953125, -2.245758056640625, -2.13818359375, -2.030609130859375, -1.92303466796875, -1.815460205078125, -1.7078857421875, -1.600311279296875, -1.49273681640625, -1.385162353515625, -1.277587890625, -1.170013427734375, -1.06243896484375, -0.954864501953125, -0.8472900390625, -0.739715576171875, -0.63214111328125, -0.524566650390625, -0.4169921875, -0.309417724609375, -0.20184326171875, -0.094268798828125, 0.0133056640625, 0.120880126953125, 0.22845458984375, 0.336029052734375, 0.443603515625, 0.551177978515625, 0.65875244140625, 0.766326904296875, 0.8739013671875, 0.981475830078125, 1.08905029296875, 1.196624755859375, 1.30419921875, 1.411773681640625, 1.51934814453125, 1.626922607421875, 1.7344970703125, 1.842071533203125, 1.94964599609375, 2.057220458984375, 2.164794921875, 2.272369384765625, 2.37994384765625, 2.487518310546875, 2.5950927734375, 2.702667236328125, 2.81024169921875, 2.917816162109375, 3.025390625]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 7.0, 2.0, 8.0, 11.0, 15.0, 15.0, 26.0, 25.0, 66.0, 66.0, 98.0, 210.0, 486.0, 1392.0, 4550.0, 20623.0, 789527.0, 209859.0, 15916.0, 3566.0, 1061.0, 475.0, 205.0, 112.0, 70.0, 37.0, 37.0, 25.0, 16.0, 10.0, 15.0, 7.0, 9.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.0546875, -1.0216522216796875, -0.988616943359375, -0.9555816650390625, -0.92254638671875, -0.8895111083984375, -0.856475830078125, -0.8234405517578125, -0.7904052734375, -0.7573699951171875, -0.724334716796875, -0.6912994384765625, -0.65826416015625, -0.6252288818359375, -0.592193603515625, -0.5591583251953125, -0.526123046875, -0.4930877685546875, -0.460052490234375, -0.4270172119140625, -0.39398193359375, -0.3609466552734375, -0.327911376953125, -0.2948760986328125, -0.2618408203125, -0.2288055419921875, -0.195770263671875, -0.1627349853515625, -0.12969970703125, -0.0966644287109375, -0.063629150390625, -0.0305938720703125, 0.00244140625, 0.0354766845703125, 0.068511962890625, 0.1015472412109375, 0.13458251953125, 0.1676177978515625, 0.200653076171875, 0.2336883544921875, 0.2667236328125, 0.2997589111328125, 0.332794189453125, 0.3658294677734375, 0.39886474609375, 0.4319000244140625, 0.464935302734375, 0.4979705810546875, 0.531005859375, 0.5640411376953125, 0.597076416015625, 0.6301116943359375, 0.66314697265625, 0.6961822509765625, 0.729217529296875, 0.7622528076171875, 0.7952880859375, 0.8283233642578125, 0.861358642578125, 0.8943939208984375, 0.92742919921875, 0.9604644775390625, 0.993499755859375, 1.0265350341796875, 1.0595703125]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 3.0, 6.0, 4.0, 8.0, 10.0, 14.0, 36.0, 102.0, 669.0, 90.0, 24.0, 11.0, 11.0, 6.0, 10.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011903047561645508, -0.00010954122990369797, -0.00010005198419094086, -9.056273847818375e-05, -8.107349276542664e-05, -7.158424705266953e-05, -6.209500133991241e-05, -5.2605755627155304e-05, -4.311650991439819e-05, -3.362726420164108e-05, -2.4138018488883972e-05, -1.4648772776126862e-05, -5.159527063369751e-06, 4.32971864938736e-06, 1.381896436214447e-05, 2.330821007490158e-05, 3.279745578765869e-05, 4.22867015004158e-05, 5.177594721317291e-05, 6.126519292593002e-05, 7.075443863868713e-05, 8.024368435144424e-05, 8.973293006420135e-05, 9.922217577695847e-05, 0.00010871142148971558, 0.00011820066720247269, 0.0001276899129152298, 0.0001371791586279869, 0.00014666840434074402, 0.00015615765005350113, 0.00016564689576625824, 0.00017513614147901535, 0.00018462538719177246, 0.00019411463290452957, 0.00020360387861728668, 0.0002130931243300438, 0.0002225823700428009, 0.00023207161575555801, 0.00024156086146831512, 0.00025105010718107224, 0.00026053935289382935, 0.00027002859860658646, 0.00027951784431934357, 0.0002890070900321007, 0.0002984963357448578, 0.0003079855814576149, 0.000317474827170372, 0.0003269640728831291, 0.00033645331859588623, 0.00034594256430864334, 0.00035543181002140045, 0.00036492105573415756, 0.00037441030144691467, 0.0003838995471596718, 0.0003933887928724289, 0.000402878038585186, 0.0004123672842979431, 0.0004218565300107002, 0.00043134577572345734, 0.00044083502143621445, 0.00045032426714897156, 0.00045981351286172867, 0.0004693027585744858, 0.0004787920042872429, 0.00048828125]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 6.0, 4.0, 9.0, 16.0, 28.0, 53.0, 109.0, 215.0, 535.0, 1502.0, 4686.0, 21203.0, 859715.0, 141652.0, 13758.0, 3226.0, 1040.0, 415.0, 187.0, 67.0, 45.0, 25.0, 17.0, 11.0, 10.0, 9.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.4287109375, -1.3909835815429688, -1.3532562255859375, -1.3155288696289062, -1.277801513671875, -1.2400741577148438, -1.2023468017578125, -1.1646194458007812, -1.12689208984375, -1.0891647338867188, -1.0514373779296875, -1.0137100219726562, -0.975982666015625, -0.9382553100585938, -0.9005279541015625, -0.8628005981445312, -0.8250732421875, -0.7873458862304688, -0.7496185302734375, -0.7118911743164062, -0.674163818359375, -0.6364364624023438, -0.5987091064453125, -0.5609817504882812, -0.52325439453125, -0.48552703857421875, -0.4477996826171875, -0.41007232666015625, -0.372344970703125, -0.33461761474609375, -0.2968902587890625, -0.25916290283203125, -0.221435546875, -0.18370819091796875, -0.1459808349609375, -0.10825347900390625, -0.070526123046875, -0.03279876708984375, 0.0049285888671875, 0.04265594482421875, 0.08038330078125, 0.11811065673828125, 0.1558380126953125, 0.19356536865234375, 0.231292724609375, 0.26902008056640625, 0.3067474365234375, 0.34447479248046875, 0.3822021484375, 0.41992950439453125, 0.4576568603515625, 0.49538421630859375, 0.533111572265625, 0.5708389282226562, 0.6085662841796875, 0.6462936401367188, 0.68402099609375, 0.7217483520507812, 0.7594757080078125, 0.7972030639648438, 0.834930419921875, 0.8726577758789062, 0.9103851318359375, 0.9481124877929688, 0.98583984375]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 5.0, 2.0, 5.0, 4.0, 7.0, 11.0, 21.0, 23.0, 71.0, 198.0, 441.0, 87.0, 36.0, 19.0, 16.0, 11.0, 11.0, 5.0, 9.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.415771484375, -0.4036064147949219, -0.39144134521484375, -0.3792762756347656, -0.3671112060546875, -0.3549461364746094, -0.34278106689453125, -0.3306159973144531, -0.318450927734375, -0.3062858581542969, -0.29412078857421875, -0.2819557189941406, -0.2697906494140625, -0.2576255798339844, -0.24546051025390625, -0.23329544067382812, -0.22113037109375, -0.20896530151367188, -0.19680023193359375, -0.18463516235351562, -0.1724700927734375, -0.16030502319335938, -0.14813995361328125, -0.13597488403320312, -0.123809814453125, -0.11164474487304688, -0.09947967529296875, -0.08731460571289062, -0.0751495361328125, -0.06298446655273438, -0.05081939697265625, -0.038654327392578125, -0.0264892578125, -0.014324188232421875, -0.00215911865234375, 0.010005950927734375, 0.0221710205078125, 0.034336090087890625, 0.04650115966796875, 0.058666229248046875, 0.070831298828125, 0.08299636840820312, 0.09516143798828125, 0.10732650756835938, 0.1194915771484375, 0.13165664672851562, 0.14382171630859375, 0.15598678588867188, 0.16815185546875, 0.18031692504882812, 0.19248199462890625, 0.20464706420898438, 0.2168121337890625, 0.22897720336914062, 0.24114227294921875, 0.2533073425292969, 0.265472412109375, 0.2776374816894531, 0.28980255126953125, 0.3019676208496094, 0.3141326904296875, 0.3262977600097656, 0.33846282958984375, 0.3506278991699219, 0.36279296875]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 10.0, 16.0, 24.0, 60.0, 223.0, 395.0, 191.0, 42.0, 28.0, 12.0, 2.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0], "bins": [-22.579866409301758, -22.140300750732422, -21.700733184814453, -21.261167526245117, -20.82160186767578, -20.382036209106445, -19.94247055053711, -19.50290298461914, -19.063337326049805, -18.62377166748047, -18.1842041015625, -17.744638442993164, -17.305072784423828, -16.865507125854492, -16.425941467285156, -15.986373901367188, -15.546808242797852, -15.107242584228516, -14.667675971984863, -14.228109359741211, -13.788543701171875, -13.348978042602539, -12.909411430358887, -12.469844818115234, -12.030279159545898, -11.590713500976562, -11.15114688873291, -10.711580276489258, -10.272014617919922, -9.832448959350586, -9.392882347106934, -8.953315734863281, -8.513750076293945, -8.07418441772461, -7.634617805480957, -7.195051670074463, -6.755485534667969, -6.315919399261475, -5.8763532638549805, -5.436787128448486, -4.99722146987915, -4.557655334472656, -4.118089199066162, -3.678523063659668, -3.238956928253174, -2.7993907928466797, -2.3598246574401855, -1.9202585220336914, -1.4806923866271973, -1.0411262512207031, -0.601560115814209, -0.16199398040771484, 0.2775721549987793, 0.7171382904052734, 1.1567044258117676, 1.5962705612182617, 2.035836696624756, 2.47540283203125, 2.914968967437744, 3.3545351028442383, 3.7941012382507324, 4.233667373657227, 4.673233509063721, 5.112799644470215, 5.552365779876709]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 2.0, 8.0, 9.0, 7.0, 7.0, 16.0, 10.0, 17.0, 21.0, 19.0, 23.0, 35.0, 30.0, 38.0, 28.0, 39.0, 41.0, 37.0, 49.0, 38.0, 37.0, 41.0, 38.0, 39.0, 47.0, 38.0, 30.0, 31.0, 30.0, 30.0, 19.0, 25.0, 16.0, 20.0, 14.0, 11.0, 13.0, 5.0, 10.0, 9.0, 9.0, 3.0, 3.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.190743923187256, -5.0354743003845215, -4.880205154418945, -4.724935531616211, -4.569665908813477, -4.414396286010742, -4.259126663208008, -4.103857517242432, -3.9485878944396973, -3.793318271636963, -3.6380488872528076, -3.4827795028686523, -3.327509880065918, -3.1722402572631836, -3.0169708728790283, -2.861701488494873, -2.7064318656921387, -2.5511622428894043, -2.395892858505249, -2.2406234741210938, -2.0853538513183594, -1.9300843477249146, -1.7748148441314697, -1.619545340538025, -1.46427583694458, -1.3090063333511353, -1.1537368297576904, -0.9984673261642456, -0.8431978225708008, -0.687928318977356, -0.5326588153839111, -0.3773893117904663, -0.22211933135986328, -0.06684982776641846, 0.08841967582702637, 0.2436891794204712, 0.398958683013916, 0.5542281866073608, 0.7094976902008057, 0.8647671937942505, 1.0200366973876953, 1.1753062009811401, 1.330575704574585, 1.4858452081680298, 1.6411147117614746, 1.7963842153549194, 1.9516537189483643, 2.1069231033325195, 2.262192726135254, 2.4174623489379883, 2.5727317333221436, 2.728001117706299, 2.883270740509033, 3.0385403633117676, 3.193809747695923, 3.349079132080078, 3.5043487548828125, 3.659618377685547, 3.814887762069702, 3.9701571464538574, 4.125426769256592, 4.280696392059326, 4.435965538024902, 4.591235160827637, 4.746504783630371]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 6.0, 2.0, 3.0, 4.0, 6.0, 6.0, 10.0, 8.0, 15.0, 18.0, 23.0, 29.0, 34.0, 64.0, 97.0, 203.0, 508.0, 1749.0, 7992.0, 91802.0, 4013111.0, 69599.0, 6551.0, 1439.0, 500.0, 183.0, 98.0, 60.0, 39.0, 22.0, 17.0, 17.0, 15.0, 19.0, 9.0, 6.0, 9.0, 8.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-6.390625, -6.21533203125, -6.0400390625, -5.86474609375, -5.689453125, -5.51416015625, -5.3388671875, -5.16357421875, -4.98828125, -4.81298828125, -4.6376953125, -4.46240234375, -4.287109375, -4.11181640625, -3.9365234375, -3.76123046875, -3.5859375, -3.41064453125, -3.2353515625, -3.06005859375, -2.884765625, -2.70947265625, -2.5341796875, -2.35888671875, -2.18359375, -2.00830078125, -1.8330078125, -1.65771484375, -1.482421875, -1.30712890625, -1.1318359375, -0.95654296875, -0.78125, -0.60595703125, -0.4306640625, -0.25537109375, -0.080078125, 0.09521484375, 0.2705078125, 0.44580078125, 0.62109375, 0.79638671875, 0.9716796875, 1.14697265625, 1.322265625, 1.49755859375, 1.6728515625, 1.84814453125, 2.0234375, 2.19873046875, 2.3740234375, 2.54931640625, 2.724609375, 2.89990234375, 3.0751953125, 3.25048828125, 3.42578125, 3.60107421875, 3.7763671875, 3.95166015625, 4.126953125, 4.30224609375, 4.4775390625, 4.65283203125, 4.828125]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 3.0, 6.0, 6.0, 6.0, 11.0, 15.0, 14.0, 14.0, 34.0, 33.0, 42.0, 50.0, 72.0, 78.0, 89.0, 92.0, 86.0, 66.0, 80.0, 46.0, 27.0, 25.0, 25.0, 22.0, 17.0, 6.0, 8.0, 8.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.955078125, -1.89605712890625, -1.8370361328125, -1.77801513671875, -1.718994140625, -1.65997314453125, -1.6009521484375, -1.54193115234375, -1.48291015625, -1.42388916015625, -1.3648681640625, -1.30584716796875, -1.246826171875, -1.18780517578125, -1.1287841796875, -1.06976318359375, -1.0107421875, -0.95172119140625, -0.8927001953125, -0.83367919921875, -0.774658203125, -0.71563720703125, -0.6566162109375, -0.59759521484375, -0.53857421875, -0.47955322265625, -0.4205322265625, -0.36151123046875, -0.302490234375, -0.24346923828125, -0.1844482421875, -0.12542724609375, -0.06640625, -0.00738525390625, 0.0516357421875, 0.11065673828125, 0.169677734375, 0.22869873046875, 0.2877197265625, 0.34674072265625, 0.40576171875, 0.46478271484375, 0.5238037109375, 0.58282470703125, 0.641845703125, 0.70086669921875, 0.7598876953125, 0.81890869140625, 0.8779296875, 0.93695068359375, 0.9959716796875, 1.05499267578125, 1.114013671875, 1.17303466796875, 1.2320556640625, 1.29107666015625, 1.35009765625, 1.40911865234375, 1.4681396484375, 1.52716064453125, 1.586181640625, 1.64520263671875, 1.7042236328125, 1.76324462890625, 1.822265625]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 5.0, 11.0, 10.0, 21.0, 48.0, 42.0, 86.0, 149.0, 372.0, 1113.0, 4557.0, 31237.0, 2786627.0, 1337618.0, 26646.0, 3989.0, 995.0, 398.0, 139.0, 83.0, 34.0, 33.0, 17.0, 10.0, 10.0, 3.0, 6.0, 6.0, 5.0, 2.0, 0.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.84765625, -4.69598388671875, -4.5443115234375, -4.39263916015625, -4.240966796875, -4.08929443359375, -3.9376220703125, -3.78594970703125, -3.63427734375, -3.48260498046875, -3.3309326171875, -3.17926025390625, -3.027587890625, -2.87591552734375, -2.7242431640625, -2.57257080078125, -2.4208984375, -2.26922607421875, -2.1175537109375, -1.96588134765625, -1.814208984375, -1.66253662109375, -1.5108642578125, -1.35919189453125, -1.20751953125, -1.05584716796875, -0.9041748046875, -0.75250244140625, -0.600830078125, -0.44915771484375, -0.2974853515625, -0.14581298828125, 0.005859375, 0.15753173828125, 0.3092041015625, 0.46087646484375, 0.612548828125, 0.76422119140625, 0.9158935546875, 1.06756591796875, 1.21923828125, 1.37091064453125, 1.5225830078125, 1.67425537109375, 1.825927734375, 1.97760009765625, 2.1292724609375, 2.28094482421875, 2.4326171875, 2.58428955078125, 2.7359619140625, 2.88763427734375, 3.039306640625, 3.19097900390625, 3.3426513671875, 3.49432373046875, 3.64599609375, 3.79766845703125, 3.9493408203125, 4.10101318359375, 4.252685546875, 4.40435791015625, 4.5560302734375, 4.70770263671875, 4.859375]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 6.0, 4.0, 6.0, 8.0, 7.0, 22.0, 17.0, 23.0, 28.0, 45.0, 68.0, 84.0, 94.0, 176.0, 355.0, 597.0, 1052.0, 559.0, 310.0, 203.0, 100.0, 86.0, 61.0, 42.0, 28.0, 22.0, 20.0, 13.0, 8.0, 18.0, 5.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.60546875, -0.5849685668945312, -0.5644683837890625, -0.5439682006835938, -0.523468017578125, -0.5029678344726562, -0.4824676513671875, -0.46196746826171875, -0.44146728515625, -0.42096710205078125, -0.4004669189453125, -0.37996673583984375, -0.359466552734375, -0.33896636962890625, -0.3184661865234375, -0.29796600341796875, -0.2774658203125, -0.25696563720703125, -0.2364654541015625, -0.21596527099609375, -0.195465087890625, -0.17496490478515625, -0.1544647216796875, -0.13396453857421875, -0.11346435546875, -0.09296417236328125, -0.0724639892578125, -0.05196380615234375, -0.031463623046875, -0.01096343994140625, 0.0095367431640625, 0.03003692626953125, 0.050537109375, 0.07103729248046875, 0.0915374755859375, 0.11203765869140625, 0.132537841796875, 0.15303802490234375, 0.1735382080078125, 0.19403839111328125, 0.21453857421875, 0.23503875732421875, 0.2555389404296875, 0.27603912353515625, 0.296539306640625, 0.31703948974609375, 0.3375396728515625, 0.35803985595703125, 0.3785400390625, 0.39904022216796875, 0.4195404052734375, 0.44004058837890625, 0.460540771484375, 0.48104095458984375, 0.5015411376953125, 0.5220413208007812, 0.54254150390625, 0.5630416870117188, 0.5835418701171875, 0.6040420532226562, 0.624542236328125, 0.6450424194335938, 0.6655426025390625, 0.6860427856445312, 0.70654296875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 6.0, 5.0, 10.0, 31.0, 35.0, 53.0, 104.0, 152.0, 170.0, 159.0, 122.0, 55.0, 49.0, 17.0, 15.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2743020057678223, -3.1289138793945312, -2.9835257530212402, -2.838137626647949, -2.692749500274658, -2.547361373901367, -2.401973247528076, -2.256585121154785, -2.111196994781494, -1.9658088684082031, -1.820420742034912, -1.675032615661621, -1.52964448928833, -1.384256362915039, -1.2388681173324585, -1.0934799909591675, -0.9480917453765869, -0.8027036190032959, -0.6573154926300049, -0.5119273066520691, -0.3665391802787781, -0.22115105390548706, -0.07576286792755127, 0.06962525844573975, 0.21501338481903076, 0.3604015111923218, 0.5057896375656128, 0.6511778235435486, 0.7965659499168396, 0.9419540762901306, 1.0873422622680664, 1.2327303886413574, 1.3781185150146484, 1.5235066413879395, 1.6688947677612305, 1.8142828941345215, 1.9596710205078125, 2.1050591468811035, 2.2504472732543945, 2.3958353996276855, 2.5412235260009766, 2.6866116523742676, 2.8319997787475586, 2.9773879051208496, 3.1227760314941406, 3.2681641578674316, 3.4135522842407227, 3.5589404106140137, 3.704328775405884, 3.849716901779175, 3.995105028152466, 4.140493392944336, 4.285881519317627, 4.431269645690918, 4.576657772064209, 4.7220458984375, 4.867434024810791, 5.012822151184082, 5.158210277557373, 5.303598403930664, 5.448986530303955, 5.594374656677246, 5.739762783050537, 5.885150909423828, 6.030539035797119]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 5.0, 3.0, 4.0, 9.0, 8.0, 12.0, 12.0, 24.0, 13.0, 27.0, 17.0, 32.0, 35.0, 46.0, 44.0, 50.0, 51.0, 60.0, 60.0, 51.0, 49.0, 56.0, 52.0, 45.0, 34.0, 43.0, 27.0, 29.0, 28.0, 16.0, 20.0, 10.0, 11.0, 3.0, 4.0, 2.0, 6.0, 4.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.029968023300171, -1.9686391353607178, -1.907310128211975, -1.845981240272522, -1.7846523523330688, -1.7233233451843262, -1.661994457244873, -1.60066556930542, -1.5393366813659668, -1.4780077934265137, -1.416678786277771, -1.3553498983383179, -1.2940210103988647, -1.232692003250122, -1.171363115310669, -1.1100342273712158, -1.0487052202224731, -0.9873762726783752, -0.9260473847389221, -0.8647184371948242, -0.8033895492553711, -0.7420606017112732, -0.6807316541671753, -0.6194027662277222, -0.5580738186836243, -0.49674490094184875, -0.43541598320007324, -0.37408703565597534, -0.31275811791419983, -0.2514292001724243, -0.19010025262832642, -0.1287713348865509, -0.06744253635406494, -0.006113611161708832, 0.05521531403064728, 0.11654424667358398, 0.1778731644153595, 0.239202082157135, 0.3005310297012329, 0.3618599474430084, 0.42318886518478394, 0.48451778292655945, 0.545846700668335, 0.6071756482124329, 0.6685045957565308, 0.7298334836959839, 0.7911624312400818, 0.8524913787841797, 0.9138202667236328, 0.9751492142677307, 1.0364781618118286, 1.0978070497512817, 1.1591359376907349, 1.2204649448394775, 1.2817938327789307, 1.3431227207183838, 1.404451608657837, 1.46578049659729, 1.5271095037460327, 1.5884383916854858, 1.649767279624939, 1.7110962867736816, 1.7724251747131348, 1.833754062652588, 1.8950830698013306]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 4.0, 4.0, 2.0, 5.0, 5.0, 13.0, 9.0, 13.0, 23.0, 33.0, 39.0, 68.0, 75.0, 127.0, 214.0, 351.0, 536.0, 966.0, 1564.0, 2969.0, 5989.0, 14633.0, 48827.0, 261582.0, 535112.0, 127286.0, 28116.0, 9907.0, 4491.0, 2316.0, 1217.0, 705.0, 408.0, 303.0, 217.0, 113.0, 103.0, 58.0, 48.0, 26.0, 26.0, 10.0, 11.0, 8.0, 12.0, 6.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.36962890625, -0.35852813720703125, -0.3474273681640625, -0.33632659912109375, -0.325225830078125, -0.31412506103515625, -0.3030242919921875, -0.29192352294921875, -0.28082275390625, -0.26972198486328125, -0.2586212158203125, -0.24752044677734375, -0.236419677734375, -0.22531890869140625, -0.2142181396484375, -0.20311737060546875, -0.1920166015625, -0.18091583251953125, -0.1698150634765625, -0.15871429443359375, -0.147613525390625, -0.13651275634765625, -0.1254119873046875, -0.11431121826171875, -0.10321044921875, -0.09210968017578125, -0.0810089111328125, -0.06990814208984375, -0.058807373046875, -0.04770660400390625, -0.0366058349609375, -0.02550506591796875, -0.014404296875, -0.00330352783203125, 0.0077972412109375, 0.01889801025390625, 0.029998779296875, 0.04109954833984375, 0.0522003173828125, 0.06330108642578125, 0.07440185546875, 0.08550262451171875, 0.0966033935546875, 0.10770416259765625, 0.118804931640625, 0.12990570068359375, 0.1410064697265625, 0.15210723876953125, 0.1632080078125, 0.17430877685546875, 0.1854095458984375, 0.19651031494140625, 0.207611083984375, 0.21871185302734375, 0.2298126220703125, 0.24091339111328125, 0.25201416015625, 0.26311492919921875, 0.2742156982421875, 0.28531646728515625, 0.296417236328125, 0.30751800537109375, 0.3186187744140625, 0.32971954345703125, 0.3408203125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 5.0, 5.0, 3.0, 6.0, 11.0, 9.0, 17.0, 19.0, 16.0, 27.0, 26.0, 46.0, 49.0, 39.0, 64.0, 60.0, 65.0, 71.0, 52.0, 53.0, 42.0, 47.0, 50.0, 35.0, 35.0, 35.0, 26.0, 24.0, 16.0, 11.0, 7.0, 6.0, 10.0, 2.0, 4.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7197265625, -1.6683197021484375, -1.616912841796875, -1.5655059814453125, -1.51409912109375, -1.4626922607421875, -1.411285400390625, -1.3598785400390625, -1.3084716796875, -1.2570648193359375, -1.205657958984375, -1.1542510986328125, -1.10284423828125, -1.0514373779296875, -1.000030517578125, -0.9486236572265625, -0.897216796875, -0.8458099365234375, -0.794403076171875, -0.7429962158203125, -0.69158935546875, -0.6401824951171875, -0.588775634765625, -0.5373687744140625, -0.4859619140625, -0.4345550537109375, -0.383148193359375, -0.3317413330078125, -0.28033447265625, -0.2289276123046875, -0.177520751953125, -0.1261138916015625, -0.07470703125, -0.0233001708984375, 0.028106689453125, 0.0795135498046875, 0.13092041015625, 0.1823272705078125, 0.233734130859375, 0.2851409912109375, 0.3365478515625, 0.3879547119140625, 0.439361572265625, 0.4907684326171875, 0.54217529296875, 0.5935821533203125, 0.644989013671875, 0.6963958740234375, 0.747802734375, 0.7992095947265625, 0.850616455078125, 0.9020233154296875, 0.95343017578125, 1.0048370361328125, 1.056243896484375, 1.1076507568359375, 1.1590576171875, 1.2104644775390625, 1.261871337890625, 1.3132781982421875, 1.36468505859375, 1.4160919189453125, 1.467498779296875, 1.5189056396484375, 1.5703125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 6.0, 3.0, 1.0, 4.0, 4.0, 6.0, 12.0, 15.0, 18.0, 35.0, 28.0, 53.0, 64.0, 99.0, 116.0, 235.0, 376.0, 561.0, 940.0, 1664.0, 3374.0, 7775.0, 21335.0, 86718.0, 403508.0, 399290.0, 85691.0, 21343.0, 7624.0, 3401.0, 1670.0, 961.0, 550.0, 338.0, 229.0, 146.0, 112.0, 68.0, 46.0, 30.0, 34.0, 22.0, 13.0, 9.0, 13.0, 8.0, 8.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.293701171875, -0.2839088439941406, -0.27411651611328125, -0.2643241882324219, -0.2545318603515625, -0.24473953247070312, -0.23494720458984375, -0.22515487670898438, -0.215362548828125, -0.20557022094726562, -0.19577789306640625, -0.18598556518554688, -0.1761932373046875, -0.16640090942382812, -0.15660858154296875, -0.14681625366210938, -0.13702392578125, -0.12723159790039062, -0.11743927001953125, -0.10764694213867188, -0.0978546142578125, -0.08806228637695312, -0.07826995849609375, -0.06847763061523438, -0.058685302734375, -0.048892974853515625, -0.03910064697265625, -0.029308319091796875, -0.0195159912109375, -0.009723663330078125, 6.866455078125e-05, 0.009860992431640625, 0.0196533203125, 0.029445648193359375, 0.03923797607421875, 0.049030303955078125, 0.0588226318359375, 0.06861495971679688, 0.07840728759765625, 0.08819961547851562, 0.097991943359375, 0.10778427124023438, 0.11757659912109375, 0.12736892700195312, 0.1371612548828125, 0.14695358276367188, 0.15674591064453125, 0.16653823852539062, 0.17633056640625, 0.18612289428710938, 0.19591522216796875, 0.20570755004882812, 0.2154998779296875, 0.22529220581054688, 0.23508453369140625, 0.24487686157226562, 0.254669189453125, 0.2644615173339844, 0.27425384521484375, 0.2840461730957031, 0.2938385009765625, 0.3036308288574219, 0.31342315673828125, 0.3232154846191406, 0.3330078125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 3.0, 15.0, 10.0, 12.0, 18.0, 22.0, 24.0, 24.0, 25.0, 31.0, 34.0, 48.0, 49.0, 53.0, 53.0, 66.0, 65.0, 59.0, 47.0, 47.0, 48.0, 48.0, 28.0, 33.0, 27.0, 18.0, 13.0, 18.0, 15.0, 13.0, 13.0, 6.0, 6.0, 3.0, 5.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.04296875, -2.93072509765625, -2.8184814453125, -2.70623779296875, -2.593994140625, -2.48175048828125, -2.3695068359375, -2.25726318359375, -2.14501953125, -2.03277587890625, -1.9205322265625, -1.80828857421875, -1.696044921875, -1.58380126953125, -1.4715576171875, -1.35931396484375, -1.2470703125, -1.13482666015625, -1.0225830078125, -0.91033935546875, -0.798095703125, -0.68585205078125, -0.5736083984375, -0.46136474609375, -0.34912109375, -0.23687744140625, -0.1246337890625, -0.01239013671875, 0.099853515625, 0.21209716796875, 0.3243408203125, 0.43658447265625, 0.548828125, 0.66107177734375, 0.7733154296875, 0.88555908203125, 0.997802734375, 1.11004638671875, 1.2222900390625, 1.33453369140625, 1.44677734375, 1.55902099609375, 1.6712646484375, 1.78350830078125, 1.895751953125, 2.00799560546875, 2.1202392578125, 2.23248291015625, 2.3447265625, 2.45697021484375, 2.5692138671875, 2.68145751953125, 2.793701171875, 2.90594482421875, 3.0181884765625, 3.13043212890625, 3.24267578125, 3.35491943359375, 3.4671630859375, 3.57940673828125, 3.691650390625, 3.80389404296875, 3.9161376953125, 4.02838134765625, 4.140625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 3.0, 6.0, 2.0, 4.0, 9.0, 10.0, 14.0, 14.0, 18.0, 31.0, 53.0, 83.0, 118.0, 229.0, 331.0, 631.0, 1293.0, 2773.0, 7003.0, 25243.0, 184313.0, 692865.0, 105731.0, 17731.0, 5347.0, 2242.0, 1048.0, 577.0, 338.0, 161.0, 101.0, 77.0, 41.0, 38.0, 27.0, 16.0, 13.0, 4.0, 6.0, 11.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.11956787109375, -0.11575794219970703, -0.11194801330566406, -0.1081380844116211, -0.10432815551757812, -0.10051822662353516, -0.09670829772949219, -0.09289836883544922, -0.08908843994140625, -0.08527851104736328, -0.08146858215332031, -0.07765865325927734, -0.07384872436523438, -0.0700387954711914, -0.06622886657714844, -0.06241893768310547, -0.0586090087890625, -0.05479907989501953, -0.05098915100097656, -0.047179222106933594, -0.043369293212890625, -0.039559364318847656, -0.03574943542480469, -0.03193950653076172, -0.02812957763671875, -0.02431964874267578, -0.020509719848632812, -0.016699790954589844, -0.012889862060546875, -0.009079933166503906, -0.0052700042724609375, -0.0014600753784179688, 0.002349853515625, 0.006159782409667969, 0.009969711303710938, 0.013779640197753906, 0.017589569091796875, 0.021399497985839844, 0.025209426879882812, 0.02901935577392578, 0.03282928466796875, 0.03663921356201172, 0.04044914245605469, 0.044259071350097656, 0.048069000244140625, 0.051878929138183594, 0.05568885803222656, 0.05949878692626953, 0.0633087158203125, 0.06711864471435547, 0.07092857360839844, 0.0747385025024414, 0.07854843139648438, 0.08235836029052734, 0.08616828918457031, 0.08997821807861328, 0.09378814697265625, 0.09759807586669922, 0.10140800476074219, 0.10521793365478516, 0.10902786254882812, 0.1128377914428711, 0.11664772033691406, 0.12045764923095703, 0.124267578125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 2.0, 7.0, 6.0, 4.0, 4.0, 15.0, 16.0, 23.0, 21.0, 32.0, 46.0, 78.0, 87.0, 78.0, 90.0, 102.0, 100.0, 62.0, 61.0, 46.0, 29.0, 26.0, 14.0, 15.0, 11.0, 9.0, 5.0, 2.0, 4.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9591064453125e-05, -4.779268056154251e-05, -4.599429666996002e-05, -4.419591277837753e-05, -4.2397528886795044e-05, -4.0599144995212555e-05, -3.8800761103630066e-05, -3.700237721204758e-05, -3.520399332046509e-05, -3.34056094288826e-05, -3.160722553730011e-05, -2.980884164571762e-05, -2.8010457754135132e-05, -2.6212073862552643e-05, -2.4413689970970154e-05, -2.2615306079387665e-05, -2.0816922187805176e-05, -1.9018538296222687e-05, -1.7220154404640198e-05, -1.542177051305771e-05, -1.362338662147522e-05, -1.182500272989273e-05, -1.0026618838310242e-05, -8.228234946727753e-06, -6.429851055145264e-06, -4.631467163562775e-06, -2.8330832719802856e-06, -1.0346993803977966e-06, 7.636845111846924e-07, 2.5620684027671814e-06, 4.36045229434967e-06, 6.1588361859321594e-06, 7.957220077514648e-06, 9.755603969097137e-06, 1.1553987860679626e-05, 1.3352371752262115e-05, 1.5150755643844604e-05, 1.6949139535427094e-05, 1.8747523427009583e-05, 2.054590731859207e-05, 2.234429121017456e-05, 2.414267510175705e-05, 2.594105899333954e-05, 2.7739442884922028e-05, 2.9537826776504517e-05, 3.1336210668087006e-05, 3.3134594559669495e-05, 3.4932978451251984e-05, 3.673136234283447e-05, 3.852974623441696e-05, 4.032813012599945e-05, 4.212651401758194e-05, 4.392489790916443e-05, 4.572328180074692e-05, 4.752166569232941e-05, 4.9320049583911896e-05, 5.1118433475494385e-05, 5.2916817367076874e-05, 5.471520125865936e-05, 5.651358515024185e-05, 5.831196904182434e-05, 6.011035293340683e-05, 6.190873682498932e-05, 6.370712071657181e-05, 6.55055046081543e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 7.0, 11.0, 15.0, 14.0, 29.0, 36.0, 72.0, 101.0, 165.0, 282.0, 455.0, 873.0, 1707.0, 3650.0, 9005.0, 28942.0, 209224.0, 680277.0, 84464.0, 17407.0, 6223.0, 2622.0, 1334.0, 648.0, 368.0, 238.0, 151.0, 57.0, 64.0, 34.0, 21.0, 16.0, 7.0, 8.0, 6.0, 1.0, 3.0, 3.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.146240234375, -0.14209842681884766, -0.1379566192626953, -0.13381481170654297, -0.12967300415039062, -0.12553119659423828, -0.12138938903808594, -0.1172475814819336, -0.11310577392578125, -0.1089639663696289, -0.10482215881347656, -0.10068035125732422, -0.09653854370117188, -0.09239673614501953, -0.08825492858886719, -0.08411312103271484, -0.0799713134765625, -0.07582950592041016, -0.07168769836425781, -0.06754589080810547, -0.06340408325195312, -0.05926227569580078, -0.05512046813964844, -0.050978660583496094, -0.04683685302734375, -0.042695045471191406, -0.03855323791503906, -0.03441143035888672, -0.030269622802734375, -0.02612781524658203, -0.021986007690429688, -0.017844200134277344, -0.013702392578125, -0.009560585021972656, -0.0054187774658203125, -0.0012769699096679688, 0.002864837646484375, 0.007006645202636719, 0.011148452758789062, 0.015290260314941406, 0.01943206787109375, 0.023573875427246094, 0.027715682983398438, 0.03185749053955078, 0.035999298095703125, 0.04014110565185547, 0.04428291320800781, 0.048424720764160156, 0.0525665283203125, 0.056708335876464844, 0.06085014343261719, 0.06499195098876953, 0.06913375854492188, 0.07327556610107422, 0.07741737365722656, 0.0815591812133789, 0.08570098876953125, 0.0898427963256836, 0.09398460388183594, 0.09812641143798828, 0.10226821899414062, 0.10641002655029297, 0.11055183410644531, 0.11469364166259766, 0.11883544921875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 1.0, 3.0, 1.0, 4.0, 7.0, 1.0, 3.0, 6.0, 5.0, 8.0, 24.0, 22.0, 36.0, 45.0, 88.0, 107.0, 162.0, 144.0, 108.0, 80.0, 37.0, 32.0, 13.0, 19.0, 10.0, 11.0, 7.0, 6.0, 3.0, 1.0, 6.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.046905517578125, -0.04563283920288086, -0.04436016082763672, -0.04308748245239258, -0.04181480407714844, -0.0405421257019043, -0.039269447326660156, -0.037996768951416016, -0.036724090576171875, -0.035451412200927734, -0.034178733825683594, -0.03290605545043945, -0.03163337707519531, -0.030360698699951172, -0.02908802032470703, -0.02781534194946289, -0.02654266357421875, -0.02526998519897461, -0.02399730682373047, -0.022724628448486328, -0.021451950073242188, -0.020179271697998047, -0.018906593322753906, -0.017633914947509766, -0.016361236572265625, -0.015088558197021484, -0.013815879821777344, -0.012543201446533203, -0.011270523071289062, -0.009997844696044922, -0.008725166320800781, -0.007452487945556641, -0.0061798095703125, -0.004907131195068359, -0.0036344528198242188, -0.002361774444580078, -0.0010890960693359375, 0.00018358230590820312, 0.0014562606811523438, 0.0027289390563964844, 0.004001617431640625, 0.005274295806884766, 0.006546974182128906, 0.007819652557373047, 0.009092330932617188, 0.010365009307861328, 0.011637687683105469, 0.01291036605834961, 0.01418304443359375, 0.01545572280883789, 0.01672840118408203, 0.018001079559326172, 0.019273757934570312, 0.020546436309814453, 0.021819114685058594, 0.023091793060302734, 0.024364471435546875, 0.025637149810791016, 0.026909828186035156, 0.028182506561279297, 0.029455184936523438, 0.030727863311767578, 0.03200054168701172, 0.03327322006225586, 0.0345458984375]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 3.0, 5.0, 1.0, 5.0, 7.0, 6.0, 11.0, 22.0, 29.0, 47.0, 82.0, 149.0, 153.0, 147.0, 125.0, 88.0, 54.0, 31.0, 18.0, 11.0, 3.0, 1.0, 4.0, 2.0, 0.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7874157428741455, -2.6876680850982666, -2.5879201889038086, -2.4881725311279297, -2.388424873352051, -2.288677215576172, -2.188929557800293, -2.089181661605835, -1.989434003829956, -1.8896863460540771, -1.7899385690689087, -1.6901907920837402, -1.5904431343078613, -1.4906954765319824, -1.390947699546814, -1.2911999225616455, -1.1914522647857666, -1.0917046070098877, -0.9919568300247192, -0.8922091126441956, -0.7924613952636719, -0.6927136778831482, -0.5929659605026245, -0.49321824312210083, -0.39347052574157715, -0.29372280836105347, -0.19397509098052979, -0.0942273736000061, 0.005520343780517578, 0.10526806116104126, 0.20501577854156494, 0.3047634959220886, 0.4045112133026123, 0.504258930683136, 0.6040066480636597, 0.7037543654441833, 0.803502082824707, 0.9032498002052307, 1.0029975175857544, 1.1027452945709229, 1.2024929523468018, 1.3022406101226807, 1.4019883871078491, 1.5017361640930176, 1.6014838218688965, 1.7012314796447754, 1.8009792566299438, 1.9007270336151123, 2.000474691390991, 2.10022234916687, 2.199970245361328, 2.299717903137207, 2.399465560913086, 2.499213218688965, 2.5989608764648438, 2.6987087726593018, 2.7984564304351807, 2.8982040882110596, 2.9979519844055176, 3.0976996421813965, 3.1974472999572754, 3.2971949577331543, 3.396942615509033, 3.496690511703491, 3.59643816947937]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 3.0, 3.0, 9.0, 9.0, 4.0, 13.0, 14.0, 20.0, 28.0, 21.0, 24.0, 48.0, 57.0, 53.0, 61.0, 64.0, 63.0, 56.0, 74.0, 61.0, 59.0, 40.0, 41.0, 41.0, 30.0, 22.0, 22.0, 18.0, 7.0, 10.0, 8.0, 2.0, 5.0, 4.0, 1.0, 6.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6601585149765015, -1.6081640720367432, -1.5561696290969849, -1.5041751861572266, -1.4521807432174683, -1.40018630027771, -1.3481918573379517, -1.2961974143981934, -1.244202971458435, -1.1922085285186768, -1.1402140855789185, -1.0882196426391602, -1.0362251996994019, -0.9842307567596436, -0.9322363138198853, -0.880241870880127, -0.8282474279403687, -0.7762529850006104, -0.724258542060852, -0.6722640991210938, -0.6202696561813354, -0.5682752132415771, -0.5162807703018188, -0.46428632736206055, -0.41229188442230225, -0.36029744148254395, -0.30830299854278564, -0.25630855560302734, -0.20431411266326904, -0.15231966972351074, -0.10032522678375244, -0.04833078384399414, 0.003663778305053711, 0.05565822124481201, 0.10765266418457031, 0.1596471071243286, 0.21164155006408691, 0.2636359930038452, 0.3156304359436035, 0.3676248788833618, 0.4196193218231201, 0.4716137647628784, 0.5236082077026367, 0.575602650642395, 0.6275970935821533, 0.6795915365219116, 0.7315859794616699, 0.7835804224014282, 0.8355748653411865, 0.8875693082809448, 0.9395637512207031, 0.9915581941604614, 1.0435526371002197, 1.095547080039978, 1.1475415229797363, 1.1995359659194946, 1.251530408859253, 1.3035248517990112, 1.3555192947387695, 1.4075137376785278, 1.4595081806182861, 1.5115026235580444, 1.5634970664978027, 1.615491509437561, 1.6674859523773193]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 8.0, 6.0, 15.0, 13.0, 36.0, 40.0, 61.0, 94.0, 132.0, 231.0, 356.0, 633.0, 1265.0, 2530.0, 5990.0, 18944.0, 111448.0, 814344.0, 68303.0, 14404.0, 4999.0, 2170.0, 1063.0, 517.0, 318.0, 202.0, 147.0, 88.0, 55.0, 38.0, 26.0, 25.0, 12.0, 6.0, 10.0, 3.0, 7.0, 2.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.38671875, -2.308197021484375, -2.22967529296875, -2.151153564453125, -2.0726318359375, -1.994110107421875, -1.91558837890625, -1.837066650390625, -1.758544921875, -1.680023193359375, -1.60150146484375, -1.522979736328125, -1.4444580078125, -1.365936279296875, -1.28741455078125, -1.208892822265625, -1.13037109375, -1.051849365234375, -0.97332763671875, -0.894805908203125, -0.8162841796875, -0.737762451171875, -0.65924072265625, -0.580718994140625, -0.502197265625, -0.423675537109375, -0.34515380859375, -0.266632080078125, -0.1881103515625, -0.109588623046875, -0.03106689453125, 0.047454833984375, 0.1259765625, 0.204498291015625, 0.28302001953125, 0.361541748046875, 0.4400634765625, 0.518585205078125, 0.59710693359375, 0.675628662109375, 0.754150390625, 0.832672119140625, 0.91119384765625, 0.989715576171875, 1.0682373046875, 1.146759033203125, 1.22528076171875, 1.303802490234375, 1.38232421875, 1.460845947265625, 1.53936767578125, 1.617889404296875, 1.6964111328125, 1.774932861328125, 1.85345458984375, 1.931976318359375, 2.010498046875, 2.089019775390625, 2.16754150390625, 2.246063232421875, 2.3245849609375, 2.403106689453125, 2.48162841796875, 2.560150146484375, 2.638671875]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 3.0, 1.0, 2.0, 0.0, 7.0, 3.0, 2.0, 3.0, 12.0, 8.0, 15.0, 17.0, 29.0, 23.0, 23.0, 33.0, 69.0, 74.0, 69.0, 51.0, 97.0, 79.0, 82.0, 63.0, 52.0, 42.0, 31.0, 29.0, 24.0, 18.0, 13.0, 11.0, 6.0, 4.0, 5.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.291015625, -3.179107666015625, -3.06719970703125, -2.955291748046875, -2.8433837890625, -2.731475830078125, -2.61956787109375, -2.507659912109375, -2.395751953125, -2.283843994140625, -2.17193603515625, -2.060028076171875, -1.9481201171875, -1.836212158203125, -1.72430419921875, -1.612396240234375, -1.50048828125, -1.388580322265625, -1.27667236328125, -1.164764404296875, -1.0528564453125, -0.940948486328125, -0.82904052734375, -0.717132568359375, -0.605224609375, -0.493316650390625, -0.38140869140625, -0.269500732421875, -0.1575927734375, -0.045684814453125, 0.06622314453125, 0.178131103515625, 0.2900390625, 0.401947021484375, 0.51385498046875, 0.625762939453125, 0.7376708984375, 0.849578857421875, 0.96148681640625, 1.073394775390625, 1.185302734375, 1.297210693359375, 1.40911865234375, 1.521026611328125, 1.6329345703125, 1.744842529296875, 1.85675048828125, 1.968658447265625, 2.08056640625, 2.192474365234375, 2.30438232421875, 2.416290283203125, 2.5281982421875, 2.640106201171875, 2.75201416015625, 2.863922119140625, 2.975830078125, 3.087738037109375, 3.19964599609375, 3.311553955078125, 3.4234619140625, 3.535369873046875, 3.64727783203125, 3.759185791015625, 3.87109375]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 7.0, 12.0, 12.0, 21.0, 26.0, 26.0, 58.0, 66.0, 118.0, 237.0, 537.0, 2063.0, 13132.0, 751185.0, 268076.0, 10047.0, 1781.0, 559.0, 206.0, 126.0, 75.0, 53.0, 46.0, 26.0, 14.0, 16.0, 9.0, 6.0, 6.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.48828125, -6.3216552734375, -6.155029296875, -5.9884033203125, -5.82177734375, -5.6551513671875, -5.488525390625, -5.3218994140625, -5.1552734375, -4.9886474609375, -4.822021484375, -4.6553955078125, -4.48876953125, -4.3221435546875, -4.155517578125, -3.9888916015625, -3.822265625, -3.6556396484375, -3.489013671875, -3.3223876953125, -3.15576171875, -2.9891357421875, -2.822509765625, -2.6558837890625, -2.4892578125, -2.3226318359375, -2.156005859375, -1.9893798828125, -1.82275390625, -1.6561279296875, -1.489501953125, -1.3228759765625, -1.15625, -0.9896240234375, -0.822998046875, -0.6563720703125, -0.48974609375, -0.3231201171875, -0.156494140625, 0.0101318359375, 0.1767578125, 0.3433837890625, 0.510009765625, 0.6766357421875, 0.84326171875, 1.0098876953125, 1.176513671875, 1.3431396484375, 1.509765625, 1.6763916015625, 1.843017578125, 2.0096435546875, 2.17626953125, 2.3428955078125, 2.509521484375, 2.6761474609375, 2.8427734375, 3.0093994140625, 3.176025390625, 3.3426513671875, 3.50927734375, 3.6759033203125, 3.842529296875, 4.0091552734375, 4.17578125]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 7.0, 6.0, 13.0, 15.0, 16.0, 21.0, 11.0, 18.0, 37.0, 42.0, 41.0, 43.0, 35.0, 64.0, 50.0, 55.0, 77.0, 56.0, 64.0, 43.0, 54.0, 46.0, 47.0, 23.0, 25.0, 29.0, 19.0, 9.0, 11.0, 9.0, 8.0, 3.0, 2.0, 2.0, 2.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.4296875, -5.286163330078125, -5.14263916015625, -4.999114990234375, -4.8555908203125, -4.712066650390625, -4.56854248046875, -4.425018310546875, -4.281494140625, -4.137969970703125, -3.99444580078125, -3.850921630859375, -3.7073974609375, -3.563873291015625, -3.42034912109375, -3.276824951171875, -3.13330078125, -2.989776611328125, -2.84625244140625, -2.702728271484375, -2.5592041015625, -2.415679931640625, -2.27215576171875, -2.128631591796875, -1.985107421875, -1.841583251953125, -1.69805908203125, -1.554534912109375, -1.4110107421875, -1.267486572265625, -1.12396240234375, -0.980438232421875, -0.8369140625, -0.693389892578125, -0.54986572265625, -0.406341552734375, -0.2628173828125, -0.119293212890625, 0.02423095703125, 0.167755126953125, 0.311279296875, 0.454803466796875, 0.59832763671875, 0.741851806640625, 0.8853759765625, 1.028900146484375, 1.17242431640625, 1.315948486328125, 1.45947265625, 1.602996826171875, 1.74652099609375, 1.890045166015625, 2.0335693359375, 2.177093505859375, 2.32061767578125, 2.464141845703125, 2.607666015625, 2.751190185546875, 2.89471435546875, 3.038238525390625, 3.1817626953125, 3.325286865234375, 3.46881103515625, 3.612335205078125, 3.755859375]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 6.0, 6.0, 13.0, 12.0, 13.0, 21.0, 44.0, 84.0, 184.0, 464.0, 2007.0, 15396.0, 326747.0, 680563.0, 19581.0, 2469.0, 549.0, 191.0, 89.0, 40.0, 33.0, 10.0, 7.0, 7.0, 3.0, 6.0, 9.0, 4.0, 2.0, 1.0], "bins": [-1.572265625, -1.538848876953125, -1.50543212890625, -1.472015380859375, -1.4385986328125, -1.405181884765625, -1.37176513671875, -1.338348388671875, -1.304931640625, -1.271514892578125, -1.23809814453125, -1.204681396484375, -1.1712646484375, -1.137847900390625, -1.10443115234375, -1.071014404296875, -1.03759765625, -1.004180908203125, -0.97076416015625, -0.937347412109375, -0.9039306640625, -0.870513916015625, -0.83709716796875, -0.803680419921875, -0.770263671875, -0.736846923828125, -0.70343017578125, -0.670013427734375, -0.6365966796875, -0.603179931640625, -0.56976318359375, -0.536346435546875, -0.5029296875, -0.469512939453125, -0.43609619140625, -0.402679443359375, -0.3692626953125, -0.335845947265625, -0.30242919921875, -0.269012451171875, -0.235595703125, -0.202178955078125, -0.16876220703125, -0.135345458984375, -0.1019287109375, -0.068511962890625, -0.03509521484375, -0.001678466796875, 0.03173828125, 0.065155029296875, 0.09857177734375, 0.131988525390625, 0.1654052734375, 0.198822021484375, 0.23223876953125, 0.265655517578125, 0.299072265625, 0.332489013671875, 0.36590576171875, 0.399322509765625, 0.4327392578125, 0.466156005859375, 0.49957275390625, 0.532989501953125, 0.56640625]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 9.0, 6.0, 3.0, 4.0, 6.0, 11.0, 14.0, 10.0, 19.0, 30.0, 28.0, 62.0, 96.0, 192.0, 196.0, 98.0, 61.0, 38.0, 38.0, 24.0, 6.0, 17.0, 8.0, 7.0, 4.0, 3.0, 3.0, 6.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.604194641113281e-05, -6.330013275146484e-05, -6.0558319091796875e-05, -5.7816505432128906e-05, -5.507469177246094e-05, -5.233287811279297e-05, -4.9591064453125e-05, -4.684925079345703e-05, -4.410743713378906e-05, -4.1365623474121094e-05, -3.8623809814453125e-05, -3.5881996154785156e-05, -3.314018249511719e-05, -3.039836883544922e-05, -2.765655517578125e-05, -2.491474151611328e-05, -2.2172927856445312e-05, -1.9431114196777344e-05, -1.6689300537109375e-05, -1.3947486877441406e-05, -1.1205673217773438e-05, -8.463859558105469e-06, -5.7220458984375e-06, -2.9802322387695312e-06, -2.384185791015625e-07, 2.5033950805664062e-06, 5.245208740234375e-06, 7.987022399902344e-06, 1.0728836059570312e-05, 1.3470649719238281e-05, 1.621246337890625e-05, 1.895427703857422e-05, 2.1696090698242188e-05, 2.4437904357910156e-05, 2.7179718017578125e-05, 2.9921531677246094e-05, 3.266334533691406e-05, 3.540515899658203e-05, 3.814697265625e-05, 4.088878631591797e-05, 4.363059997558594e-05, 4.6372413635253906e-05, 4.9114227294921875e-05, 5.1856040954589844e-05, 5.459785461425781e-05, 5.733966827392578e-05, 6.008148193359375e-05, 6.282329559326172e-05, 6.556510925292969e-05, 6.830692291259766e-05, 7.104873657226562e-05, 7.37905502319336e-05, 7.653236389160156e-05, 7.927417755126953e-05, 8.20159912109375e-05, 8.475780487060547e-05, 8.749961853027344e-05, 9.02414321899414e-05, 9.298324584960938e-05, 9.572505950927734e-05, 9.846687316894531e-05, 0.00010120868682861328, 0.00010395050048828125, 0.00010669231414794922, 0.00010943412780761719]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 4.0, 3.0, 4.0, 7.0, 11.0, 15.0, 29.0, 50.0, 86.0, 193.0, 512.0, 1538.0, 7191.0, 54463.0, 882651.0, 88806.0, 9951.0, 2025.0, 574.0, 227.0, 100.0, 57.0, 25.0, 15.0, 7.0, 6.0, 6.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.94970703125, -0.9176101684570312, -0.8855133056640625, -0.8534164428710938, -0.821319580078125, -0.7892227172851562, -0.7571258544921875, -0.7250289916992188, -0.69293212890625, -0.6608352661132812, -0.6287384033203125, -0.5966415405273438, -0.564544677734375, -0.5324478149414062, -0.5003509521484375, -0.46825408935546875, -0.4361572265625, -0.40406036376953125, -0.3719635009765625, -0.33986663818359375, -0.307769775390625, -0.27567291259765625, -0.2435760498046875, -0.21147918701171875, -0.17938232421875, -0.14728546142578125, -0.1151885986328125, -0.08309173583984375, -0.050994873046875, -0.01889801025390625, 0.0131988525390625, 0.04529571533203125, 0.077392578125, 0.10948944091796875, 0.1415863037109375, 0.17368316650390625, 0.205780029296875, 0.23787689208984375, 0.2699737548828125, 0.30207061767578125, 0.33416748046875, 0.36626434326171875, 0.3983612060546875, 0.43045806884765625, 0.462554931640625, 0.49465179443359375, 0.5267486572265625, 0.5588455200195312, 0.5909423828125, 0.6230392456054688, 0.6551361083984375, 0.6872329711914062, 0.719329833984375, 0.7514266967773438, 0.7835235595703125, 0.8156204223632812, 0.84771728515625, 0.8798141479492188, 0.9119110107421875, 0.9440078735351562, 0.976104736328125, 1.0082015991210938, 1.0402984619140625, 1.0723953247070312, 1.1044921875]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 3.0, 7.0, 3.0, 6.0, 6.0, 19.0, 23.0, 18.0, 39.0, 52.0, 67.0, 114.0, 268.0, 115.0, 66.0, 47.0, 31.0, 34.0, 12.0, 17.0, 13.0, 7.0, 8.0, 7.0, 5.0, 4.0, 1.0, 2.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.31298828125, -0.3030548095703125, -0.293121337890625, -0.2831878662109375, -0.27325439453125, -0.2633209228515625, -0.253387451171875, -0.2434539794921875, -0.2335205078125, -0.2235870361328125, -0.213653564453125, -0.2037200927734375, -0.19378662109375, -0.1838531494140625, -0.173919677734375, -0.1639862060546875, -0.154052734375, -0.1441192626953125, -0.134185791015625, -0.1242523193359375, -0.11431884765625, -0.1043853759765625, -0.094451904296875, -0.0845184326171875, -0.0745849609375, -0.0646514892578125, -0.054718017578125, -0.0447845458984375, -0.03485107421875, -0.0249176025390625, -0.014984130859375, -0.0050506591796875, 0.0048828125, 0.0148162841796875, 0.024749755859375, 0.0346832275390625, 0.04461669921875, 0.0545501708984375, 0.064483642578125, 0.0744171142578125, 0.0843505859375, 0.0942840576171875, 0.104217529296875, 0.1141510009765625, 0.12408447265625, 0.1340179443359375, 0.143951416015625, 0.1538848876953125, 0.163818359375, 0.1737518310546875, 0.183685302734375, 0.1936187744140625, 0.20355224609375, 0.2134857177734375, 0.223419189453125, 0.2333526611328125, 0.2432861328125, 0.2532196044921875, 0.263153076171875, 0.2730865478515625, 0.28302001953125, 0.2929534912109375, 0.302886962890625, 0.3128204345703125, 0.32275390625]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 9.0, 5.0, 24.0, 50.0, 134.0, 278.0, 271.0, 153.0, 55.0, 12.0, 9.0, 1.0, 6.0, 1.0, 2.0, 0.0, 3.0], "bins": [-21.024106979370117, -20.627666473388672, -20.231225967407227, -19.83478546142578, -19.438343048095703, -19.041902542114258, -18.645462036132812, -18.249021530151367, -17.852581024169922, -17.456140518188477, -17.05970001220703, -16.663259506225586, -16.266817092895508, -15.870377540588379, -15.473936080932617, -15.077495574951172, -14.681055068969727, -14.284614562988281, -13.88817310333252, -13.491732597351074, -13.095292091369629, -12.698851585388184, -12.302410125732422, -11.905969619750977, -11.509528160095215, -11.11308765411377, -10.716646194458008, -10.320205688476562, -9.923765182495117, -9.527324676513672, -9.13088321685791, -8.734442710876465, -8.338001251220703, -7.9415602684021, -7.545119762420654, -7.148678779602051, -6.7522382736206055, -6.355797290802002, -5.959356307983398, -5.562915802001953, -5.166475296020508, -4.770034313201904, -4.373593807220459, -3.9771528244018555, -3.58071231842041, -3.1842713356018066, -2.7878305912017822, -2.391389846801758, -1.9949493408203125, -1.598508596420288, -1.2020678520202637, -0.8056269884109497, -0.4091862440109253, -0.012745499610900879, 0.3836953639984131, 0.7801361083984375, 1.176576852798462, 1.5730175971984863, 1.9694583415985107, 2.365899085998535, 2.7623400688171387, 3.158780574798584, 3.5552215576171875, 3.951662302017212, 4.348103046417236]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 4.0, 8.0, 6.0, 4.0, 8.0, 13.0, 13.0, 10.0, 18.0, 28.0, 15.0, 22.0, 26.0, 35.0, 27.0, 39.0, 31.0, 43.0, 44.0, 44.0, 39.0, 38.0, 48.0, 46.0, 41.0, 35.0, 45.0, 34.0, 37.0, 27.0, 23.0, 34.0, 20.0, 11.0, 14.0, 18.0, 13.0, 13.0, 7.0, 5.0, 8.0, 2.0, 5.0, 1.0, 4.0, 0.0, 0.0, 2.0, 1.0], "bins": [-6.569394111633301, -6.385113716125488, -6.200833320617676, -6.016552925109863, -5.832272529602051, -5.647992134094238, -5.463711738586426, -5.279431343078613, -5.095150947570801, -4.910870552062988, -4.726590156555176, -4.542309761047363, -4.358029365539551, -4.173748970031738, -3.989468574523926, -3.8051881790161133, -3.620907783508301, -3.4366273880004883, -3.252346992492676, -3.0680665969848633, -2.883786201477051, -2.6995058059692383, -2.515225410461426, -2.3309450149536133, -2.146664619445801, -1.9623842239379883, -1.7781038284301758, -1.5938234329223633, -1.4095430374145508, -1.2252626419067383, -1.0409822463989258, -0.8567018508911133, -0.6724214553833008, -0.4881410598754883, -0.3038606643676758, -0.11958026885986328, 0.06470012664794922, 0.24898052215576172, 0.4332609176635742, 0.6175413131713867, 0.8018217086791992, 0.9861021041870117, 1.1703824996948242, 1.3546628952026367, 1.5389432907104492, 1.7232236862182617, 1.9075040817260742, 2.0917844772338867, 2.276064872741699, 2.4603452682495117, 2.644625663757324, 2.8289060592651367, 3.013186454772949, 3.1974668502807617, 3.381747245788574, 3.5660276412963867, 3.750308036804199, 3.9345884323120117, 4.118868827819824, 4.303149223327637, 4.487429618835449, 4.671710014343262, 4.855990409851074, 5.040270805358887, 5.224551200866699]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 5.0, 4.0, 11.0, 6.0, 16.0, 22.0, 23.0, 34.0, 28.0, 59.0, 90.0, 130.0, 133.0, 214.0, 333.0, 560.0, 947.0, 2248.0, 6118.0, 24189.0, 248927.0, 3730464.0, 150573.0, 19479.0, 5320.0, 1981.0, 897.0, 462.0, 287.0, 193.0, 151.0, 103.0, 67.0, 60.0, 49.0, 37.0, 17.0, 16.0, 12.0, 7.0, 6.0, 6.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.794921875, -3.684661865234375, -3.57440185546875, -3.464141845703125, -3.3538818359375, -3.243621826171875, -3.13336181640625, -3.023101806640625, -2.912841796875, -2.802581787109375, -2.69232177734375, -2.582061767578125, -2.4718017578125, -2.361541748046875, -2.25128173828125, -2.141021728515625, -2.03076171875, -1.920501708984375, -1.81024169921875, -1.699981689453125, -1.5897216796875, -1.479461669921875, -1.36920166015625, -1.258941650390625, -1.148681640625, -1.038421630859375, -0.92816162109375, -0.817901611328125, -0.7076416015625, -0.597381591796875, -0.48712158203125, -0.376861572265625, -0.2666015625, -0.156341552734375, -0.04608154296875, 0.064178466796875, 0.1744384765625, 0.284698486328125, 0.39495849609375, 0.505218505859375, 0.615478515625, 0.725738525390625, 0.83599853515625, 0.946258544921875, 1.0565185546875, 1.166778564453125, 1.27703857421875, 1.387298583984375, 1.49755859375, 1.607818603515625, 1.71807861328125, 1.828338623046875, 1.9385986328125, 2.048858642578125, 2.15911865234375, 2.269378662109375, 2.379638671875, 2.489898681640625, 2.60015869140625, 2.710418701171875, 2.8206787109375, 2.930938720703125, 3.04119873046875, 3.151458740234375, 3.26171875]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 5.0, 1.0, 6.0, 6.0, 6.0, 9.0, 17.0, 16.0, 16.0, 37.0, 27.0, 40.0, 48.0, 68.0, 70.0, 72.0, 76.0, 94.0, 70.0, 54.0, 61.0, 58.0, 34.0, 22.0, 21.0, 14.0, 13.0, 12.0, 10.0, 4.0, 3.0, 6.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8720703125, -1.81927490234375, -1.7664794921875, -1.71368408203125, -1.660888671875, -1.60809326171875, -1.5552978515625, -1.50250244140625, -1.44970703125, -1.39691162109375, -1.3441162109375, -1.29132080078125, -1.238525390625, -1.18572998046875, -1.1329345703125, -1.08013916015625, -1.02734375, -0.97454833984375, -0.9217529296875, -0.86895751953125, -0.816162109375, -0.76336669921875, -0.7105712890625, -0.65777587890625, -0.60498046875, -0.55218505859375, -0.4993896484375, -0.44659423828125, -0.393798828125, -0.34100341796875, -0.2882080078125, -0.23541259765625, -0.1826171875, -0.12982177734375, -0.0770263671875, -0.02423095703125, 0.028564453125, 0.08135986328125, 0.1341552734375, 0.18695068359375, 0.23974609375, 0.29254150390625, 0.3453369140625, 0.39813232421875, 0.450927734375, 0.50372314453125, 0.5565185546875, 0.60931396484375, 0.662109375, 0.71490478515625, 0.7677001953125, 0.82049560546875, 0.873291015625, 0.92608642578125, 0.9788818359375, 1.03167724609375, 1.08447265625, 1.13726806640625, 1.1900634765625, 1.24285888671875, 1.295654296875, 1.34844970703125, 1.4012451171875, 1.45404052734375, 1.5068359375]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 11.0, 6.0, 13.0, 15.0, 23.0, 45.0, 79.0, 147.0, 333.0, 910.0, 4510.0, 45955.0, 3757299.0, 367265.0, 14408.0, 2212.0, 546.0, 212.0, 109.0, 51.0, 36.0, 29.0, 12.0, 9.0, 14.0, 5.0, 3.0, 5.0, 2.0, 5.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.65234375, -4.46453857421875, -4.2767333984375, -4.08892822265625, -3.901123046875, -3.71331787109375, -3.5255126953125, -3.33770751953125, -3.14990234375, -2.96209716796875, -2.7742919921875, -2.58648681640625, -2.398681640625, -2.21087646484375, -2.0230712890625, -1.83526611328125, -1.6474609375, -1.45965576171875, -1.2718505859375, -1.08404541015625, -0.896240234375, -0.70843505859375, -0.5206298828125, -0.33282470703125, -0.14501953125, 0.04278564453125, 0.2305908203125, 0.41839599609375, 0.606201171875, 0.79400634765625, 0.9818115234375, 1.16961669921875, 1.357421875, 1.54522705078125, 1.7330322265625, 1.92083740234375, 2.108642578125, 2.29644775390625, 2.4842529296875, 2.67205810546875, 2.85986328125, 3.04766845703125, 3.2354736328125, 3.42327880859375, 3.611083984375, 3.79888916015625, 3.9866943359375, 4.17449951171875, 4.3623046875, 4.55010986328125, 4.7379150390625, 4.92572021484375, 5.113525390625, 5.30133056640625, 5.4891357421875, 5.67694091796875, 5.86474609375, 6.05255126953125, 6.2403564453125, 6.42816162109375, 6.615966796875, 6.80377197265625, 6.9915771484375, 7.17938232421875, 7.3671875]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 5.0, 2.0, 7.0, 3.0, 6.0, 14.0, 8.0, 12.0, 16.0, 20.0, 25.0, 29.0, 39.0, 76.0, 90.0, 131.0, 217.0, 337.0, 571.0, 763.0, 594.0, 382.0, 219.0, 153.0, 93.0, 69.0, 34.0, 44.0, 26.0, 24.0, 13.0, 16.0, 8.0, 10.0, 7.0, 7.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.77880859375, -0.7569046020507812, -0.7350006103515625, -0.7130966186523438, -0.691192626953125, -0.6692886352539062, -0.6473846435546875, -0.6254806518554688, -0.60357666015625, -0.5816726684570312, -0.5597686767578125, -0.5378646850585938, -0.515960693359375, -0.49405670166015625, -0.4721527099609375, -0.45024871826171875, -0.4283447265625, -0.40644073486328125, -0.3845367431640625, -0.36263275146484375, -0.340728759765625, -0.31882476806640625, -0.2969207763671875, -0.27501678466796875, -0.25311279296875, -0.23120880126953125, -0.2093048095703125, -0.18740081787109375, -0.165496826171875, -0.14359283447265625, -0.1216888427734375, -0.09978485107421875, -0.077880859375, -0.05597686767578125, -0.0340728759765625, -0.01216888427734375, 0.009735107421875, 0.03163909912109375, 0.0535430908203125, 0.07544708251953125, 0.09735107421875, 0.11925506591796875, 0.1411590576171875, 0.16306304931640625, 0.184967041015625, 0.20687103271484375, 0.2287750244140625, 0.25067901611328125, 0.2725830078125, 0.29448699951171875, 0.3163909912109375, 0.33829498291015625, 0.360198974609375, 0.38210296630859375, 0.4040069580078125, 0.42591094970703125, 0.44781494140625, 0.46971893310546875, 0.4916229248046875, 0.5135269165039062, 0.535430908203125, 0.5573348999023438, 0.5792388916015625, 0.6011428833007812, 0.623046875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 13.0, 21.0, 12.0, 28.0, 33.0, 49.0, 65.0, 79.0, 102.0, 122.0, 98.0, 98.0, 88.0, 58.0, 45.0, 26.0, 30.0, 13.0, 11.0, 3.0, 6.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.552720069885254, -2.454667091369629, -2.356614351272583, -2.258561372756958, -2.160508632659912, -2.062455654144287, -1.9644027948379517, -1.8663499355316162, -1.7682969570159912, -1.6702440977096558, -1.5721912384033203, -1.4741382598876953, -1.3760854005813599, -1.2780325412750244, -1.179979681968689, -1.0819268226623535, -0.9838739633560181, -0.8858211040496826, -0.7877681851387024, -0.6897153258323669, -0.5916624069213867, -0.49360954761505127, -0.3955566883087158, -0.2975037693977356, -0.19945091009140015, -0.1013980284333229, -0.0033451467752456665, 0.09470772743225098, 0.1927606165409088, 0.29081350564956665, 0.3888663649559021, 0.4869192838668823, 0.5849721431732178, 0.6830250024795532, 0.7810779213905334, 0.8791307806968689, 0.9771836996078491, 1.0752365589141846, 1.17328941822052, 1.2713422775268555, 1.3693952560424805, 1.467448115348816, 1.5655009746551514, 1.6635539531707764, 1.7616068124771118, 1.8596596717834473, 1.9577125310897827, 2.055765390396118, 2.153818130493164, 2.251871109008789, 2.349923849105835, 2.44797682762146, 2.546029567718506, 2.644082546234131, 2.742135524749756, 2.8401882648468018, 2.9382412433624268, 3.0362942218780518, 3.1343469619750977, 3.2323999404907227, 3.3304526805877686, 3.4285056591033936, 3.5265583992004395, 3.6246113777160645, 3.7226643562316895]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 5.0, 8.0, 2.0, 4.0, 9.0, 12.0, 11.0, 19.0, 19.0, 18.0, 21.0, 25.0, 23.0, 31.0, 33.0, 38.0, 39.0, 38.0, 46.0, 42.0, 40.0, 53.0, 55.0, 39.0, 49.0, 34.0, 30.0, 36.0, 26.0, 25.0, 28.0, 23.0, 20.0, 23.0, 11.0, 11.0, 15.0, 12.0, 6.0, 5.0, 2.0, 4.0, 4.0, 8.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4101009368896484, -1.361124873161316, -1.312148928642273, -1.2631728649139404, -1.2141969203948975, -1.165220856666565, -1.1162447929382324, -1.0672688484191895, -1.0182929039001465, -0.9693168997764587, -0.920340895652771, -0.8713648319244385, -0.8223888874053955, -0.773412823677063, -0.7244368195533752, -0.6754608154296875, -0.626484751701355, -0.5775087475776672, -0.5285327434539795, -0.47955670952796936, -0.4305807054042816, -0.38160470128059387, -0.33262866735458374, -0.283652663230896, -0.23467665910720825, -0.1857006549835205, -0.13672463595867157, -0.08774861693382263, -0.03877261281013489, 0.010203391313552856, 0.05917942523956299, 0.10815542936325073, 0.15713131427764893, 0.20610731840133667, 0.2550833225250244, 0.30405935645103455, 0.3530353605747223, 0.40201136469841003, 0.45098739862442017, 0.4999634027481079, 0.5489394068717957, 0.5979154109954834, 0.6468914151191711, 0.6958674192428589, 0.7448434829711914, 0.7938194274902344, 0.8427954912185669, 0.8917714953422546, 0.9407474994659424, 0.9897235035896301, 1.0386995077133179, 1.0876755714416504, 1.1366515159606934, 1.1856275796890259, 1.2346036434173584, 1.2835795879364014, 1.3325555324554443, 1.3815315961837769, 1.4305075407028198, 1.4794836044311523, 1.5284595489501953, 1.5774356126785278, 1.6264116764068604, 1.6753876209259033, 1.7243636846542358]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 6.0, 4.0, 5.0, 4.0, 6.0, 7.0, 15.0, 25.0, 38.0, 36.0, 77.0, 116.0, 211.0, 366.0, 668.0, 1528.0, 3455.0, 8631.0, 26996.0, 106096.0, 408498.0, 364885.0, 89954.0, 23184.0, 7889.0, 3066.0, 1305.0, 628.0, 340.0, 176.0, 92.0, 78.0, 49.0, 37.0, 23.0, 19.0, 13.0, 9.0, 8.0, 4.0, 5.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.263427734375, -0.25432586669921875, -0.2452239990234375, -0.23612213134765625, -0.227020263671875, -0.21791839599609375, -0.2088165283203125, -0.19971466064453125, -0.19061279296875, -0.18151092529296875, -0.1724090576171875, -0.16330718994140625, -0.154205322265625, -0.14510345458984375, -0.1360015869140625, -0.12689971923828125, -0.1177978515625, -0.10869598388671875, -0.0995941162109375, -0.09049224853515625, -0.081390380859375, -0.07228851318359375, -0.0631866455078125, -0.05408477783203125, -0.04498291015625, -0.03588104248046875, -0.0267791748046875, -0.01767730712890625, -0.008575439453125, 0.00052642822265625, 0.0096282958984375, 0.01873016357421875, 0.02783203125, 0.03693389892578125, 0.0460357666015625, 0.05513763427734375, 0.064239501953125, 0.07334136962890625, 0.0824432373046875, 0.09154510498046875, 0.10064697265625, 0.10974884033203125, 0.1188507080078125, 0.12795257568359375, 0.137054443359375, 0.14615631103515625, 0.1552581787109375, 0.16436004638671875, 0.1734619140625, 0.18256378173828125, 0.1916656494140625, 0.20076751708984375, 0.209869384765625, 0.21897125244140625, 0.2280731201171875, 0.23717498779296875, 0.24627685546875, 0.25537872314453125, 0.2644805908203125, 0.27358245849609375, 0.282684326171875, 0.29178619384765625, 0.3008880615234375, 0.30998992919921875, 0.319091796875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 5.0, 3.0, 4.0, 2.0, 6.0, 7.0, 4.0, 16.0, 21.0, 18.0, 21.0, 21.0, 30.0, 34.0, 39.0, 35.0, 35.0, 52.0, 48.0, 47.0, 52.0, 50.0, 48.0, 50.0, 48.0, 41.0, 44.0, 32.0, 26.0, 28.0, 22.0, 14.0, 22.0, 17.0, 17.0, 11.0, 6.0, 6.0, 7.0, 8.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.0390625, -1.0032958984375, -0.967529296875, -0.9317626953125, -0.89599609375, -0.8602294921875, -0.824462890625, -0.7886962890625, -0.7529296875, -0.7171630859375, -0.681396484375, -0.6456298828125, -0.60986328125, -0.5740966796875, -0.538330078125, -0.5025634765625, -0.466796875, -0.4310302734375, -0.395263671875, -0.3594970703125, -0.32373046875, -0.2879638671875, -0.252197265625, -0.2164306640625, -0.1806640625, -0.1448974609375, -0.109130859375, -0.0733642578125, -0.03759765625, -0.0018310546875, 0.033935546875, 0.0697021484375, 0.10546875, 0.1412353515625, 0.177001953125, 0.2127685546875, 0.24853515625, 0.2843017578125, 0.320068359375, 0.3558349609375, 0.3916015625, 0.4273681640625, 0.463134765625, 0.4989013671875, 0.53466796875, 0.5704345703125, 0.606201171875, 0.6419677734375, 0.677734375, 0.7135009765625, 0.749267578125, 0.7850341796875, 0.82080078125, 0.8565673828125, 0.892333984375, 0.9281005859375, 0.9638671875, 0.9996337890625, 1.035400390625, 1.0711669921875, 1.10693359375, 1.1427001953125, 1.178466796875, 1.2142333984375, 1.25]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 4.0, 5.0, 6.0, 7.0, 21.0, 26.0, 40.0, 52.0, 91.0, 131.0, 205.0, 357.0, 659.0, 1393.0, 3220.0, 8832.0, 33451.0, 163752.0, 492601.0, 265962.0, 56182.0, 13643.0, 4302.0, 1715.0, 730.0, 440.0, 248.0, 187.0, 97.0, 57.0, 49.0, 24.0, 24.0, 17.0, 9.0, 2.0, 9.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2464599609375, -0.23785972595214844, -0.22925949096679688, -0.2206592559814453, -0.21205902099609375, -0.2034587860107422, -0.19485855102539062, -0.18625831604003906, -0.1776580810546875, -0.16905784606933594, -0.16045761108398438, -0.1518573760986328, -0.14325714111328125, -0.1346569061279297, -0.12605667114257812, -0.11745643615722656, -0.108856201171875, -0.10025596618652344, -0.09165573120117188, -0.08305549621582031, -0.07445526123046875, -0.06585502624511719, -0.057254791259765625, -0.04865455627441406, -0.0400543212890625, -0.03145408630371094, -0.022853851318359375, -0.014253616333007812, -0.00565338134765625, 0.0029468536376953125, 0.011547088623046875, 0.020147323608398438, 0.02874755859375, 0.03734779357910156, 0.045948028564453125, 0.05454826354980469, 0.06314849853515625, 0.07174873352050781, 0.08034896850585938, 0.08894920349121094, 0.0975494384765625, 0.10614967346191406, 0.11474990844726562, 0.12335014343261719, 0.13195037841796875, 0.1405506134033203, 0.14915084838867188, 0.15775108337402344, 0.166351318359375, 0.17495155334472656, 0.18355178833007812, 0.1921520233154297, 0.20075225830078125, 0.2093524932861328, 0.21795272827148438, 0.22655296325683594, 0.2351531982421875, 0.24375343322753906, 0.2523536682128906, 0.2609539031982422, 0.26955413818359375, 0.2781543731689453, 0.2867546081542969, 0.29535484313964844, 0.303955078125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 4.0, 3.0, 7.0, 5.0, 5.0, 6.0, 11.0, 15.0, 13.0, 8.0, 18.0, 9.0, 21.0, 27.0, 30.0, 35.0, 37.0, 26.0, 51.0, 37.0, 41.0, 44.0, 46.0, 58.0, 39.0, 29.0, 35.0, 45.0, 29.0, 30.0, 36.0, 28.0, 19.0, 18.0, 21.0, 16.0, 10.0, 13.0, 10.0, 12.0, 6.0, 6.0, 15.0, 5.0, 7.0, 6.0, 4.0, 7.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.16015625, -2.09393310546875, -2.0277099609375, -1.96148681640625, -1.895263671875, -1.82904052734375, -1.7628173828125, -1.69659423828125, -1.63037109375, -1.56414794921875, -1.4979248046875, -1.43170166015625, -1.365478515625, -1.29925537109375, -1.2330322265625, -1.16680908203125, -1.1005859375, -1.03436279296875, -0.9681396484375, -0.90191650390625, -0.835693359375, -0.76947021484375, -0.7032470703125, -0.63702392578125, -0.57080078125, -0.50457763671875, -0.4383544921875, -0.37213134765625, -0.305908203125, -0.23968505859375, -0.1734619140625, -0.10723876953125, -0.041015625, 0.02520751953125, 0.0914306640625, 0.15765380859375, 0.223876953125, 0.29010009765625, 0.3563232421875, 0.42254638671875, 0.48876953125, 0.55499267578125, 0.6212158203125, 0.68743896484375, 0.753662109375, 0.81988525390625, 0.8861083984375, 0.95233154296875, 1.0185546875, 1.08477783203125, 1.1510009765625, 1.21722412109375, 1.283447265625, 1.34967041015625, 1.4158935546875, 1.48211669921875, 1.54833984375, 1.61456298828125, 1.6807861328125, 1.74700927734375, 1.813232421875, 1.87945556640625, 1.9456787109375, 2.01190185546875, 2.078125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 5.0, 11.0, 15.0, 28.0, 31.0, 50.0, 66.0, 106.0, 189.0, 333.0, 645.0, 1379.0, 3352.0, 10236.0, 40243.0, 230384.0, 584235.0, 138243.0, 26624.0, 7355.0, 2703.0, 1093.0, 530.0, 249.0, 147.0, 80.0, 71.0, 42.0, 30.0, 26.0, 16.0, 18.0, 7.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 5.0, 0.0, 1.0], "bins": [-0.1258544921875, -0.1225738525390625, -0.119293212890625, -0.1160125732421875, -0.11273193359375, -0.1094512939453125, -0.106170654296875, -0.1028900146484375, -0.099609375, -0.0963287353515625, -0.093048095703125, -0.0897674560546875, -0.08648681640625, -0.0832061767578125, -0.079925537109375, -0.0766448974609375, -0.0733642578125, -0.0700836181640625, -0.066802978515625, -0.0635223388671875, -0.06024169921875, -0.0569610595703125, -0.053680419921875, -0.0503997802734375, -0.047119140625, -0.0438385009765625, -0.040557861328125, -0.0372772216796875, -0.03399658203125, -0.0307159423828125, -0.027435302734375, -0.0241546630859375, -0.0208740234375, -0.0175933837890625, -0.014312744140625, -0.0110321044921875, -0.00775146484375, -0.0044708251953125, -0.001190185546875, 0.0020904541015625, 0.00537109375, 0.0086517333984375, 0.011932373046875, 0.0152130126953125, 0.01849365234375, 0.0217742919921875, 0.025054931640625, 0.0283355712890625, 0.0316162109375, 0.0348968505859375, 0.038177490234375, 0.0414581298828125, 0.04473876953125, 0.0480194091796875, 0.051300048828125, 0.0545806884765625, 0.057861328125, 0.0611419677734375, 0.064422607421875, 0.0677032470703125, 0.07098388671875, 0.0742645263671875, 0.077545166015625, 0.0808258056640625, 0.0841064453125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 4.0, 9.0, 15.0, 13.0, 22.0, 27.0, 46.0, 48.0, 70.0, 84.0, 96.0, 105.0, 114.0, 77.0, 56.0, 53.0, 37.0, 31.0, 24.0, 13.0, 18.0, 8.0, 4.0, 10.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.324052810668945e-05, -6.123911589384079e-05, -5.9237703680992126e-05, -5.723629146814346e-05, -5.52348792552948e-05, -5.3233467042446136e-05, -5.123205482959747e-05, -4.923064261674881e-05, -4.7229230403900146e-05, -4.522781819105148e-05, -4.322640597820282e-05, -4.1224993765354156e-05, -3.922358155250549e-05, -3.722216933965683e-05, -3.5220757126808167e-05, -3.32193449139595e-05, -3.121793270111084e-05, -2.9216520488262177e-05, -2.7215108275413513e-05, -2.521369606256485e-05, -2.3212283849716187e-05, -2.1210871636867523e-05, -1.920945942401886e-05, -1.7208047211170197e-05, -1.5206634998321533e-05, -1.320522278547287e-05, -1.1203810572624207e-05, -9.202398359775543e-06, -7.20098614692688e-06, -5.1995739340782166e-06, -3.1981617212295532e-06, -1.1967495083808899e-06, 8.046627044677734e-07, 2.8060749173164368e-06, 4.8074871301651e-06, 6.8088993430137634e-06, 8.810311555862427e-06, 1.081172376871109e-05, 1.2813135981559753e-05, 1.4814548194408417e-05, 1.681596040725708e-05, 1.8817372620105743e-05, 2.0818784832954407e-05, 2.282019704580307e-05, 2.4821609258651733e-05, 2.6823021471500397e-05, 2.882443368434906e-05, 3.0825845897197723e-05, 3.282725811004639e-05, 3.482867032289505e-05, 3.683008253574371e-05, 3.883149474859238e-05, 4.083290696144104e-05, 4.28343191742897e-05, 4.483573138713837e-05, 4.683714359998703e-05, 4.883855581283569e-05, 5.083996802568436e-05, 5.284138023853302e-05, 5.484279245138168e-05, 5.684420466423035e-05, 5.884561687707901e-05, 6.084702908992767e-05, 6.284844130277634e-05, 6.4849853515625e-05]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 4.0, 5.0, 3.0, 1.0, 2.0, 9.0, 14.0, 13.0, 9.0, 13.0, 29.0, 41.0, 50.0, 62.0, 94.0, 139.0, 194.0, 343.0, 574.0, 1056.0, 2080.0, 4543.0, 11026.0, 34572.0, 143975.0, 497216.0, 264014.0, 58813.0, 17030.0, 6421.0, 2888.0, 1402.0, 742.0, 413.0, 248.0, 155.0, 102.0, 80.0, 42.0, 27.0, 31.0, 24.0, 20.0, 12.0, 13.0, 5.0, 2.0, 8.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.09637451171875, -0.09323501586914062, -0.09009552001953125, -0.08695602416992188, -0.0838165283203125, -0.08067703247070312, -0.07753753662109375, -0.07439804077148438, -0.071258544921875, -0.06811904907226562, -0.06497955322265625, -0.061840057373046875, -0.0587005615234375, -0.055561065673828125, -0.05242156982421875, -0.049282073974609375, -0.046142578125, -0.043003082275390625, -0.03986358642578125, -0.036724090576171875, -0.0335845947265625, -0.030445098876953125, -0.02730560302734375, -0.024166107177734375, -0.021026611328125, -0.017887115478515625, -0.01474761962890625, -0.011608123779296875, -0.0084686279296875, -0.005329132080078125, -0.00218963623046875, 0.000949859619140625, 0.00408935546875, 0.007228851318359375, 0.01036834716796875, 0.013507843017578125, 0.0166473388671875, 0.019786834716796875, 0.02292633056640625, 0.026065826416015625, 0.029205322265625, 0.032344818115234375, 0.03548431396484375, 0.038623809814453125, 0.0417633056640625, 0.044902801513671875, 0.04804229736328125, 0.051181793212890625, 0.0543212890625, 0.057460784912109375, 0.06060028076171875, 0.06373977661132812, 0.0668792724609375, 0.07001876831054688, 0.07315826416015625, 0.07629776000976562, 0.079437255859375, 0.08257675170898438, 0.08571624755859375, 0.08885574340820312, 0.0919952392578125, 0.09513473510742188, 0.09827423095703125, 0.10141372680664062, 0.10455322265625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 2.0, 1.0, 0.0, 6.0, 4.0, 8.0, 8.0, 12.0, 9.0, 38.0, 37.0, 44.0, 41.0, 73.0, 94.0, 83.0, 83.0, 88.0, 82.0, 63.0, 51.0, 44.0, 29.0, 17.0, 26.0, 11.0, 6.0, 12.0, 5.0, 6.0, 4.0, 4.0, 4.0, 0.0, 3.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0], "bins": [-0.0306854248046875, -0.0298919677734375, -0.0290985107421875, -0.0283050537109375, -0.0275115966796875, -0.0267181396484375, -0.0259246826171875, -0.0251312255859375, -0.0243377685546875, -0.0235443115234375, -0.0227508544921875, -0.0219573974609375, -0.0211639404296875, -0.0203704833984375, -0.0195770263671875, -0.0187835693359375, -0.0179901123046875, -0.0171966552734375, -0.0164031982421875, -0.0156097412109375, -0.0148162841796875, -0.0140228271484375, -0.0132293701171875, -0.0124359130859375, -0.0116424560546875, -0.0108489990234375, -0.0100555419921875, -0.0092620849609375, -0.0084686279296875, -0.0076751708984375, -0.0068817138671875, -0.0060882568359375, -0.0052947998046875, -0.0045013427734375, -0.0037078857421875, -0.0029144287109375, -0.0021209716796875, -0.0013275146484375, -0.0005340576171875, 0.0002593994140625, 0.0010528564453125, 0.0018463134765625, 0.0026397705078125, 0.0034332275390625, 0.0042266845703125, 0.0050201416015625, 0.0058135986328125, 0.0066070556640625, 0.0074005126953125, 0.0081939697265625, 0.0089874267578125, 0.0097808837890625, 0.0105743408203125, 0.0113677978515625, 0.0121612548828125, 0.0129547119140625, 0.0137481689453125, 0.0145416259765625, 0.0153350830078125, 0.0161285400390625, 0.0169219970703125, 0.0177154541015625, 0.0185089111328125, 0.0193023681640625, 0.0200958251953125]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 6.0, 5.0, 6.0, 9.0, 10.0, 23.0, 24.0, 35.0, 46.0, 56.0, 63.0, 94.0, 97.0, 88.0, 109.0, 86.0, 60.0, 55.0, 40.0, 23.0, 20.0, 18.0, 7.0, 9.0, 4.0, 4.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6849658489227295, -1.6311278343200684, -1.5772899389266968, -1.5234519243240356, -1.4696139097213745, -1.415776014328003, -1.3619379997253418, -1.3080999851226807, -1.2542619705200195, -1.2004239559173584, -1.1465860605239868, -1.0927480459213257, -1.0389100313186646, -0.9850720763206482, -0.9312341213226318, -0.8773961067199707, -0.8235582113265991, -0.7697202563285828, -0.7158822417259216, -0.6620442867279053, -0.6082062721252441, -0.5543683171272278, -0.5005303621292114, -0.4466923773288727, -0.39285439252853394, -0.3390164077281952, -0.28517842292785645, -0.2313404679298401, -0.17750248312950134, -0.1236644983291626, -0.06982654333114624, -0.015988558530807495, 0.0378495454788208, 0.09168752282857895, 0.1455255001783371, 0.19936347007751465, 0.2532014548778534, 0.30703943967819214, 0.3608773946762085, 0.41471537947654724, 0.468553364276886, 0.5223913192749023, 0.5762293338775635, 0.6300672888755798, 0.6839052438735962, 0.7377432584762573, 0.7915812134742737, 0.84541916847229, 0.8992571830749512, 0.9530951380729675, 1.0069330930709839, 1.060771107673645, 1.1146091222763062, 1.1684470176696777, 1.2222850322723389, 1.276123046875, 1.3299610614776611, 1.3837990760803223, 1.4376369714736938, 1.491474986076355, 1.5453130006790161, 1.5991508960723877, 1.6529889106750488, 1.70682692527771, 1.7606648206710815]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 5.0, 4.0, 4.0, 6.0, 8.0, 5.0, 5.0, 11.0, 17.0, 20.0, 23.0, 24.0, 17.0, 33.0, 35.0, 43.0, 42.0, 45.0, 49.0, 48.0, 57.0, 60.0, 53.0, 52.0, 47.0, 26.0, 44.0, 30.0, 28.0, 21.0, 22.0, 35.0, 16.0, 12.0, 11.0, 12.0, 9.0, 9.0, 2.0, 5.0, 3.0, 2.0, 0.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.9726780652999878, -0.9380478858947754, -0.903417706489563, -0.8687874674797058, -0.8341572880744934, -0.799527108669281, -0.7648968696594238, -0.7302666902542114, -0.695636510848999, -0.6610063314437866, -0.6263761520385742, -0.591745913028717, -0.5571157336235046, -0.5224855542182922, -0.48785534501075745, -0.45322513580322266, -0.41859495639801025, -0.38396477699279785, -0.34933456778526306, -0.31470435857772827, -0.28007417917251587, -0.24544398486614227, -0.21081379055976868, -0.17618359625339508, -0.14155340194702148, -0.10692320764064789, -0.07229301333427429, -0.037662819027900696, -0.0030326247215270996, 0.0315975695848465, 0.06622776389122009, 0.10085795819759369, 0.13548815250396729, 0.17011834681034088, 0.20474854111671448, 0.23937873542308807, 0.27400892972946167, 0.3086391091346741, 0.34326931834220886, 0.37789952754974365, 0.41252970695495605, 0.44715988636016846, 0.48179009556770325, 0.516420304775238, 0.5510504841804504, 0.5856806635856628, 0.62031090259552, 0.6549410820007324, 0.6895712614059448, 0.7242014408111572, 0.7588316202163696, 0.7934618592262268, 0.8280920386314392, 0.8627222180366516, 0.8973524570465088, 0.9319826364517212, 0.9666128158569336, 1.001242995262146, 1.0358731746673584, 1.0705033540725708, 1.1051335334777832, 1.1397638320922852, 1.1743940114974976, 1.20902419090271, 1.2436543703079224]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 4.0, 2.0, 4.0, 11.0, 4.0, 17.0, 22.0, 29.0, 49.0, 44.0, 67.0, 121.0, 173.0, 299.0, 450.0, 811.0, 1467.0, 2864.0, 5878.0, 13789.0, 36316.0, 145395.0, 630537.0, 147493.0, 36434.0, 13689.0, 6064.0, 2866.0, 1504.0, 810.0, 462.0, 311.0, 193.0, 140.0, 65.0, 61.0, 33.0, 28.0, 14.0, 10.0, 8.0, 9.0, 4.0, 5.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.6796875, -1.6227569580078125, -1.565826416015625, -1.5088958740234375, -1.45196533203125, -1.3950347900390625, -1.338104248046875, -1.2811737060546875, -1.2242431640625, -1.1673126220703125, -1.110382080078125, -1.0534515380859375, -0.99652099609375, -0.9395904541015625, -0.882659912109375, -0.8257293701171875, -0.768798828125, -0.7118682861328125, -0.654937744140625, -0.5980072021484375, -0.54107666015625, -0.4841461181640625, -0.427215576171875, -0.3702850341796875, -0.3133544921875, -0.2564239501953125, -0.199493408203125, -0.1425628662109375, -0.08563232421875, -0.0287017822265625, 0.028228759765625, 0.0851593017578125, 0.14208984375, 0.1990203857421875, 0.255950927734375, 0.3128814697265625, 0.36981201171875, 0.4267425537109375, 0.483673095703125, 0.5406036376953125, 0.5975341796875, 0.6544647216796875, 0.711395263671875, 0.7683258056640625, 0.82525634765625, 0.8821868896484375, 0.939117431640625, 0.9960479736328125, 1.052978515625, 1.1099090576171875, 1.166839599609375, 1.2237701416015625, 1.28070068359375, 1.3376312255859375, 1.394561767578125, 1.4514923095703125, 1.5084228515625, 1.5653533935546875, 1.622283935546875, 1.6792144775390625, 1.73614501953125, 1.7930755615234375, 1.850006103515625, 1.9069366455078125, 1.9638671875]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 1.0, 5.0, 2.0, 2.0, 4.0, 6.0, 5.0, 7.0, 9.0, 6.0, 12.0, 19.0, 21.0, 15.0, 28.0, 28.0, 33.0, 31.0, 38.0, 57.0, 57.0, 59.0, 52.0, 58.0, 49.0, 47.0, 50.0, 49.0, 30.0, 38.0, 28.0, 29.0, 26.0, 29.0, 23.0, 11.0, 5.0, 12.0, 5.0, 7.0, 4.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.34765625, -2.267669677734375, -2.18768310546875, -2.107696533203125, -2.0277099609375, -1.947723388671875, -1.86773681640625, -1.787750244140625, -1.707763671875, -1.627777099609375, -1.54779052734375, -1.467803955078125, -1.3878173828125, -1.307830810546875, -1.22784423828125, -1.147857666015625, -1.06787109375, -0.987884521484375, -0.90789794921875, -0.827911376953125, -0.7479248046875, -0.667938232421875, -0.58795166015625, -0.507965087890625, -0.427978515625, -0.347991943359375, -0.26800537109375, -0.188018798828125, -0.1080322265625, -0.028045654296875, 0.05194091796875, 0.131927490234375, 0.2119140625, 0.291900634765625, 0.37188720703125, 0.451873779296875, 0.5318603515625, 0.611846923828125, 0.69183349609375, 0.771820068359375, 0.851806640625, 0.931793212890625, 1.01177978515625, 1.091766357421875, 1.1717529296875, 1.251739501953125, 1.33172607421875, 1.411712646484375, 1.49169921875, 1.571685791015625, 1.65167236328125, 1.731658935546875, 1.8116455078125, 1.891632080078125, 1.97161865234375, 2.051605224609375, 2.131591796875, 2.211578369140625, 2.29156494140625, 2.371551513671875, 2.4515380859375, 2.531524658203125, 2.61151123046875, 2.691497802734375, 2.771484375]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 7.0, 9.0, 6.0, 12.0, 20.0, 20.0, 42.0, 70.0, 107.0, 222.0, 548.0, 1752.0, 7510.0, 42669.0, 760811.0, 208594.0, 20208.0, 4091.0, 1091.0, 363.0, 157.0, 92.0, 46.0, 40.0, 24.0, 14.0, 9.0, 5.0, 6.0, 4.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-4.28125, -4.173675537109375, -4.06610107421875, -3.958526611328125, -3.8509521484375, -3.743377685546875, -3.63580322265625, -3.528228759765625, -3.420654296875, -3.313079833984375, -3.20550537109375, -3.097930908203125, -2.9903564453125, -2.882781982421875, -2.77520751953125, -2.667633056640625, -2.56005859375, -2.452484130859375, -2.34490966796875, -2.237335205078125, -2.1297607421875, -2.022186279296875, -1.91461181640625, -1.807037353515625, -1.699462890625, -1.591888427734375, -1.48431396484375, -1.376739501953125, -1.2691650390625, -1.161590576171875, -1.05401611328125, -0.946441650390625, -0.8388671875, -0.731292724609375, -0.62371826171875, -0.516143798828125, -0.4085693359375, -0.300994873046875, -0.19342041015625, -0.085845947265625, 0.021728515625, 0.129302978515625, 0.23687744140625, 0.344451904296875, 0.4520263671875, 0.559600830078125, 0.66717529296875, 0.774749755859375, 0.88232421875, 0.989898681640625, 1.09747314453125, 1.205047607421875, 1.3126220703125, 1.420196533203125, 1.52777099609375, 1.635345458984375, 1.742919921875, 1.850494384765625, 1.95806884765625, 2.065643310546875, 2.1732177734375, 2.280792236328125, 2.38836669921875, 2.495941162109375, 2.603515625]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 7.0, 3.0, 8.0, 7.0, 11.0, 15.0, 24.0, 16.0, 19.0, 18.0, 15.0, 17.0, 47.0, 40.0, 41.0, 45.0, 50.0, 66.0, 60.0, 69.0, 52.0, 43.0, 46.0, 49.0, 34.0, 38.0, 32.0, 24.0, 18.0, 15.0, 11.0, 15.0, 11.0, 6.0, 4.0, 5.0, 6.0, 3.0, 4.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0], "bins": [-3.74609375, -3.634857177734375, -3.52362060546875, -3.412384033203125, -3.3011474609375, -3.189910888671875, -3.07867431640625, -2.967437744140625, -2.856201171875, -2.744964599609375, -2.63372802734375, -2.522491455078125, -2.4112548828125, -2.300018310546875, -2.18878173828125, -2.077545166015625, -1.96630859375, -1.855072021484375, -1.74383544921875, -1.632598876953125, -1.5213623046875, -1.410125732421875, -1.29888916015625, -1.187652587890625, -1.076416015625, -0.965179443359375, -0.85394287109375, -0.742706298828125, -0.6314697265625, -0.520233154296875, -0.40899658203125, -0.297760009765625, -0.1865234375, -0.075286865234375, 0.03594970703125, 0.147186279296875, 0.2584228515625, 0.369659423828125, 0.48089599609375, 0.592132568359375, 0.703369140625, 0.814605712890625, 0.92584228515625, 1.037078857421875, 1.1483154296875, 1.259552001953125, 1.37078857421875, 1.482025146484375, 1.59326171875, 1.704498291015625, 1.81573486328125, 1.926971435546875, 2.0382080078125, 2.149444580078125, 2.26068115234375, 2.371917724609375, 2.483154296875, 2.594390869140625, 2.70562744140625, 2.816864013671875, 2.9281005859375, 3.039337158203125, 3.15057373046875, 3.261810302734375, 3.373046875]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 3.0, 5.0, 3.0, 6.0, 4.0, 18.0, 21.0, 29.0, 45.0, 96.0, 204.0, 644.0, 2165.0, 9775.0, 61268.0, 773860.0, 174144.0, 20389.0, 4136.0, 1048.0, 349.0, 142.0, 91.0, 32.0, 24.0, 18.0, 9.0, 6.0, 4.0, 10.0, 3.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.90576171875, -0.8788986206054688, -0.8520355224609375, -0.8251724243164062, -0.798309326171875, -0.7714462280273438, -0.7445831298828125, -0.7177200317382812, -0.69085693359375, -0.6639938354492188, -0.6371307373046875, -0.6102676391601562, -0.583404541015625, -0.5565414428710938, -0.5296783447265625, -0.5028152465820312, -0.4759521484375, -0.44908905029296875, -0.4222259521484375, -0.39536285400390625, -0.368499755859375, -0.34163665771484375, -0.3147735595703125, -0.28791046142578125, -0.26104736328125, -0.23418426513671875, -0.2073211669921875, -0.18045806884765625, -0.153594970703125, -0.12673187255859375, -0.0998687744140625, -0.07300567626953125, -0.046142578125, -0.01927947998046875, 0.0075836181640625, 0.03444671630859375, 0.061309814453125, 0.08817291259765625, 0.1150360107421875, 0.14189910888671875, 0.16876220703125, 0.19562530517578125, 0.2224884033203125, 0.24935150146484375, 0.276214599609375, 0.30307769775390625, 0.3299407958984375, 0.35680389404296875, 0.3836669921875, 0.41053009033203125, 0.4373931884765625, 0.46425628662109375, 0.491119384765625, 0.5179824829101562, 0.5448455810546875, 0.5717086791992188, 0.59857177734375, 0.6254348754882812, 0.6522979736328125, 0.6791610717773438, 0.706024169921875, 0.7328872680664062, 0.7597503662109375, 0.7866134643554688, 0.8134765625]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 5.0, 7.0, 12.0, 7.0, 10.0, 15.0, 26.0, 29.0, 45.0, 71.0, 78.0, 189.0, 171.0, 105.0, 62.0, 48.0, 32.0, 27.0, 22.0, 18.0, 4.0, 11.0, 4.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0001310110092163086, -0.000127376988530159, -0.0001237429678440094, -0.0001201089471578598, -0.0001164749264717102, -0.00011284090578556061, -0.00010920688509941101, -0.00010557286441326141, -0.00010193884372711182, -9.830482304096222e-05, -9.467080235481262e-05, -9.103678166866302e-05, -8.740276098251343e-05, -8.376874029636383e-05, -8.013471961021423e-05, -7.650069892406464e-05, -7.286667823791504e-05, -6.923265755176544e-05, -6.559863686561584e-05, -6.196461617946625e-05, -5.833059549331665e-05, -5.469657480716705e-05, -5.1062554121017456e-05, -4.742853343486786e-05, -4.379451274871826e-05, -4.0160492062568665e-05, -3.652647137641907e-05, -3.289245069026947e-05, -2.9258430004119873e-05, -2.5624409317970276e-05, -2.199038863182068e-05, -1.835636794567108e-05, -1.4722347259521484e-05, -1.1088326573371887e-05, -7.45430588722229e-06, -3.820285201072693e-06, -1.862645149230957e-07, 3.4477561712265015e-06, 7.081776857376099e-06, 1.0715797543525696e-05, 1.4349818229675293e-05, 1.798383891582489e-05, 2.1617859601974487e-05, 2.5251880288124084e-05, 2.888590097427368e-05, 3.251992166042328e-05, 3.6153942346572876e-05, 3.978796303272247e-05, 4.342198371887207e-05, 4.705600440502167e-05, 5.0690025091171265e-05, 5.432404577732086e-05, 5.795806646347046e-05, 6.159208714962006e-05, 6.522610783576965e-05, 6.886012852191925e-05, 7.249414920806885e-05, 7.612816989421844e-05, 7.976219058036804e-05, 8.339621126651764e-05, 8.703023195266724e-05, 9.066425263881683e-05, 9.429827332496643e-05, 9.793229401111603e-05, 0.00010156631469726562]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 5.0, 1.0, 4.0, 4.0, 4.0, 14.0, 20.0, 24.0, 36.0, 61.0, 103.0, 178.0, 280.0, 611.0, 1197.0, 3072.0, 8887.0, 30303.0, 149372.0, 700751.0, 115535.0, 25411.0, 7645.0, 2739.0, 1142.0, 491.0, 280.0, 153.0, 84.0, 50.0, 31.0, 26.0, 21.0, 17.0, 6.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.55419921875, -0.533233642578125, -0.51226806640625, -0.491302490234375, -0.4703369140625, -0.449371337890625, -0.42840576171875, -0.407440185546875, -0.386474609375, -0.365509033203125, -0.34454345703125, -0.323577880859375, -0.3026123046875, -0.281646728515625, -0.26068115234375, -0.239715576171875, -0.21875, -0.197784423828125, -0.17681884765625, -0.155853271484375, -0.1348876953125, -0.113922119140625, -0.09295654296875, -0.071990966796875, -0.051025390625, -0.030059814453125, -0.00909423828125, 0.011871337890625, 0.0328369140625, 0.053802490234375, 0.07476806640625, 0.095733642578125, 0.11669921875, 0.137664794921875, 0.15863037109375, 0.179595947265625, 0.2005615234375, 0.221527099609375, 0.24249267578125, 0.263458251953125, 0.284423828125, 0.305389404296875, 0.32635498046875, 0.347320556640625, 0.3682861328125, 0.389251708984375, 0.41021728515625, 0.431182861328125, 0.4521484375, 0.473114013671875, 0.49407958984375, 0.515045166015625, 0.5360107421875, 0.556976318359375, 0.57794189453125, 0.598907470703125, 0.619873046875, 0.640838623046875, 0.66180419921875, 0.682769775390625, 0.7037353515625, 0.724700927734375, 0.74566650390625, 0.766632080078125, 0.78759765625]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 6.0, 10.0, 10.0, 10.0, 6.0, 15.0, 23.0, 21.0, 27.0, 31.0, 44.0, 76.0, 122.0, 161.0, 132.0, 99.0, 45.0, 39.0, 24.0, 24.0, 13.0, 11.0, 12.0, 14.0, 8.0, 5.0, 3.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0], "bins": [-0.425048828125, -0.41400909423828125, -0.4029693603515625, -0.39192962646484375, -0.380889892578125, -0.36985015869140625, -0.3588104248046875, -0.34777069091796875, -0.33673095703125, -0.32569122314453125, -0.3146514892578125, -0.30361175537109375, -0.292572021484375, -0.28153228759765625, -0.2704925537109375, -0.25945281982421875, -0.2484130859375, -0.23737335205078125, -0.2263336181640625, -0.21529388427734375, -0.204254150390625, -0.19321441650390625, -0.1821746826171875, -0.17113494873046875, -0.16009521484375, -0.14905548095703125, -0.1380157470703125, -0.12697601318359375, -0.115936279296875, -0.10489654541015625, -0.0938568115234375, -0.08281707763671875, -0.07177734375, -0.06073760986328125, -0.0496978759765625, -0.03865814208984375, -0.027618408203125, -0.01657867431640625, -0.0055389404296875, 0.00550079345703125, 0.01654052734375, 0.02758026123046875, 0.0386199951171875, 0.04965972900390625, 0.060699462890625, 0.07173919677734375, 0.0827789306640625, 0.09381866455078125, 0.1048583984375, 0.11589813232421875, 0.1269378662109375, 0.13797760009765625, 0.149017333984375, 0.16005706787109375, 0.1710968017578125, 0.18213653564453125, 0.19317626953125, 0.20421600341796875, 0.2152557373046875, 0.22629547119140625, 0.237335205078125, 0.24837493896484375, 0.2594146728515625, 0.27045440673828125, 0.281494140625]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 12.0, 15.0, 42.0, 66.0, 129.0, 176.0, 192.0, 164.0, 96.0, 53.0, 25.0, 19.0, 10.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.952287197113037, -2.713155508041382, -2.4740238189697266, -2.234891891479492, -1.9957603216171265, -1.7566286325454712, -1.5174968242645264, -1.278365135192871, -1.0392334461212158, -0.8001017570495605, -0.5609700083732605, -0.32183825969696045, -0.08270657062530518, 0.1564251184463501, 0.3955569267272949, 0.6346886157989502, 0.8738203048706055, 1.1129519939422607, 1.352083683013916, 1.5912154912948608, 1.8303471803665161, 2.069478988647461, 2.308610677719116, 2.5477423667907715, 2.7868740558624268, 3.026005744934082, 3.2651374340057373, 3.5042691230773926, 3.743401050567627, 3.982532501220703, 4.2216644287109375, 4.460796356201172, 4.699928283691406, 4.939060211181641, 5.178191661834717, 5.417323589324951, 5.656455039978027, 5.895586967468262, 6.134718894958496, 6.373850345611572, 6.612981796264648, 6.852113723754883, 7.091245174407959, 7.330377101898193, 7.5695085525512695, 7.808640480041504, 8.047772407531738, 8.286903381347656, 8.52603530883789, 8.765167236328125, 9.00429916381836, 9.243430137634277, 9.482562065124512, 9.721693992614746, 9.96082592010498, 10.199956893920898, 10.43908977508545, 10.678221702575684, 10.917353630065918, 11.156484603881836, 11.39561653137207, 11.634748458862305, 11.873880386352539, 12.113012313842773, 12.352143287658691]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 5.0, 9.0, 7.0, 5.0, 13.0, 4.0, 18.0, 16.0, 14.0, 24.0, 31.0, 20.0, 28.0, 31.0, 35.0, 39.0, 41.0, 48.0, 37.0, 30.0, 43.0, 40.0, 42.0, 40.0, 39.0, 30.0, 38.0, 33.0, 33.0, 35.0, 26.0, 18.0, 22.0, 18.0, 18.0, 12.0, 18.0, 9.0, 10.0, 8.0, 5.0, 5.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0], "bins": [-6.527335166931152, -6.350761413574219, -6.174187660217285, -5.997613906860352, -5.821040630340576, -5.644466876983643, -5.467893123626709, -5.291319370269775, -5.11474609375, -4.938172340393066, -4.761598587036133, -4.585024833679199, -4.408451557159424, -4.23187780380249, -4.055304050445557, -3.878730297088623, -3.7021565437316895, -3.525582790374756, -3.3490092754364014, -3.1724355220794678, -2.9958620071411133, -2.8192882537841797, -2.642714500427246, -2.4661407470703125, -2.289567232131958, -2.1129934787750244, -1.93641996383667, -1.7598462104797363, -1.5832725763320923, -1.4066989421844482, -1.2301251888275146, -1.0535515546798706, -0.8769774436950684, -0.7004038095474243, -0.5238301157951355, -0.3472564220428467, -0.17068278789520264, 0.005890846252441406, 0.182464599609375, 0.35903823375701904, 0.5356118679046631, 0.7121855020523071, 0.888759195804596, 1.0653328895568848, 1.2419065237045288, 1.4184801578521729, 1.5950539112091064, 1.7716275453567505, 1.9482011795043945, 2.124774932861328, 2.3013484477996826, 2.477922201156616, 2.6544957160949707, 2.8310694694519043, 3.007643222808838, 3.1842169761657715, 3.360790491104126, 3.5373642444610596, 3.713937759399414, 3.8905115127563477, 4.067085266113281, 4.243659019470215, 4.420232772827148, 4.596806049346924, 4.773379802703857]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 2.0, 2.0, 3.0, 8.0, 3.0, 6.0, 9.0, 7.0, 21.0, 22.0, 16.0, 45.0, 50.0, 84.0, 116.0, 184.0, 370.0, 703.0, 1854.0, 5358.0, 21717.0, 269852.0, 3773701.0, 99776.0, 13849.0, 3799.0, 1354.0, 578.0, 280.0, 147.0, 94.0, 66.0, 53.0, 36.0, 27.0, 21.0, 16.0, 17.0, 11.0, 7.0, 8.0, 6.0, 4.0, 2.0, 0.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-4.25390625, -4.13360595703125, -4.0133056640625, -3.89300537109375, -3.772705078125, -3.65240478515625, -3.5321044921875, -3.41180419921875, -3.29150390625, -3.17120361328125, -3.0509033203125, -2.93060302734375, -2.810302734375, -2.69000244140625, -2.5697021484375, -2.44940185546875, -2.3291015625, -2.20880126953125, -2.0885009765625, -1.96820068359375, -1.847900390625, -1.72760009765625, -1.6072998046875, -1.48699951171875, -1.36669921875, -1.24639892578125, -1.1260986328125, -1.00579833984375, -0.885498046875, -0.76519775390625, -0.6448974609375, -0.52459716796875, -0.404296875, -0.28399658203125, -0.1636962890625, -0.04339599609375, 0.076904296875, 0.19720458984375, 0.3175048828125, 0.43780517578125, 0.55810546875, 0.67840576171875, 0.7987060546875, 0.91900634765625, 1.039306640625, 1.15960693359375, 1.2799072265625, 1.40020751953125, 1.5205078125, 1.64080810546875, 1.7611083984375, 1.88140869140625, 2.001708984375, 2.12200927734375, 2.2423095703125, 2.36260986328125, 2.48291015625, 2.60321044921875, 2.7235107421875, 2.84381103515625, 2.964111328125, 3.08441162109375, 3.2047119140625, 3.32501220703125, 3.4453125]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [2.0, 5.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 3.0, 8.0, 12.0, 8.0, 9.0, 16.0, 18.0, 28.0, 28.0, 33.0, 37.0, 31.0, 42.0, 56.0, 34.0, 61.0, 62.0, 71.0, 73.0, 55.0, 41.0, 40.0, 38.0, 35.0, 29.0, 18.0, 20.0, 25.0, 18.0, 14.0, 10.0, 4.0, 10.0, 5.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8525390625, -0.8184661865234375, -0.784393310546875, -0.7503204345703125, -0.71624755859375, -0.6821746826171875, -0.648101806640625, -0.6140289306640625, -0.5799560546875, -0.5458831787109375, -0.511810302734375, -0.4777374267578125, -0.44366455078125, -0.4095916748046875, -0.375518798828125, -0.3414459228515625, -0.307373046875, -0.2733001708984375, -0.239227294921875, -0.2051544189453125, -0.17108154296875, -0.1370086669921875, -0.102935791015625, -0.0688629150390625, -0.0347900390625, -0.0007171630859375, 0.033355712890625, 0.0674285888671875, 0.10150146484375, 0.1355743408203125, 0.169647216796875, 0.2037200927734375, 0.23779296875, 0.2718658447265625, 0.305938720703125, 0.3400115966796875, 0.37408447265625, 0.4081573486328125, 0.442230224609375, 0.4763031005859375, 0.5103759765625, 0.5444488525390625, 0.578521728515625, 0.6125946044921875, 0.64666748046875, 0.6807403564453125, 0.714813232421875, 0.7488861083984375, 0.782958984375, 0.8170318603515625, 0.851104736328125, 0.8851776123046875, 0.91925048828125, 0.9533233642578125, 0.987396240234375, 1.0214691162109375, 1.0555419921875, 1.0896148681640625, 1.123687744140625, 1.1577606201171875, 1.19183349609375, 1.2259063720703125, 1.259979248046875, 1.2940521240234375, 1.328125]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 5.0, 5.0, 11.0, 8.0, 7.0, 11.0, 5.0, 17.0, 27.0, 33.0, 54.0, 57.0, 82.0, 152.0, 232.0, 524.0, 1387.0, 4825.0, 22037.0, 179211.0, 3489294.0, 447359.0, 38078.0, 7330.0, 1964.0, 714.0, 309.0, 167.0, 105.0, 76.0, 42.0, 36.0, 27.0, 25.0, 14.0, 14.0, 6.0, 8.0, 4.0, 9.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.84375, -2.747833251953125, -2.65191650390625, -2.555999755859375, -2.4600830078125, -2.364166259765625, -2.26824951171875, -2.172332763671875, -2.076416015625, -1.980499267578125, -1.88458251953125, -1.788665771484375, -1.6927490234375, -1.596832275390625, -1.50091552734375, -1.404998779296875, -1.30908203125, -1.213165283203125, -1.11724853515625, -1.021331787109375, -0.9254150390625, -0.829498291015625, -0.73358154296875, -0.637664794921875, -0.541748046875, -0.445831298828125, -0.34991455078125, -0.253997802734375, -0.1580810546875, -0.062164306640625, 0.03375244140625, 0.129669189453125, 0.2255859375, 0.321502685546875, 0.41741943359375, 0.513336181640625, 0.6092529296875, 0.705169677734375, 0.80108642578125, 0.897003173828125, 0.992919921875, 1.088836669921875, 1.18475341796875, 1.280670166015625, 1.3765869140625, 1.472503662109375, 1.56842041015625, 1.664337158203125, 1.76025390625, 1.856170654296875, 1.95208740234375, 2.048004150390625, 2.1439208984375, 2.239837646484375, 2.33575439453125, 2.431671142578125, 2.527587890625, 2.623504638671875, 2.71942138671875, 2.815338134765625, 2.9112548828125, 3.007171630859375, 3.10308837890625, 3.199005126953125, 3.294921875]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 5.0, 10.0, 8.0, 15.0, 18.0, 16.0, 27.0, 43.0, 46.0, 65.0, 77.0, 127.0, 191.0, 270.0, 416.0, 586.0, 632.0, 463.0, 317.0, 216.0, 142.0, 102.0, 63.0, 58.0, 34.0, 34.0, 26.0, 13.0, 14.0, 13.0, 3.0, 3.0, 6.0, 4.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.673828125, -0.6547012329101562, -0.6355743408203125, -0.6164474487304688, -0.597320556640625, -0.5781936645507812, -0.5590667724609375, -0.5399398803710938, -0.52081298828125, -0.5016860961914062, -0.4825592041015625, -0.46343231201171875, -0.444305419921875, -0.42517852783203125, -0.4060516357421875, -0.38692474365234375, -0.3677978515625, -0.34867095947265625, -0.3295440673828125, -0.31041717529296875, -0.291290283203125, -0.27216339111328125, -0.2530364990234375, -0.23390960693359375, -0.21478271484375, -0.19565582275390625, -0.1765289306640625, -0.15740203857421875, -0.138275146484375, -0.11914825439453125, -0.1000213623046875, -0.08089447021484375, -0.061767578125, -0.04264068603515625, -0.0235137939453125, -0.00438690185546875, 0.014739990234375, 0.03386688232421875, 0.0529937744140625, 0.07212066650390625, 0.09124755859375, 0.11037445068359375, 0.1295013427734375, 0.14862823486328125, 0.167755126953125, 0.18688201904296875, 0.2060089111328125, 0.22513580322265625, 0.2442626953125, 0.26338958740234375, 0.2825164794921875, 0.30164337158203125, 0.320770263671875, 0.33989715576171875, 0.3590240478515625, 0.37815093994140625, 0.39727783203125, 0.41640472412109375, 0.4355316162109375, 0.45465850830078125, 0.473785400390625, 0.49291229248046875, 0.5120391845703125, 0.5311660766601562, 0.55029296875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 5.0, 11.0, 22.0, 24.0, 39.0, 53.0, 73.0, 77.0, 107.0, 102.0, 105.0, 90.0, 75.0, 67.0, 51.0, 37.0, 24.0, 12.0, 15.0, 4.0, 7.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5456047058105469, -1.4555232524871826, -1.3654416799545288, -1.2753602266311646, -1.1852786540985107, -1.0951972007751465, -1.0051157474517822, -0.9150342345237732, -0.8249527215957642, -0.7348712086677551, -0.6447896957397461, -0.5547082424163818, -0.4646267294883728, -0.37454521656036377, -0.2844637632369995, -0.19438225030899048, -0.10430073738098145, -0.014219239354133606, 0.07586225867271423, 0.16594374179840088, 0.2560252547264099, 0.34610676765441895, 0.4361882209777832, 0.5262697339057922, 0.6163512468338013, 0.7064327597618103, 0.7965142726898193, 0.8865957260131836, 0.9766772389411926, 1.0667587518692017, 1.156840205192566, 1.2469217777252197, 1.337003231048584, 1.4270846843719482, 1.517166256904602, 1.6072477102279663, 1.6973292827606201, 1.7874107360839844, 1.8774921894073486, 1.967573642730713, 2.0576553344726562, 2.1477367877960205, 2.2378182411193848, 2.327899932861328, 2.4179813861846924, 2.5080628395080566, 2.598144292831421, 2.688225746154785, 2.7783071994781494, 2.8683886528015137, 2.958470106124878, 3.048551559448242, 3.1386332511901855, 3.22871470451355, 3.318796157836914, 3.4088776111602783, 3.4989590644836426, 3.589040517807007, 3.679121971130371, 3.7692036628723145, 3.8592851161956787, 3.949366569519043, 4.039447784423828, 4.1295294761657715, 4.219611167907715]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 8.0, 3.0, 1.0, 14.0, 12.0, 10.0, 13.0, 16.0, 19.0, 25.0, 20.0, 32.0, 24.0, 42.0, 35.0, 34.0, 37.0, 49.0, 35.0, 45.0, 43.0, 32.0, 37.0, 40.0, 44.0, 48.0, 36.0, 26.0, 23.0, 21.0, 28.0, 21.0, 21.0, 14.0, 20.0, 19.0, 9.0, 9.0, 9.0, 4.0, 5.0, 4.0, 3.0, 6.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.3104372024536133, -1.2676371335983276, -1.224837064743042, -1.182037115097046, -1.1392370462417603, -1.0964369773864746, -1.053636908531189, -1.0108368396759033, -0.9680368304252625, -0.9252367615699768, -0.8824367523193359, -0.8396366834640503, -0.7968366146087646, -0.7540366053581238, -0.7112365365028381, -0.6684365272521973, -0.6256364583969116, -0.582836389541626, -0.5400363802909851, -0.49723631143569946, -0.4544362723827362, -0.41163623332977295, -0.3688361644744873, -0.32603612542152405, -0.2832360863685608, -0.24043604731559753, -0.19763599336147308, -0.15483593940734863, -0.11203590035438538, -0.06923586130142212, -0.026435792446136475, 0.016364246606826782, 0.05916416645050049, 0.10196421295404434, 0.1447642594575882, 0.18756431341171265, 0.2303643524646759, 0.27316439151763916, 0.3159644603729248, 0.35876449942588806, 0.4015645384788513, 0.4443645775318146, 0.48716461658477783, 0.5299646854400635, 0.5727647542953491, 0.61556476354599, 0.6583648324012756, 0.7011648416519165, 0.7439649105072021, 0.7867649793624878, 0.8295649886131287, 0.8723650574684143, 0.9151650667190552, 0.9579651355743408, 1.0007652044296265, 1.043565273284912, 1.0863652229309082, 1.1291652917861938, 1.1719653606414795, 1.2147653102874756, 1.2575653791427612, 1.3003654479980469, 1.3431655168533325, 1.3859655857086182, 1.4287656545639038]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 5.0, 5.0, 9.0, 5.0, 9.0, 18.0, 31.0, 26.0, 42.0, 50.0, 84.0, 120.0, 201.0, 353.0, 904.0, 2613.0, 11545.0, 219890.0, 767297.0, 37614.0, 4966.0, 1484.0, 558.0, 258.0, 150.0, 99.0, 63.0, 57.0, 33.0, 21.0, 15.0, 12.0, 6.0, 6.0, 8.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.47509765625, -0.45465850830078125, -0.4342193603515625, -0.41378021240234375, -0.393341064453125, -0.37290191650390625, -0.3524627685546875, -0.33202362060546875, -0.31158447265625, -0.29114532470703125, -0.2707061767578125, -0.25026702880859375, -0.229827880859375, -0.20938873291015625, -0.1889495849609375, -0.16851043701171875, -0.1480712890625, -0.12763214111328125, -0.1071929931640625, -0.08675384521484375, -0.066314697265625, -0.04587554931640625, -0.0254364013671875, -0.00499725341796875, 0.01544189453125, 0.03588104248046875, 0.0563201904296875, 0.07675933837890625, 0.097198486328125, 0.11763763427734375, 0.1380767822265625, 0.15851593017578125, 0.178955078125, 0.19939422607421875, 0.2198333740234375, 0.24027252197265625, 0.260711669921875, 0.28115081787109375, 0.3015899658203125, 0.32202911376953125, 0.34246826171875, 0.36290740966796875, 0.3833465576171875, 0.40378570556640625, 0.424224853515625, 0.44466400146484375, 0.4651031494140625, 0.48554229736328125, 0.5059814453125, 0.5264205932617188, 0.5468597412109375, 0.5672988891601562, 0.587738037109375, 0.6081771850585938, 0.6286163330078125, 0.6490554809570312, 0.66949462890625, 0.6899337768554688, 0.7103729248046875, 0.7308120727539062, 0.751251220703125, 0.7716903686523438, 0.7921295166015625, 0.8125686645507812, 0.8330078125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 9.0, 6.0, 9.0, 16.0, 16.0, 22.0, 21.0, 29.0, 46.0, 42.0, 48.0, 59.0, 61.0, 61.0, 61.0, 54.0, 54.0, 47.0, 54.0, 52.0, 40.0, 39.0, 26.0, 29.0, 20.0, 19.0, 21.0, 15.0, 7.0, 6.0, 8.0, 5.0, 0.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.70703125, -1.6634521484375, -1.619873046875, -1.5762939453125, -1.53271484375, -1.4891357421875, -1.445556640625, -1.4019775390625, -1.3583984375, -1.3148193359375, -1.271240234375, -1.2276611328125, -1.18408203125, -1.1405029296875, -1.096923828125, -1.0533447265625, -1.009765625, -0.9661865234375, -0.922607421875, -0.8790283203125, -0.83544921875, -0.7918701171875, -0.748291015625, -0.7047119140625, -0.6611328125, -0.6175537109375, -0.573974609375, -0.5303955078125, -0.48681640625, -0.4432373046875, -0.399658203125, -0.3560791015625, -0.3125, -0.2689208984375, -0.225341796875, -0.1817626953125, -0.13818359375, -0.0946044921875, -0.051025390625, -0.0074462890625, 0.0361328125, 0.0797119140625, 0.123291015625, 0.1668701171875, 0.21044921875, 0.2540283203125, 0.297607421875, 0.3411865234375, 0.384765625, 0.4283447265625, 0.471923828125, 0.5155029296875, 0.55908203125, 0.6026611328125, 0.646240234375, 0.6898193359375, 0.7333984375, 0.7769775390625, 0.820556640625, 0.8641357421875, 0.90771484375, 0.9512939453125, 0.994873046875, 1.0384521484375, 1.08203125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 1.0, 4.0, 5.0, 9.0, 10.0, 7.0, 17.0, 20.0, 32.0, 47.0, 57.0, 80.0, 111.0, 158.0, 266.0, 463.0, 849.0, 1633.0, 3487.0, 10094.0, 42902.0, 256105.0, 545857.0, 147708.0, 26215.0, 6728.0, 2609.0, 1244.0, 675.0, 410.0, 248.0, 166.0, 94.0, 73.0, 35.0, 57.0, 19.0, 11.0, 12.0, 5.0, 5.0, 10.0, 3.0, 4.0, 6.0, 3.0, 2.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2626953125, -0.2534294128417969, -0.24416351318359375, -0.23489761352539062, -0.2256317138671875, -0.21636581420898438, -0.20709991455078125, -0.19783401489257812, -0.188568115234375, -0.17930221557617188, -0.17003631591796875, -0.16077041625976562, -0.1515045166015625, -0.14223861694335938, -0.13297271728515625, -0.12370681762695312, -0.11444091796875, -0.10517501831054688, -0.09590911865234375, -0.08664321899414062, -0.0773773193359375, -0.06811141967773438, -0.05884552001953125, -0.049579620361328125, -0.040313720703125, -0.031047821044921875, -0.02178192138671875, -0.012516021728515625, -0.0032501220703125, 0.006015777587890625, 0.01528167724609375, 0.024547576904296875, 0.0338134765625, 0.043079376220703125, 0.05234527587890625, 0.061611175537109375, 0.0708770751953125, 0.08014297485351562, 0.08940887451171875, 0.09867477416992188, 0.107940673828125, 0.11720657348632812, 0.12647247314453125, 0.13573837280273438, 0.1450042724609375, 0.15427017211914062, 0.16353607177734375, 0.17280197143554688, 0.18206787109375, 0.19133377075195312, 0.20059967041015625, 0.20986557006835938, 0.2191314697265625, 0.22839736938476562, 0.23766326904296875, 0.24692916870117188, 0.256195068359375, 0.2654609680175781, 0.27472686767578125, 0.2839927673339844, 0.2932586669921875, 0.3025245666503906, 0.31179046630859375, 0.3210563659667969, 0.330322265625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 1.0, 2.0, 5.0, 6.0, 10.0, 15.0, 12.0, 9.0, 31.0, 26.0, 32.0, 43.0, 44.0, 57.0, 43.0, 61.0, 41.0, 42.0, 59.0, 52.0, 65.0, 41.0, 49.0, 42.0, 33.0, 40.0, 25.0, 20.0, 22.0, 20.0, 16.0, 10.0, 5.0, 10.0, 6.0, 5.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.64453125, -3.545074462890625, -3.44561767578125, -3.346160888671875, -3.2467041015625, -3.147247314453125, -3.04779052734375, -2.948333740234375, -2.848876953125, -2.749420166015625, -2.64996337890625, -2.550506591796875, -2.4510498046875, -2.351593017578125, -2.25213623046875, -2.152679443359375, -2.05322265625, -1.953765869140625, -1.85430908203125, -1.754852294921875, -1.6553955078125, -1.555938720703125, -1.45648193359375, -1.357025146484375, -1.257568359375, -1.158111572265625, -1.05865478515625, -0.959197998046875, -0.8597412109375, -0.760284423828125, -0.66082763671875, -0.561370849609375, -0.4619140625, -0.362457275390625, -0.26300048828125, -0.163543701171875, -0.0640869140625, 0.035369873046875, 0.13482666015625, 0.234283447265625, 0.333740234375, 0.433197021484375, 0.53265380859375, 0.632110595703125, 0.7315673828125, 0.831024169921875, 0.93048095703125, 1.029937744140625, 1.12939453125, 1.228851318359375, 1.32830810546875, 1.427764892578125, 1.5272216796875, 1.626678466796875, 1.72613525390625, 1.825592041015625, 1.925048828125, 2.024505615234375, 2.12396240234375, 2.223419189453125, 2.3228759765625, 2.422332763671875, 2.52178955078125, 2.621246337890625, 2.720703125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 5.0, 7.0, 2.0, 4.0, 8.0, 24.0, 30.0, 63.0, 130.0, 289.0, 738.0, 1888.0, 7004.0, 41825.0, 737265.0, 235658.0, 17740.0, 3798.0, 1213.0, 456.0, 193.0, 96.0, 65.0, 27.0, 13.0, 11.0, 7.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.21435546875, -0.20801162719726562, -0.20166778564453125, -0.19532394409179688, -0.1889801025390625, -0.18263626098632812, -0.17629241943359375, -0.16994857788085938, -0.163604736328125, -0.15726089477539062, -0.15091705322265625, -0.14457321166992188, -0.1382293701171875, -0.13188552856445312, -0.12554168701171875, -0.11919784545898438, -0.11285400390625, -0.10651016235351562, -0.10016632080078125, -0.09382247924804688, -0.0874786376953125, -0.08113479614257812, -0.07479095458984375, -0.06844711303710938, -0.062103271484375, -0.055759429931640625, -0.04941558837890625, -0.043071746826171875, -0.0367279052734375, -0.030384063720703125, -0.02404022216796875, -0.017696380615234375, -0.0113525390625, -0.005008697509765625, 0.00133514404296875, 0.007678985595703125, 0.0140228271484375, 0.020366668701171875, 0.02671051025390625, 0.033054351806640625, 0.039398193359375, 0.045742034912109375, 0.05208587646484375, 0.058429718017578125, 0.0647735595703125, 0.07111740112304688, 0.07746124267578125, 0.08380508422851562, 0.09014892578125, 0.09649276733398438, 0.10283660888671875, 0.10918045043945312, 0.1155242919921875, 0.12186813354492188, 0.12821197509765625, 0.13455581665039062, 0.140899658203125, 0.14724349975585938, 0.15358734130859375, 0.15993118286132812, 0.1662750244140625, 0.17261886596679688, 0.17896270751953125, 0.18530654907226562, 0.191650390625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 5.0, 1.0, 5.0, 13.0, 8.0, 22.0, 19.0, 31.0, 56.0, 71.0, 92.0, 117.0, 117.0, 109.0, 96.0, 83.0, 51.0, 31.0, 24.0, 17.0, 11.0, 5.0, 5.0, 4.0, 5.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.192922592163086e-05, -5.942676216363907e-05, -5.692429840564728e-05, -5.442183464765549e-05, -5.1919370889663696e-05, -4.9416907131671906e-05, -4.6914443373680115e-05, -4.4411979615688324e-05, -4.190951585769653e-05, -3.940705209970474e-05, -3.690458834171295e-05, -3.440212458372116e-05, -3.189966082572937e-05, -2.939719706773758e-05, -2.689473330974579e-05, -2.4392269551753998e-05, -2.1889805793762207e-05, -1.9387342035770416e-05, -1.6884878277778625e-05, -1.4382414519786835e-05, -1.1879950761795044e-05, -9.377487003803253e-06, -6.875023245811462e-06, -4.372559487819672e-06, -1.8700957298278809e-06, 6.323680281639099e-07, 3.1348317861557007e-06, 5.6372955441474915e-06, 8.139759302139282e-06, 1.0642223060131073e-05, 1.3144686818122864e-05, 1.5647150576114655e-05, 1.8149614334106445e-05, 2.0652078092098236e-05, 2.3154541850090027e-05, 2.5657005608081818e-05, 2.815946936607361e-05, 3.06619331240654e-05, 3.316439688205719e-05, 3.566686064004898e-05, 3.816932439804077e-05, 4.067178815603256e-05, 4.317425191402435e-05, 4.5676715672016144e-05, 4.8179179430007935e-05, 5.0681643187999725e-05, 5.3184106945991516e-05, 5.568657070398331e-05, 5.81890344619751e-05, 6.069149821996689e-05, 6.319396197795868e-05, 6.569642573595047e-05, 6.819888949394226e-05, 7.070135325193405e-05, 7.320381700992584e-05, 7.570628076791763e-05, 7.820874452590942e-05, 8.071120828390121e-05, 8.3213672041893e-05, 8.57161357998848e-05, 8.821859955787659e-05, 9.072106331586838e-05, 9.322352707386017e-05, 9.572599083185196e-05, 9.822845458984375e-05]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 12.0, 15.0, 22.0, 28.0, 51.0, 89.0, 170.0, 272.0, 522.0, 912.0, 1582.0, 3029.0, 5911.0, 12022.0, 29141.0, 90231.0, 340112.0, 393616.0, 109150.0, 33951.0, 13763.0, 6556.0, 3344.0, 1811.0, 993.0, 541.0, 277.0, 173.0, 109.0, 66.0, 28.0, 12.0, 18.0, 7.0, 6.0, 6.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08135986328125, -0.07882308959960938, -0.07628631591796875, -0.07374954223632812, -0.0712127685546875, -0.06867599487304688, -0.06613922119140625, -0.06360244750976562, -0.061065673828125, -0.058528900146484375, -0.05599212646484375, -0.053455352783203125, -0.0509185791015625, -0.048381805419921875, -0.04584503173828125, -0.043308258056640625, -0.040771484375, -0.038234710693359375, -0.03569793701171875, -0.033161163330078125, -0.0306243896484375, -0.028087615966796875, -0.02555084228515625, -0.023014068603515625, -0.020477294921875, -0.017940521240234375, -0.01540374755859375, -0.012866973876953125, -0.0103302001953125, -0.007793426513671875, -0.00525665283203125, -0.002719879150390625, -0.00018310546875, 0.002353668212890625, 0.00489044189453125, 0.007427215576171875, 0.0099639892578125, 0.012500762939453125, 0.01503753662109375, 0.017574310302734375, 0.020111083984375, 0.022647857666015625, 0.02518463134765625, 0.027721405029296875, 0.0302581787109375, 0.032794952392578125, 0.03533172607421875, 0.037868499755859375, 0.0404052734375, 0.042942047119140625, 0.04547882080078125, 0.048015594482421875, 0.0505523681640625, 0.053089141845703125, 0.05562591552734375, 0.058162689208984375, 0.060699462890625, 0.06323623657226562, 0.06577301025390625, 0.06830978393554688, 0.0708465576171875, 0.07338333129882812, 0.07592010498046875, 0.07845687866210938, 0.08099365234375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 5.0, 4.0, 6.0, 5.0, 6.0, 8.0, 11.0, 21.0, 30.0, 42.0, 60.0, 94.0, 125.0, 152.0, 123.0, 110.0, 53.0, 35.0, 37.0, 22.0, 7.0, 11.0, 10.0, 7.0, 4.0, 5.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.036590576171875, -0.035463809967041016, -0.03433704376220703, -0.03321027755737305, -0.03208351135253906, -0.030956745147705078, -0.029829978942871094, -0.02870321273803711, -0.027576446533203125, -0.02644968032836914, -0.025322914123535156, -0.024196147918701172, -0.023069381713867188, -0.021942615509033203, -0.02081584930419922, -0.019689083099365234, -0.01856231689453125, -0.017435550689697266, -0.01630878448486328, -0.015182018280029297, -0.014055252075195312, -0.012928485870361328, -0.011801719665527344, -0.01067495346069336, -0.009548187255859375, -0.00842142105102539, -0.007294654846191406, -0.006167888641357422, -0.0050411224365234375, -0.003914356231689453, -0.0027875900268554688, -0.0016608238220214844, -0.0005340576171875, 0.0005927085876464844, 0.0017194747924804688, 0.002846240997314453, 0.0039730072021484375, 0.005099773406982422, 0.006226539611816406, 0.007353305816650391, 0.008480072021484375, 0.00960683822631836, 0.010733604431152344, 0.011860370635986328, 0.012987136840820312, 0.014113903045654297, 0.015240669250488281, 0.016367435455322266, 0.01749420166015625, 0.018620967864990234, 0.01974773406982422, 0.020874500274658203, 0.022001266479492188, 0.023128032684326172, 0.024254798889160156, 0.02538156509399414, 0.026508331298828125, 0.02763509750366211, 0.028761863708496094, 0.029888629913330078, 0.031015396118164062, 0.03214216232299805, 0.03326892852783203, 0.034395694732666016, 0.0355224609375]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 11.0, 20.0, 24.0, 22.0, 51.0, 66.0, 71.0, 82.0, 101.0, 103.0, 96.0, 95.0, 64.0, 56.0, 47.0, 33.0, 17.0, 21.0, 7.0, 7.0, 5.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0808062553405762, -1.0233845710754395, -0.9659629464149475, -0.9085413217544556, -0.8511196970939636, -0.7936980724334717, -0.736276388168335, -0.678854763507843, -0.6214331388473511, -0.5640115141868591, -0.5065898299217224, -0.44916820526123047, -0.3917465806007385, -0.3343249261379242, -0.27690327167510986, -0.21948164701461792, -0.1620599627494812, -0.10463832318782806, -0.04721667617559433, 0.010204970836639404, 0.06762661039829254, 0.12504824995994568, 0.18246990442276, 0.23989152908325195, 0.2973131835460663, 0.3547348380088806, 0.41215646266937256, 0.4695781171321869, 0.5269997715950012, 0.5844213962554932, 0.6418430805206299, 0.699264645576477, 0.7566863298416138, 0.8141079545021057, 0.8715296387672424, 0.9289512634277344, 0.9863728880882263, 1.0437945127487183, 1.101216197013855, 1.1586377620697021, 1.2160594463348389, 1.2734811305999756, 1.3309026956558228, 1.3883243799209595, 1.4457460641860962, 1.5031676292419434, 1.56058931350708, 1.6180109977722168, 1.6754326820373535, 1.7328543663024902, 1.7902759313583374, 1.8476976156234741, 1.9051192998886108, 1.962540864944458, 2.0199625492095947, 2.0773842334747314, 2.134805679321289, 2.192227363586426, 2.2496490478515625, 2.307070732116699, 2.364492177963257, 2.4219138622283936, 2.4793355464935303, 2.536757230758667, 2.5941789150238037]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 5.0, 6.0, 8.0, 16.0, 14.0, 13.0, 21.0, 25.0, 32.0, 42.0, 39.0, 55.0, 43.0, 51.0, 55.0, 67.0, 53.0, 58.0, 58.0, 52.0, 49.0, 33.0, 35.0, 31.0, 37.0, 21.0, 27.0, 16.0, 10.0, 12.0, 3.0, 10.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3500936031341553, -1.3102937936782837, -1.2704938650131226, -1.230694055557251, -1.1908942461013794, -1.1510944366455078, -1.1112945079803467, -1.071494698524475, -1.0316948890686035, -0.9918950200080872, -0.9520952105522156, -0.9122953414916992, -0.8724955320358276, -0.8326956629753113, -0.7928957939147949, -0.7530959844589233, -0.713296115398407, -0.6734962463378906, -0.633696436882019, -0.5938965678215027, -0.5540967583656311, -0.5142968893051147, -0.4744970500469208, -0.4346972107887268, -0.39489737153053284, -0.35509753227233887, -0.3152976930141449, -0.2754978537559509, -0.23569799959659576, -0.1958981603384018, -0.15609830617904663, -0.11629846692085266, -0.07649862766265869, -0.03669878467917442, 0.003101058304309845, 0.04290090501308441, 0.08270074427127838, 0.12250058352947235, 0.16230043768882751, 0.20210027694702148, 0.24190011620521545, 0.2816999554634094, 0.3214997947216034, 0.36129963397979736, 0.4010995030403137, 0.4408993124961853, 0.48069918155670166, 0.5204989910125732, 0.5602988600730896, 0.600098729133606, 0.6398985385894775, 0.6796984076499939, 0.7194982171058655, 0.7592980861663818, 0.7990978956222534, 0.8388977646827698, 0.8786976337432861, 0.9184975028038025, 0.9582973122596741, 0.9980971813201904, 1.037896990776062, 1.0776968002319336, 1.1174967288970947, 1.1572965383529663, 1.197096347808838]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 7.0, 4.0, 8.0, 16.0, 28.0, 46.0, 50.0, 87.0, 141.0, 222.0, 403.0, 721.0, 1463.0, 2760.0, 5858.0, 12809.0, 33046.0, 104302.0, 421887.0, 332861.0, 82939.0, 27581.0, 10859.0, 5055.0, 2532.0, 1291.0, 647.0, 374.0, 215.0, 133.0, 59.0, 53.0, 37.0, 19.0, 14.0, 17.0, 4.0, 5.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.037109375, -1.9732666015625, -1.909423828125, -1.8455810546875, -1.78173828125, -1.7178955078125, -1.654052734375, -1.5902099609375, -1.5263671875, -1.4625244140625, -1.398681640625, -1.3348388671875, -1.27099609375, -1.2071533203125, -1.143310546875, -1.0794677734375, -1.015625, -0.9517822265625, -0.887939453125, -0.8240966796875, -0.76025390625, -0.6964111328125, -0.632568359375, -0.5687255859375, -0.5048828125, -0.4410400390625, -0.377197265625, -0.3133544921875, -0.24951171875, -0.1856689453125, -0.121826171875, -0.0579833984375, 0.005859375, 0.0697021484375, 0.133544921875, 0.1973876953125, 0.26123046875, 0.3250732421875, 0.388916015625, 0.4527587890625, 0.5166015625, 0.5804443359375, 0.644287109375, 0.7081298828125, 0.77197265625, 0.8358154296875, 0.899658203125, 0.9635009765625, 1.02734375, 1.0911865234375, 1.155029296875, 1.2188720703125, 1.28271484375, 1.3465576171875, 1.410400390625, 1.4742431640625, 1.5380859375, 1.6019287109375, 1.665771484375, 1.7296142578125, 1.79345703125, 1.8572998046875, 1.921142578125, 1.9849853515625, 2.048828125]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 5.0, 6.0, 9.0, 12.0, 10.0, 18.0, 15.0, 21.0, 14.0, 31.0, 38.0, 35.0, 30.0, 34.0, 35.0, 42.0, 56.0, 48.0, 57.0, 51.0, 50.0, 50.0, 39.0, 39.0, 35.0, 27.0, 35.0, 31.0, 28.0, 24.0, 15.0, 10.0, 15.0, 13.0, 9.0, 3.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.90234375, -1.8438720703125, -1.785400390625, -1.7269287109375, -1.66845703125, -1.6099853515625, -1.551513671875, -1.4930419921875, -1.4345703125, -1.3760986328125, -1.317626953125, -1.2591552734375, -1.20068359375, -1.1422119140625, -1.083740234375, -1.0252685546875, -0.966796875, -0.9083251953125, -0.849853515625, -0.7913818359375, -0.73291015625, -0.6744384765625, -0.615966796875, -0.5574951171875, -0.4990234375, -0.4405517578125, -0.382080078125, -0.3236083984375, -0.26513671875, -0.2066650390625, -0.148193359375, -0.0897216796875, -0.03125, 0.0272216796875, 0.085693359375, 0.1441650390625, 0.20263671875, 0.2611083984375, 0.319580078125, 0.3780517578125, 0.4365234375, 0.4949951171875, 0.553466796875, 0.6119384765625, 0.67041015625, 0.7288818359375, 0.787353515625, 0.8458251953125, 0.904296875, 0.9627685546875, 1.021240234375, 1.0797119140625, 1.13818359375, 1.1966552734375, 1.255126953125, 1.3135986328125, 1.3720703125, 1.4305419921875, 1.489013671875, 1.5474853515625, 1.60595703125, 1.6644287109375, 1.722900390625, 1.7813720703125, 1.83984375]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 5.0, 4.0, 7.0, 11.0, 15.0, 31.0, 28.0, 37.0, 67.0, 90.0, 129.0, 194.0, 351.0, 582.0, 1036.0, 1824.0, 3382.0, 6636.0, 13280.0, 29826.0, 74041.0, 218096.0, 425043.0, 166631.0, 59080.0, 24607.0, 11236.0, 5474.0, 2933.0, 1572.0, 879.0, 526.0, 319.0, 219.0, 125.0, 76.0, 63.0, 36.0, 32.0, 16.0, 11.0, 5.0, 4.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7001953125, -1.6521453857421875, -1.604095458984375, -1.5560455322265625, -1.50799560546875, -1.4599456787109375, -1.411895751953125, -1.3638458251953125, -1.3157958984375, -1.2677459716796875, -1.219696044921875, -1.1716461181640625, -1.12359619140625, -1.0755462646484375, -1.027496337890625, -0.9794464111328125, -0.931396484375, -0.8833465576171875, -0.835296630859375, -0.7872467041015625, -0.73919677734375, -0.6911468505859375, -0.643096923828125, -0.5950469970703125, -0.5469970703125, -0.4989471435546875, -0.450897216796875, -0.4028472900390625, -0.35479736328125, -0.3067474365234375, -0.258697509765625, -0.2106475830078125, -0.16259765625, -0.1145477294921875, -0.066497802734375, -0.0184478759765625, 0.02960205078125, 0.0776519775390625, 0.125701904296875, 0.1737518310546875, 0.2218017578125, 0.2698516845703125, 0.317901611328125, 0.3659515380859375, 0.41400146484375, 0.4620513916015625, 0.510101318359375, 0.5581512451171875, 0.606201171875, 0.6542510986328125, 0.702301025390625, 0.7503509521484375, 0.79840087890625, 0.8464508056640625, 0.894500732421875, 0.9425506591796875, 0.9906005859375, 1.0386505126953125, 1.086700439453125, 1.1347503662109375, 1.18280029296875, 1.2308502197265625, 1.278900146484375, 1.3269500732421875, 1.375]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 5.0, 7.0, 6.0, 5.0, 2.0, 12.0, 7.0, 11.0, 15.0, 14.0, 23.0, 28.0, 19.0, 30.0, 25.0, 36.0, 30.0, 31.0, 39.0, 41.0, 40.0, 46.0, 50.0, 56.0, 36.0, 52.0, 48.0, 42.0, 34.0, 30.0, 26.0, 25.0, 20.0, 20.0, 15.0, 12.0, 12.0, 8.0, 7.0, 11.0, 3.0, 7.0, 5.0, 6.0, 2.0, 2.0, 3.0, 3.0, 2.0], "bins": [-2.8359375, -2.759490966796875, -2.68304443359375, -2.606597900390625, -2.5301513671875, -2.453704833984375, -2.37725830078125, -2.300811767578125, -2.224365234375, -2.147918701171875, -2.07147216796875, -1.995025634765625, -1.9185791015625, -1.842132568359375, -1.76568603515625, -1.689239501953125, -1.61279296875, -1.536346435546875, -1.45989990234375, -1.383453369140625, -1.3070068359375, -1.230560302734375, -1.15411376953125, -1.077667236328125, -1.001220703125, -0.924774169921875, -0.84832763671875, -0.771881103515625, -0.6954345703125, -0.618988037109375, -0.54254150390625, -0.466094970703125, -0.3896484375, -0.313201904296875, -0.23675537109375, -0.160308837890625, -0.0838623046875, -0.007415771484375, 0.06903076171875, 0.145477294921875, 0.221923828125, 0.298370361328125, 0.37481689453125, 0.451263427734375, 0.5277099609375, 0.604156494140625, 0.68060302734375, 0.757049560546875, 0.83349609375, 0.909942626953125, 0.98638916015625, 1.062835693359375, 1.1392822265625, 1.215728759765625, 1.29217529296875, 1.368621826171875, 1.445068359375, 1.521514892578125, 1.59796142578125, 1.674407958984375, 1.7508544921875, 1.827301025390625, 1.90374755859375, 1.980194091796875, 2.056640625]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 6.0, 7.0, 3.0, 8.0, 14.0, 23.0, 30.0, 31.0, 60.0, 111.0, 145.0, 258.0, 412.0, 548.0, 1043.0, 1696.0, 2798.0, 4905.0, 8576.0, 15474.0, 28666.0, 53365.0, 100313.0, 192965.0, 312652.0, 151032.0, 79202.0, 42182.0, 22788.0, 12500.0, 6848.0, 3914.0, 2297.0, 1383.0, 873.0, 523.0, 310.0, 191.0, 133.0, 89.0, 65.0, 27.0, 32.0, 24.0, 12.0, 5.0, 5.0, 6.0, 6.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.271484375, -0.26357269287109375, -0.2556610107421875, -0.24774932861328125, -0.239837646484375, -0.23192596435546875, -0.2240142822265625, -0.21610260009765625, -0.20819091796875, -0.20027923583984375, -0.1923675537109375, -0.18445587158203125, -0.176544189453125, -0.16863250732421875, -0.1607208251953125, -0.15280914306640625, -0.1448974609375, -0.13698577880859375, -0.1290740966796875, -0.12116241455078125, -0.113250732421875, -0.10533905029296875, -0.0974273681640625, -0.08951568603515625, -0.08160400390625, -0.07369232177734375, -0.0657806396484375, -0.05786895751953125, -0.049957275390625, -0.04204559326171875, -0.0341339111328125, -0.02622222900390625, -0.018310546875, -0.01039886474609375, -0.0024871826171875, 0.00542449951171875, 0.013336181640625, 0.02124786376953125, 0.0291595458984375, 0.03707122802734375, 0.04498291015625, 0.05289459228515625, 0.0608062744140625, 0.06871795654296875, 0.076629638671875, 0.08454132080078125, 0.0924530029296875, 0.10036468505859375, 0.1082763671875, 0.11618804931640625, 0.1240997314453125, 0.13201141357421875, 0.139923095703125, 0.14783477783203125, 0.1557464599609375, 0.16365814208984375, 0.17156982421875, 0.17948150634765625, 0.1873931884765625, 0.19530487060546875, 0.203216552734375, 0.21112823486328125, 0.2190399169921875, 0.22695159912109375, 0.23486328125]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 4.0, 3.0, 6.0, 4.0, 9.0, 8.0, 8.0, 22.0, 26.0, 21.0, 31.0, 31.0, 41.0, 46.0, 61.0, 67.0, 100.0, 116.0, 68.0, 62.0, 53.0, 42.0, 32.0, 28.0, 29.0, 18.0, 12.0, 16.0, 5.0, 11.0, 7.0, 4.0, 4.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0], "bins": [-0.00012564659118652344, -0.00012251641601324081, -0.00011938624083995819, -0.00011625606566667557, -0.00011312589049339294, -0.00010999571532011032, -0.0001068655401468277, -0.00010373536497354507, -0.00010060518980026245, -9.747501462697983e-05, -9.43448394536972e-05, -9.121466428041458e-05, -8.808448910713196e-05, -8.495431393384933e-05, -8.182413876056671e-05, -7.869396358728409e-05, -7.556378841400146e-05, -7.243361324071884e-05, -6.930343806743622e-05, -6.61732628941536e-05, -6.304308772087097e-05, -5.991291254758835e-05, -5.6782737374305725e-05, -5.36525622010231e-05, -5.052238702774048e-05, -4.7392211854457855e-05, -4.426203668117523e-05, -4.113186150789261e-05, -3.8001686334609985e-05, -3.487151116132736e-05, -3.174133598804474e-05, -2.8611160814762115e-05, -2.5480985641479492e-05, -2.235081046819687e-05, -1.9220635294914246e-05, -1.6090460121631622e-05, -1.2960284948348999e-05, -9.830109775066376e-06, -6.6999346017837524e-06, -3.569759428501129e-06, -4.3958425521850586e-07, 2.6905909180641174e-06, 5.820766091346741e-06, 8.950941264629364e-06, 1.2081116437911987e-05, 1.521129161119461e-05, 1.8341466784477234e-05, 2.1471641957759857e-05, 2.460181713104248e-05, 2.7731992304325104e-05, 3.086216747760773e-05, 3.399234265089035e-05, 3.7122517824172974e-05, 4.02526929974556e-05, 4.338286817073822e-05, 4.6513043344020844e-05, 4.964321851730347e-05, 5.277339369058609e-05, 5.590356886386871e-05, 5.903374403715134e-05, 6.216391921043396e-05, 6.529409438371658e-05, 6.84242695569992e-05, 7.155444473028183e-05, 7.468461990356445e-05]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 10.0, 7.0, 12.0, 15.0, 24.0, 33.0, 46.0, 82.0, 108.0, 157.0, 202.0, 355.0, 536.0, 876.0, 1399.0, 2320.0, 4059.0, 7350.0, 14228.0, 28981.0, 62387.0, 139447.0, 351544.0, 235351.0, 103814.0, 46820.0, 22561.0, 11237.0, 5835.0, 3473.0, 1944.0, 1170.0, 754.0, 467.0, 344.0, 202.0, 121.0, 88.0, 52.0, 48.0, 36.0, 26.0, 14.0, 7.0, 4.0, 6.0, 3.0, 2.0, 2.0, 3.0, 2.0, 2.0], "bins": [-0.393310546875, -0.3820152282714844, -0.37071990966796875, -0.3594245910644531, -0.3481292724609375, -0.3368339538574219, -0.32553863525390625, -0.3142433166503906, -0.302947998046875, -0.2916526794433594, -0.28035736083984375, -0.2690620422363281, -0.2577667236328125, -0.24647140502929688, -0.23517608642578125, -0.22388076782226562, -0.21258544921875, -0.20129013061523438, -0.18999481201171875, -0.17869949340820312, -0.1674041748046875, -0.15610885620117188, -0.14481353759765625, -0.13351821899414062, -0.122222900390625, -0.11092758178710938, -0.09963226318359375, -0.08833694458007812, -0.0770416259765625, -0.06574630737304688, -0.05445098876953125, -0.043155670166015625, -0.0318603515625, -0.020565032958984375, -0.00926971435546875, 0.002025604248046875, 0.0133209228515625, 0.024616241455078125, 0.03591156005859375, 0.047206878662109375, 0.058502197265625, 0.06979751586914062, 0.08109283447265625, 0.09238815307617188, 0.1036834716796875, 0.11497879028320312, 0.12627410888671875, 0.13756942749023438, 0.14886474609375, 0.16016006469726562, 0.17145538330078125, 0.18275070190429688, 0.1940460205078125, 0.20534133911132812, 0.21663665771484375, 0.22793197631835938, 0.239227294921875, 0.2505226135253906, 0.26181793212890625, 0.2731132507324219, 0.2844085693359375, 0.2957038879394531, 0.30699920654296875, 0.3182945251464844, 0.32958984375]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 3.0, 2.0, 11.0, 10.0, 10.0, 15.0, 18.0, 22.0, 31.0, 33.0, 36.0, 42.0, 50.0, 72.0, 96.0, 93.0, 82.0, 51.0, 52.0, 49.0, 36.0, 29.0, 29.0, 28.0, 22.0, 15.0, 17.0, 9.0, 10.0, 7.0, 7.0, 2.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25537109375, -0.2469940185546875, -0.238616943359375, -0.2302398681640625, -0.22186279296875, -0.2134857177734375, -0.205108642578125, -0.1967315673828125, -0.1883544921875, -0.1799774169921875, -0.171600341796875, -0.1632232666015625, -0.15484619140625, -0.1464691162109375, -0.138092041015625, -0.1297149658203125, -0.121337890625, -0.1129608154296875, -0.104583740234375, -0.0962066650390625, -0.08782958984375, -0.0794525146484375, -0.071075439453125, -0.0626983642578125, -0.0543212890625, -0.0459442138671875, -0.037567138671875, -0.0291900634765625, -0.02081298828125, -0.0124359130859375, -0.004058837890625, 0.0043182373046875, 0.0126953125, 0.0210723876953125, 0.029449462890625, 0.0378265380859375, 0.04620361328125, 0.0545806884765625, 0.062957763671875, 0.0713348388671875, 0.0797119140625, 0.0880889892578125, 0.096466064453125, 0.1048431396484375, 0.11322021484375, 0.1215972900390625, 0.129974365234375, 0.1383514404296875, 0.146728515625, 0.1551055908203125, 0.163482666015625, 0.1718597412109375, 0.18023681640625, 0.1886138916015625, 0.196990966796875, 0.2053680419921875, 0.2137451171875, 0.2221221923828125, 0.230499267578125, 0.2388763427734375, 0.24725341796875, 0.2556304931640625, 0.264007568359375, 0.2723846435546875, 0.28076171875]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 3.0, 1.0, 5.0, 13.0, 13.0, 28.0, 29.0, 78.0, 78.0, 95.0, 138.0, 93.0, 126.0, 104.0, 70.0, 48.0, 36.0, 17.0, 10.0, 6.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.894886016845703, -4.7289509773254395, -4.563016414642334, -4.39708137512207, -4.231146812438965, -4.065211772918701, -3.8992769718170166, -3.733342170715332, -3.5674073696136475, -3.401472568511963, -3.2355377674102783, -3.0696029663085938, -2.90366792678833, -2.7377333641052246, -2.571798324584961, -2.4058635234832764, -2.239928722381592, -2.0739939212799072, -1.9080591201782227, -1.7421241998672485, -1.576189398765564, -1.4102545976638794, -1.2443196773529053, -1.0783848762512207, -0.9124500751495361, -0.7465152740478516, -0.5805804133415222, -0.41464558243751526, -0.2487107515335083, -0.08277595043182373, 0.08315891027450562, 0.24909377098083496, 0.41502904891967773, 0.5809638500213623, 0.7468987107276917, 0.912833571434021, 1.0787683725357056, 1.2447031736373901, 1.4106380939483643, 1.5765728950500488, 1.7425076961517334, 1.908442497253418, 2.0743772983551025, 2.240312099456787, 2.406247138977051, 2.5721817016601562, 2.73811674118042, 2.9040515422821045, 3.069986343383789, 3.2359211444854736, 3.401855945587158, 3.5677907466888428, 3.7337255477905273, 3.899660587310791, 4.0655951499938965, 4.23153018951416, 4.397464752197266, 4.563399791717529, 4.729334354400635, 4.895269393920898, 5.061203956604004, 5.227138996124268, 5.393073558807373, 5.559008598327637, 5.7249436378479]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 0.0, 2.0, 3.0, 2.0, 0.0, 7.0, 3.0, 6.0, 7.0, 8.0, 12.0, 15.0, 15.0, 17.0, 23.0, 16.0, 20.0, 14.0, 19.0, 28.0, 31.0, 39.0, 40.0, 29.0, 37.0, 44.0, 30.0, 37.0, 52.0, 32.0, 41.0, 35.0, 31.0, 30.0, 25.0, 28.0, 26.0, 24.0, 25.0, 22.0, 21.0, 17.0, 16.0, 17.0, 10.0, 17.0, 9.0, 5.0, 4.0, 7.0, 5.0, 2.0, 2.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.084555625915527, -3.9525306224823, -3.8205056190490723, -3.6884806156158447, -3.556455612182617, -3.4244308471679688, -3.292405843734741, -3.1603808403015137, -3.028355836868286, -2.8963308334350586, -2.764305830001831, -2.6322808265686035, -2.500256061553955, -2.3682308197021484, -2.2362060546875, -2.1041810512542725, -1.972156047821045, -1.8401310443878174, -1.7081060409545898, -1.5760811567306519, -1.4440561532974243, -1.3120311498641968, -1.1800062656402588, -1.0479812622070312, -0.9159562587738037, -0.7839312553405762, -0.6519063115119934, -0.5198813676834106, -0.3878563642501831, -0.25583136081695557, -0.1238064169883728, 0.008218526840209961, 0.1402430534362793, 0.27226802706718445, 0.4042930006980896, 0.5363179445266724, 0.6683429479598999, 0.8003679513931274, 0.9323928952217102, 1.064417839050293, 1.1964428424835205, 1.328467845916748, 1.4604928493499756, 1.5925177335739136, 1.7245427370071411, 1.8565677404403687, 1.9885926246643066, 2.120617628097534, 2.2526426315307617, 2.3846676349639893, 2.516692638397217, 2.6487176418304443, 2.780742645263672, 2.9127674102783203, 3.044792413711548, 3.1768174171447754, 3.308842420578003, 3.4408674240112305, 3.572892427444458, 3.7049174308776855, 3.836942195892334, 3.9689674377441406, 4.100992202758789, 4.2330169677734375, 4.365042209625244]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 4.0, 0.0, 5.0, 4.0, 6.0, 12.0, 9.0, 12.0, 21.0, 31.0, 37.0, 42.0, 68.0, 77.0, 113.0, 129.0, 164.0, 212.0, 235.0, 313.0, 372.0, 431.0, 512.0, 587.0, 785.0, 1167.0, 1040670.0, 929.0, 670.0, 561.0, 449.0, 399.0, 323.0, 243.0, 193.0, 190.0, 122.0, 121.0, 97.0, 75.0, 55.0, 33.0, 28.0, 29.0, 19.0, 19.0, 9.0, 9.0, 7.0, 3.0, 1.0, 5.0, 1.0, 2.0, 0.0, 1.0, 4.0, 0.0, 0.0, 2.0], "bins": [-4.427000045776367, -4.280395984649658, -4.133791923522949, -3.9871878623962402, -3.8405838012695312, -3.6939797401428223, -3.5473756790161133, -3.4007716178894043, -3.2541675567626953, -3.1075634956359863, -2.9609594345092773, -2.8143553733825684, -2.6677513122558594, -2.5211472511291504, -2.3745431900024414, -2.2279391288757324, -2.0813350677490234, -1.9347310066223145, -1.7881269454956055, -1.6415228843688965, -1.4949188232421875, -1.3483147621154785, -1.2017107009887695, -1.0551066398620605, -0.9085025787353516, -0.7618985176086426, -0.6152944564819336, -0.4686903953552246, -0.3220863342285156, -0.17548227310180664, -0.028878211975097656, 0.11772584915161133, 0.2643303871154785, 0.4109344482421875, 0.5575385093688965, 0.7041425704956055, 0.8507466316223145, 0.9973506927490234, 1.1439547538757324, 1.2905588150024414, 1.4371628761291504, 1.5837669372558594, 1.7303709983825684, 1.8769750595092773, 2.0235791206359863, 2.1701831817626953, 2.3167872428894043, 2.4633913040161133, 2.6099953651428223, 2.7565994262695312, 2.9032034873962402, 3.049807548522949, 3.196411609649658, 3.343015670776367, 3.489619731903076, 3.636223793029785, 3.782827854156494, 3.929431915283203, 4.076035976409912, 4.222640037536621, 4.36924409866333, 4.515848159790039, 4.662452220916748, 4.809056282043457, 4.955660343170166]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 2.0, 3.0, 9.0, 8.0, 11.0, 15.0, 35.0, 80.0, 155.0, 393.0, 1144.0, 3213.0, 9693.0, 51413792.0, 31560.0, 7211.0, 2556.0, 858.0, 317.0, 132.0, 63.0, 26.0, 21.0, 10.0, 7.0, 8.0, 5.0, 5.0, 5.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.18787384033203, -20.453519821166992, -19.719165802001953, -18.984811782836914, -18.250457763671875, -17.516103744506836, -16.781749725341797, -16.047395706176758, -15.313041687011719, -14.57868766784668, -13.84433364868164, -13.109979629516602, -12.375625610351562, -11.641271591186523, -10.906917572021484, -10.172563552856445, -9.438210487365723, -8.703856468200684, -7.9695024490356445, -7.2351484298706055, -6.500794410705566, -5.766440391540527, -5.0320868492126465, -4.297732830047607, -3.5633788108825684, -2.8290247917175293, -2.0946707725524902, -1.3603169918060303, -0.6259629726409912, 0.10839104652404785, 0.8427448272705078, 1.5770988464355469, 2.311452865600586, 3.045806884765625, 3.780160903930664, 4.514514923095703, 5.248868942260742, 5.983222961425781, 6.717576503753662, 7.451930522918701, 8.186285018920898, 8.920639038085938, 9.654993057250977, 10.389347076416016, 11.123701095581055, 11.858055114746094, 12.592409133911133, 13.326763153076172, 14.061116218566895, 14.795470237731934, 15.529824256896973, 16.264177322387695, 16.998531341552734, 17.732885360717773, 18.467239379882812, 19.20159339904785, 19.93594741821289, 20.67030143737793, 21.40465545654297, 22.139009475708008, 22.873363494873047, 23.607717514038086, 24.342071533203125, 25.076425552368164, 25.810779571533203]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 4.0, 3.0, 6.0, 14.0, 6.0, 27.0, 35.0, 66.0, 69.0, 86.0, 151.0, 186.0, 302.0, 484.0, 759.0, 1212.0, 2023.0, 3615.0, 6101.0, 10912.0, 19809.0, 36960.0, 68946.0, 125730.0, 217430.0, 346115.0, 597760.0, 3375342.0, 621559.0, 349673.0, 222420.0, 127958.0, 70477.0, 37910.0, 20382.0, 11366.0, 6269.0, 3647.0, 2022.0, 1304.0, 796.0, 509.0, 339.0, 196.0, 129.0, 111.0, 83.0, 45.0, 31.0, 28.0, 15.0, 9.0, 6.0, 4.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.810546875, -0.7848281860351562, -0.7591094970703125, -0.7333908081054688, -0.707672119140625, -0.6819534301757812, -0.6562347412109375, -0.6305160522460938, -0.60479736328125, -0.5790786743164062, -0.5533599853515625, -0.5276412963867188, -0.501922607421875, -0.47620391845703125, -0.4504852294921875, -0.42476654052734375, -0.3990478515625, -0.37332916259765625, -0.3476104736328125, -0.32189178466796875, -0.296173095703125, -0.27045440673828125, -0.2447357177734375, -0.21901702880859375, -0.19329833984375, -0.16757965087890625, -0.1418609619140625, -0.11614227294921875, -0.090423583984375, -0.06470489501953125, -0.0389862060546875, -0.01326751708984375, 0.012451171875, 0.03816986083984375, 0.0638885498046875, 0.08960723876953125, 0.115325927734375, 0.14104461669921875, 0.1667633056640625, 0.19248199462890625, 0.21820068359375, 0.24391937255859375, 0.2696380615234375, 0.29535675048828125, 0.321075439453125, 0.34679412841796875, 0.3725128173828125, 0.39823150634765625, 0.4239501953125, 0.44966888427734375, 0.4753875732421875, 0.5011062622070312, 0.526824951171875, 0.5525436401367188, 0.5782623291015625, 0.6039810180664062, 0.62969970703125, 0.6554183959960938, 0.6811370849609375, 0.7068557739257812, 0.732574462890625, 0.7582931518554688, 0.7840118408203125, 0.8097305297851562, 0.83544921875]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 3.0, 5.0, 4.0, 5.0, 9.0, 3.0, 5.0, 9.0, 18.0, 14.0, 16.0, 20.0, 15.0, 32.0, 33.0, 34.0, 51.0, 27.0, 46.0, 50.0, 35.0, 75.0, 956.0, 110.0, 48.0, 38.0, 48.0, 36.0, 26.0, 42.0, 33.0, 28.0, 14.0, 31.0, 22.0, 12.0, 18.0, 9.0, 7.0, 11.0, 7.0, 6.0, 4.0, 8.0, 1.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.9296875, -12.5203857421875, -12.111083984375, -11.7017822265625, -11.29248046875, -10.8831787109375, -10.473876953125, -10.0645751953125, -9.6552734375, -9.2459716796875, -8.836669921875, -8.4273681640625, -8.01806640625, -7.6087646484375, -7.199462890625, -6.7901611328125, -6.380859375, -5.9715576171875, -5.562255859375, -5.1529541015625, -4.74365234375, -4.3343505859375, -3.925048828125, -3.5157470703125, -3.1064453125, -2.6971435546875, -2.287841796875, -1.8785400390625, -1.46923828125, -1.0599365234375, -0.650634765625, -0.2413330078125, 0.16796875, 0.5772705078125, 0.986572265625, 1.3958740234375, 1.80517578125, 2.2144775390625, 2.623779296875, 3.0330810546875, 3.4423828125, 3.8516845703125, 4.260986328125, 4.6702880859375, 5.07958984375, 5.4888916015625, 5.898193359375, 6.3074951171875, 6.716796875, 7.1260986328125, 7.535400390625, 7.9447021484375, 8.35400390625, 8.7633056640625, 9.172607421875, 9.5819091796875, 9.9912109375, 10.4005126953125, 10.809814453125, 11.2191162109375, 11.62841796875, 12.0377197265625, 12.447021484375, 12.8563232421875, 13.265625]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 6.0, 2.0, 2.0, 6.0, 7.0, 15.0, 15.0, 26.0, 38.0, 63.0, 111.0, 217.0, 471.0, 1082.0, 2590.0, 7117.0, 18970.0, 51129.0, 129822.0, 289793.0, 530696.0, 3646687.0, 845763.0, 419395.0, 207161.0, 87072.0, 33396.0, 12120.0, 4436.0, 1755.0, 774.0, 326.0, 160.0, 92.0, 58.0, 26.0, 16.0, 16.0, 5.0, 2.0, 2.0, 2.0, 1.0], "bins": [-1.1201171875, -1.09393310546875, -1.0677490234375, -1.04156494140625, -1.015380859375, -0.98919677734375, -0.9630126953125, -0.93682861328125, -0.91064453125, -0.88446044921875, -0.8582763671875, -0.83209228515625, -0.805908203125, -0.77972412109375, -0.7535400390625, -0.72735595703125, -0.701171875, -0.67498779296875, -0.6488037109375, -0.62261962890625, -0.596435546875, -0.57025146484375, -0.5440673828125, -0.51788330078125, -0.49169921875, -0.46551513671875, -0.4393310546875, -0.41314697265625, -0.386962890625, -0.36077880859375, -0.3345947265625, -0.30841064453125, -0.2822265625, -0.25604248046875, -0.2298583984375, -0.20367431640625, -0.177490234375, -0.15130615234375, -0.1251220703125, -0.09893798828125, -0.07275390625, -0.04656982421875, -0.0203857421875, 0.00579833984375, 0.031982421875, 0.05816650390625, 0.0843505859375, 0.11053466796875, 0.13671875, 0.16290283203125, 0.1890869140625, 0.21527099609375, 0.241455078125, 0.26763916015625, 0.2938232421875, 0.32000732421875, 0.34619140625, 0.37237548828125, 0.3985595703125, 0.42474365234375, 0.450927734375, 0.47711181640625, 0.5032958984375, 0.52947998046875, 0.5556640625]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 6.0, 5.0, 8.0, 14.0, 14.0, 20.0, 23.0, 23.0, 33.0, 31.0, 34.0, 41.0, 47.0, 49.0, 46.0, 56.0, 729.0, 399.0, 42.0, 54.0, 48.0, 54.0, 42.0, 34.0, 34.0, 23.0, 24.0, 15.0, 23.0, 14.0, 17.0, 13.0, 5.0, 3.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.359375, -9.926025390625, -9.49267578125, -9.059326171875, -8.6259765625, -8.192626953125, -7.75927734375, -7.325927734375, -6.892578125, -6.459228515625, -6.02587890625, -5.592529296875, -5.1591796875, -4.725830078125, -4.29248046875, -3.859130859375, -3.42578125, -2.992431640625, -2.55908203125, -2.125732421875, -1.6923828125, -1.259033203125, -0.82568359375, -0.392333984375, 0.041015625, 0.474365234375, 0.90771484375, 1.341064453125, 1.7744140625, 2.207763671875, 2.64111328125, 3.074462890625, 3.5078125, 3.941162109375, 4.37451171875, 4.807861328125, 5.2412109375, 5.674560546875, 6.10791015625, 6.541259765625, 6.974609375, 7.407958984375, 7.84130859375, 8.274658203125, 8.7080078125, 9.141357421875, 9.57470703125, 10.008056640625, 10.44140625, 10.874755859375, 11.30810546875, 11.741455078125, 12.1748046875, 12.608154296875, 13.04150390625, 13.474853515625, 13.908203125, 14.341552734375, 14.77490234375, 15.208251953125, 15.6416015625, 16.074951171875, 16.50830078125, 16.941650390625, 17.375]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 8.0, 10.0, 13.0, 25.0, 43.0, 63.0, 90.0, 163.0, 203.0, 336.0, 553.0, 822.0, 1378.0, 2734.0, 5518.0, 14007.0, 44053.0, 204353.0, 4574113.0, 1228844.0, 155472.0, 36119.0, 11836.0, 4856.0, 2367.0, 1269.0, 780.0, 485.0, 311.0, 207.0, 133.0, 81.0, 50.0, 37.0, 26.0, 23.0, 5.0, 17.0, 6.0, 5.0, 8.0, 3.0, 0.0, 0.0, 1.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.5712890625, -1.5129241943359375, -1.454559326171875, -1.3961944580078125, -1.33782958984375, -1.2794647216796875, -1.221099853515625, -1.1627349853515625, -1.1043701171875, -1.0460052490234375, -0.987640380859375, -0.9292755126953125, -0.87091064453125, -0.8125457763671875, -0.754180908203125, -0.6958160400390625, -0.637451171875, -0.5790863037109375, -0.520721435546875, -0.4623565673828125, -0.40399169921875, -0.3456268310546875, -0.287261962890625, -0.2288970947265625, -0.1705322265625, -0.1121673583984375, -0.053802490234375, 0.0045623779296875, 0.06292724609375, 0.1212921142578125, 0.179656982421875, 0.2380218505859375, 0.29638671875, 0.3547515869140625, 0.413116455078125, 0.4714813232421875, 0.52984619140625, 0.5882110595703125, 0.646575927734375, 0.7049407958984375, 0.7633056640625, 0.8216705322265625, 0.880035400390625, 0.9384002685546875, 0.99676513671875, 1.0551300048828125, 1.113494873046875, 1.1718597412109375, 1.230224609375, 1.2885894775390625, 1.346954345703125, 1.4053192138671875, 1.46368408203125, 1.5220489501953125, 1.580413818359375, 1.6387786865234375, 1.6971435546875, 1.7555084228515625, 1.813873291015625, 1.8722381591796875, 1.93060302734375, 1.9889678955078125, 2.047332763671875, 2.1056976318359375, 2.1640625]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 9.0, 7.0, 8.0, 7.0, 9.0, 6.0, 10.0, 9.0, 24.0, 27.0, 28.0, 33.0, 41.0, 36.0, 54.0, 56.0, 43.0, 40.0, 150.0, 986.0, 61.0, 49.0, 37.0, 49.0, 40.0, 35.0, 26.0, 29.0, 27.0, 28.0, 13.0, 19.0, 13.0, 5.0, 4.0, 6.0, 7.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.5078125, -12.07861328125, -11.6494140625, -11.22021484375, -10.791015625, -10.36181640625, -9.9326171875, -9.50341796875, -9.07421875, -8.64501953125, -8.2158203125, -7.78662109375, -7.357421875, -6.92822265625, -6.4990234375, -6.06982421875, -5.640625, -5.21142578125, -4.7822265625, -4.35302734375, -3.923828125, -3.49462890625, -3.0654296875, -2.63623046875, -2.20703125, -1.77783203125, -1.3486328125, -0.91943359375, -0.490234375, -0.06103515625, 0.3681640625, 0.79736328125, 1.2265625, 1.65576171875, 2.0849609375, 2.51416015625, 2.943359375, 3.37255859375, 3.8017578125, 4.23095703125, 4.66015625, 5.08935546875, 5.5185546875, 5.94775390625, 6.376953125, 6.80615234375, 7.2353515625, 7.66455078125, 8.09375, 8.52294921875, 8.9521484375, 9.38134765625, 9.810546875, 10.23974609375, 10.6689453125, 11.09814453125, 11.52734375, 11.95654296875, 12.3857421875, 12.81494140625, 13.244140625, 13.67333984375, 14.1025390625, 14.53173828125, 14.9609375]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 10.0, 27.0, 58.0, 290.0, 361.0, 179.0, 45.0, 18.0, 9.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.83673858642578, -38.67256164550781, -37.508384704589844, -36.34421157836914, -35.18003463745117, -34.0158576965332, -32.8516845703125, -31.68750762939453, -30.523330688476562, -29.359153747558594, -28.194978713989258, -27.030803680419922, -25.866626739501953, -24.702449798583984, -23.53827476501465, -22.374099731445312, -21.209922790527344, -20.045745849609375, -18.88157081604004, -17.717395782470703, -16.553218841552734, -15.389042854309082, -14.22486686706543, -13.060690879821777, -11.896514892578125, -10.732338905334473, -9.56816291809082, -8.403986930847168, -7.239810943603516, -6.075634956359863, -4.911458969116211, -3.7472829818725586, -2.583110809326172, -1.4189348220825195, -0.2547588348388672, 0.9094171524047852, 2.0735931396484375, 3.23776912689209, 4.401945114135742, 5.5661211013793945, 6.730297088623047, 7.894473075866699, 9.058649063110352, 10.222825050354004, 11.387001037597656, 12.551177024841309, 13.715353012084961, 14.879528999328613, 16.043704986572266, 17.207881927490234, 18.37205696105957, 19.536231994628906, 20.700408935546875, 21.864585876464844, 23.02876091003418, 24.192935943603516, 25.357112884521484, 26.521289825439453, 27.68546485900879, 28.849639892578125, 30.013816833496094, 31.177993774414062, 32.34217071533203, 33.506343841552734, 34.6705207824707]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 4.0, 11.0, 13.0, 10.0, 19.0, 16.0, 39.0, 56.0, 54.0, 71.0, 96.0, 88.0, 103.0, 81.0, 83.0, 62.0, 45.0, 30.0, 33.0, 24.0, 17.0, 11.0, 14.0, 3.0, 4.0, 5.0, 4.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-35.75379180908203, -34.51516342163086, -33.27653121948242, -32.03790283203125, -30.799270629882812, -29.56064224243164, -28.322011947631836, -27.08338165283203, -25.844751358032227, -24.606121063232422, -23.367490768432617, -22.128860473632812, -20.89023208618164, -19.651599884033203, -18.41297149658203, -17.174341201782227, -15.935710906982422, -14.697080612182617, -13.458450317382812, -12.219820976257324, -10.98119068145752, -9.742560386657715, -8.503931045532227, -7.265300750732422, -6.026670455932617, -4.7880401611328125, -3.549410343170166, -2.3107802867889404, -1.0721502304077148, 0.16648006439208984, 1.4051098823547363, 2.643739700317383, 3.882373809814453, 5.121004104614258, 6.359633922576904, 7.598263740539551, 8.836894035339355, 10.07552433013916, 11.314153671264648, 12.552783966064453, 13.791414260864258, 15.030044555664062, 16.268674850463867, 17.507305145263672, 18.745933532714844, 19.98456573486328, 21.223194122314453, 22.461824417114258, 23.700454711914062, 24.939085006713867, 26.177715301513672, 27.416345596313477, 28.65497589111328, 29.893604278564453, 31.132234573364258, 32.37086486816406, 33.6094970703125, 34.84812545776367, 36.08675765991211, 37.32538604736328, 38.56401824951172, 39.80264663696289, 41.04127883911133, 42.2799072265625, 43.51853561401367]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 3.0, 7.0, 10.0, 20.0, 892.0, 1817.0, 2797.0, 6540.0, 39773.0, 3110763.0, 1000234.0, 25372.0, 3689.0, 1995.0, 295.0, 26.0, 18.0, 10.0, 6.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1546630859375, -0.1486968994140625, -0.142730712890625, -0.1367645263671875, -0.13079833984375, -0.1248321533203125, -0.118865966796875, -0.1128997802734375, -0.10693359375, -0.1009674072265625, -0.095001220703125, -0.0890350341796875, -0.08306884765625, -0.0771026611328125, -0.071136474609375, -0.0651702880859375, -0.0592041015625, -0.0532379150390625, -0.047271728515625, -0.0413055419921875, -0.03533935546875, -0.0293731689453125, -0.023406982421875, -0.0174407958984375, -0.011474609375, -0.0055084228515625, 0.000457763671875, 0.0064239501953125, 0.01239013671875, 0.0183563232421875, 0.024322509765625, 0.0302886962890625, 0.0362548828125, 0.0422210693359375, 0.048187255859375, 0.0541534423828125, 0.06011962890625, 0.0660858154296875, 0.072052001953125, 0.0780181884765625, 0.083984375, 0.0899505615234375, 0.095916748046875, 0.1018829345703125, 0.10784912109375, 0.1138153076171875, 0.119781494140625, 0.1257476806640625, 0.1317138671875, 0.1376800537109375, 0.143646240234375, 0.1496124267578125, 0.15557861328125, 0.1615447998046875, 0.167510986328125, 0.1734771728515625, 0.179443359375, 0.1854095458984375, 0.191375732421875, 0.1973419189453125, 0.20330810546875, 0.2092742919921875, 0.215240478515625, 0.2212066650390625, 0.2271728515625]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 4.0, 2.0, 9.0, 12.0, 18.0, 35.0, 41.0, 81.0, 147.0, 339.0, 132.0, 71.0, 40.0, 18.0, 16.0, 9.0, 11.0, 8.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1600341796875, -0.15440750122070312, -0.14878082275390625, -0.14315414428710938, -0.1375274658203125, -0.13190078735351562, -0.12627410888671875, -0.12064743041992188, -0.115020751953125, -0.10939407348632812, -0.10376739501953125, -0.09814071655273438, -0.0925140380859375, -0.08688735961914062, -0.08126068115234375, -0.07563400268554688, -0.07000732421875, -0.06438064575195312, -0.05875396728515625, -0.053127288818359375, -0.0475006103515625, -0.041873931884765625, -0.03624725341796875, -0.030620574951171875, -0.024993896484375, -0.019367218017578125, -0.01374053955078125, -0.008113861083984375, -0.0024871826171875, 0.003139495849609375, 0.00876617431640625, 0.014392852783203125, 0.02001953125, 0.025646209716796875, 0.03127288818359375, 0.036899566650390625, 0.0425262451171875, 0.048152923583984375, 0.05377960205078125, 0.059406280517578125, 0.065032958984375, 0.07065963745117188, 0.07628631591796875, 0.08191299438476562, 0.0875396728515625, 0.09316635131835938, 0.09879302978515625, 0.10441970825195312, 0.11004638671875, 0.11567306518554688, 0.12129974365234375, 0.12692642211914062, 0.1325531005859375, 0.13817977905273438, 0.14380645751953125, 0.14943313598632812, 0.155059814453125, 0.16068649291992188, 0.16631317138671875, 0.17193984985351562, 0.1775665283203125, 0.18319320678710938, 0.18881988525390625, 0.19444656372070312, 0.2000732421875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 12.0, 23.0, 32.0, 35.0, 48.0, 132.0, 408.0, 3295.0, 4181872.0, 7511.0, 567.0, 160.0, 70.0, 44.0, 22.0, 21.0, 8.0, 6.0, 8.0, 2.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.31005859375, -0.29569244384765625, -0.2813262939453125, -0.26696014404296875, -0.252593994140625, -0.23822784423828125, -0.2238616943359375, -0.20949554443359375, -0.19512939453125, -0.18076324462890625, -0.1663970947265625, -0.15203094482421875, -0.137664794921875, -0.12329864501953125, -0.1089324951171875, -0.09456634521484375, -0.0802001953125, -0.06583404541015625, -0.0514678955078125, -0.03710174560546875, -0.022735595703125, -0.00836944580078125, 0.0059967041015625, 0.02036285400390625, 0.03472900390625, 0.04909515380859375, 0.0634613037109375, 0.07782745361328125, 0.092193603515625, 0.10655975341796875, 0.1209259033203125, 0.13529205322265625, 0.149658203125, 0.16402435302734375, 0.1783905029296875, 0.19275665283203125, 0.207122802734375, 0.22148895263671875, 0.2358551025390625, 0.25022125244140625, 0.26458740234375, 0.27895355224609375, 0.2933197021484375, 0.30768585205078125, 0.322052001953125, 0.33641815185546875, 0.3507843017578125, 0.36515045166015625, 0.3795166015625, 0.39388275146484375, 0.4082489013671875, 0.42261505126953125, 0.436981201171875, 0.45134735107421875, 0.4657135009765625, 0.48007965087890625, 0.49444580078125, 0.5088119506835938, 0.5231781005859375, 0.5375442504882812, 0.551910400390625, 0.5662765502929688, 0.5806427001953125, 0.5950088500976562, 0.609375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 7.0, 1.0, 10.0, 18.0, 28.0, 34.0, 28.0, 102.0, 217.0, 567.0, 1280.0, 960.0, 470.0, 168.0, 69.0, 41.0, 28.0, 23.0, 13.0, 7.0, 3.0, 7.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06317138671875, -0.060128211975097656, -0.05708503723144531, -0.05404186248779297, -0.050998687744140625, -0.04795551300048828, -0.04491233825683594, -0.041869163513183594, -0.03882598876953125, -0.035782814025878906, -0.03273963928222656, -0.02969646453857422, -0.026653289794921875, -0.02361011505126953, -0.020566940307617188, -0.017523765563964844, -0.0144805908203125, -0.011437416076660156, -0.008394241333007812, -0.005351066589355469, -0.002307891845703125, 0.0007352828979492188, 0.0037784576416015625, 0.006821632385253906, 0.00986480712890625, 0.012907981872558594, 0.015951156616210938, 0.01899433135986328, 0.022037506103515625, 0.02508068084716797, 0.028123855590820312, 0.031167030334472656, 0.034210205078125, 0.037253379821777344, 0.04029655456542969, 0.04333972930908203, 0.046382904052734375, 0.04942607879638672, 0.05246925354003906, 0.055512428283691406, 0.05855560302734375, 0.061598777770996094, 0.06464195251464844, 0.06768512725830078, 0.07072830200195312, 0.07377147674560547, 0.07681465148925781, 0.07985782623291016, 0.0829010009765625, 0.08594417572021484, 0.08898735046386719, 0.09203052520751953, 0.09507369995117188, 0.09811687469482422, 0.10116004943847656, 0.1042032241821289, 0.10724639892578125, 0.1102895736694336, 0.11333274841308594, 0.11637592315673828, 0.11941909790039062, 0.12246227264404297, 0.1255054473876953, 0.12854862213134766, 0.131591796875]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 25.0, 848.0, 142.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.639014720916748, -2.5812911987304688, -2.5235679149627686, -2.4658443927764893, -2.40812087059021, -2.3503975868225098, -2.2926740646362305, -2.234950542449951, -2.177227258682251, -2.1195037364959717, -2.0617804527282715, -2.004056930541992, -1.9463335275650024, -1.8886101245880127, -1.8308866024017334, -1.7731631994247437, -1.7154396772384644, -1.6577162742614746, -1.5999927520751953, -1.5422693490982056, -1.4845459461212158, -1.4268224239349365, -1.3690990209579468, -1.311375617980957, -1.2536520957946777, -1.195928692817688, -1.1382051706314087, -1.080481767654419, -1.0227583646774292, -0.9650349020957947, -0.9073114395141602, -0.8495880365371704, -0.7918646335601807, -0.7341411709785461, -0.6764177680015564, -0.6186943054199219, -0.5609709024429321, -0.5032474398612976, -0.4455239772796631, -0.38780054450035095, -0.3300771117210388, -0.2723536789417267, -0.21463023126125336, -0.15690678358078003, -0.0991833508014679, -0.04145991802215576, 0.01626354455947876, 0.0739869773387909, 0.13171041011810303, 0.18943384289741516, 0.2471572905778885, 0.3048807382583618, 0.36260417103767395, 0.4203276038169861, 0.4780510663986206, 0.5357744693756104, 0.5934979319572449, 0.6512213945388794, 0.7089447975158691, 0.7666682600975037, 0.8243917226791382, 0.8821151256561279, 0.9398385882377625, 0.997562050819397, 1.0552854537963867]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 3.0, 5.0, 4.0, 8.0, 10.0, 9.0, 12.0, 19.0, 17.0, 24.0, 20.0, 34.0, 28.0, 43.0, 38.0, 39.0, 48.0, 46.0, 41.0, 46.0, 47.0, 53.0, 44.0, 44.0, 46.0, 51.0, 37.0, 23.0, 34.0, 20.0, 20.0, 18.0, 15.0, 14.0, 14.0, 12.0, 12.0, 3.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1742118000984192, -0.16894155740737915, -0.1636713296175003, -0.15840108692646027, -0.15313085913658142, -0.14786061644554138, -0.14259037375450134, -0.1373201459646225, -0.13204991817474365, -0.1267796754837036, -0.12150944769382477, -0.11623920500278473, -0.11096897721290588, -0.10569873452186584, -0.1004284992814064, -0.09515826404094696, -0.08988802134990692, -0.08461778610944748, -0.07934755086898804, -0.074077308177948, -0.06880708038806915, -0.06353683769702911, -0.05826660245656967, -0.05299636721611023, -0.04772613197565079, -0.042455896735191345, -0.0371856614947319, -0.03191542252898216, -0.02664518728852272, -0.021374952048063278, -0.016104713082313538, -0.010834477841854095, -0.005564242601394653, -0.00029400642961263657, 0.00497622974216938, 0.010246466845273972, 0.015516702085733414, 0.020786937326192856, 0.026057176291942596, 0.03132741153240204, 0.03659764677286148, 0.04186788201332092, 0.047138117253780365, 0.052408356219530106, 0.05767859145998955, 0.06294882297515869, 0.06821906566619873, 0.07348930090665817, 0.07875953614711761, 0.08402977138757706, 0.0893000066280365, 0.09457024931907654, 0.09984047710895538, 0.10511071979999542, 0.11038095504045486, 0.1156511902809143, 0.12092142552137375, 0.1261916607618332, 0.13146190345287323, 0.13673213124275208, 0.14200237393379211, 0.14727260172367096, 0.152542844414711, 0.15781307220458984, 0.16308331489562988]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 5.0, 6.0, 20.0, 6.0, 13.0, 13.0, 28.0, 33.0, 42.0, 61.0, 70.0, 110.0, 183.0, 232.0, 443.0, 848.0, 1980.0, 5429.0, 26903.0, 918887.0, 78919.0, 8975.0, 2687.0, 1090.0, 566.0, 355.0, 203.0, 119.0, 91.0, 63.0, 42.0, 26.0, 28.0, 14.0, 15.0, 11.0, 9.0, 8.0, 6.0, 3.0, 4.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.935546875, -0.9029388427734375, -0.870330810546875, -0.8377227783203125, -0.80511474609375, -0.7725067138671875, -0.739898681640625, -0.7072906494140625, -0.6746826171875, -0.6420745849609375, -0.609466552734375, -0.5768585205078125, -0.54425048828125, -0.5116424560546875, -0.479034423828125, -0.4464263916015625, -0.413818359375, -0.3812103271484375, -0.348602294921875, -0.3159942626953125, -0.28338623046875, -0.2507781982421875, -0.218170166015625, -0.1855621337890625, -0.1529541015625, -0.1203460693359375, -0.087738037109375, -0.0551300048828125, -0.02252197265625, 0.0100860595703125, 0.042694091796875, 0.0753021240234375, 0.10791015625, 0.1405181884765625, 0.173126220703125, 0.2057342529296875, 0.23834228515625, 0.2709503173828125, 0.303558349609375, 0.3361663818359375, 0.3687744140625, 0.4013824462890625, 0.433990478515625, 0.4665985107421875, 0.49920654296875, 0.5318145751953125, 0.564422607421875, 0.5970306396484375, 0.629638671875, 0.6622467041015625, 0.694854736328125, 0.7274627685546875, 0.76007080078125, 0.7926788330078125, 0.825286865234375, 0.8578948974609375, 0.8905029296875, 0.9231109619140625, 0.955718994140625, 0.9883270263671875, 1.02093505859375, 1.0535430908203125, 1.086151123046875, 1.1187591552734375, 1.1513671875]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 4.0, 5.0, 3.0, 6.0, 15.0, 16.0, 33.0, 45.0, 71.0, 148.0, 349.0, 130.0, 74.0, 43.0, 16.0, 13.0, 9.0, 11.0, 8.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.16455078125, -0.1587677001953125, -0.152984619140625, -0.1472015380859375, -0.14141845703125, -0.1356353759765625, -0.129852294921875, -0.1240692138671875, -0.1182861328125, -0.1125030517578125, -0.106719970703125, -0.1009368896484375, -0.09515380859375, -0.0893707275390625, -0.083587646484375, -0.0778045654296875, -0.072021484375, -0.0662384033203125, -0.060455322265625, -0.0546722412109375, -0.04888916015625, -0.0431060791015625, -0.037322998046875, -0.0315399169921875, -0.0257568359375, -0.0199737548828125, -0.014190673828125, -0.0084075927734375, -0.00262451171875, 0.0031585693359375, 0.008941650390625, 0.0147247314453125, 0.0205078125, 0.0262908935546875, 0.032073974609375, 0.0378570556640625, 0.04364013671875, 0.0494232177734375, 0.055206298828125, 0.0609893798828125, 0.0667724609375, 0.0725555419921875, 0.078338623046875, 0.0841217041015625, 0.08990478515625, 0.0956878662109375, 0.101470947265625, 0.1072540283203125, 0.113037109375, 0.1188201904296875, 0.124603271484375, 0.1303863525390625, 0.13616943359375, 0.1419525146484375, 0.147735595703125, 0.1535186767578125, 0.1593017578125, 0.1650848388671875, 0.170867919921875, 0.1766510009765625, 0.18243408203125, 0.1882171630859375, 0.194000244140625, 0.1997833251953125, 0.20556640625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 4.0, 4.0, 1.0, 2.0, 10.0, 5.0, 9.0, 10.0, 11.0, 19.0, 25.0, 19.0, 24.0, 42.0, 58.0, 60.0, 74.0, 99.0, 129.0, 158.0, 298.0, 502.0, 1082.0, 3567.0, 17496.0, 118066.0, 580559.0, 276644.0, 39093.0, 6949.0, 1672.0, 678.0, 325.0, 215.0, 143.0, 117.0, 79.0, 64.0, 55.0, 32.0, 36.0, 26.0, 23.0, 11.0, 16.0, 7.0, 15.0, 7.0, 7.0, 7.0, 5.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.2249755859375, -0.2176513671875, -0.2103271484375, -0.2030029296875, -0.1956787109375, -0.1883544921875, -0.1810302734375, -0.1737060546875, -0.1663818359375, -0.1590576171875, -0.1517333984375, -0.1444091796875, -0.1370849609375, -0.1297607421875, -0.1224365234375, -0.1151123046875, -0.1077880859375, -0.1004638671875, -0.0931396484375, -0.0858154296875, -0.0784912109375, -0.0711669921875, -0.0638427734375, -0.0565185546875, -0.0491943359375, -0.0418701171875, -0.0345458984375, -0.0272216796875, -0.0198974609375, -0.0125732421875, -0.0052490234375, 0.0020751953125, 0.0093994140625, 0.0167236328125, 0.0240478515625, 0.0313720703125, 0.0386962890625, 0.0460205078125, 0.0533447265625, 0.0606689453125, 0.0679931640625, 0.0753173828125, 0.0826416015625, 0.0899658203125, 0.0972900390625, 0.1046142578125, 0.1119384765625, 0.1192626953125, 0.1265869140625, 0.1339111328125, 0.1412353515625, 0.1485595703125, 0.1558837890625, 0.1632080078125, 0.1705322265625, 0.1778564453125, 0.1851806640625, 0.1925048828125, 0.1998291015625, 0.2071533203125, 0.2144775390625, 0.2218017578125, 0.2291259765625, 0.2364501953125, 0.2437744140625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 4.0, 5.0, 3.0, 1.0, 7.0, 3.0, 9.0, 15.0, 13.0, 21.0, 20.0, 20.0, 15.0, 34.0, 25.0, 34.0, 28.0, 39.0, 34.0, 41.0, 40.0, 38.0, 28.0, 36.0, 57.0, 38.0, 39.0, 25.0, 37.0, 31.0, 29.0, 38.0, 32.0, 33.0, 25.0, 18.0, 17.0, 11.0, 16.0, 12.0, 7.0, 9.0, 4.0, 7.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.1937255859375, -0.18821144104003906, -0.18269729614257812, -0.1771831512451172, -0.17166900634765625, -0.1661548614501953, -0.16064071655273438, -0.15512657165527344, -0.1496124267578125, -0.14409828186035156, -0.13858413696289062, -0.1330699920654297, -0.12755584716796875, -0.12204170227050781, -0.11652755737304688, -0.11101341247558594, -0.105499267578125, -0.09998512268066406, -0.09447097778320312, -0.08895683288574219, -0.08344268798828125, -0.07792854309082031, -0.07241439819335938, -0.06690025329589844, -0.0613861083984375, -0.05587196350097656, -0.050357818603515625, -0.04484367370605469, -0.03932952880859375, -0.03381538391113281, -0.028301239013671875, -0.022787094116210938, -0.01727294921875, -0.011758804321289062, -0.006244659423828125, -0.0007305145263671875, 0.00478363037109375, 0.010297775268554688, 0.015811920166015625, 0.021326065063476562, 0.0268402099609375, 0.03235435485839844, 0.037868499755859375, 0.04338264465332031, 0.04889678955078125, 0.05441093444824219, 0.059925079345703125, 0.06543922424316406, 0.070953369140625, 0.07646751403808594, 0.08198165893554688, 0.08749580383300781, 0.09300994873046875, 0.09852409362792969, 0.10403823852539062, 0.10955238342285156, 0.1150665283203125, 0.12058067321777344, 0.12609481811523438, 0.1316089630126953, 0.13712310791015625, 0.1426372528076172, 0.14815139770507812, 0.15366554260253906, 0.1591796875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 6.0, 6.0, 7.0, 8.0, 13.0, 12.0, 13.0, 31.0, 31.0, 40.0, 74.0, 95.0, 155.0, 246.0, 317.0, 531.0, 806.0, 1286.0, 2280.0, 4024.0, 7766.0, 16500.0, 40266.0, 116127.0, 370705.0, 320975.0, 99847.0, 35391.0, 14918.0, 7134.0, 3678.0, 1959.0, 1146.0, 740.0, 448.0, 312.0, 202.0, 141.0, 82.0, 56.0, 53.0, 42.0, 34.0, 8.0, 14.0, 11.0, 8.0, 7.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.06536865234375, -0.06325531005859375, -0.0611419677734375, -0.05902862548828125, -0.056915283203125, -0.05480194091796875, -0.0526885986328125, -0.05057525634765625, -0.0484619140625, -0.04634857177734375, -0.0442352294921875, -0.04212188720703125, -0.040008544921875, -0.03789520263671875, -0.0357818603515625, -0.03366851806640625, -0.03155517578125, -0.02944183349609375, -0.0273284912109375, -0.02521514892578125, -0.023101806640625, -0.02098846435546875, -0.0188751220703125, -0.01676177978515625, -0.0146484375, -0.01253509521484375, -0.0104217529296875, -0.00830841064453125, -0.006195068359375, -0.00408172607421875, -0.0019683837890625, 0.00014495849609375, 0.00225830078125, 0.00437164306640625, 0.0064849853515625, 0.00859832763671875, 0.010711669921875, 0.01282501220703125, 0.0149383544921875, 0.01705169677734375, 0.0191650390625, 0.02127838134765625, 0.0233917236328125, 0.02550506591796875, 0.027618408203125, 0.02973175048828125, 0.0318450927734375, 0.03395843505859375, 0.03607177734375, 0.03818511962890625, 0.0402984619140625, 0.04241180419921875, 0.044525146484375, 0.04663848876953125, 0.0487518310546875, 0.05086517333984375, 0.052978515625, 0.05509185791015625, 0.0572052001953125, 0.05931854248046875, 0.061431884765625, 0.06354522705078125, 0.0656585693359375, 0.06777191162109375, 0.06988525390625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 2.0, 2.0, 5.0, 3.0, 2.0, 5.0, 6.0, 8.0, 9.0, 14.0, 24.0, 19.0, 33.0, 37.0, 52.0, 54.0, 63.0, 92.0, 67.0, 110.0, 81.0, 82.0, 54.0, 43.0, 37.0, 14.0, 29.0, 15.0, 10.0, 4.0, 5.0, 4.0, 6.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.1622905731201172e-05, -1.1298805475234985e-05, -1.0974705219268799e-05, -1.0650604963302612e-05, -1.0326504707336426e-05, -1.000240445137024e-05, -9.678304195404053e-06, -9.354203939437866e-06, -9.03010368347168e-06, -8.706003427505493e-06, -8.381903171539307e-06, -8.05780291557312e-06, -7.733702659606934e-06, -7.409602403640747e-06, -7.0855021476745605e-06, -6.761401891708374e-06, -6.4373016357421875e-06, -6.113201379776001e-06, -5.7891011238098145e-06, -5.465000867843628e-06, -5.140900611877441e-06, -4.816800355911255e-06, -4.492700099945068e-06, -4.168599843978882e-06, -3.844499588012695e-06, -3.520399332046509e-06, -3.1962990760803223e-06, -2.8721988201141357e-06, -2.5480985641479492e-06, -2.2239983081817627e-06, -1.8998980522155762e-06, -1.5757977962493896e-06, -1.2516975402832031e-06, -9.275972843170166e-07, -6.034970283508301e-07, -2.7939677238464355e-07, 4.470348358154297e-08, 3.688037395477295e-07, 6.92903995513916e-07, 1.0170042514801025e-06, 1.341104507446289e-06, 1.6652047634124756e-06, 1.989305019378662e-06, 2.3134052753448486e-06, 2.637505531311035e-06, 2.9616057872772217e-06, 3.285706043243408e-06, 3.6098062992095947e-06, 3.933906555175781e-06, 4.258006811141968e-06, 4.582107067108154e-06, 4.906207323074341e-06, 5.230307579040527e-06, 5.554407835006714e-06, 5.8785080909729e-06, 6.202608346939087e-06, 6.5267086029052734e-06, 6.85080885887146e-06, 7.1749091148376465e-06, 7.499009370803833e-06, 7.82310962677002e-06, 8.147209882736206e-06, 8.471310138702393e-06, 8.795410394668579e-06, 9.119510650634766e-06]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 7.0, 11.0, 11.0, 13.0, 26.0, 21.0, 31.0, 55.0, 106.0, 131.0, 220.0, 399.0, 779.0, 1422.0, 2902.0, 6949.0, 20941.0, 82015.0, 404445.0, 410161.0, 83400.0, 21181.0, 7127.0, 2952.0, 1452.0, 725.0, 402.0, 242.0, 154.0, 85.0, 51.0, 45.0, 33.0, 20.0, 12.0, 7.0, 7.0, 7.0, 3.0, 4.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.09063720703125, -0.08804798126220703, -0.08545875549316406, -0.0828695297241211, -0.08028030395507812, -0.07769107818603516, -0.07510185241699219, -0.07251262664794922, -0.06992340087890625, -0.06733417510986328, -0.06474494934082031, -0.062155723571777344, -0.059566497802734375, -0.056977272033691406, -0.05438804626464844, -0.05179882049560547, -0.0492095947265625, -0.04662036895751953, -0.04403114318847656, -0.041441917419433594, -0.038852691650390625, -0.036263465881347656, -0.03367424011230469, -0.03108501434326172, -0.02849578857421875, -0.02590656280517578, -0.023317337036132812, -0.020728111267089844, -0.018138885498046875, -0.015549659729003906, -0.012960433959960938, -0.010371208190917969, -0.007781982421875, -0.005192756652832031, -0.0026035308837890625, -1.430511474609375e-05, 0.002574920654296875, 0.005164146423339844, 0.0077533721923828125, 0.010342597961425781, 0.01293182373046875, 0.015521049499511719, 0.018110275268554688, 0.020699501037597656, 0.023288726806640625, 0.025877952575683594, 0.028467178344726562, 0.03105640411376953, 0.0336456298828125, 0.03623485565185547, 0.03882408142089844, 0.041413307189941406, 0.044002532958984375, 0.046591758728027344, 0.04918098449707031, 0.05177021026611328, 0.05435943603515625, 0.05694866180419922, 0.05953788757324219, 0.062127113342285156, 0.06471633911132812, 0.0673055648803711, 0.06989479064941406, 0.07248401641845703, 0.0750732421875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 2.0, 2.0, 4.0, 7.0, 6.0, 6.0, 11.0, 12.0, 16.0, 21.0, 28.0, 39.0, 35.0, 39.0, 55.0, 54.0, 62.0, 69.0, 88.0, 80.0, 60.0, 50.0, 46.0, 34.0, 38.0, 28.0, 26.0, 19.0, 11.0, 9.0, 7.0, 10.0, 10.0, 5.0, 4.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0458984375, -0.04403400421142578, -0.04216957092285156, -0.040305137634277344, -0.038440704345703125, -0.036576271057128906, -0.03471183776855469, -0.03284740447998047, -0.03098297119140625, -0.02911853790283203, -0.027254104614257812, -0.025389671325683594, -0.023525238037109375, -0.021660804748535156, -0.019796371459960938, -0.01793193817138672, -0.0160675048828125, -0.014203071594238281, -0.012338638305664062, -0.010474205017089844, -0.008609771728515625, -0.006745338439941406, -0.0048809051513671875, -0.0030164718627929688, -0.00115203857421875, 0.0007123947143554688, 0.0025768280029296875, 0.004441261291503906, 0.006305694580078125, 0.008170127868652344, 0.010034561157226562, 0.011898994445800781, 0.013763427734375, 0.01562786102294922, 0.017492294311523438, 0.019356727600097656, 0.021221160888671875, 0.023085594177246094, 0.024950027465820312, 0.02681446075439453, 0.02867889404296875, 0.03054332733154297, 0.03240776062011719, 0.034272193908691406, 0.036136627197265625, 0.038001060485839844, 0.03986549377441406, 0.04172992706298828, 0.0435943603515625, 0.04545879364013672, 0.04732322692871094, 0.049187660217285156, 0.051052093505859375, 0.052916526794433594, 0.05478096008300781, 0.05664539337158203, 0.05850982666015625, 0.06037425994873047, 0.06223869323730469, 0.0641031265258789, 0.06596755981445312, 0.06783199310302734, 0.06969642639160156, 0.07156085968017578, 0.07342529296875]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 10.0, 29.0, 60.0, 167.0, 390.0, 261.0, 68.0, 17.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.976993560791016, -4.872744560241699, -4.768496036529541, -4.664247035980225, -4.559998512268066, -4.45574951171875, -4.351500988006592, -4.247251987457275, -4.143003463745117, -4.038754463195801, -3.9345059394836426, -3.8302571773529053, -3.726008415222168, -3.6217594146728516, -3.5175106525421143, -3.413261890411377, -3.3090128898620605, -3.2047641277313232, -3.100515365600586, -2.9962666034698486, -2.8920178413391113, -2.787768840789795, -2.6835200786590576, -2.5792713165283203, -2.475022554397583, -2.3707737922668457, -2.2665250301361084, -2.162276268005371, -2.0580272674560547, -1.953778624534607, -1.84952974319458, -1.7452809810638428, -1.6410322189331055, -1.5367834568023682, -1.4325346946716309, -1.328285813331604, -1.2240370512008667, -1.1197882890701294, -1.0155394077301025, -0.9112906455993652, -0.8070418834686279, -0.7027931213378906, -0.5985442996025085, -0.49429550766944885, -0.39004671573638916, -0.28579795360565186, -0.18154913187026978, -0.0773003101348877, 0.02694845199584961, 0.1311972439289093, 0.235446035861969, 0.3396948277950287, 0.4439436197280884, 0.5481923818588257, 0.6524412035942078, 0.7566900253295898, 0.8609387874603271, 0.9651875495910645, 1.0694363117218018, 1.1736851930618286, 1.277933955192566, 1.3821827173233032, 1.48643159866333, 1.5906803607940674, 1.6949291229248047]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 3.0, 4.0, 6.0, 7.0, 17.0, 22.0, 26.0, 25.0, 46.0, 32.0, 39.0, 42.0, 48.0, 53.0, 54.0, 62.0, 46.0, 51.0, 56.0, 43.0, 51.0, 42.0, 33.0, 34.0, 34.0, 36.0, 21.0, 25.0, 14.0, 18.0, 5.0, 7.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.8114482164382935, -1.7571368217468262, -1.7028255462646484, -1.6485141515731812, -1.5942028760910034, -1.5398914813995361, -1.4855802059173584, -1.4312688112258911, -1.3769574165344238, -1.3226460218429565, -1.2683347463607788, -1.2140233516693115, -1.1597120761871338, -1.1054006814956665, -1.0510892868041992, -0.9967780113220215, -0.9424667358398438, -0.8881554007530212, -0.8338440656661987, -0.7795326709747314, -0.7252213954925537, -0.6709100008010864, -0.6165986657142639, -0.5622873306274414, -0.5079759955406189, -0.4536646604537964, -0.3993533253669739, -0.345041960477829, -0.29073062539100647, -0.23641929030418396, -0.18210792541503906, -0.12779659032821655, -0.0734853744506836, -0.019174031913280487, 0.03513731062412262, 0.08944866061210632, 0.14375999569892883, 0.19807133078575134, 0.25238269567489624, 0.30669403076171875, 0.36100536584854126, 0.41531670093536377, 0.4696280360221863, 0.5239393711090088, 0.5782507658004761, 0.6325620412826538, 0.6868734359741211, 0.7411847710609436, 0.7954961061477661, 0.8498074412345886, 0.9041187763214111, 0.9584301710128784, 1.0127414464950562, 1.0670528411865234, 1.1213641166687012, 1.1756755113601685, 1.2299869060516357, 1.284298300743103, 1.3386095762252808, 1.392920970916748, 1.4472322463989258, 1.501543641090393, 1.5558550357818604, 1.610166311264038, 1.6644775867462158]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 7.0, 2.0, 1.0, 8.0, 14.0, 15.0, 22.0, 36.0, 56.0, 164.0, 915.0, 1450033.0, 2741716.0, 927.0, 178.0, 75.0, 44.0, 21.0, 17.0, 9.0, 9.0, 9.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.908203125, -0.87188720703125, -0.8355712890625, -0.79925537109375, -0.762939453125, -0.72662353515625, -0.6903076171875, -0.65399169921875, -0.61767578125, -0.58135986328125, -0.5450439453125, -0.50872802734375, -0.472412109375, -0.43609619140625, -0.3997802734375, -0.36346435546875, -0.3271484375, -0.29083251953125, -0.2545166015625, -0.21820068359375, -0.181884765625, -0.14556884765625, -0.1092529296875, -0.07293701171875, -0.03662109375, -0.00030517578125, 0.0360107421875, 0.07232666015625, 0.108642578125, 0.14495849609375, 0.1812744140625, 0.21759033203125, 0.25390625, 0.29022216796875, 0.3265380859375, 0.36285400390625, 0.399169921875, 0.43548583984375, 0.4718017578125, 0.50811767578125, 0.54443359375, 0.58074951171875, 0.6170654296875, 0.65338134765625, 0.689697265625, 0.72601318359375, 0.7623291015625, 0.79864501953125, 0.8349609375, 0.87127685546875, 0.9075927734375, 0.94390869140625, 0.980224609375, 1.01654052734375, 1.0528564453125, 1.08917236328125, 1.12548828125, 1.16180419921875, 1.1981201171875, 1.23443603515625, 1.270751953125, 1.30706787109375, 1.3433837890625, 1.37969970703125, 1.416015625]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 6.0, 9.0, 8.0, 16.0, 24.0, 33.0, 49.0, 105.0, 147.0, 187.0, 160.0, 97.0, 59.0, 37.0, 15.0, 19.0, 6.0, 15.0, 6.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1231689453125, -0.11816215515136719, -0.11315536499023438, -0.10814857482910156, -0.10314178466796875, -0.09813499450683594, -0.09312820434570312, -0.08812141418457031, -0.0831146240234375, -0.07810783386230469, -0.07310104370117188, -0.06809425354003906, -0.06308746337890625, -0.05808067321777344, -0.053073883056640625, -0.04806709289550781, -0.043060302734375, -0.03805351257324219, -0.033046722412109375, -0.028039932250976562, -0.02303314208984375, -0.018026351928710938, -0.013019561767578125, -0.008012771606445312, -0.0030059814453125, 0.0020008087158203125, 0.007007598876953125, 0.012014389038085938, 0.01702117919921875, 0.022027969360351562, 0.027034759521484375, 0.03204154968261719, 0.03704833984375, 0.04205513000488281, 0.047061920166015625, 0.05206871032714844, 0.05707550048828125, 0.06208229064941406, 0.06708908081054688, 0.07209587097167969, 0.0771026611328125, 0.08210945129394531, 0.08711624145507812, 0.09212303161621094, 0.09712982177734375, 0.10213661193847656, 0.10714340209960938, 0.11215019226074219, 0.117156982421875, 0.12216377258300781, 0.12717056274414062, 0.13217735290527344, 0.13718414306640625, 0.14219093322753906, 0.14719772338867188, 0.1522045135498047, 0.1572113037109375, 0.1622180938720703, 0.16722488403320312, 0.17223167419433594, 0.17723846435546875, 0.18224525451660156, 0.18725204467773438, 0.1922588348388672, 0.197265625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 2.0, 3.0, 2.0, 6.0, 9.0, 11.0, 13.0, 18.0, 25.0, 30.0, 37.0, 54.0, 75.0, 161.0, 299.0, 1011.0, 4042.0, 24739.0, 423824.0, 3622569.0, 102968.0, 11047.0, 2188.0, 612.0, 235.0, 118.0, 63.0, 27.0, 25.0, 14.0, 11.0, 14.0, 8.0, 3.0, 4.0, 6.0, 0.0, 1.0, 1.0, 3.0], "bins": [-0.439453125, -0.42930030822753906, -0.4191474914550781, -0.4089946746826172, -0.39884185791015625, -0.3886890411376953, -0.3785362243652344, -0.36838340759277344, -0.3582305908203125, -0.34807777404785156, -0.3379249572753906, -0.3277721405029297, -0.31761932373046875, -0.3074665069580078, -0.2973136901855469, -0.28716087341308594, -0.277008056640625, -0.26685523986816406, -0.2567024230957031, -0.2465496063232422, -0.23639678955078125, -0.2262439727783203, -0.21609115600585938, -0.20593833923339844, -0.1957855224609375, -0.18563270568847656, -0.17547988891601562, -0.1653270721435547, -0.15517425537109375, -0.1450214385986328, -0.13486862182617188, -0.12471580505371094, -0.11456298828125, -0.10441017150878906, -0.09425735473632812, -0.08410453796386719, -0.07395172119140625, -0.06379890441894531, -0.053646087646484375, -0.04349327087402344, -0.0333404541015625, -0.023187637329101562, -0.013034820556640625, -0.0028820037841796875, 0.00727081298828125, 0.017423629760742188, 0.027576446533203125, 0.03772926330566406, 0.047882080078125, 0.05803489685058594, 0.06818771362304688, 0.07834053039550781, 0.08849334716796875, 0.09864616394042969, 0.10879898071289062, 0.11895179748535156, 0.1291046142578125, 0.13925743103027344, 0.14941024780273438, 0.1595630645751953, 0.16971588134765625, 0.1798686981201172, 0.19002151489257812, 0.20017433166503906, 0.2103271484375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 2.0, 2.0, 6.0, 1.0, 5.0, 5.0, 7.0, 8.0, 14.0, 13.0, 11.0, 22.0, 34.0, 21.0, 42.0, 53.0, 62.0, 102.0, 144.0, 209.0, 411.0, 739.0, 946.0, 510.0, 295.0, 165.0, 76.0, 61.0, 33.0, 19.0, 15.0, 10.0, 6.0, 5.0, 8.0, 4.0, 1.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1312255859375, -0.1279773712158203, -0.12472915649414062, -0.12148094177246094, -0.11823272705078125, -0.11498451232910156, -0.11173629760742188, -0.10848808288574219, -0.1052398681640625, -0.10199165344238281, -0.09874343872070312, -0.09549522399902344, -0.09224700927734375, -0.08899879455566406, -0.08575057983398438, -0.08250236511230469, -0.079254150390625, -0.07600593566894531, -0.07275772094726562, -0.06950950622558594, -0.06626129150390625, -0.06301307678222656, -0.059764862060546875, -0.05651664733886719, -0.0532684326171875, -0.05002021789550781, -0.046772003173828125, -0.04352378845214844, -0.04027557373046875, -0.03702735900878906, -0.033779144287109375, -0.030530929565429688, -0.02728271484375, -0.024034500122070312, -0.020786285400390625, -0.017538070678710938, -0.01428985595703125, -0.011041641235351562, -0.007793426513671875, -0.0045452117919921875, -0.0012969970703125, 0.0019512176513671875, 0.005199432373046875, 0.008447647094726562, 0.01169586181640625, 0.014944076538085938, 0.018192291259765625, 0.021440505981445312, 0.024688720703125, 0.027936935424804688, 0.031185150146484375, 0.03443336486816406, 0.03768157958984375, 0.04092979431152344, 0.044178009033203125, 0.04742622375488281, 0.0506744384765625, 0.05392265319824219, 0.057170867919921875, 0.06041908264160156, 0.06366729736328125, 0.06691551208496094, 0.07016372680664062, 0.07341194152832031, 0.07666015625]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 9.0, 697.0, 310.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.005799770355225, -3.782850980758667, -3.5599021911621094, -3.3369534015655518, -3.114004611968994, -2.8910558223724365, -2.668107032775879, -2.4451582431793213, -2.2222094535827637, -1.999260663986206, -1.7763118743896484, -1.5533630847930908, -1.3304142951965332, -1.1074655055999756, -0.884516716003418, -0.6615679264068604, -0.43861913681030273, -0.21567034721374512, 0.0072784423828125, 0.23022723197937012, 0.45317602157592773, 0.6761248111724854, 0.899073600769043, 1.1220223903656006, 1.3449711799621582, 1.5679199695587158, 1.7908687591552734, 2.013817548751831, 2.2367663383483887, 2.4597151279449463, 2.682663917541504, 2.9056127071380615, 3.1285619735717773, 3.351510763168335, 3.5744595527648926, 3.79740834236145, 4.020357131958008, 4.2433061599731445, 4.466254711151123, 4.689203262329102, 4.912152290344238, 5.135101318359375, 5.3580498695373535, 5.580998420715332, 5.803947448730469, 6.0268964767456055, 6.249845027923584, 6.4727935791015625, 6.695742607116699, 6.918691635131836, 7.1416401863098145, 7.364588737487793, 7.58753776550293, 7.810486793518066, 8.033435821533203, 8.256383895874023, 8.47933292388916, 8.702281951904297, 8.925230026245117, 9.148179054260254, 9.37112808227539, 9.594077110290527, 9.817026138305664, 10.039974212646484, 10.262923240661621]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 7.0, 5.0, 8.0, 12.0, 11.0, 15.0, 19.0, 32.0, 45.0, 34.0, 52.0, 55.0, 60.0, 60.0, 64.0, 52.0, 56.0, 53.0, 52.0, 49.0, 42.0, 47.0, 38.0, 37.0, 34.0, 16.0, 15.0, 11.0, 7.0, 9.0, 6.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4416899085044861, -0.42432186007499695, -0.4069538116455078, -0.3895857632160187, -0.37221771478652954, -0.3548496663570404, -0.33748161792755127, -0.32011356949806213, -0.302745521068573, -0.28537747263908386, -0.2680094242095947, -0.2506413757801056, -0.23327332735061646, -0.21590527892112732, -0.19853723049163818, -0.18116918206214905, -0.1638011336326599, -0.14643308520317078, -0.12906503677368164, -0.1116969883441925, -0.09432893991470337, -0.07696089148521423, -0.0595928430557251, -0.04222479462623596, -0.024856746196746826, -0.00748869776725769, 0.009879350662231445, 0.02724739909172058, 0.04461544752120972, 0.06198349595069885, 0.07935154438018799, 0.09671959280967712, 0.11408764123916626, 0.1314556896686554, 0.14882373809814453, 0.16619178652763367, 0.1835598349571228, 0.20092788338661194, 0.21829593181610107, 0.2356639802455902, 0.25303202867507935, 0.2704000771045685, 0.2877681255340576, 0.30513617396354675, 0.3225042223930359, 0.339872270822525, 0.35724031925201416, 0.3746083676815033, 0.39197641611099243, 0.40934446454048157, 0.4267125129699707, 0.44408056139945984, 0.461448609828949, 0.4788166582584381, 0.49618470668792725, 0.5135527849197388, 0.5309208035469055, 0.5482888221740723, 0.5656569004058838, 0.5830249786376953, 0.6003929972648621, 0.6177610158920288, 0.6351290941238403, 0.6524971723556519, 0.6698651909828186]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 3.0, 4.0, 4.0, 9.0, 9.0, 12.0, 8.0, 26.0, 26.0, 35.0, 63.0, 78.0, 147.0, 199.0, 373.0, 739.0, 1745.0, 5872.0, 30044.0, 298410.0, 639332.0, 57376.0, 9481.0, 2513.0, 938.0, 424.0, 260.0, 139.0, 103.0, 61.0, 40.0, 29.0, 17.0, 7.0, 12.0, 14.0, 6.0, 2.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.287841796875, -0.27724456787109375, -0.2666473388671875, -0.25605010986328125, -0.245452880859375, -0.23485565185546875, -0.2242584228515625, -0.21366119384765625, -0.20306396484375, -0.19246673583984375, -0.1818695068359375, -0.17127227783203125, -0.160675048828125, -0.15007781982421875, -0.1394805908203125, -0.12888336181640625, -0.1182861328125, -0.10768890380859375, -0.0970916748046875, -0.08649444580078125, -0.075897216796875, -0.06529998779296875, -0.0547027587890625, -0.04410552978515625, -0.03350830078125, -0.02291107177734375, -0.0123138427734375, -0.00171661376953125, 0.008880615234375, 0.01947784423828125, 0.0300750732421875, 0.04067230224609375, 0.05126953125, 0.06186676025390625, 0.0724639892578125, 0.08306121826171875, 0.093658447265625, 0.10425567626953125, 0.1148529052734375, 0.12545013427734375, 0.13604736328125, 0.14664459228515625, 0.1572418212890625, 0.16783905029296875, 0.178436279296875, 0.18903350830078125, 0.1996307373046875, 0.21022796630859375, 0.2208251953125, 0.23142242431640625, 0.2420196533203125, 0.25261688232421875, 0.263214111328125, 0.27381134033203125, 0.2844085693359375, 0.29500579833984375, 0.30560302734375, 0.31620025634765625, 0.3267974853515625, 0.33739471435546875, 0.347991943359375, 0.35858917236328125, 0.3691864013671875, 0.37978363037109375, 0.390380859375]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 0.0, 2.0, 7.0, 10.0, 7.0, 22.0, 29.0, 29.0, 49.0, 91.0, 119.0, 169.0, 158.0, 117.0, 66.0, 43.0, 21.0, 19.0, 20.0, 9.0, 9.0, 4.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.11322021484375, -0.10846805572509766, -0.10371589660644531, -0.09896373748779297, -0.09421157836914062, -0.08945941925048828, -0.08470726013183594, -0.0799551010131836, -0.07520294189453125, -0.0704507827758789, -0.06569862365722656, -0.06094646453857422, -0.056194305419921875, -0.05144214630126953, -0.04668998718261719, -0.041937828063964844, -0.0371856689453125, -0.032433509826660156, -0.027681350708007812, -0.02292919158935547, -0.018177032470703125, -0.013424873352050781, -0.008672714233398438, -0.003920555114746094, 0.00083160400390625, 0.005583763122558594, 0.010335922241210938, 0.015088081359863281, 0.019840240478515625, 0.02459239959716797, 0.029344558715820312, 0.034096717834472656, 0.038848876953125, 0.043601036071777344, 0.04835319519042969, 0.05310535430908203, 0.057857513427734375, 0.06260967254638672, 0.06736183166503906, 0.0721139907836914, 0.07686614990234375, 0.0816183090209961, 0.08637046813964844, 0.09112262725830078, 0.09587478637695312, 0.10062694549560547, 0.10537910461425781, 0.11013126373291016, 0.1148834228515625, 0.11963558197021484, 0.12438774108886719, 0.12913990020751953, 0.13389205932617188, 0.13864421844482422, 0.14339637756347656, 0.1481485366821289, 0.15290069580078125, 0.1576528549194336, 0.16240501403808594, 0.16715717315673828, 0.17190933227539062, 0.17666149139404297, 0.1814136505126953, 0.18616580963134766, 0.19091796875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 5.0, 1.0, 4.0, 3.0, 2.0, 1.0, 1.0, 7.0, 6.0, 8.0, 18.0, 13.0, 15.0, 14.0, 20.0, 20.0, 29.0, 23.0, 36.0, 34.0, 43.0, 45.0, 55.0, 127.0, 554.0, 9230.0, 890338.0, 145033.0, 2181.0, 295.0, 84.0, 58.0, 43.0, 22.0, 31.0, 33.0, 18.0, 22.0, 22.0, 13.0, 13.0, 11.0, 11.0, 6.0, 5.0, 3.0, 8.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8857421875, -0.8560028076171875, -0.826263427734375, -0.7965240478515625, -0.76678466796875, -0.7370452880859375, -0.707305908203125, -0.6775665283203125, -0.6478271484375, -0.6180877685546875, -0.588348388671875, -0.5586090087890625, -0.52886962890625, -0.4991302490234375, -0.469390869140625, -0.4396514892578125, -0.409912109375, -0.3801727294921875, -0.350433349609375, -0.3206939697265625, -0.29095458984375, -0.2612152099609375, -0.231475830078125, -0.2017364501953125, -0.1719970703125, -0.1422576904296875, -0.112518310546875, -0.0827789306640625, -0.05303955078125, -0.0233001708984375, 0.006439208984375, 0.0361785888671875, 0.06591796875, 0.0956573486328125, 0.125396728515625, 0.1551361083984375, 0.18487548828125, 0.2146148681640625, 0.244354248046875, 0.2740936279296875, 0.3038330078125, 0.3335723876953125, 0.363311767578125, 0.3930511474609375, 0.42279052734375, 0.4525299072265625, 0.482269287109375, 0.5120086669921875, 0.541748046875, 0.5714874267578125, 0.601226806640625, 0.6309661865234375, 0.66070556640625, 0.6904449462890625, 0.720184326171875, 0.7499237060546875, 0.7796630859375, 0.8094024658203125, 0.839141845703125, 0.8688812255859375, 0.89862060546875, 0.9283599853515625, 0.958099365234375, 0.9878387451171875, 1.017578125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0, 6.0, 7.0, 12.0, 10.0, 18.0, 14.0, 16.0, 19.0, 23.0, 24.0, 30.0, 41.0, 30.0, 43.0, 38.0, 38.0, 33.0, 46.0, 43.0, 43.0, 48.0, 41.0, 39.0, 36.0, 56.0, 30.0, 26.0, 27.0, 27.0, 28.0, 26.0, 12.0, 12.0, 13.0, 16.0, 7.0, 2.0, 6.0, 5.0, 5.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.160888671875, -0.15545082092285156, -0.15001296997070312, -0.1445751190185547, -0.13913726806640625, -0.1336994171142578, -0.12826156616210938, -0.12282371520996094, -0.1173858642578125, -0.11194801330566406, -0.10651016235351562, -0.10107231140136719, -0.09563446044921875, -0.09019660949707031, -0.08475875854492188, -0.07932090759277344, -0.073883056640625, -0.06844520568847656, -0.06300735473632812, -0.05756950378417969, -0.05213165283203125, -0.04669380187988281, -0.041255950927734375, -0.03581809997558594, -0.0303802490234375, -0.024942398071289062, -0.019504547119140625, -0.014066696166992188, -0.00862884521484375, -0.0031909942626953125, 0.002246856689453125, 0.0076847076416015625, 0.01312255859375, 0.018560409545898438, 0.023998260498046875, 0.029436111450195312, 0.03487396240234375, 0.04031181335449219, 0.045749664306640625, 0.05118751525878906, 0.0566253662109375, 0.06206321716308594, 0.06750106811523438, 0.07293891906738281, 0.07837677001953125, 0.08381462097167969, 0.08925247192382812, 0.09469032287597656, 0.100128173828125, 0.10556602478027344, 0.11100387573242188, 0.11644172668457031, 0.12187957763671875, 0.1273174285888672, 0.13275527954101562, 0.13819313049316406, 0.1436309814453125, 0.14906883239746094, 0.15450668334960938, 0.1599445343017578, 0.16538238525390625, 0.1708202362060547, 0.17625808715820312, 0.18169593811035156, 0.1871337890625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 3.0, 4.0, 6.0, 11.0, 12.0, 17.0, 27.0, 32.0, 52.0, 91.0, 163.0, 271.0, 475.0, 923.0, 1896.0, 4327.0, 11128.0, 36516.0, 182085.0, 632592.0, 132465.0, 29001.0, 9235.0, 3681.0, 1720.0, 826.0, 431.0, 205.0, 116.0, 88.0, 40.0, 36.0, 22.0, 22.0, 11.0, 13.0, 7.0, 6.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1361083984375, -0.1322650909423828, -0.12842178344726562, -0.12457847595214844, -0.12073516845703125, -0.11689186096191406, -0.11304855346679688, -0.10920524597167969, -0.1053619384765625, -0.10151863098144531, -0.09767532348632812, -0.09383201599121094, -0.08998870849609375, -0.08614540100097656, -0.08230209350585938, -0.07845878601074219, -0.074615478515625, -0.07077217102050781, -0.06692886352539062, -0.06308555603027344, -0.05924224853515625, -0.05539894104003906, -0.051555633544921875, -0.04771232604980469, -0.0438690185546875, -0.04002571105957031, -0.036182403564453125, -0.03233909606933594, -0.02849578857421875, -0.024652481079101562, -0.020809173583984375, -0.016965866088867188, -0.01312255859375, -0.009279251098632812, -0.005435943603515625, -0.0015926361083984375, 0.00225067138671875, 0.0060939788818359375, 0.009937286376953125, 0.013780593872070312, 0.0176239013671875, 0.021467208862304688, 0.025310516357421875, 0.029153823852539062, 0.03299713134765625, 0.03684043884277344, 0.040683746337890625, 0.04452705383300781, 0.048370361328125, 0.05221366882324219, 0.056056976318359375, 0.05990028381347656, 0.06374359130859375, 0.06758689880371094, 0.07143020629882812, 0.07527351379394531, 0.0791168212890625, 0.08296012878417969, 0.08680343627929688, 0.09064674377441406, 0.09449005126953125, 0.09833335876464844, 0.10217666625976562, 0.10601997375488281, 0.10986328125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 6.0, 9.0, 10.0, 9.0, 12.0, 13.0, 11.0, 22.0, 22.0, 36.0, 43.0, 57.0, 48.0, 78.0, 66.0, 86.0, 62.0, 80.0, 83.0, 51.0, 45.0, 27.0, 40.0, 12.0, 13.0, 19.0, 9.0, 10.0, 9.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.046627044677734e-06, -7.783062756061554e-06, -7.5194984674453735e-06, -7.255934178829193e-06, -6.992369890213013e-06, -6.728805601596832e-06, -6.465241312980652e-06, -6.2016770243644714e-06, -5.938112735748291e-06, -5.674548447132111e-06, -5.41098415851593e-06, -5.14741986989975e-06, -4.883855581283569e-06, -4.620291292667389e-06, -4.3567270040512085e-06, -4.093162715435028e-06, -3.829598426818848e-06, -3.5660341382026672e-06, -3.302469849586487e-06, -3.0389055609703064e-06, -2.775341272354126e-06, -2.5117769837379456e-06, -2.248212695121765e-06, -1.9846484065055847e-06, -1.7210841178894043e-06, -1.4575198292732239e-06, -1.1939555406570435e-06, -9.30391252040863e-07, -6.668269634246826e-07, -4.032626748085022e-07, -1.3969838619232178e-07, 1.2386590242385864e-07, 3.8743019104003906e-07, 6.509944796562195e-07, 9.145587682723999e-07, 1.1781230568885803e-06, 1.4416873455047607e-06, 1.7052516341209412e-06, 1.9688159227371216e-06, 2.232380211353302e-06, 2.4959444999694824e-06, 2.759508788585663e-06, 3.0230730772018433e-06, 3.2866373658180237e-06, 3.550201654434204e-06, 3.8137659430503845e-06, 4.077330231666565e-06, 4.340894520282745e-06, 4.604458808898926e-06, 4.868023097515106e-06, 5.131587386131287e-06, 5.395151674747467e-06, 5.6587159633636475e-06, 5.922280251979828e-06, 6.185844540596008e-06, 6.449408829212189e-06, 6.712973117828369e-06, 6.9765374064445496e-06, 7.24010169506073e-06, 7.50366598367691e-06, 7.76723027229309e-06, 8.030794560909271e-06, 8.294358849525452e-06, 8.557923138141632e-06, 8.821487426757812e-06]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 6.0, 4.0, 6.0, 8.0, 13.0, 14.0, 15.0, 30.0, 27.0, 41.0, 68.0, 104.0, 264.0, 1770.0, 162067.0, 878428.0, 4883.0, 382.0, 146.0, 62.0, 44.0, 37.0, 28.0, 24.0, 18.0, 18.0, 14.0, 7.0, 6.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3330078125, -0.3219642639160156, -0.31092071533203125, -0.2998771667480469, -0.2888336181640625, -0.2777900695800781, -0.26674652099609375, -0.2557029724121094, -0.244659423828125, -0.23361587524414062, -0.22257232666015625, -0.21152877807617188, -0.2004852294921875, -0.18944168090820312, -0.17839813232421875, -0.16735458374023438, -0.15631103515625, -0.14526748657226562, -0.13422393798828125, -0.12318038940429688, -0.1121368408203125, -0.10109329223632812, -0.09004974365234375, -0.07900619506835938, -0.067962646484375, -0.056919097900390625, -0.04587554931640625, -0.034832000732421875, -0.0237884521484375, -0.012744903564453125, -0.00170135498046875, 0.009342193603515625, 0.0203857421875, 0.031429290771484375, 0.04247283935546875, 0.053516387939453125, 0.0645599365234375, 0.07560348510742188, 0.08664703369140625, 0.09769058227539062, 0.108734130859375, 0.11977767944335938, 0.13082122802734375, 0.14186477661132812, 0.1529083251953125, 0.16395187377929688, 0.17499542236328125, 0.18603897094726562, 0.19708251953125, 0.20812606811523438, 0.21916961669921875, 0.23021316528320312, 0.2412567138671875, 0.2523002624511719, 0.26334381103515625, 0.2743873596191406, 0.285430908203125, 0.2964744567871094, 0.30751800537109375, 0.3185615539550781, 0.3296051025390625, 0.3406486511230469, 0.35169219970703125, 0.3627357482910156, 0.373779296875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 5.0, 7.0, 5.0, 10.0, 14.0, 16.0, 19.0, 23.0, 26.0, 36.0, 46.0, 71.0, 59.0, 99.0, 85.0, 86.0, 76.0, 67.0, 46.0, 31.0, 34.0, 23.0, 23.0, 20.0, 16.0, 17.0, 11.0, 3.0, 3.0, 5.0, 5.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.060638427734375, -0.05871772766113281, -0.056797027587890625, -0.05487632751464844, -0.05295562744140625, -0.05103492736816406, -0.049114227294921875, -0.04719352722167969, -0.0452728271484375, -0.04335212707519531, -0.041431427001953125, -0.03951072692871094, -0.03759002685546875, -0.03566932678222656, -0.033748626708984375, -0.03182792663574219, -0.0299072265625, -0.027986526489257812, -0.026065826416015625, -0.024145126342773438, -0.02222442626953125, -0.020303726196289062, -0.018383026123046875, -0.016462326049804688, -0.0145416259765625, -0.012620925903320312, -0.010700225830078125, -0.008779525756835938, -0.00685882568359375, -0.0049381256103515625, -0.003017425537109375, -0.0010967254638671875, 0.000823974609375, 0.0027446746826171875, 0.004665374755859375, 0.0065860748291015625, 0.00850677490234375, 0.010427474975585938, 0.012348175048828125, 0.014268875122070312, 0.0161895751953125, 0.018110275268554688, 0.020030975341796875, 0.021951675415039062, 0.02387237548828125, 0.025793075561523438, 0.027713775634765625, 0.029634475708007812, 0.03155517578125, 0.03347587585449219, 0.035396575927734375, 0.03731727600097656, 0.03923797607421875, 0.04115867614746094, 0.043079376220703125, 0.04500007629394531, 0.0469207763671875, 0.04884147644042969, 0.050762176513671875, 0.05268287658691406, 0.05460357666015625, 0.05652427673339844, 0.058444976806640625, 0.06036567687988281, 0.062286376953125]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 6.0, 25.0, 444.0, 489.0, 44.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.230231285095215, -8.071907997131348, -7.913585662841797, -7.755262851715088, -7.596940040588379, -7.438616752624512, -7.280294418334961, -7.121971130371094, -6.963648319244385, -6.805325508117676, -6.647002696990967, -6.488679885864258, -6.330357074737549, -6.17203426361084, -6.013710975646973, -5.855388164520264, -5.697065353393555, -5.538742542266846, -5.380419731140137, -5.222096920013428, -5.063774108886719, -4.905450820922852, -4.747128486633301, -4.588805198669434, -4.430482864379883, -4.272160053253174, -4.113837242126465, -3.955514430999756, -3.7971913814544678, -3.638868570327759, -3.48054575920105, -3.3222227096557617, -3.163900136947632, -3.005577325820923, -2.847254514694214, -2.688931465148926, -2.530608654022217, -2.372285842895508, -2.213963031768799, -2.05564022064209, -1.8973172903060913, -1.7389944791793823, -1.5806715488433838, -1.4223487377166748, -1.2640259265899658, -1.1057029962539673, -0.9473801851272583, -0.7890572547912598, -0.6307344436645508, -0.472411572933197, -0.31408873200416565, -0.15576589107513428, 0.0025569796562194824, 0.16087985038757324, 0.3192026615142822, 0.47752559185028076, 0.6358484029769897, 0.7941712737083435, 0.9524941444396973, 1.1108169555664062, 1.2691397666931152, 1.4274626970291138, 1.5857855081558228, 1.7441084384918213, 1.9024312496185303]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 5.0, 6.0, 5.0, 5.0, 5.0, 7.0, 8.0, 12.0, 11.0, 15.0, 11.0, 24.0, 28.0, 16.0, 40.0, 45.0, 43.0, 42.0, 34.0, 35.0, 50.0, 51.0, 39.0, 41.0, 41.0, 45.0, 41.0, 34.0, 29.0, 29.0, 30.0, 30.0, 26.0, 21.0, 20.0, 21.0, 15.0, 15.0, 11.0, 9.0, 5.0, 5.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.8964300751686096, -0.8689583539962769, -0.8414866328239441, -0.8140149116516113, -0.7865432500839233, -0.7590715289115906, -0.7315998077392578, -0.704128086566925, -0.6766563653945923, -0.6491846442222595, -0.6217129230499268, -0.5942412614822388, -0.566769540309906, -0.5392978191375732, -0.5118260979652405, -0.4843543767929077, -0.45688268542289734, -0.4294109642505646, -0.4019392728805542, -0.37446755170822144, -0.34699583053588867, -0.3195241093635559, -0.29205241799354553, -0.26458069682121277, -0.2371089905500412, -0.20963728427886963, -0.18216556310653687, -0.1546938568353653, -0.12722215056419373, -0.09975042939186096, -0.07227872312068939, -0.04480700194835663, -0.01733529567718506, 0.010136416181921959, 0.037608128041028976, 0.06507983803749084, 0.09255155175924301, 0.12002326548099518, 0.14749497175216675, 0.1749666929244995, 0.20243839919567108, 0.22991010546684265, 0.2573818266391754, 0.2848535180091858, 0.31232523918151855, 0.3397969603538513, 0.3672686815261841, 0.39474040269851685, 0.4222120940685272, 0.44968381524086, 0.47715550661087036, 0.5046272277832031, 0.5320989489555359, 0.5595706701278687, 0.5870423316955566, 0.6145141124725342, 0.6419857740402222, 0.6694574952125549, 0.6969292163848877, 0.7244008779525757, 0.7518725991249084, 0.7793443202972412, 0.806816041469574, 0.8342877626419067, 0.8617594838142395]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 5.0, 6.0, 7.0, 14.0, 22.0, 27.0, 37.0, 70.0, 90.0, 196.0, 368.0, 915.0, 3181.0, 14448.0, 261187.0, 3862930.0, 43225.0, 4818.0, 1323.0, 565.0, 319.0, 175.0, 115.0, 68.0, 37.0, 32.0, 19.0, 17.0, 15.0, 14.0, 7.0, 6.0, 4.0, 6.0, 6.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.27197265625, -0.2616233825683594, -0.25127410888671875, -0.24092483520507812, -0.2305755615234375, -0.22022628784179688, -0.20987701416015625, -0.19952774047851562, -0.189178466796875, -0.17882919311523438, -0.16847991943359375, -0.15813064575195312, -0.1477813720703125, -0.13743209838867188, -0.12708282470703125, -0.11673355102539062, -0.10638427734375, -0.09603500366210938, -0.08568572998046875, -0.07533645629882812, -0.0649871826171875, -0.054637908935546875, -0.04428863525390625, -0.033939361572265625, -0.023590087890625, -0.013240814208984375, -0.00289154052734375, 0.007457733154296875, 0.0178070068359375, 0.028156280517578125, 0.03850555419921875, 0.048854827880859375, 0.0592041015625, 0.06955337524414062, 0.07990264892578125, 0.09025192260742188, 0.1006011962890625, 0.11095046997070312, 0.12129974365234375, 0.13164901733398438, 0.141998291015625, 0.15234756469726562, 0.16269683837890625, 0.17304611206054688, 0.1833953857421875, 0.19374465942382812, 0.20409393310546875, 0.21444320678710938, 0.22479248046875, 0.23514175415039062, 0.24549102783203125, 0.2558403015136719, 0.2661895751953125, 0.2765388488769531, 0.28688812255859375, 0.2972373962402344, 0.307586669921875, 0.3179359436035156, 0.32828521728515625, 0.3386344909667969, 0.3489837646484375, 0.3593330383300781, 0.36968231201171875, 0.3800315856933594, 0.390380859375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 5.0, 3.0, 14.0, 16.0, 17.0, 22.0, 37.0, 60.0, 98.0, 158.0, 184.0, 155.0, 74.0, 76.0, 24.0, 20.0, 18.0, 16.0, 2.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.11505126953125, -0.11033344268798828, -0.10561561584472656, -0.10089778900146484, -0.09617996215820312, -0.0914621353149414, -0.08674430847167969, -0.08202648162841797, -0.07730865478515625, -0.07259082794189453, -0.06787300109863281, -0.0631551742553711, -0.058437347412109375, -0.053719520568847656, -0.04900169372558594, -0.04428386688232422, -0.0395660400390625, -0.03484821319580078, -0.030130386352539062, -0.025412559509277344, -0.020694732666015625, -0.015976905822753906, -0.011259078979492188, -0.006541252136230469, -0.00182342529296875, 0.0028944015502929688, 0.0076122283935546875, 0.012330055236816406, 0.017047882080078125, 0.021765708923339844, 0.026483535766601562, 0.03120136260986328, 0.035919189453125, 0.04063701629638672, 0.04535484313964844, 0.050072669982910156, 0.054790496826171875, 0.059508323669433594, 0.06422615051269531, 0.06894397735595703, 0.07366180419921875, 0.07837963104248047, 0.08309745788574219, 0.0878152847290039, 0.09253311157226562, 0.09725093841552734, 0.10196876525878906, 0.10668659210205078, 0.1114044189453125, 0.11612224578857422, 0.12084007263183594, 0.12555789947509766, 0.13027572631835938, 0.1349935531616211, 0.1397113800048828, 0.14442920684814453, 0.14914703369140625, 0.15386486053466797, 0.1585826873779297, 0.1633005142211914, 0.16801834106445312, 0.17273616790771484, 0.17745399475097656, 0.18217182159423828, 0.1868896484375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 7.0, 9.0, 23.0, 50.0, 115.0, 342.0, 1097.0, 11155.0, 1627359.0, 2539088.0, 13303.0, 1140.0, 306.0, 140.0, 58.0, 33.0, 29.0, 6.0, 5.0, 6.0, 2.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.472900390625, -0.4560279846191406, -0.43915557861328125, -0.4222831726074219, -0.4054107666015625, -0.3885383605957031, -0.37166595458984375, -0.3547935485839844, -0.337921142578125, -0.3210487365722656, -0.30417633056640625, -0.2873039245605469, -0.2704315185546875, -0.2535591125488281, -0.23668670654296875, -0.21981430053710938, -0.20294189453125, -0.18606948852539062, -0.16919708251953125, -0.15232467651367188, -0.1354522705078125, -0.11857986450195312, -0.10170745849609375, -0.08483505249023438, -0.067962646484375, -0.051090240478515625, -0.03421783447265625, -0.017345428466796875, -0.0004730224609375, 0.016399383544921875, 0.03327178955078125, 0.050144195556640625, 0.0670166015625, 0.08388900756835938, 0.10076141357421875, 0.11763381958007812, 0.1345062255859375, 0.15137863159179688, 0.16825103759765625, 0.18512344360351562, 0.201995849609375, 0.21886825561523438, 0.23574066162109375, 0.2526130676269531, 0.2694854736328125, 0.2863578796386719, 0.30323028564453125, 0.3201026916503906, 0.33697509765625, 0.3538475036621094, 0.37071990966796875, 0.3875923156738281, 0.4044647216796875, 0.4213371276855469, 0.43820953369140625, 0.4550819396972656, 0.471954345703125, 0.4888267517089844, 0.5056991577148438, 0.5225715637207031, 0.5394439697265625, 0.5563163757324219, 0.5731887817382812, 0.5900611877441406, 0.60693359375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 12.0, 8.0, 21.0, 41.0, 86.0, 158.0, 406.0, 752.0, 1302.0, 648.0, 283.0, 147.0, 96.0, 47.0, 31.0, 16.0, 10.0, 3.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1944580078125, -0.188446044921875, -0.18243408203125, -0.176422119140625, -0.17041015625, -0.164398193359375, -0.15838623046875, -0.152374267578125, -0.1463623046875, -0.140350341796875, -0.13433837890625, -0.128326416015625, -0.122314453125, -0.116302490234375, -0.11029052734375, -0.104278564453125, -0.0982666015625, -0.092254638671875, -0.08624267578125, -0.080230712890625, -0.07421875, -0.068206787109375, -0.06219482421875, -0.056182861328125, -0.0501708984375, -0.044158935546875, -0.03814697265625, -0.032135009765625, -0.026123046875, -0.020111083984375, -0.01409912109375, -0.008087158203125, -0.0020751953125, 0.003936767578125, 0.00994873046875, 0.015960693359375, 0.02197265625, 0.027984619140625, 0.03399658203125, 0.040008544921875, 0.0460205078125, 0.052032470703125, 0.05804443359375, 0.064056396484375, 0.070068359375, 0.076080322265625, 0.08209228515625, 0.088104248046875, 0.0941162109375, 0.100128173828125, 0.10614013671875, 0.112152099609375, 0.1181640625, 0.124176025390625, 0.13018798828125, 0.136199951171875, 0.1422119140625, 0.148223876953125, 0.15423583984375, 0.160247802734375, 0.166259765625, 0.172271728515625, 0.17828369140625, 0.184295654296875, 0.1903076171875]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 841.0, 172.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.509147644042969, -13.248595237731934, -12.988042831420898, -12.727490425109863, -12.466938018798828, -12.20638656616211, -11.945834159851074, -11.685281753540039, -11.424729347229004, -11.164176940917969, -10.903624534606934, -10.643072128295898, -10.38252067565918, -10.121968269348145, -9.86141586303711, -9.600863456726074, -9.340311050415039, -9.079758644104004, -8.819206237792969, -8.558653831481934, -8.298101425170898, -8.03754997253418, -7.7769975662231445, -7.516445159912109, -7.255892753601074, -6.995340347290039, -6.734787940979004, -6.474236011505127, -6.213683605194092, -5.953131198883057, -5.69257926940918, -5.4320268630981445, -5.171474933624268, -4.910922527313232, -4.6503705978393555, -4.38981819152832, -4.129265785217285, -3.86871337890625, -3.608161211013794, -3.347609043121338, -3.0870566368103027, -2.8265042304992676, -2.5659520626068115, -2.3053998947143555, -2.0448474884033203, -1.7842952013015747, -1.523742914199829, -1.2631906270980835, -1.002638339996338, -0.7420860528945923, -0.4815337657928467, -0.22098147869110107, 0.03957080841064453, 0.30012309551239014, 0.5606753826141357, 0.8212276697158813, 1.081779956817627, 1.3423322439193726, 1.6028845310211182, 1.8634368181228638, 2.1239891052246094, 2.3845415115356445, 2.6450936794281006, 2.9056458473205566, 3.166198253631592]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 5.0, 7.0, 14.0, 11.0, 20.0, 15.0, 24.0, 37.0, 39.0, 52.0, 50.0, 57.0, 70.0, 69.0, 76.0, 51.0, 63.0, 53.0, 55.0, 55.0, 39.0, 31.0, 28.0, 17.0, 16.0, 19.0, 15.0, 7.0, 7.0, 4.0, 5.0, 2.0, 1.0], "bins": [-0.7734193801879883, -0.7562493681907654, -0.7390792965888977, -0.7219092845916748, -0.7047392725944519, -0.687569260597229, -0.6703991889953613, -0.6532291769981384, -0.6360591650009155, -0.6188891530036926, -0.601719081401825, -0.584549069404602, -0.5673790574073792, -0.5502090454101562, -0.5330389738082886, -0.5158689618110657, -0.498698890209198, -0.4815288484096527, -0.4643588364124298, -0.4471887946128845, -0.4300187826156616, -0.41284874081611633, -0.39567869901657104, -0.37850868701934814, -0.36133864521980286, -0.34416860342025757, -0.32699859142303467, -0.3098285496234894, -0.2926585078239441, -0.2754884958267212, -0.2583184540271759, -0.2411484271287918, -0.2239784598350525, -0.2068084329366684, -0.1896384060382843, -0.172468364238739, -0.15529833734035492, -0.13812831044197083, -0.12095827609300613, -0.10378824174404144, -0.08661821484565735, -0.06944818794727325, -0.05227815359830856, -0.03510812297463417, -0.017938092350959778, -0.0007680654525756836, 0.016401968896389008, 0.0335720032453537, 0.05074203014373779, 0.06791205704212189, 0.08508209139108658, 0.10225212574005127, 0.11942215263843536, 0.13659217953681946, 0.15376222133636475, 0.17093224823474884, 0.18810227513313293, 0.20527230203151703, 0.22244232892990112, 0.2396123707294464, 0.2567824125289917, 0.2739524245262146, 0.2911224663257599, 0.3082925081253052, 0.3254625201225281]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 8.0, 2.0, 3.0, 3.0, 3.0, 7.0, 8.0, 12.0, 8.0, 16.0, 25.0, 31.0, 33.0, 41.0, 70.0, 92.0, 137.0, 169.0, 268.0, 496.0, 953.0, 2153.0, 6210.0, 24996.0, 215567.0, 707223.0, 70408.0, 12782.0, 3628.0, 1432.0, 624.0, 366.0, 217.0, 155.0, 107.0, 66.0, 45.0, 40.0, 32.0, 30.0, 15.0, 18.0, 13.0, 9.0, 7.0, 9.0, 5.0, 10.0, 4.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.423095703125, -0.4086418151855469, -0.39418792724609375, -0.3797340393066406, -0.3652801513671875, -0.3508262634277344, -0.33637237548828125, -0.3219184875488281, -0.307464599609375, -0.2930107116699219, -0.27855682373046875, -0.2641029357910156, -0.2496490478515625, -0.23519515991210938, -0.22074127197265625, -0.20628738403320312, -0.19183349609375, -0.17737960815429688, -0.16292572021484375, -0.14847183227539062, -0.1340179443359375, -0.11956405639648438, -0.10511016845703125, -0.09065628051757812, -0.076202392578125, -0.061748504638671875, -0.04729461669921875, -0.032840728759765625, -0.0183868408203125, -0.003932952880859375, 0.01052093505859375, 0.024974822998046875, 0.0394287109375, 0.053882598876953125, 0.06833648681640625, 0.08279037475585938, 0.0972442626953125, 0.11169815063476562, 0.12615203857421875, 0.14060592651367188, 0.155059814453125, 0.16951370239257812, 0.18396759033203125, 0.19842147827148438, 0.2128753662109375, 0.22732925415039062, 0.24178314208984375, 0.2562370300292969, 0.27069091796875, 0.2851448059082031, 0.29959869384765625, 0.3140525817871094, 0.3285064697265625, 0.3429603576660156, 0.35741424560546875, 0.3718681335449219, 0.386322021484375, 0.4007759094238281, 0.41522979736328125, 0.4296836853027344, 0.4441375732421875, 0.4585914611816406, 0.47304534912109375, 0.4874992370605469, 0.501953125]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 4.0, 10.0, 8.0, 14.0, 21.0, 35.0, 39.0, 78.0, 121.0, 188.0, 184.0, 120.0, 72.0, 39.0, 26.0, 18.0, 14.0, 5.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.117919921875, -0.11318397521972656, -0.10844802856445312, -0.10371208190917969, -0.09897613525390625, -0.09424018859863281, -0.08950424194335938, -0.08476829528808594, -0.0800323486328125, -0.07529640197753906, -0.07056045532226562, -0.06582450866699219, -0.06108856201171875, -0.05635261535644531, -0.051616668701171875, -0.04688072204589844, -0.042144775390625, -0.03740882873535156, -0.032672882080078125, -0.027936935424804688, -0.02320098876953125, -0.018465042114257812, -0.013729095458984375, -0.008993148803710938, -0.0042572021484375, 0.0004787445068359375, 0.005214691162109375, 0.009950637817382812, 0.01468658447265625, 0.019422531127929688, 0.024158477783203125, 0.028894424438476562, 0.03363037109375, 0.03836631774902344, 0.043102264404296875, 0.04783821105957031, 0.05257415771484375, 0.05731010437011719, 0.062046051025390625, 0.06678199768066406, 0.0715179443359375, 0.07625389099121094, 0.08098983764648438, 0.08572578430175781, 0.09046173095703125, 0.09519767761230469, 0.09993362426757812, 0.10466957092285156, 0.109405517578125, 0.11414146423339844, 0.11887741088867188, 0.12361335754394531, 0.12834930419921875, 0.1330852508544922, 0.13782119750976562, 0.14255714416503906, 0.1472930908203125, 0.15202903747558594, 0.15676498413085938, 0.1615009307861328, 0.16623687744140625, 0.1709728240966797, 0.17570877075195312, 0.18044471740722656, 0.1851806640625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 3.0, 7.0, 5.0, 2.0, 11.0, 11.0, 10.0, 14.0, 15.0, 21.0, 30.0, 55.0, 48.0, 64.0, 87.0, 108.0, 177.0, 267.0, 580.0, 1453.0, 4693.0, 19233.0, 130061.0, 667440.0, 189855.0, 25072.0, 5812.0, 1739.0, 614.0, 347.0, 201.0, 126.0, 91.0, 83.0, 39.0, 45.0, 35.0, 26.0, 14.0, 14.0, 18.0, 9.0, 4.0, 9.0, 6.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 4.0], "bins": [-0.447998046875, -0.4350433349609375, -0.422088623046875, -0.4091339111328125, -0.39617919921875, -0.3832244873046875, -0.370269775390625, -0.3573150634765625, -0.3443603515625, -0.3314056396484375, -0.318450927734375, -0.3054962158203125, -0.29254150390625, -0.2795867919921875, -0.266632080078125, -0.2536773681640625, -0.24072265625, -0.2277679443359375, -0.214813232421875, -0.2018585205078125, -0.18890380859375, -0.1759490966796875, -0.162994384765625, -0.1500396728515625, -0.1370849609375, -0.1241302490234375, -0.111175537109375, -0.0982208251953125, -0.08526611328125, -0.0723114013671875, -0.059356689453125, -0.0464019775390625, -0.033447265625, -0.0204925537109375, -0.007537841796875, 0.0054168701171875, 0.01837158203125, 0.0313262939453125, 0.044281005859375, 0.0572357177734375, 0.0701904296875, 0.0831451416015625, 0.096099853515625, 0.1090545654296875, 0.12200927734375, 0.1349639892578125, 0.147918701171875, 0.1608734130859375, 0.173828125, 0.1867828369140625, 0.199737548828125, 0.2126922607421875, 0.22564697265625, 0.2386016845703125, 0.251556396484375, 0.2645111083984375, 0.2774658203125, 0.2904205322265625, 0.303375244140625, 0.3163299560546875, 0.32928466796875, 0.3422393798828125, 0.355194091796875, 0.3681488037109375, 0.381103515625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 3.0, 5.0, 6.0, 6.0, 7.0, 8.0, 5.0, 18.0, 17.0, 14.0, 22.0, 24.0, 29.0, 28.0, 32.0, 46.0, 52.0, 45.0, 41.0, 42.0, 55.0, 47.0, 50.0, 52.0, 44.0, 42.0, 38.0, 39.0, 36.0, 36.0, 16.0, 16.0, 16.0, 12.0, 8.0, 11.0, 5.0, 7.0, 6.0, 5.0, 2.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.14111328125, -0.13638687133789062, -0.13166046142578125, -0.12693405151367188, -0.1222076416015625, -0.11748123168945312, -0.11275482177734375, -0.10802841186523438, -0.103302001953125, -0.09857559204101562, -0.09384918212890625, -0.08912277221679688, -0.0843963623046875, -0.07966995239257812, -0.07494354248046875, -0.07021713256835938, -0.06549072265625, -0.060764312744140625, -0.05603790283203125, -0.051311492919921875, -0.0465850830078125, -0.041858673095703125, -0.03713226318359375, -0.032405853271484375, -0.027679443359375, -0.022953033447265625, -0.01822662353515625, -0.013500213623046875, -0.0087738037109375, -0.004047393798828125, 0.00067901611328125, 0.005405426025390625, 0.0101318359375, 0.014858245849609375, 0.01958465576171875, 0.024311065673828125, 0.0290374755859375, 0.033763885498046875, 0.03849029541015625, 0.043216705322265625, 0.047943115234375, 0.052669525146484375, 0.05739593505859375, 0.062122344970703125, 0.0668487548828125, 0.07157516479492188, 0.07630157470703125, 0.08102798461914062, 0.08575439453125, 0.09048080444335938, 0.09520721435546875, 0.09993362426757812, 0.1046600341796875, 0.10938644409179688, 0.11411285400390625, 0.11883926391601562, 0.123565673828125, 0.12829208374023438, 0.13301849365234375, 0.13774490356445312, 0.1424713134765625, 0.14719772338867188, 0.15192413330078125, 0.15665054321289062, 0.161376953125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 9.0, 7.0, 6.0, 9.0, 15.0, 23.0, 33.0, 41.0, 63.0, 99.0, 137.0, 174.0, 301.0, 422.0, 664.0, 1098.0, 1791.0, 3217.0, 5830.0, 12057.0, 31040.0, 121802.0, 478653.0, 290933.0, 61233.0, 19482.0, 8559.0, 4406.0, 2479.0, 1490.0, 888.0, 504.0, 376.0, 244.0, 128.0, 84.0, 81.0, 41.0, 40.0, 29.0, 16.0, 10.0, 9.0, 9.0, 14.0, 7.0, 2.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.1444091796875, -0.1395587921142578, -0.13470840454101562, -0.12985801696777344, -0.12500762939453125, -0.12015724182128906, -0.11530685424804688, -0.11045646667480469, -0.1056060791015625, -0.10075569152832031, -0.09590530395507812, -0.09105491638183594, -0.08620452880859375, -0.08135414123535156, -0.07650375366210938, -0.07165336608886719, -0.066802978515625, -0.06195259094238281, -0.057102203369140625, -0.05225181579589844, -0.04740142822265625, -0.04255104064941406, -0.037700653076171875, -0.03285026550292969, -0.0279998779296875, -0.023149490356445312, -0.018299102783203125, -0.013448715209960938, -0.00859832763671875, -0.0037479400634765625, 0.001102447509765625, 0.0059528350830078125, 0.01080322265625, 0.015653610229492188, 0.020503997802734375, 0.025354385375976562, 0.03020477294921875, 0.03505516052246094, 0.039905548095703125, 0.04475593566894531, 0.0496063232421875, 0.05445671081542969, 0.059307098388671875, 0.06415748596191406, 0.06900787353515625, 0.07385826110839844, 0.07870864868164062, 0.08355903625488281, 0.088409423828125, 0.09325981140136719, 0.09811019897460938, 0.10296058654785156, 0.10781097412109375, 0.11266136169433594, 0.11751174926757812, 0.12236213684082031, 0.1272125244140625, 0.1320629119873047, 0.13691329956054688, 0.14176368713378906, 0.14661407470703125, 0.15146446228027344, 0.15631484985351562, 0.1611652374267578, 0.166015625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 4.0, 3.0, 12.0, 13.0, 20.0, 40.0, 78.0, 142.0, 215.0, 219.0, 131.0, 55.0, 23.0, 15.0, 11.0, 9.0, 1.0, 5.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.713369369506836e-05, -3.606826066970825e-05, -3.5002827644348145e-05, -3.393739461898804e-05, -3.287196159362793e-05, -3.180652856826782e-05, -3.0741095542907715e-05, -2.9675662517547607e-05, -2.86102294921875e-05, -2.7544796466827393e-05, -2.6479363441467285e-05, -2.5413930416107178e-05, -2.434849739074707e-05, -2.3283064365386963e-05, -2.2217631340026855e-05, -2.1152198314666748e-05, -2.008676528930664e-05, -1.9021332263946533e-05, -1.7955899238586426e-05, -1.689046621322632e-05, -1.582503318786621e-05, -1.4759600162506104e-05, -1.3694167137145996e-05, -1.2628734111785889e-05, -1.1563301086425781e-05, -1.0497868061065674e-05, -9.432435035705566e-06, -8.367002010345459e-06, -7.3015689849853516e-06, -6.236135959625244e-06, -5.170702934265137e-06, -4.105269908905029e-06, -3.039836883544922e-06, -1.9744038581848145e-06, -9.08970832824707e-07, 1.564621925354004e-07, 1.2218952178955078e-06, 2.2873282432556152e-06, 3.3527612686157227e-06, 4.41819429397583e-06, 5.4836273193359375e-06, 6.549060344696045e-06, 7.614493370056152e-06, 8.67992639541626e-06, 9.745359420776367e-06, 1.0810792446136475e-05, 1.1876225471496582e-05, 1.294165849685669e-05, 1.4007091522216797e-05, 1.5072524547576904e-05, 1.6137957572937012e-05, 1.720339059829712e-05, 1.8268823623657227e-05, 1.9334256649017334e-05, 2.039968967437744e-05, 2.146512269973755e-05, 2.2530555725097656e-05, 2.3595988750457764e-05, 2.466142177581787e-05, 2.572685480117798e-05, 2.6792287826538086e-05, 2.7857720851898193e-05, 2.89231538772583e-05, 2.9988586902618408e-05, 3.1054019927978516e-05]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 6.0, 10.0, 7.0, 14.0, 13.0, 20.0, 32.0, 39.0, 78.0, 96.0, 174.0, 306.0, 591.0, 1506.0, 4144.0, 16810.0, 118648.0, 670849.0, 201692.0, 24309.0, 5645.0, 1888.0, 749.0, 383.0, 191.0, 118.0, 66.0, 49.0, 32.0, 28.0, 16.0, 9.0, 11.0, 5.0, 6.0, 3.0, 3.0, 4.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1845703125, -0.1785411834716797, -0.17251205444335938, -0.16648292541503906, -0.16045379638671875, -0.15442466735839844, -0.14839553833007812, -0.1423664093017578, -0.1363372802734375, -0.1303081512451172, -0.12427902221679688, -0.11824989318847656, -0.11222076416015625, -0.10619163513183594, -0.10016250610351562, -0.09413337707519531, -0.088104248046875, -0.08207511901855469, -0.07604598999023438, -0.07001686096191406, -0.06398773193359375, -0.05795860290527344, -0.051929473876953125, -0.04590034484863281, -0.0398712158203125, -0.03384208679199219, -0.027812957763671875, -0.021783828735351562, -0.01575469970703125, -0.009725570678710938, -0.003696441650390625, 0.0023326873779296875, 0.00836181640625, 0.014390945434570312, 0.020420074462890625, 0.026449203491210938, 0.03247833251953125, 0.03850746154785156, 0.044536590576171875, 0.05056571960449219, 0.0565948486328125, 0.06262397766113281, 0.06865310668945312, 0.07468223571777344, 0.08071136474609375, 0.08674049377441406, 0.09276962280273438, 0.09879875183105469, 0.104827880859375, 0.11085700988769531, 0.11688613891601562, 0.12291526794433594, 0.12894439697265625, 0.13497352600097656, 0.14100265502929688, 0.1470317840576172, 0.1530609130859375, 0.1590900421142578, 0.16511917114257812, 0.17114830017089844, 0.17717742919921875, 0.18320655822753906, 0.18923568725585938, 0.1952648162841797, 0.2012939453125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 7.0, 3.0, 5.0, 6.0, 7.0, 14.0, 20.0, 12.0, 21.0, 33.0, 35.0, 56.0, 42.0, 54.0, 69.0, 71.0, 76.0, 80.0, 73.0, 76.0, 40.0, 44.0, 37.0, 27.0, 18.0, 18.0, 13.0, 6.0, 7.0, 5.0, 5.0, 4.0, 2.0, 5.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.06829833984375, -0.06624031066894531, -0.06418228149414062, -0.06212425231933594, -0.06006622314453125, -0.05800819396972656, -0.055950164794921875, -0.05389213562011719, -0.0518341064453125, -0.04977607727050781, -0.047718048095703125, -0.04566001892089844, -0.04360198974609375, -0.04154396057128906, -0.039485931396484375, -0.03742790222167969, -0.035369873046875, -0.03331184387207031, -0.031253814697265625, -0.029195785522460938, -0.02713775634765625, -0.025079727172851562, -0.023021697998046875, -0.020963668823242188, -0.0189056396484375, -0.016847610473632812, -0.014789581298828125, -0.012731552124023438, -0.01067352294921875, -0.008615493774414062, -0.006557464599609375, -0.0044994354248046875, -0.00244140625, -0.0003833770751953125, 0.001674652099609375, 0.0037326812744140625, 0.00579071044921875, 0.007848739624023438, 0.009906768798828125, 0.011964797973632812, 0.0140228271484375, 0.016080856323242188, 0.018138885498046875, 0.020196914672851562, 0.02225494384765625, 0.024312973022460938, 0.026371002197265625, 0.028429031372070312, 0.030487060546875, 0.03254508972167969, 0.034603118896484375, 0.03666114807128906, 0.03871917724609375, 0.04077720642089844, 0.042835235595703125, 0.04489326477050781, 0.0469512939453125, 0.04900932312011719, 0.051067352294921875, 0.05312538146972656, 0.05518341064453125, 0.05724143981933594, 0.059299468994140625, 0.06135749816894531, 0.06341552734375]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 12.0, 30.0, 91.0, 225.0, 288.0, 203.0, 98.0, 29.0, 17.0, 7.0, 6.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.949930191040039, -1.9041064977645874, -1.8582826852798462, -1.8124589920043945, -1.7666351795196533, -1.7208114862442017, -1.67498779296875, -1.6291639804840088, -1.5833401679992676, -1.537516474723816, -1.4916926622390747, -1.445868968963623, -1.4000451564788818, -1.3542214632034302, -1.3083977699279785, -1.2625739574432373, -1.2167502641677856, -1.170926570892334, -1.1251027584075928, -1.0792790651321411, -1.0334552526474, -0.9876315593719482, -0.9418078064918518, -0.8959840536117554, -0.8501603007316589, -0.8043365478515625, -0.7585127949714661, -0.7126890420913696, -0.666865348815918, -0.6210415363311768, -0.5752178430557251, -0.5293940901756287, -0.48357027769088745, -0.437746524810791, -0.3919227719306946, -0.34609904885292053, -0.3002752959728241, -0.25445154309272766, -0.2086278200149536, -0.16280406713485718, -0.11698031425476074, -0.0711565688252449, -0.025332823395729065, 0.020490914583206177, 0.06631466746330261, 0.11213842034339905, 0.1579621434211731, 0.20378589630126953, 0.24960964918136597, 0.2954334020614624, 0.34125715494155884, 0.3870808780193329, 0.4329046308994293, 0.47872838377952576, 0.5245521068572998, 0.5703758597373962, 0.6161996126174927, 0.6620233654975891, 0.7078471183776855, 0.7536708116531372, 0.7994946241378784, 0.8453183174133301, 0.8911420702934265, 0.936965823173523, 0.9827895760536194]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 6.0, 12.0, 9.0, 14.0, 12.0, 16.0, 21.0, 25.0, 28.0, 41.0, 33.0, 40.0, 36.0, 53.0, 57.0, 51.0, 47.0, 60.0, 43.0, 50.0, 42.0, 51.0, 48.0, 37.0, 31.0, 29.0, 24.0, 24.0, 14.0, 16.0, 10.0, 8.0, 7.0, 10.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.46683305501937866, -0.4494871497154236, -0.4321412742137909, -0.4147953689098358, -0.3974494934082031, -0.38010358810424805, -0.36275768280029297, -0.3454118072986603, -0.3280659317970276, -0.3107200264930725, -0.2933741509914398, -0.27602824568748474, -0.25868237018585205, -0.24133646488189697, -0.2239905744791031, -0.2066446840763092, -0.18929877877235413, -0.17195288836956024, -0.15460699796676636, -0.13726109266281128, -0.11991520971059799, -0.10256931930780411, -0.08522342145442963, -0.06787753105163574, -0.05053164064884186, -0.033185750246047974, -0.01583985611796379, 0.0015060380101203918, 0.018851928412914276, 0.03619781881570816, 0.05354371666908264, 0.07088960707187653, 0.08823549747467041, 0.1055813878774643, 0.12292727828025818, 0.14027318358421326, 0.15761905908584595, 0.17496496438980103, 0.1923108547925949, 0.2096567451953888, 0.22700263559818268, 0.24434852600097656, 0.26169443130493164, 0.27904030680656433, 0.2963862121105194, 0.3137320876121521, 0.3310779929161072, 0.34842389822006226, 0.36576977372169495, 0.38311567902565, 0.4004615545272827, 0.4178074598312378, 0.4351533353328705, 0.45249924063682556, 0.46984511613845825, 0.48719102144241333, 0.5045369267463684, 0.5218828320503235, 0.5392287373542786, 0.5565745830535889, 0.573920488357544, 0.591266393661499, 0.6086122989654541, 0.6259582042694092, 0.6433040499687195]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 1.0, 7.0, 7.0, 11.0, 19.0, 32.0, 48.0, 114.0, 201.0, 434.0, 1074.0, 3338.0, 8619.0, 32320.0, 686462.0, 3356012.0, 89788.0, 10549.0, 2668.0, 990.0, 542.0, 350.0, 182.0, 128.0, 96.0, 69.0, 52.0, 38.0, 34.0, 18.0, 11.0, 15.0, 13.0, 5.0, 6.0, 9.0, 6.0, 1.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0], "bins": [-0.1614990234375, -0.1548328399658203, -0.14816665649414062, -0.14150047302246094, -0.13483428955078125, -0.12816810607910156, -0.12150192260742188, -0.11483573913574219, -0.1081695556640625, -0.10150337219238281, -0.09483718872070312, -0.08817100524902344, -0.08150482177734375, -0.07483863830566406, -0.06817245483398438, -0.06150627136230469, -0.054840087890625, -0.04817390441894531, -0.041507720947265625, -0.03484153747558594, -0.02817535400390625, -0.021509170532226562, -0.014842987060546875, -0.008176803588867188, -0.0015106201171875, 0.0051555633544921875, 0.011821746826171875, 0.018487930297851562, 0.02515411376953125, 0.03182029724121094, 0.038486480712890625, 0.04515266418457031, 0.05181884765625, 0.05848503112792969, 0.06515121459960938, 0.07181739807128906, 0.07848358154296875, 0.08514976501464844, 0.09181594848632812, 0.09848213195800781, 0.1051483154296875, 0.11181449890136719, 0.11848068237304688, 0.12514686584472656, 0.13181304931640625, 0.13847923278808594, 0.14514541625976562, 0.1518115997314453, 0.158477783203125, 0.1651439666748047, 0.17181015014648438, 0.17847633361816406, 0.18514251708984375, 0.19180870056152344, 0.19847488403320312, 0.2051410675048828, 0.2118072509765625, 0.2184734344482422, 0.22513961791992188, 0.23180580139160156, 0.23847198486328125, 0.24513816833496094, 0.2518043518066406, 0.2584705352783203, 0.26513671875]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 2.0, 10.0, 20.0, 5.0, 31.0, 33.0, 44.0, 103.0, 148.0, 164.0, 174.0, 99.0, 69.0, 39.0, 21.0, 18.0, 8.0, 7.0, 2.0, 0.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1083984375, -0.10380744934082031, -0.09921646118164062, -0.09462547302246094, -0.09003448486328125, -0.08544349670410156, -0.08085250854492188, -0.07626152038574219, -0.0716705322265625, -0.06707954406738281, -0.062488555908203125, -0.05789756774902344, -0.05330657958984375, -0.04871559143066406, -0.044124603271484375, -0.03953361511230469, -0.034942626953125, -0.030351638793945312, -0.025760650634765625, -0.021169662475585938, -0.01657867431640625, -0.011987686157226562, -0.007396697998046875, -0.0028057098388671875, 0.0017852783203125, 0.0063762664794921875, 0.010967254638671875, 0.015558242797851562, 0.02014923095703125, 0.024740219116210938, 0.029331207275390625, 0.03392219543457031, 0.03851318359375, 0.04310417175292969, 0.047695159912109375, 0.05228614807128906, 0.05687713623046875, 0.06146812438964844, 0.06605911254882812, 0.07065010070800781, 0.0752410888671875, 0.07983207702636719, 0.08442306518554688, 0.08901405334472656, 0.09360504150390625, 0.09819602966308594, 0.10278701782226562, 0.10737800598144531, 0.111968994140625, 0.11655998229980469, 0.12115097045898438, 0.12574195861816406, 0.13033294677734375, 0.13492393493652344, 0.13951492309570312, 0.1441059112548828, 0.1486968994140625, 0.1532878875732422, 0.15787887573242188, 0.16246986389160156, 0.16706085205078125, 0.17165184020996094, 0.17624282836914062, 0.1808338165283203, 0.1854248046875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 5.0, 9.0, 10.0, 9.0, 22.0, 15.0, 50.0, 41.0, 80.0, 127.0, 198.0, 339.0, 659.0, 1361.0, 3634.0, 12804.0, 64373.0, 485962.0, 2799461.0, 713415.0, 87696.0, 16391.0, 4299.0, 1605.0, 754.0, 358.0, 204.0, 145.0, 86.0, 50.0, 32.0, 34.0, 12.0, 12.0, 11.0, 9.0, 1.0, 5.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1414794921875, -0.13652992248535156, -0.13158035278320312, -0.1266307830810547, -0.12168121337890625, -0.11673164367675781, -0.11178207397460938, -0.10683250427246094, -0.1018829345703125, -0.09693336486816406, -0.09198379516601562, -0.08703422546386719, -0.08208465576171875, -0.07713508605957031, -0.07218551635742188, -0.06723594665527344, -0.062286376953125, -0.05733680725097656, -0.052387237548828125, -0.04743766784667969, -0.04248809814453125, -0.03753852844238281, -0.032588958740234375, -0.027639389038085938, -0.0226898193359375, -0.017740249633789062, -0.012790679931640625, -0.007841110229492188, -0.00289154052734375, 0.0020580291748046875, 0.007007598876953125, 0.011957168579101562, 0.01690673828125, 0.021856307983398438, 0.026805877685546875, 0.03175544738769531, 0.03670501708984375, 0.04165458679199219, 0.046604156494140625, 0.05155372619628906, 0.0565032958984375, 0.06145286560058594, 0.06640243530273438, 0.07135200500488281, 0.07630157470703125, 0.08125114440917969, 0.08620071411132812, 0.09115028381347656, 0.096099853515625, 0.10104942321777344, 0.10599899291992188, 0.11094856262207031, 0.11589813232421875, 0.12084770202636719, 0.12579727172851562, 0.13074684143066406, 0.1356964111328125, 0.14064598083496094, 0.14559555053710938, 0.1505451202392578, 0.15549468994140625, 0.1604442596435547, 0.16539382934570312, 0.17034339904785156, 0.17529296875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 6.0, 5.0, 7.0, 12.0, 5.0, 14.0, 12.0, 22.0, 49.0, 43.0, 80.0, 111.0, 134.0, 161.0, 251.0, 304.0, 396.0, 424.0, 461.0, 406.0, 299.0, 215.0, 155.0, 138.0, 109.0, 56.0, 46.0, 38.0, 29.0, 21.0, 24.0, 11.0, 7.0, 5.0, 6.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 1.0], "bins": [-0.1123046875, -0.10935401916503906, -0.10640335083007812, -0.10345268249511719, -0.10050201416015625, -0.09755134582519531, -0.09460067749023438, -0.09165000915527344, -0.0886993408203125, -0.08574867248535156, -0.08279800415039062, -0.07984733581542969, -0.07689666748046875, -0.07394599914550781, -0.07099533081054688, -0.06804466247558594, -0.065093994140625, -0.06214332580566406, -0.059192657470703125, -0.05624198913574219, -0.05329132080078125, -0.05034065246582031, -0.047389984130859375, -0.04443931579589844, -0.0414886474609375, -0.03853797912597656, -0.035587310791015625, -0.03263664245605469, -0.02968597412109375, -0.026735305786132812, -0.023784637451171875, -0.020833969116210938, -0.01788330078125, -0.014932632446289062, -0.011981964111328125, -0.009031295776367188, -0.00608062744140625, -0.0031299591064453125, -0.000179290771484375, 0.0027713775634765625, 0.0057220458984375, 0.008672714233398438, 0.011623382568359375, 0.014574050903320312, 0.01752471923828125, 0.020475387573242188, 0.023426055908203125, 0.026376724243164062, 0.029327392578125, 0.03227806091308594, 0.035228729248046875, 0.03817939758300781, 0.04113006591796875, 0.04408073425292969, 0.047031402587890625, 0.04998207092285156, 0.0529327392578125, 0.05588340759277344, 0.058834075927734375, 0.06178474426269531, 0.06473541259765625, 0.06768608093261719, 0.07063674926757812, 0.07358741760253906, 0.0765380859375]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 8.0, 23.0, 52.0, 147.0, 253.0, 249.0, 147.0, 65.0, 42.0, 13.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4258193373680115, -0.393331378698349, -0.36084339022636414, -0.32835543155670166, -0.2958674430847168, -0.2633794844150543, -0.23089152574539185, -0.19840355217456818, -0.1659155786037445, -0.13342760503292084, -0.10093963891267776, -0.06845167279243469, -0.03596369922161102, -0.0034757256507873535, 0.029012233018875122, 0.06150020658969879, 0.09398818016052246, 0.12647615373134613, 0.1589641273021698, 0.19145208597183228, 0.22394005954265594, 0.2564280331134796, 0.2889159917831421, 0.32140398025512695, 0.35389193892478943, 0.3863798975944519, 0.41886788606643677, 0.45135584473609924, 0.4838438034057617, 0.5163317918777466, 0.5488197803497314, 0.5813077092170715, 0.6137956380844116, 0.6462836265563965, 0.6787715554237366, 0.7112595438957214, 0.7437475323677063, 0.7762354612350464, 0.8087234497070312, 0.8412114381790161, 0.873699426651001, 0.9061874151229858, 0.9386753439903259, 0.9711633324623108, 1.0036512613296509, 1.0361392498016357, 1.0686272382736206, 1.1011152267456055, 1.1336030960083008, 1.1660910844802856, 1.1985790729522705, 1.2310669422149658, 1.2635549306869507, 1.2960429191589355, 1.3285309076309204, 1.3610188961029053, 1.3935068845748901, 1.425994873046875, 1.4584828615188599, 1.4909708499908447, 1.52345871925354, 1.555946707725525, 1.5884346961975098, 1.6209226846694946, 1.6534106731414795]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 3.0, 3.0, 1.0, 2.0, 3.0, 3.0, 7.0, 11.0, 8.0, 13.0, 14.0, 14.0, 16.0, 23.0, 25.0, 26.0, 40.0, 33.0, 29.0, 41.0, 33.0, 45.0, 45.0, 60.0, 48.0, 44.0, 34.0, 43.0, 32.0, 39.0, 33.0, 31.0, 24.0, 31.0, 21.0, 18.0, 16.0, 18.0, 12.0, 16.0, 15.0, 6.0, 10.0, 7.0, 4.0, 0.0, 1.0, 3.0, 2.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.31851905584335327, -0.30708131194114685, -0.29564356803894043, -0.284205824136734, -0.2727680802345276, -0.26133033633232117, -0.24989260733127594, -0.23845486342906952, -0.2270171195268631, -0.21557937562465668, -0.20414163172245026, -0.19270390272140503, -0.1812661588191986, -0.1698284149169922, -0.15839067101478577, -0.14695292711257935, -0.13551518321037292, -0.1240774393081665, -0.11263969540596008, -0.10120195895433426, -0.08976421505212784, -0.07832647114992142, -0.0668887346982956, -0.05545099079608917, -0.04401324689388275, -0.03257550299167633, -0.021137762814760208, -0.009700022637844086, 0.0017377212643623352, 0.013175465166568756, 0.02461320161819458, 0.036050945520401, 0.04748868942260742, 0.05892643332481384, 0.07036417722702026, 0.08180191367864609, 0.09323965758085251, 0.10467740148305893, 0.11611513793468475, 0.12755288183689117, 0.1389906257390976, 0.15042836964130402, 0.16186611354351044, 0.17330384254455566, 0.18474158644676208, 0.1961793303489685, 0.20761707425117493, 0.21905481815338135, 0.23049256205558777, 0.2419303059577942, 0.2533680498600006, 0.26480579376220703, 0.27624353766441345, 0.2876812815666199, 0.2991189956665039, 0.3105567693710327, 0.32199448347091675, 0.33343222737312317, 0.3448699712753296, 0.356307715177536, 0.36774545907974243, 0.37918320298194885, 0.3906209468841553, 0.4020586609840393, 0.4134964346885681]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 2.0, 6.0, 2.0, 5.0, 4.0, 9.0, 10.0, 8.0, 23.0, 14.0, 26.0, 43.0, 66.0, 80.0, 125.0, 211.0, 361.0, 665.0, 1801.0, 6431.0, 42057.0, 555519.0, 401795.0, 30946.0, 5328.0, 1447.0, 589.0, 349.0, 192.0, 134.0, 92.0, 56.0, 56.0, 34.0, 19.0, 11.0, 14.0, 13.0, 7.0, 2.0, 3.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51171875, -0.49462127685546875, -0.4775238037109375, -0.46042633056640625, -0.443328857421875, -0.42623138427734375, -0.4091339111328125, -0.39203643798828125, -0.37493896484375, -0.35784149169921875, -0.3407440185546875, -0.32364654541015625, -0.306549072265625, -0.28945159912109375, -0.2723541259765625, -0.25525665283203125, -0.2381591796875, -0.22106170654296875, -0.2039642333984375, -0.18686676025390625, -0.169769287109375, -0.15267181396484375, -0.1355743408203125, -0.11847686767578125, -0.10137939453125, -0.08428192138671875, -0.0671844482421875, -0.05008697509765625, -0.032989501953125, -0.01589202880859375, 0.0012054443359375, 0.01830291748046875, 0.035400390625, 0.05249786376953125, 0.0695953369140625, 0.08669281005859375, 0.103790283203125, 0.12088775634765625, 0.1379852294921875, 0.15508270263671875, 0.17218017578125, 0.18927764892578125, 0.2063751220703125, 0.22347259521484375, 0.240570068359375, 0.25766754150390625, 0.2747650146484375, 0.29186248779296875, 0.3089599609375, 0.32605743408203125, 0.3431549072265625, 0.36025238037109375, 0.377349853515625, 0.39444732666015625, 0.4115447998046875, 0.42864227294921875, 0.44573974609375, 0.46283721923828125, 0.4799346923828125, 0.49703216552734375, 0.514129638671875, 0.5312271118164062, 0.5483245849609375, 0.5654220581054688, 0.58251953125]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 8.0, 10.0, 12.0, 13.0, 21.0, 37.0, 55.0, 112.0, 126.0, 202.0, 155.0, 99.0, 72.0, 39.0, 20.0, 12.0, 6.0, 2.0, 1.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.10528564453125, -0.10060787200927734, -0.09593009948730469, -0.09125232696533203, -0.08657455444335938, -0.08189678192138672, -0.07721900939941406, -0.0725412368774414, -0.06786346435546875, -0.0631856918334961, -0.05850791931152344, -0.05383014678955078, -0.049152374267578125, -0.04447460174560547, -0.03979682922363281, -0.035119056701660156, -0.0304412841796875, -0.025763511657714844, -0.021085739135742188, -0.01640796661376953, -0.011730194091796875, -0.007052421569824219, -0.0023746490478515625, 0.0023031234741210938, 0.00698089599609375, 0.011658668518066406, 0.016336441040039062, 0.02101421356201172, 0.025691986083984375, 0.03036975860595703, 0.03504753112792969, 0.039725303649902344, 0.044403076171875, 0.049080848693847656, 0.05375862121582031, 0.05843639373779297, 0.06311416625976562, 0.06779193878173828, 0.07246971130371094, 0.0771474838256836, 0.08182525634765625, 0.0865030288696289, 0.09118080139160156, 0.09585857391357422, 0.10053634643554688, 0.10521411895751953, 0.10989189147949219, 0.11456966400146484, 0.1192474365234375, 0.12392520904541016, 0.1286029815673828, 0.13328075408935547, 0.13795852661132812, 0.14263629913330078, 0.14731407165527344, 0.1519918441772461, 0.15666961669921875, 0.1613473892211914, 0.16602516174316406, 0.17070293426513672, 0.17538070678710938, 0.18005847930908203, 0.1847362518310547, 0.18941402435302734, 0.194091796875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 1.0, 5.0, 8.0, 5.0, 11.0, 19.0, 12.0, 21.0, 35.0, 62.0, 59.0, 163.0, 284.0, 807.0, 2726.0, 12499.0, 78452.0, 454383.0, 414094.0, 69446.0, 11419.0, 2416.0, 813.0, 365.0, 144.0, 96.0, 57.0, 50.0, 19.0, 18.0, 16.0, 9.0, 10.0, 7.0, 6.0, 4.0, 2.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.467041015625, -0.45195770263671875, -0.4368743896484375, -0.42179107666015625, -0.406707763671875, -0.39162445068359375, -0.3765411376953125, -0.36145782470703125, -0.34637451171875, -0.33129119873046875, -0.3162078857421875, -0.30112457275390625, -0.286041259765625, -0.27095794677734375, -0.2558746337890625, -0.24079132080078125, -0.2257080078125, -0.21062469482421875, -0.1955413818359375, -0.18045806884765625, -0.165374755859375, -0.15029144287109375, -0.1352081298828125, -0.12012481689453125, -0.10504150390625, -0.08995819091796875, -0.0748748779296875, -0.05979156494140625, -0.044708251953125, -0.02962493896484375, -0.0145416259765625, 0.00054168701171875, 0.015625, 0.03070831298828125, 0.0457916259765625, 0.06087493896484375, 0.075958251953125, 0.09104156494140625, 0.1061248779296875, 0.12120819091796875, 0.13629150390625, 0.15137481689453125, 0.1664581298828125, 0.18154144287109375, 0.196624755859375, 0.21170806884765625, 0.2267913818359375, 0.24187469482421875, 0.2569580078125, 0.27204132080078125, 0.2871246337890625, 0.30220794677734375, 0.317291259765625, 0.33237457275390625, 0.3474578857421875, 0.36254119873046875, 0.37762451171875, 0.39270782470703125, 0.4077911376953125, 0.42287445068359375, 0.437957763671875, 0.45304107666015625, 0.4681243896484375, 0.48320770263671875, 0.498291015625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 4.0, 8.0, 7.0, 6.0, 11.0, 14.0, 23.0, 21.0, 28.0, 29.0, 29.0, 30.0, 38.0, 60.0, 38.0, 56.0, 57.0, 43.0, 61.0, 42.0, 63.0, 56.0, 50.0, 43.0, 40.0, 32.0, 29.0, 17.0, 13.0, 10.0, 7.0, 5.0, 8.0, 5.0, 7.0, 4.0, 1.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.2274169921875, -0.2210540771484375, -0.214691162109375, -0.2083282470703125, -0.20196533203125, -0.1956024169921875, -0.189239501953125, -0.1828765869140625, -0.176513671875, -0.1701507568359375, -0.163787841796875, -0.1574249267578125, -0.15106201171875, -0.1446990966796875, -0.138336181640625, -0.1319732666015625, -0.1256103515625, -0.1192474365234375, -0.112884521484375, -0.1065216064453125, -0.10015869140625, -0.0937957763671875, -0.087432861328125, -0.0810699462890625, -0.07470703125, -0.0683441162109375, -0.061981201171875, -0.0556182861328125, -0.04925537109375, -0.0428924560546875, -0.036529541015625, -0.0301666259765625, -0.0238037109375, -0.0174407958984375, -0.011077880859375, -0.0047149658203125, 0.00164794921875, 0.0080108642578125, 0.014373779296875, 0.0207366943359375, 0.027099609375, 0.0334625244140625, 0.039825439453125, 0.0461883544921875, 0.05255126953125, 0.0589141845703125, 0.065277099609375, 0.0716400146484375, 0.0780029296875, 0.0843658447265625, 0.090728759765625, 0.0970916748046875, 0.10345458984375, 0.1098175048828125, 0.116180419921875, 0.1225433349609375, 0.12890625, 0.1352691650390625, 0.141632080078125, 0.1479949951171875, 0.15435791015625, 0.1607208251953125, 0.167083740234375, 0.1734466552734375, 0.1798095703125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 5.0, 6.0, 4.0, 10.0, 9.0, 11.0, 24.0, 46.0, 52.0, 77.0, 135.0, 154.0, 268.0, 432.0, 786.0, 1602.0, 3421.0, 8504.0, 25990.0, 100697.0, 374362.0, 383738.0, 105080.0, 27347.0, 8659.0, 3482.0, 1599.0, 808.0, 449.0, 292.0, 167.0, 126.0, 56.0, 52.0, 36.0, 24.0, 14.0, 11.0, 1.0, 8.0, 6.0, 2.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1605224609375, -0.15517425537109375, -0.1498260498046875, -0.14447784423828125, -0.139129638671875, -0.13378143310546875, -0.1284332275390625, -0.12308502197265625, -0.11773681640625, -0.11238861083984375, -0.1070404052734375, -0.10169219970703125, -0.096343994140625, -0.09099578857421875, -0.0856475830078125, -0.08029937744140625, -0.074951171875, -0.06960296630859375, -0.0642547607421875, -0.05890655517578125, -0.053558349609375, -0.04821014404296875, -0.0428619384765625, -0.03751373291015625, -0.03216552734375, -0.02681732177734375, -0.0214691162109375, -0.01612091064453125, -0.010772705078125, -0.00542449951171875, -7.62939453125e-05, 0.00527191162109375, 0.0106201171875, 0.01596832275390625, 0.0213165283203125, 0.02666473388671875, 0.032012939453125, 0.03736114501953125, 0.0427093505859375, 0.04805755615234375, 0.05340576171875, 0.05875396728515625, 0.0641021728515625, 0.06945037841796875, 0.074798583984375, 0.08014678955078125, 0.0854949951171875, 0.09084320068359375, 0.09619140625, 0.10153961181640625, 0.1068878173828125, 0.11223602294921875, 0.117584228515625, 0.12293243408203125, 0.1282806396484375, 0.13362884521484375, 0.13897705078125, 0.14432525634765625, 0.1496734619140625, 0.15502166748046875, 0.160369873046875, 0.16571807861328125, 0.1710662841796875, 0.17641448974609375, 0.1817626953125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 9.0, 4.0, 11.0, 13.0, 20.0, 24.0, 29.0, 58.0, 85.0, 116.0, 166.0, 120.0, 98.0, 66.0, 54.0, 37.0, 29.0, 19.0, 13.0, 15.0, 4.0, 3.0, 2.0, 0.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.248453140258789e-05, -3.15522775053978e-05, -3.06200236082077e-05, -2.968776971101761e-05, -2.8755515813827515e-05, -2.782326191663742e-05, -2.6891008019447327e-05, -2.5958754122257233e-05, -2.502650022506714e-05, -2.4094246327877045e-05, -2.316199243068695e-05, -2.2229738533496857e-05, -2.1297484636306763e-05, -2.036523073911667e-05, -1.9432976841926575e-05, -1.850072294473648e-05, -1.7568469047546387e-05, -1.6636215150356293e-05, -1.57039612531662e-05, -1.4771707355976105e-05, -1.383945345878601e-05, -1.2907199561595917e-05, -1.1974945664405823e-05, -1.1042691767215729e-05, -1.0110437870025635e-05, -9.17818397283554e-06, -8.245930075645447e-06, -7.313676178455353e-06, -6.381422281265259e-06, -5.449168384075165e-06, -4.516914486885071e-06, -3.584660589694977e-06, -2.652406692504883e-06, -1.7201527953147888e-06, -7.878988981246948e-07, 1.4435499906539917e-07, 1.0766088962554932e-06, 2.008862793445587e-06, 2.941116690635681e-06, 3.873370587825775e-06, 4.805624485015869e-06, 5.737878382205963e-06, 6.670132279396057e-06, 7.602386176586151e-06, 8.534640073776245e-06, 9.466893970966339e-06, 1.0399147868156433e-05, 1.1331401765346527e-05, 1.2263655662536621e-05, 1.3195909559726715e-05, 1.4128163456916809e-05, 1.5060417354106903e-05, 1.5992671251296997e-05, 1.692492514848709e-05, 1.7857179045677185e-05, 1.878943294286728e-05, 1.9721686840057373e-05, 2.0653940737247467e-05, 2.158619463443756e-05, 2.2518448531627655e-05, 2.345070242881775e-05, 2.4382956326007843e-05, 2.5315210223197937e-05, 2.624746412038803e-05, 2.7179718017578125e-05]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 2.0, 4.0, 8.0, 8.0, 14.0, 15.0, 23.0, 32.0, 51.0, 84.0, 149.0, 328.0, 1174.0, 5718.0, 60304.0, 786295.0, 179703.0, 11739.0, 1875.0, 517.0, 204.0, 107.0, 57.0, 47.0, 23.0, 10.0, 16.0, 7.0, 10.0, 7.0, 7.0, 6.0, 1.0, 4.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.390380859375, -0.3794364929199219, -0.36849212646484375, -0.3575477600097656, -0.3466033935546875, -0.3356590270996094, -0.32471466064453125, -0.3137702941894531, -0.302825927734375, -0.2918815612792969, -0.28093719482421875, -0.2699928283691406, -0.2590484619140625, -0.24810409545898438, -0.23715972900390625, -0.22621536254882812, -0.21527099609375, -0.20432662963867188, -0.19338226318359375, -0.18243789672851562, -0.1714935302734375, -0.16054916381835938, -0.14960479736328125, -0.13866043090820312, -0.127716064453125, -0.11677169799804688, -0.10582733154296875, -0.09488296508789062, -0.0839385986328125, -0.07299423217773438, -0.06204986572265625, -0.051105499267578125, -0.0401611328125, -0.029216766357421875, -0.01827239990234375, -0.007328033447265625, 0.0036163330078125, 0.014560699462890625, 0.02550506591796875, 0.036449432373046875, 0.047393798828125, 0.058338165283203125, 0.06928253173828125, 0.08022689819335938, 0.0911712646484375, 0.10211563110351562, 0.11305999755859375, 0.12400436401367188, 0.13494873046875, 0.14589309692382812, 0.15683746337890625, 0.16778182983398438, 0.1787261962890625, 0.18967056274414062, 0.20061492919921875, 0.21155929565429688, 0.222503662109375, 0.23344802856445312, 0.24439239501953125, 0.2553367614746094, 0.2662811279296875, 0.2772254943847656, 0.28816986083984375, 0.2991142272949219, 0.31005859375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 4.0, 6.0, 7.0, 13.0, 13.0, 25.0, 25.0, 34.0, 53.0, 74.0, 110.0, 124.0, 125.0, 102.0, 76.0, 65.0, 52.0, 29.0, 21.0, 13.0, 6.0, 4.0, 3.0, 3.0, 5.0, 2.0, 1.0, 1.0, 7.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13134765625, -0.1266918182373047, -0.12203598022460938, -0.11738014221191406, -0.11272430419921875, -0.10806846618652344, -0.10341262817382812, -0.09875679016113281, -0.0941009521484375, -0.08944511413574219, -0.08478927612304688, -0.08013343811035156, -0.07547760009765625, -0.07082176208496094, -0.06616592407226562, -0.06151008605957031, -0.056854248046875, -0.05219841003417969, -0.047542572021484375, -0.04288673400878906, -0.03823089599609375, -0.03357505798339844, -0.028919219970703125, -0.024263381958007812, -0.0196075439453125, -0.014951705932617188, -0.010295867919921875, -0.0056400299072265625, -0.00098419189453125, 0.0036716461181640625, 0.008327484130859375, 0.012983322143554688, 0.01763916015625, 0.022294998168945312, 0.026950836181640625, 0.03160667419433594, 0.03626251220703125, 0.04091835021972656, 0.045574188232421875, 0.05023002624511719, 0.0548858642578125, 0.05954170227050781, 0.06419754028320312, 0.06885337829589844, 0.07350921630859375, 0.07816505432128906, 0.08282089233398438, 0.08747673034667969, 0.092132568359375, 0.09678840637207031, 0.10144424438476562, 0.10610008239746094, 0.11075592041015625, 0.11541175842285156, 0.12006759643554688, 0.12472343444824219, 0.1293792724609375, 0.1340351104736328, 0.13869094848632812, 0.14334678649902344, 0.14800262451171875, 0.15265846252441406, 0.15731430053710938, 0.1619701385498047, 0.1666259765625]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 11.0, 68.0, 278.0, 428.0, 179.0, 36.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.753924369812012, -4.651325702667236, -4.548727512359619, -4.446128845214844, -4.343530178070068, -4.240931510925293, -4.138333320617676, -4.0357346534729, -3.933135986328125, -3.8305375576019287, -3.7279388904571533, -3.625340461730957, -3.5227417945861816, -3.4201433658599854, -3.317544937133789, -3.2149462699890137, -3.1123478412628174, -3.009749412536621, -2.9071507453918457, -2.8045523166656494, -2.701953649520874, -2.5993552207946777, -2.4967565536499023, -2.394158124923706, -2.2915596961975098, -2.1889612674713135, -2.086362600326538, -1.9837641716003418, -1.8811655044555664, -1.7785670757293701, -1.6759685277938843, -1.5733699798583984, -1.4707715511322021, -1.3681730031967163, -1.2655744552612305, -1.1629760265350342, -1.0603773593902588, -0.9577788710594177, -0.8551803827285767, -0.7525818347930908, -0.649983286857605, -0.5473847389221191, -0.4447862207889557, -0.34218770265579224, -0.2395891547203064, -0.13699060678482056, -0.03439211845397949, 0.06820642948150635, 0.1708049774169922, 0.273403525352478, 0.3760020434856415, 0.47860056161880493, 0.5811991095542908, 0.6837976574897766, 0.7863961458206177, 0.8889946937561035, 0.9915932416915894, 1.0941917896270752, 1.196790337562561, 1.2993888854980469, 1.4019873142242432, 1.5045859813690186, 1.6071844100952148, 1.7097829580307007, 1.8123815059661865]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 6.0, 4.0, 2.0, 6.0, 14.0, 22.0, 25.0, 29.0, 32.0, 45.0, 55.0, 59.0, 67.0, 84.0, 71.0, 60.0, 66.0, 59.0, 56.0, 54.0, 39.0, 33.0, 27.0, 15.0, 23.0, 13.0, 8.0, 7.0, 9.0, 7.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.8294411301612854, -0.7996581196784973, -0.7698750495910645, -0.7400920391082764, -0.7103090286254883, -0.6805259585380554, -0.6507429480552673, -0.6209598779678345, -0.5911768674850464, -0.5613938570022583, -0.5316107869148254, -0.5018277764320374, -0.4720447361469269, -0.4422616958618164, -0.4124786853790283, -0.38269564509391785, -0.3529126048088074, -0.3231295645236969, -0.2933465242385864, -0.26356351375579834, -0.23378047347068787, -0.2039974331855774, -0.1742144078016281, -0.14443138241767883, -0.11464834213256836, -0.08486530929803848, -0.055082276463508606, -0.02529924362897873, 0.0044837892055511475, 0.03426682949066162, 0.0640498548746109, 0.09383288025856018, 0.12361598014831543, 0.1533990204334259, 0.18318204581737518, 0.21296507120132446, 0.24274811148643494, 0.2725311517715454, 0.3023141622543335, 0.33209720253944397, 0.36188024282455444, 0.3916632831096649, 0.4214463233947754, 0.4512293338775635, 0.48101237416267395, 0.5107954144477844, 0.5405784249305725, 0.5703614950180054, 0.6001445055007935, 0.6299275159835815, 0.6597105860710144, 0.6894935965538025, 0.7192766666412354, 0.7490596771240234, 0.7788426876068115, 0.8086256980895996, 0.8384087681770325, 0.8681917786598206, 0.8979748487472534, 0.9277578592300415, 0.9575408697128296, 0.9873239398002625, 1.0171070098876953, 1.0468900203704834, 1.0766730308532715]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 8.0, 12.0, 26.0, 51.0, 82.0, 168.0, 527.0, 3113.0, 31601.0, 3978354.0, 174098.0, 4535.0, 1035.0, 333.0, 169.0, 64.0, 44.0, 26.0, 10.0, 6.0, 8.0, 4.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.310791015625, -0.2981986999511719, -0.28560638427734375, -0.2730140686035156, -0.2604217529296875, -0.24782943725585938, -0.23523712158203125, -0.22264480590820312, -0.210052490234375, -0.19746017456054688, -0.18486785888671875, -0.17227554321289062, -0.1596832275390625, -0.14709091186523438, -0.13449859619140625, -0.12190628051757812, -0.10931396484375, -0.09672164916992188, -0.08412933349609375, -0.07153701782226562, -0.0589447021484375, -0.046352386474609375, -0.03376007080078125, -0.021167755126953125, -0.008575439453125, 0.004016876220703125, 0.01660919189453125, 0.029201507568359375, 0.0417938232421875, 0.054386138916015625, 0.06697845458984375, 0.07957077026367188, 0.0921630859375, 0.10475540161132812, 0.11734771728515625, 0.12994003295898438, 0.1425323486328125, 0.15512466430664062, 0.16771697998046875, 0.18030929565429688, 0.192901611328125, 0.20549392700195312, 0.21808624267578125, 0.23067855834960938, 0.2432708740234375, 0.2558631896972656, 0.26845550537109375, 0.2810478210449219, 0.29364013671875, 0.3062324523925781, 0.31882476806640625, 0.3314170837402344, 0.3440093994140625, 0.3566017150878906, 0.36919403076171875, 0.3817863464355469, 0.394378662109375, 0.4069709777832031, 0.41956329345703125, 0.4321556091308594, 0.4447479248046875, 0.4573402404785156, 0.46993255615234375, 0.4825248718261719, 0.4951171875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 6.0, 12.0, 10.0, 17.0, 23.0, 32.0, 62.0, 93.0, 107.0, 137.0, 144.0, 123.0, 93.0, 52.0, 40.0, 27.0, 12.0, 6.0, 9.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.08856201171875, -0.08414745330810547, -0.07973289489746094, -0.0753183364868164, -0.07090377807617188, -0.06648921966552734, -0.06207466125488281, -0.05766010284423828, -0.05324554443359375, -0.04883098602294922, -0.04441642761230469, -0.040001869201660156, -0.035587310791015625, -0.031172752380371094, -0.026758193969726562, -0.02234363555908203, -0.0179290771484375, -0.013514518737792969, -0.009099960327148438, -0.004685401916503906, -0.000270843505859375, 0.004143714904785156, 0.008558273315429688, 0.012972831726074219, 0.01738739013671875, 0.02180194854736328, 0.026216506958007812, 0.030631065368652344, 0.035045623779296875, 0.039460182189941406, 0.04387474060058594, 0.04828929901123047, 0.052703857421875, 0.05711841583251953, 0.06153297424316406, 0.0659475326538086, 0.07036209106445312, 0.07477664947509766, 0.07919120788574219, 0.08360576629638672, 0.08802032470703125, 0.09243488311767578, 0.09684944152832031, 0.10126399993896484, 0.10567855834960938, 0.1100931167602539, 0.11450767517089844, 0.11892223358154297, 0.1233367919921875, 0.12775135040283203, 0.13216590881347656, 0.1365804672241211, 0.14099502563476562, 0.14540958404541016, 0.1498241424560547, 0.15423870086669922, 0.15865325927734375, 0.16306781768798828, 0.1674823760986328, 0.17189693450927734, 0.17631149291992188, 0.1807260513305664, 0.18514060974121094, 0.18955516815185547, 0.1939697265625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 7.0, 3.0, 8.0, 9.0, 11.0, 21.0, 30.0, 44.0, 60.0, 82.0, 112.0, 206.0, 377.0, 641.0, 1441.0, 3959.0, 14831.0, 81786.0, 714980.0, 2744558.0, 546899.0, 65702.0, 12191.0, 3436.0, 1285.0, 624.0, 350.0, 216.0, 112.0, 104.0, 59.0, 37.0, 30.0, 25.0, 14.0, 11.0, 6.0, 5.0, 6.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1483154296875, -0.14310073852539062, -0.13788604736328125, -0.13267135620117188, -0.1274566650390625, -0.12224197387695312, -0.11702728271484375, -0.11181259155273438, -0.106597900390625, -0.10138320922851562, -0.09616851806640625, -0.09095382690429688, -0.0857391357421875, -0.08052444458007812, -0.07530975341796875, -0.07009506225585938, -0.06488037109375, -0.059665679931640625, -0.05445098876953125, -0.049236297607421875, -0.0440216064453125, -0.038806915283203125, -0.03359222412109375, -0.028377532958984375, -0.023162841796875, -0.017948150634765625, -0.01273345947265625, -0.007518768310546875, -0.0023040771484375, 0.002910614013671875, 0.00812530517578125, 0.013339996337890625, 0.0185546875, 0.023769378662109375, 0.02898406982421875, 0.034198760986328125, 0.0394134521484375, 0.044628143310546875, 0.04984283447265625, 0.055057525634765625, 0.060272216796875, 0.06548690795898438, 0.07070159912109375, 0.07591629028320312, 0.0811309814453125, 0.08634567260742188, 0.09156036376953125, 0.09677505493164062, 0.10198974609375, 0.10720443725585938, 0.11241912841796875, 0.11763381958007812, 0.1228485107421875, 0.12806320190429688, 0.13327789306640625, 0.13849258422851562, 0.143707275390625, 0.14892196655273438, 0.15413665771484375, 0.15935134887695312, 0.1645660400390625, 0.16978073120117188, 0.17499542236328125, 0.18021011352539062, 0.1854248046875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 5.0, 4.0, 10.0, 17.0, 21.0, 22.0, 38.0, 37.0, 55.0, 71.0, 93.0, 155.0, 181.0, 246.0, 280.0, 359.0, 403.0, 406.0, 403.0, 296.0, 228.0, 213.0, 142.0, 105.0, 76.0, 62.0, 41.0, 27.0, 19.0, 25.0, 11.0, 12.0, 7.0, 5.0, 4.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.11114501953125, -0.10807609558105469, -0.10500717163085938, -0.10193824768066406, -0.09886932373046875, -0.09580039978027344, -0.09273147583007812, -0.08966255187988281, -0.0865936279296875, -0.08352470397949219, -0.08045578002929688, -0.07738685607910156, -0.07431793212890625, -0.07124900817871094, -0.06818008422851562, -0.06511116027832031, -0.062042236328125, -0.05897331237792969, -0.055904388427734375, -0.05283546447753906, -0.04976654052734375, -0.04669761657714844, -0.043628692626953125, -0.04055976867675781, -0.0374908447265625, -0.03442192077636719, -0.031352996826171875, -0.028284072875976562, -0.02521514892578125, -0.022146224975585938, -0.019077301025390625, -0.016008377075195312, -0.012939453125, -0.009870529174804688, -0.006801605224609375, -0.0037326812744140625, -0.00066375732421875, 0.0024051666259765625, 0.005474090576171875, 0.008543014526367188, 0.0116119384765625, 0.014680862426757812, 0.017749786376953125, 0.020818710327148438, 0.02388763427734375, 0.026956558227539062, 0.030025482177734375, 0.03309440612792969, 0.036163330078125, 0.03923225402832031, 0.042301177978515625, 0.04537010192871094, 0.04843902587890625, 0.05150794982910156, 0.054576873779296875, 0.05764579772949219, 0.0607147216796875, 0.06378364562988281, 0.06685256958007812, 0.06992149353027344, 0.07299041748046875, 0.07605934143066406, 0.07912826538085938, 0.08219718933105469, 0.08526611328125]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 8.0, 33.0, 131.0, 400.0, 327.0, 100.0, 13.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4440441131591797, -1.3808889389038086, -1.3177337646484375, -1.2545785903930664, -1.1914234161376953, -1.1282682418823242, -1.0651129484176636, -1.0019577741622925, -0.9388025999069214, -0.8756474256515503, -0.8124922513961792, -0.7493370175361633, -0.6861818432807922, -0.6230266690254211, -0.5598714351654053, -0.4967162609100342, -0.4335610866546631, -0.370405912399292, -0.3072507083415985, -0.24409551918506622, -0.18094033002853394, -0.11778515577316284, -0.05462995171546936, 0.008525252342224121, 0.07168042659759521, 0.1348356157541275, 0.1979908049106598, 0.26114600896835327, 0.32430118322372437, 0.38745635747909546, 0.45061156153678894, 0.5137667655944824, 0.5769219398498535, 0.6400771141052246, 0.7032322883605957, 0.7663875222206116, 0.8295426964759827, 0.8926978707313538, 0.9558531045913696, 1.0190082788467407, 1.0821634531021118, 1.145318627357483, 1.208473801612854, 1.271628975868225, 1.3347842693328857, 1.3979394435882568, 1.461094617843628, 1.524249792098999, 1.5874049663543701, 1.6505601406097412, 1.7137153148651123, 1.7768704891204834, 1.8400256633758545, 1.9031808376312256, 1.9663361310958862, 2.029491424560547, 2.092646598815918, 2.155801773071289, 2.21895694732666, 2.2821121215820312, 2.3452672958374023, 2.4084224700927734, 2.4715776443481445, 2.5347328186035156, 2.5978879928588867]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 4.0, 2.0, 8.0, 6.0, 8.0, 10.0, 17.0, 22.0, 24.0, 26.0, 26.0, 25.0, 31.0, 35.0, 46.0, 40.0, 38.0, 35.0, 43.0, 50.0, 42.0, 40.0, 57.0, 46.0, 39.0, 28.0, 34.0, 25.0, 27.0, 30.0, 20.0, 17.0, 18.0, 14.0, 18.0, 8.0, 13.0, 8.0, 6.0, 8.0, 1.0, 5.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33290839195251465, -0.32202205061912537, -0.31113573908805847, -0.3002493977546692, -0.2893630862236023, -0.278476744890213, -0.26759040355682373, -0.25670409202575684, -0.24581775069236755, -0.23493142426013947, -0.22404509782791138, -0.2131587564945221, -0.202272430062294, -0.19138610363006592, -0.18049977719783783, -0.16961345076560974, -0.15872712433338165, -0.14784079790115356, -0.13695447146892548, -0.1260681450366974, -0.1151818037033081, -0.10429547727108002, -0.09340915083885193, -0.08252281695604324, -0.07163649052381516, -0.06075016036629677, -0.04986383020877838, -0.03897750377655029, -0.028091173619031906, -0.01720484346151352, -0.006318517029285431, 0.004567816853523254, 0.015454143285751343, 0.02634047344326973, 0.037226803600788116, 0.048113130033016205, 0.05899946019053459, 0.06988579034805298, 0.08077211678028107, 0.09165845066308975, 0.10254477709531784, 0.11343110352754593, 0.12431743741035461, 0.1352037638425827, 0.1460900902748108, 0.15697643160820007, 0.16786274313926697, 0.17874908447265625, 0.18963541090488434, 0.20052173733711243, 0.21140806376934052, 0.2222943902015686, 0.23318073153495789, 0.24406705796718597, 0.25495338439941406, 0.26583972573280334, 0.27672603726387024, 0.2876123785972595, 0.2984986901283264, 0.3093850314617157, 0.3202713429927826, 0.3311576843261719, 0.34204399585723877, 0.35293033719062805, 0.36381667852401733]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 5.0, 3.0, 5.0, 6.0, 13.0, 15.0, 23.0, 27.0, 35.0, 51.0, 70.0, 93.0, 145.0, 233.0, 375.0, 696.0, 1471.0, 3641.0, 11696.0, 55979.0, 409135.0, 476497.0, 67381.0, 13377.0, 3994.0, 1632.0, 787.0, 383.0, 255.0, 165.0, 101.0, 76.0, 56.0, 53.0, 17.0, 11.0, 16.0, 5.0, 7.0, 6.0, 5.0, 7.0, 4.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.373046875, -0.3617591857910156, -0.35047149658203125, -0.3391838073730469, -0.3278961181640625, -0.3166084289550781, -0.30532073974609375, -0.2940330505371094, -0.282745361328125, -0.2714576721191406, -0.26016998291015625, -0.24888229370117188, -0.2375946044921875, -0.22630691528320312, -0.21501922607421875, -0.20373153686523438, -0.19244384765625, -0.18115615844726562, -0.16986846923828125, -0.15858078002929688, -0.1472930908203125, -0.13600540161132812, -0.12471771240234375, -0.11343002319335938, -0.102142333984375, -0.09085464477539062, -0.07956695556640625, -0.06827926635742188, -0.0569915771484375, -0.045703887939453125, -0.03441619873046875, -0.023128509521484375, -0.0118408203125, -0.000553131103515625, 0.01073455810546875, 0.022022247314453125, 0.0333099365234375, 0.044597625732421875, 0.05588531494140625, 0.06717300415039062, 0.078460693359375, 0.08974838256835938, 0.10103607177734375, 0.11232376098632812, 0.1236114501953125, 0.13489913940429688, 0.14618682861328125, 0.15747451782226562, 0.16876220703125, 0.18004989624023438, 0.19133758544921875, 0.20262527465820312, 0.2139129638671875, 0.22520065307617188, 0.23648834228515625, 0.24777603149414062, 0.259063720703125, 0.2703514099121094, 0.28163909912109375, 0.2929267883300781, 0.3042144775390625, 0.3155021667480469, 0.32678985595703125, 0.3380775451660156, 0.349365234375]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 9.0, 9.0, 18.0, 22.0, 22.0, 56.0, 78.0, 122.0, 121.0, 158.0, 134.0, 92.0, 71.0, 39.0, 25.0, 14.0, 5.0, 9.0, 0.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.09075927734375, -0.08629131317138672, -0.08182334899902344, -0.07735538482666016, -0.07288742065429688, -0.0684194564819336, -0.06395149230957031, -0.05948352813720703, -0.05501556396484375, -0.05054759979248047, -0.04607963562011719, -0.041611671447753906, -0.037143707275390625, -0.032675743103027344, -0.028207778930664062, -0.02373981475830078, -0.0192718505859375, -0.014803886413574219, -0.010335922241210938, -0.005867958068847656, -0.001399993896484375, 0.0030679702758789062, 0.0075359344482421875, 0.012003898620605469, 0.01647186279296875, 0.02093982696533203, 0.025407791137695312, 0.029875755310058594, 0.034343719482421875, 0.038811683654785156, 0.04327964782714844, 0.04774761199951172, 0.052215576171875, 0.05668354034423828, 0.06115150451660156, 0.06561946868896484, 0.07008743286132812, 0.0745553970336914, 0.07902336120605469, 0.08349132537841797, 0.08795928955078125, 0.09242725372314453, 0.09689521789550781, 0.1013631820678711, 0.10583114624023438, 0.11029911041259766, 0.11476707458496094, 0.11923503875732422, 0.1237030029296875, 0.12817096710205078, 0.13263893127441406, 0.13710689544677734, 0.14157485961914062, 0.1460428237915039, 0.1505107879638672, 0.15497875213623047, 0.15944671630859375, 0.16391468048095703, 0.1683826446533203, 0.1728506088256836, 0.17731857299804688, 0.18178653717041016, 0.18625450134277344, 0.19072246551513672, 0.1951904296875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 3.0, 10.0, 10.0, 21.0, 22.0, 27.0, 41.0, 52.0, 91.0, 149.0, 271.0, 472.0, 1161.0, 3772.0, 18512.0, 109749.0, 501297.0, 339513.0, 58777.0, 10344.0, 2403.0, 869.0, 381.0, 188.0, 115.0, 106.0, 59.0, 31.0, 21.0, 24.0, 16.0, 14.0, 10.0, 3.0, 6.0, 5.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.37744140625, -0.3666038513183594, -0.35576629638671875, -0.3449287414550781, -0.3340911865234375, -0.3232536315917969, -0.31241607666015625, -0.3015785217285156, -0.290740966796875, -0.2799034118652344, -0.26906585693359375, -0.2582283020019531, -0.2473907470703125, -0.23655319213867188, -0.22571563720703125, -0.21487808227539062, -0.20404052734375, -0.19320297241210938, -0.18236541748046875, -0.17152786254882812, -0.1606903076171875, -0.14985275268554688, -0.13901519775390625, -0.12817764282226562, -0.117340087890625, -0.10650253295898438, -0.09566497802734375, -0.08482742309570312, -0.0739898681640625, -0.06315231323242188, -0.05231475830078125, -0.041477203369140625, -0.0306396484375, -0.019802093505859375, -0.00896453857421875, 0.001873016357421875, 0.0127105712890625, 0.023548126220703125, 0.03438568115234375, 0.045223236083984375, 0.056060791015625, 0.06689834594726562, 0.07773590087890625, 0.08857345581054688, 0.0994110107421875, 0.11024856567382812, 0.12108612060546875, 0.13192367553710938, 0.14276123046875, 0.15359878540039062, 0.16443634033203125, 0.17527389526367188, 0.1861114501953125, 0.19694900512695312, 0.20778656005859375, 0.21862411499023438, 0.229461669921875, 0.24029922485351562, 0.25113677978515625, 0.2619743347167969, 0.2728118896484375, 0.2836494445800781, 0.29448699951171875, 0.3053245544433594, 0.316162109375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 0.0, 2.0, 5.0, 3.0, 7.0, 9.0, 8.0, 12.0, 23.0, 19.0, 24.0, 39.0, 22.0, 34.0, 36.0, 33.0, 40.0, 43.0, 40.0, 55.0, 47.0, 34.0, 48.0, 42.0, 44.0, 35.0, 44.0, 33.0, 26.0, 32.0, 23.0, 26.0, 20.0, 10.0, 16.0, 17.0, 15.0, 12.0, 5.0, 4.0, 3.0, 7.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.17919921875, -0.1738739013671875, -0.168548583984375, -0.1632232666015625, -0.15789794921875, -0.1525726318359375, -0.147247314453125, -0.1419219970703125, -0.1365966796875, -0.1312713623046875, -0.125946044921875, -0.1206207275390625, -0.11529541015625, -0.1099700927734375, -0.104644775390625, -0.0993194580078125, -0.093994140625, -0.0886688232421875, -0.083343505859375, -0.0780181884765625, -0.07269287109375, -0.0673675537109375, -0.062042236328125, -0.0567169189453125, -0.0513916015625, -0.0460662841796875, -0.040740966796875, -0.0354156494140625, -0.03009033203125, -0.0247650146484375, -0.019439697265625, -0.0141143798828125, -0.0087890625, -0.0034637451171875, 0.001861572265625, 0.0071868896484375, 0.01251220703125, 0.0178375244140625, 0.023162841796875, 0.0284881591796875, 0.0338134765625, 0.0391387939453125, 0.044464111328125, 0.0497894287109375, 0.05511474609375, 0.0604400634765625, 0.065765380859375, 0.0710906982421875, 0.076416015625, 0.0817413330078125, 0.087066650390625, 0.0923919677734375, 0.09771728515625, 0.1030426025390625, 0.108367919921875, 0.1136932373046875, 0.1190185546875, 0.1243438720703125, 0.129669189453125, 0.1349945068359375, 0.14031982421875, 0.1456451416015625, 0.150970458984375, 0.1562957763671875, 0.16162109375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 7.0, 11.0, 5.0, 13.0, 27.0, 35.0, 46.0, 83.0, 136.0, 212.0, 453.0, 794.0, 1534.0, 3304.0, 7192.0, 16570.0, 41067.0, 106411.0, 245007.0, 318242.0, 183463.0, 73492.0, 28252.0, 11893.0, 5127.0, 2466.0, 1243.0, 591.0, 349.0, 193.0, 136.0, 69.0, 50.0, 25.0, 23.0, 15.0, 7.0, 3.0, 2.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.07794189453125, -0.07560157775878906, -0.07326126098632812, -0.07092094421386719, -0.06858062744140625, -0.06624031066894531, -0.06389999389648438, -0.06155967712402344, -0.0592193603515625, -0.05687904357910156, -0.054538726806640625, -0.05219841003417969, -0.04985809326171875, -0.04751777648925781, -0.045177459716796875, -0.04283714294433594, -0.040496826171875, -0.03815650939941406, -0.035816192626953125, -0.03347587585449219, -0.03113555908203125, -0.028795242309570312, -0.026454925537109375, -0.024114608764648438, -0.0217742919921875, -0.019433975219726562, -0.017093658447265625, -0.014753341674804688, -0.01241302490234375, -0.010072708129882812, -0.007732391357421875, -0.0053920745849609375, -0.0030517578125, -0.0007114410400390625, 0.001628875732421875, 0.0039691925048828125, 0.00630950927734375, 0.008649826049804688, 0.010990142822265625, 0.013330459594726562, 0.0156707763671875, 0.018011093139648438, 0.020351409912109375, 0.022691726684570312, 0.02503204345703125, 0.027372360229492188, 0.029712677001953125, 0.03205299377441406, 0.034393310546875, 0.03673362731933594, 0.039073944091796875, 0.04141426086425781, 0.04375457763671875, 0.04609489440917969, 0.048435211181640625, 0.05077552795410156, 0.0531158447265625, 0.05545616149902344, 0.057796478271484375, 0.06013679504394531, 0.06247711181640625, 0.06481742858886719, 0.06715774536132812, 0.06949806213378906, 0.07183837890625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 4.0, 2.0, 5.0, 10.0, 2.0, 12.0, 8.0, 17.0, 21.0, 26.0, 25.0, 33.0, 46.0, 47.0, 72.0, 68.0, 81.0, 72.0, 81.0, 75.0, 52.0, 52.0, 31.0, 27.0, 23.0, 17.0, 17.0, 17.0, 10.0, 9.0, 7.0, 6.0, 2.0, 7.0, 3.0, 6.0, 3.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1026859283447266e-05, -1.0662712156772614e-05, -1.0298565030097961e-05, -9.93441790342331e-06, -9.570270776748657e-06, -9.206123650074005e-06, -8.841976523399353e-06, -8.477829396724701e-06, -8.113682270050049e-06, -7.749535143375397e-06, -7.385388016700745e-06, -7.0212408900260925e-06, -6.6570937633514404e-06, -6.292946636676788e-06, -5.928799510002136e-06, -5.564652383327484e-06, -5.200505256652832e-06, -4.83635812997818e-06, -4.472211003303528e-06, -4.108063876628876e-06, -3.7439167499542236e-06, -3.3797696232795715e-06, -3.0156224966049194e-06, -2.6514753699302673e-06, -2.2873282432556152e-06, -1.923181116580963e-06, -1.559033989906311e-06, -1.194886863231659e-06, -8.307397365570068e-07, -4.6659260988235474e-07, -1.0244548320770264e-07, 2.6170164346694946e-07, 6.258487701416016e-07, 9.899958968162537e-07, 1.3541430234909058e-06, 1.7182901501655579e-06, 2.08243727684021e-06, 2.446584403514862e-06, 2.810731530189514e-06, 3.1748786568641663e-06, 3.5390257835388184e-06, 3.9031729102134705e-06, 4.2673200368881226e-06, 4.631467163562775e-06, 4.995614290237427e-06, 5.359761416912079e-06, 5.723908543586731e-06, 6.088055670261383e-06, 6.452202796936035e-06, 6.816349923610687e-06, 7.180497050285339e-06, 7.5446441769599915e-06, 7.908791303634644e-06, 8.272938430309296e-06, 8.637085556983948e-06, 9.0012326836586e-06, 9.365379810333252e-06, 9.729526937007904e-06, 1.0093674063682556e-05, 1.0457821190357208e-05, 1.082196831703186e-05, 1.1186115443706512e-05, 1.1550262570381165e-05, 1.1914409697055817e-05, 1.2278556823730469e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 6.0, 4.0, 8.0, 13.0, 9.0, 15.0, 24.0, 38.0, 62.0, 85.0, 131.0, 203.0, 361.0, 646.0, 1145.0, 2124.0, 4651.0, 10447.0, 26266.0, 69712.0, 187128.0, 340697.0, 246031.0, 96999.0, 35499.0, 14101.0, 6135.0, 2764.0, 1383.0, 754.0, 403.0, 236.0, 161.0, 97.0, 64.0, 31.0, 23.0, 27.0, 20.0, 15.0, 6.0, 9.0, 5.0, 7.0, 2.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0728759765625, -0.07033348083496094, -0.06779098510742188, -0.06524848937988281, -0.06270599365234375, -0.06016349792480469, -0.057621002197265625, -0.05507850646972656, -0.0525360107421875, -0.04999351501464844, -0.047451019287109375, -0.04490852355957031, -0.04236602783203125, -0.03982353210449219, -0.037281036376953125, -0.03473854064941406, -0.032196044921875, -0.029653549194335938, -0.027111053466796875, -0.024568557739257812, -0.02202606201171875, -0.019483566284179688, -0.016941070556640625, -0.014398574829101562, -0.0118560791015625, -0.009313583374023438, -0.006771087646484375, -0.0042285919189453125, -0.00168609619140625, 0.0008563995361328125, 0.003398895263671875, 0.0059413909912109375, 0.00848388671875, 0.011026382446289062, 0.013568878173828125, 0.016111373901367188, 0.01865386962890625, 0.021196365356445312, 0.023738861083984375, 0.026281356811523438, 0.0288238525390625, 0.03136634826660156, 0.033908843994140625, 0.03645133972167969, 0.03899383544921875, 0.04153633117675781, 0.044078826904296875, 0.04662132263183594, 0.049163818359375, 0.05170631408691406, 0.054248809814453125, 0.05679130554199219, 0.05933380126953125, 0.06187629699707031, 0.06441879272460938, 0.06696128845214844, 0.0695037841796875, 0.07204627990722656, 0.07458877563476562, 0.07713127136230469, 0.07967376708984375, 0.08221626281738281, 0.08475875854492188, 0.08730125427246094, 0.08984375]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 6.0, 3.0, 13.0, 8.0, 9.0, 12.0, 12.0, 14.0, 19.0, 28.0, 21.0, 31.0, 56.0, 45.0, 64.0, 62.0, 51.0, 56.0, 59.0, 62.0, 49.0, 54.0, 40.0, 40.0, 40.0, 31.0, 25.0, 15.0, 9.0, 17.0, 18.0, 7.0, 8.0, 5.0, 8.0, 3.0, 2.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0643310546875, -0.0625448226928711, -0.06075859069824219, -0.05897235870361328, -0.057186126708984375, -0.05539989471435547, -0.05361366271972656, -0.051827430725097656, -0.05004119873046875, -0.048254966735839844, -0.04646873474121094, -0.04468250274658203, -0.042896270751953125, -0.04111003875732422, -0.03932380676269531, -0.037537574768066406, -0.0357513427734375, -0.033965110778808594, -0.03217887878417969, -0.03039264678955078, -0.028606414794921875, -0.02682018280029297, -0.025033950805664062, -0.023247718811035156, -0.02146148681640625, -0.019675254821777344, -0.017889022827148438, -0.01610279083251953, -0.014316558837890625, -0.012530326843261719, -0.010744094848632812, -0.008957862854003906, -0.007171630859375, -0.005385398864746094, -0.0035991668701171875, -0.0018129348754882812, -2.6702880859375e-05, 0.0017595291137695312, 0.0035457611083984375, 0.005331993103027344, 0.00711822509765625, 0.008904457092285156, 0.010690689086914062, 0.012476921081542969, 0.014263153076171875, 0.01604938507080078, 0.017835617065429688, 0.019621849060058594, 0.0214080810546875, 0.023194313049316406, 0.024980545043945312, 0.02676677703857422, 0.028553009033203125, 0.03033924102783203, 0.03212547302246094, 0.033911705017089844, 0.03569793701171875, 0.037484169006347656, 0.03927040100097656, 0.04105663299560547, 0.042842864990234375, 0.04462909698486328, 0.04641532897949219, 0.048201560974121094, 0.04998779296875]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 43.0, 357.0, 504.0, 93.0, 12.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.004016399383545, -3.883042097091675, -3.762068033218384, -3.6410937309265137, -3.5201194286346436, -3.3991451263427734, -3.2781710624694824, -3.1571967601776123, -3.036222457885742, -2.915248155593872, -2.794274091720581, -2.673299789428711, -2.552325487136841, -2.4313511848449707, -2.3103771209716797, -2.1894028186798096, -2.0684285163879395, -1.9474543333053589, -1.8264800310134888, -1.7055058479309082, -1.584531545639038, -1.4635573625564575, -1.342583179473877, -1.2216088771820068, -1.1006348133087158, -0.9796605706214905, -0.8586863279342651, -0.7377121448516846, -0.6167378425598145, -0.4957636594772339, -0.37478941679000854, -0.2538151741027832, -0.13284087181091309, -0.011866636574268341, 0.1091075986623764, 0.23008182644844055, 0.3510560691356659, 0.47203028202056885, 0.5930045247077942, 0.7139787673950195, 0.8349530100822449, 0.9559272527694702, 1.0769014358520508, 1.197875738143921, 1.3188499212265015, 1.439824104309082, 1.5607984066009521, 1.6817727088928223, 1.8027468919754028, 1.9237210750579834, 2.0446953773498535, 2.1656696796417236, 2.2866437435150146, 2.4076180458068848, 2.528592348098755, 2.649566650390625, 2.770540714263916, 2.891515016555786, 3.012489080429077, 3.1334633827209473, 3.2544376850128174, 3.3754119873046875, 3.4963860511779785, 3.6173603534698486, 3.7383346557617188]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 7.0, 11.0, 13.0, 12.0, 16.0, 15.0, 30.0, 18.0, 35.0, 39.0, 41.0, 44.0, 45.0, 55.0, 56.0, 52.0, 64.0, 51.0, 51.0, 53.0, 56.0, 41.0, 36.0, 38.0, 27.0, 23.0, 15.0, 16.0, 11.0, 9.0, 8.0, 2.0, 4.0, 3.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.7837508320808411, -0.7629237771034241, -0.7420967221260071, -0.7212697267532349, -0.7004426717758179, -0.6796156167984009, -0.6587885618209839, -0.6379615068435669, -0.6171344518661499, -0.5963073968887329, -0.5754803419113159, -0.5546533465385437, -0.5338262915611267, -0.5129992365837097, -0.4921721816062927, -0.47134512662887573, -0.4505181312561035, -0.4296910762786865, -0.4088640511035919, -0.3880369961261749, -0.3672099709510803, -0.34638291597366333, -0.32555586099624634, -0.30472880601882935, -0.28390178084373474, -0.26307472586631775, -0.24224770069122314, -0.22142064571380615, -0.20059360563755035, -0.17976656556129456, -0.15893951058387756, -0.13811247050762177, -0.11728537082672119, -0.0964583307504654, -0.075631283223629, -0.0548042394220829, -0.033977195620536804, -0.013150155544281006, 0.007676891982555389, 0.028503939509391785, 0.04933097958564758, 0.07015801966190338, 0.09098506718873978, 0.11181211471557617, 0.13263915479183197, 0.15346619486808777, 0.17429324984550476, 0.19512028992176056, 0.21594732999801636, 0.23677437007427216, 0.25760141015052795, 0.27842846512794495, 0.29925549030303955, 0.32008254528045654, 0.34090960025787354, 0.3617366552352905, 0.38256368041038513, 0.4033907353878021, 0.42421776056289673, 0.4450448155403137, 0.4658718705177307, 0.4866988956928253, 0.5075259208679199, 0.5283529758453369, 0.5491800308227539]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 8.0, 14.0, 33.0, 54.0, 99.0, 192.0, 416.0, 1143.0, 3229.0, 9828.0, 46373.0, 1173593.0, 2859380.0, 83436.0, 10671.0, 3096.0, 1195.0, 578.0, 305.0, 179.0, 144.0, 90.0, 74.0, 48.0, 25.0, 17.0, 18.0, 12.0, 5.0, 9.0, 4.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.163818359375, -0.15703201293945312, -0.15024566650390625, -0.14345932006835938, -0.1366729736328125, -0.12988662719726562, -0.12310028076171875, -0.11631393432617188, -0.109527587890625, -0.10274124145507812, -0.09595489501953125, -0.08916854858398438, -0.0823822021484375, -0.07559585571289062, -0.06880950927734375, -0.062023162841796875, -0.05523681640625, -0.048450469970703125, -0.04166412353515625, -0.034877777099609375, -0.0280914306640625, -0.021305084228515625, -0.01451873779296875, -0.007732391357421875, -0.000946044921875, 0.005840301513671875, 0.01262664794921875, 0.019412994384765625, 0.0261993408203125, 0.032985687255859375, 0.03977203369140625, 0.046558380126953125, 0.0533447265625, 0.060131072998046875, 0.06691741943359375, 0.07370376586914062, 0.0804901123046875, 0.08727645874023438, 0.09406280517578125, 0.10084915161132812, 0.107635498046875, 0.11442184448242188, 0.12120819091796875, 0.12799453735351562, 0.1347808837890625, 0.14156723022460938, 0.14835357666015625, 0.15513992309570312, 0.16192626953125, 0.16871261596679688, 0.17549896240234375, 0.18228530883789062, 0.1890716552734375, 0.19585800170898438, 0.20264434814453125, 0.20943069458007812, 0.216217041015625, 0.22300338745117188, 0.22978973388671875, 0.23657608032226562, 0.2433624267578125, 0.2501487731933594, 0.25693511962890625, 0.2637214660644531, 0.2705078125]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 6.0, 6.0, 9.0, 28.0, 26.0, 42.0, 80.0, 113.0, 109.0, 130.0, 134.0, 112.0, 84.0, 52.0, 31.0, 20.0, 12.0, 7.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0772705078125, -0.07289886474609375, -0.0685272216796875, -0.06415557861328125, -0.059783935546875, -0.05541229248046875, -0.0510406494140625, -0.04666900634765625, -0.04229736328125, -0.03792572021484375, -0.0335540771484375, -0.02918243408203125, -0.024810791015625, -0.02043914794921875, -0.0160675048828125, -0.01169586181640625, -0.00732421875, -0.00295257568359375, 0.0014190673828125, 0.00579071044921875, 0.010162353515625, 0.01453399658203125, 0.0189056396484375, 0.02327728271484375, 0.02764892578125, 0.03202056884765625, 0.0363922119140625, 0.04076385498046875, 0.045135498046875, 0.04950714111328125, 0.0538787841796875, 0.05825042724609375, 0.0626220703125, 0.06699371337890625, 0.0713653564453125, 0.07573699951171875, 0.080108642578125, 0.08448028564453125, 0.0888519287109375, 0.09322357177734375, 0.09759521484375, 0.10196685791015625, 0.1063385009765625, 0.11071014404296875, 0.115081787109375, 0.11945343017578125, 0.1238250732421875, 0.12819671630859375, 0.132568359375, 0.13694000244140625, 0.1413116455078125, 0.14568328857421875, 0.150054931640625, 0.15442657470703125, 0.1587982177734375, 0.16316986083984375, 0.16754150390625, 0.17191314697265625, 0.1762847900390625, 0.18065643310546875, 0.185028076171875, 0.18939971923828125, 0.1937713623046875, 0.19814300537109375, 0.2025146484375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 12.0, 10.0, 11.0, 28.0, 21.0, 29.0, 52.0, 73.0, 102.0, 241.0, 472.0, 1287.0, 5757.0, 41387.0, 566595.0, 3230046.0, 314735.0, 27281.0, 4104.0, 1038.0, 388.0, 223.0, 121.0, 81.0, 50.0, 42.0, 29.0, 14.0, 11.0, 11.0, 5.0, 10.0, 6.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.22705078125, -0.22004318237304688, -0.21303558349609375, -0.20602798461914062, -0.1990203857421875, -0.19201278686523438, -0.18500518798828125, -0.17799758911132812, -0.170989990234375, -0.16398239135742188, -0.15697479248046875, -0.14996719360351562, -0.1429595947265625, -0.13595199584960938, -0.12894439697265625, -0.12193679809570312, -0.11492919921875, -0.10792160034179688, -0.10091400146484375, -0.09390640258789062, -0.0868988037109375, -0.07989120483398438, -0.07288360595703125, -0.06587600708007812, -0.058868408203125, -0.051860809326171875, -0.04485321044921875, -0.037845611572265625, -0.0308380126953125, -0.023830413818359375, -0.01682281494140625, -0.009815216064453125, -0.0028076171875, 0.004199981689453125, 0.01120758056640625, 0.018215179443359375, 0.0252227783203125, 0.032230377197265625, 0.03923797607421875, 0.046245574951171875, 0.053253173828125, 0.060260772705078125, 0.06726837158203125, 0.07427597045898438, 0.0812835693359375, 0.08829116821289062, 0.09529876708984375, 0.10230636596679688, 0.10931396484375, 0.11632156372070312, 0.12332916259765625, 0.13033676147460938, 0.1373443603515625, 0.14435195922851562, 0.15135955810546875, 0.15836715698242188, 0.165374755859375, 0.17238235473632812, 0.17938995361328125, 0.18639755249023438, 0.1934051513671875, 0.20041275024414062, 0.20742034912109375, 0.21442794799804688, 0.221435546875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 5.0, 3.0, 7.0, 14.0, 10.0, 22.0, 17.0, 32.0, 46.0, 55.0, 76.0, 115.0, 167.0, 205.0, 280.0, 389.0, 540.0, 496.0, 449.0, 340.0, 244.0, 172.0, 117.0, 88.0, 58.0, 43.0, 30.0, 22.0, 11.0, 10.0, 6.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11712646484375, -0.11379051208496094, -0.11045455932617188, -0.10711860656738281, -0.10378265380859375, -0.10044670104980469, -0.09711074829101562, -0.09377479553222656, -0.0904388427734375, -0.08710289001464844, -0.08376693725585938, -0.08043098449707031, -0.07709503173828125, -0.07375907897949219, -0.07042312622070312, -0.06708717346191406, -0.063751220703125, -0.06041526794433594, -0.057079315185546875, -0.05374336242675781, -0.05040740966796875, -0.04707145690917969, -0.043735504150390625, -0.04039955139160156, -0.0370635986328125, -0.03372764587402344, -0.030391693115234375, -0.027055740356445312, -0.02371978759765625, -0.020383834838867188, -0.017047882080078125, -0.013711929321289062, -0.0103759765625, -0.0070400238037109375, -0.003704071044921875, -0.0003681182861328125, 0.00296783447265625, 0.0063037872314453125, 0.009639739990234375, 0.012975692749023438, 0.0163116455078125, 0.019647598266601562, 0.022983551025390625, 0.026319503784179688, 0.02965545654296875, 0.03299140930175781, 0.036327362060546875, 0.03966331481933594, 0.042999267578125, 0.04633522033691406, 0.049671173095703125, 0.05300712585449219, 0.05634307861328125, 0.05967903137207031, 0.06301498413085938, 0.06635093688964844, 0.0696868896484375, 0.07302284240722656, 0.07635879516601562, 0.07969474792480469, 0.08303070068359375, 0.08636665344238281, 0.08970260620117188, 0.09303855895996094, 0.09637451171875]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 9.0, 33.0, 93.0, 195.0, 256.0, 219.0, 122.0, 57.0, 16.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2261666059494019, -1.187685251235962, -1.1492037773132324, -1.1107224225997925, -1.0722410678863525, -1.033759593963623, -0.9952782392501831, -0.9567968249320984, -0.9183154106140137, -0.879833996295929, -0.8413525819778442, -0.8028712272644043, -0.7643898129463196, -0.7259083986282349, -0.6874270439147949, -0.6489456295967102, -0.6104642152786255, -0.5719828009605408, -0.533501386642456, -0.4950200319290161, -0.4565386176109314, -0.4180572032928467, -0.37957581877708435, -0.341094434261322, -0.3026130199432373, -0.2641316056251526, -0.22565022110939026, -0.18716882169246674, -0.1486874222755432, -0.11020602285861969, -0.07172462344169617, -0.03324323892593384, 0.00523829460144043, 0.04371969401836395, 0.08220109343528748, 0.120682492852211, 0.15916389226913452, 0.19764529168605804, 0.23612669110298157, 0.2746080756187439, 0.3130894899368286, 0.35157090425491333, 0.39005228877067566, 0.428533673286438, 0.4670150876045227, 0.5054965019226074, 0.5439778566360474, 0.5824592709541321, 0.6209406852722168, 0.6594220995903015, 0.6979035139083862, 0.7363848686218262, 0.7748662829399109, 0.8133476972579956, 0.8518290519714355, 0.8903104662895203, 0.928791880607605, 0.9672732949256897, 1.0057547092437744, 1.0442360639572144, 1.0827174186706543, 1.1211988925933838, 1.1596802473068237, 1.1981616020202637, 1.2366430759429932]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 4.0, 3.0, 3.0, 5.0, 5.0, 9.0, 13.0, 9.0, 15.0, 8.0, 16.0, 20.0, 18.0, 32.0, 29.0, 30.0, 42.0, 42.0, 35.0, 52.0, 49.0, 42.0, 41.0, 48.0, 44.0, 40.0, 42.0, 37.0, 47.0, 35.0, 30.0, 19.0, 19.0, 19.0, 18.0, 15.0, 14.0, 12.0, 12.0, 14.0, 8.0, 4.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.3093070983886719, -0.2985919117927551, -0.287876695394516, -0.27716150879859924, -0.2664463222026825, -0.25573110580444336, -0.2450159192085266, -0.23430071771144867, -0.22358551621437073, -0.21287031471729279, -0.20215512812137604, -0.1914399266242981, -0.18072472512722015, -0.1700095236301422, -0.15929433703422546, -0.14857913553714752, -0.13786394894123077, -0.12714874744415283, -0.11643355339765549, -0.10571835935115814, -0.0950031578540802, -0.08428796380758286, -0.07357276976108551, -0.06285756826400757, -0.05214237421751022, -0.04142717644572258, -0.030711980536580086, -0.01999678462743759, -0.009281586855649948, 0.0014336109161376953, 0.01214880496263504, 0.022864006459712982, 0.03357920050621033, 0.04429439827799797, 0.055009596049785614, 0.06572479009628296, 0.0764399915933609, 0.08715518563985825, 0.09787037968635559, 0.10858558118343353, 0.11930077522993088, 0.13001596927642822, 0.14073117077350616, 0.1514463722705841, 0.16216155886650085, 0.1728767603635788, 0.18359196186065674, 0.1943071484565735, 0.20502234995365143, 0.21573755145072937, 0.22645273804664612, 0.23716793954372406, 0.247883141040802, 0.25859832763671875, 0.2693135142326355, 0.28002873063087463, 0.2907439172267914, 0.30145910382270813, 0.31217432022094727, 0.322889506816864, 0.33360469341278076, 0.3443199098110199, 0.35503509640693665, 0.3657503128051758, 0.37646549940109253]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 5.0, 3.0, 3.0, 5.0, 3.0, 11.0, 9.0, 17.0, 13.0, 25.0, 22.0, 37.0, 36.0, 66.0, 69.0, 120.0, 169.0, 238.0, 301.0, 555.0, 1005.0, 2229.0, 6175.0, 21780.0, 99264.0, 474266.0, 350124.0, 67401.0, 15609.0, 4646.0, 1879.0, 893.0, 491.0, 288.0, 218.0, 154.0, 94.0, 91.0, 61.0, 41.0, 42.0, 25.0, 19.0, 14.0, 14.0, 11.0, 8.0, 3.0, 4.0, 6.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.28271484375, -0.2735595703125, -0.264404296875, -0.2552490234375, -0.24609375, -0.2369384765625, -0.227783203125, -0.2186279296875, -0.20947265625, -0.2003173828125, -0.191162109375, -0.1820068359375, -0.1728515625, -0.1636962890625, -0.154541015625, -0.1453857421875, -0.13623046875, -0.1270751953125, -0.117919921875, -0.1087646484375, -0.099609375, -0.0904541015625, -0.081298828125, -0.0721435546875, -0.06298828125, -0.0538330078125, -0.044677734375, -0.0355224609375, -0.0263671875, -0.0172119140625, -0.008056640625, 0.0010986328125, 0.01025390625, 0.0194091796875, 0.028564453125, 0.0377197265625, 0.046875, 0.0560302734375, 0.065185546875, 0.0743408203125, 0.08349609375, 0.0926513671875, 0.101806640625, 0.1109619140625, 0.1201171875, 0.1292724609375, 0.138427734375, 0.1475830078125, 0.15673828125, 0.1658935546875, 0.175048828125, 0.1842041015625, 0.193359375, 0.2025146484375, 0.211669921875, 0.2208251953125, 0.22998046875, 0.2391357421875, 0.248291015625, 0.2574462890625, 0.2666015625, 0.2757568359375, 0.284912109375, 0.2940673828125, 0.30322265625]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 6.0, 5.0, 8.0, 16.0, 19.0, 39.0, 58.0, 92.0, 104.0, 124.0, 115.0, 134.0, 100.0, 80.0, 38.0, 32.0, 20.0, 10.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.06597900390625, -0.06169414520263672, -0.05740928649902344, -0.053124427795410156, -0.048839569091796875, -0.044554710388183594, -0.04026985168457031, -0.03598499298095703, -0.03170013427734375, -0.02741527557373047, -0.023130416870117188, -0.018845558166503906, -0.014560699462890625, -0.010275840759277344, -0.0059909820556640625, -0.0017061233520507812, 0.0025787353515625, 0.006863594055175781, 0.011148452758789062, 0.015433311462402344, 0.019718170166015625, 0.024003028869628906, 0.028287887573242188, 0.03257274627685547, 0.03685760498046875, 0.04114246368408203, 0.04542732238769531, 0.049712181091308594, 0.053997039794921875, 0.058281898498535156, 0.06256675720214844, 0.06685161590576172, 0.071136474609375, 0.07542133331298828, 0.07970619201660156, 0.08399105072021484, 0.08827590942382812, 0.0925607681274414, 0.09684562683105469, 0.10113048553466797, 0.10541534423828125, 0.10970020294189453, 0.11398506164550781, 0.1182699203491211, 0.12255477905273438, 0.12683963775634766, 0.13112449645996094, 0.13540935516357422, 0.1396942138671875, 0.14397907257080078, 0.14826393127441406, 0.15254878997802734, 0.15683364868164062, 0.1611185073852539, 0.1654033660888672, 0.16968822479248047, 0.17397308349609375, 0.17825794219970703, 0.1825428009033203, 0.1868276596069336, 0.19111251831054688, 0.19539737701416016, 0.19968223571777344, 0.20396709442138672, 0.208251953125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 2.0, 3.0, 14.0, 13.0, 10.0, 20.0, 28.0, 45.0, 54.0, 85.0, 163.0, 318.0, 614.0, 1283.0, 2821.0, 6644.0, 14733.0, 33626.0, 77522.0, 175133.0, 301757.0, 236427.0, 110328.0, 48714.0, 21112.0, 9239.0, 4200.0, 1867.0, 827.0, 394.0, 204.0, 110.0, 73.0, 50.0, 29.0, 21.0, 18.0, 12.0, 13.0, 11.0, 5.0, 9.0, 0.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.156005859375, -0.15108680725097656, -0.14616775512695312, -0.1412487030029297, -0.13632965087890625, -0.1314105987548828, -0.12649154663085938, -0.12157249450683594, -0.1166534423828125, -0.11173439025878906, -0.10681533813476562, -0.10189628601074219, -0.09697723388671875, -0.09205818176269531, -0.08713912963867188, -0.08222007751464844, -0.077301025390625, -0.07238197326660156, -0.06746292114257812, -0.06254386901855469, -0.05762481689453125, -0.05270576477050781, -0.047786712646484375, -0.04286766052246094, -0.0379486083984375, -0.03302955627441406, -0.028110504150390625, -0.023191452026367188, -0.01827239990234375, -0.013353347778320312, -0.008434295654296875, -0.0035152435302734375, 0.00140380859375, 0.0063228607177734375, 0.011241912841796875, 0.016160964965820312, 0.02108001708984375, 0.025999069213867188, 0.030918121337890625, 0.03583717346191406, 0.0407562255859375, 0.04567527770996094, 0.050594329833984375, 0.05551338195800781, 0.06043243408203125, 0.06535148620605469, 0.07027053833007812, 0.07518959045410156, 0.080108642578125, 0.08502769470214844, 0.08994674682617188, 0.09486579895019531, 0.09978485107421875, 0.10470390319824219, 0.10962295532226562, 0.11454200744628906, 0.1194610595703125, 0.12438011169433594, 0.12929916381835938, 0.1342182159423828, 0.13913726806640625, 0.1440563201904297, 0.14897537231445312, 0.15389442443847656, 0.1588134765625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 4.0, 2.0, 4.0, 7.0, 8.0, 14.0, 8.0, 10.0, 15.0, 17.0, 21.0, 18.0, 22.0, 20.0, 28.0, 30.0, 30.0, 31.0, 36.0, 35.0, 35.0, 34.0, 37.0, 53.0, 52.0, 38.0, 46.0, 35.0, 27.0, 36.0, 27.0, 30.0, 28.0, 24.0, 18.0, 24.0, 25.0, 14.0, 14.0, 11.0, 10.0, 8.0, 8.0, 2.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1485595703125, -0.14398574829101562, -0.13941192626953125, -0.13483810424804688, -0.1302642822265625, -0.12569046020507812, -0.12111663818359375, -0.11654281616210938, -0.111968994140625, -0.10739517211914062, -0.10282135009765625, -0.09824752807617188, -0.0936737060546875, -0.08909988403320312, -0.08452606201171875, -0.07995223999023438, -0.07537841796875, -0.07080459594726562, -0.06623077392578125, -0.061656951904296875, -0.0570831298828125, -0.052509307861328125, -0.04793548583984375, -0.043361663818359375, -0.038787841796875, -0.034214019775390625, -0.02964019775390625, -0.025066375732421875, -0.0204925537109375, -0.015918731689453125, -0.01134490966796875, -0.006771087646484375, -0.002197265625, 0.002376556396484375, 0.00695037841796875, 0.011524200439453125, 0.0160980224609375, 0.020671844482421875, 0.02524566650390625, 0.029819488525390625, 0.034393310546875, 0.038967132568359375, 0.04354095458984375, 0.048114776611328125, 0.0526885986328125, 0.057262420654296875, 0.06183624267578125, 0.06641006469726562, 0.07098388671875, 0.07555770874023438, 0.08013153076171875, 0.08470535278320312, 0.0892791748046875, 0.09385299682617188, 0.09842681884765625, 0.10300064086914062, 0.107574462890625, 0.11214828491210938, 0.11672210693359375, 0.12129592895507812, 0.1258697509765625, 0.13044357299804688, 0.13501739501953125, 0.13959121704101562, 0.1441650390625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 5.0, 9.0, 5.0, 14.0, 15.0, 26.0, 45.0, 52.0, 90.0, 124.0, 193.0, 298.0, 477.0, 797.0, 1338.0, 2209.0, 3813.0, 6872.0, 12364.0, 22535.0, 42138.0, 75914.0, 130672.0, 189900.0, 202611.0, 151155.0, 91252.0, 50881.0, 27751.0, 15182.0, 8377.0, 4614.0, 2644.0, 1586.0, 1010.0, 609.0, 380.0, 197.0, 145.0, 83.0, 59.0, 41.0, 27.0, 18.0, 13.0, 14.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.039337158203125, -0.03803300857543945, -0.036728858947753906, -0.03542470932006836, -0.03412055969238281, -0.032816410064697266, -0.03151226043701172, -0.030208110809326172, -0.028903961181640625, -0.027599811553955078, -0.02629566192626953, -0.024991512298583984, -0.023687362670898438, -0.02238321304321289, -0.021079063415527344, -0.019774913787841797, -0.01847076416015625, -0.017166614532470703, -0.015862464904785156, -0.01455831527709961, -0.013254165649414062, -0.011950016021728516, -0.010645866394042969, -0.009341716766357422, -0.008037567138671875, -0.006733417510986328, -0.005429267883300781, -0.004125118255615234, -0.0028209686279296875, -0.0015168190002441406, -0.00021266937255859375, 0.0010914802551269531, 0.0023956298828125, 0.003699779510498047, 0.005003929138183594, 0.006308078765869141, 0.0076122283935546875, 0.008916378021240234, 0.010220527648925781, 0.011524677276611328, 0.012828826904296875, 0.014132976531982422, 0.015437126159667969, 0.016741275787353516, 0.018045425415039062, 0.01934957504272461, 0.020653724670410156, 0.021957874298095703, 0.02326202392578125, 0.024566173553466797, 0.025870323181152344, 0.02717447280883789, 0.028478622436523438, 0.029782772064208984, 0.03108692169189453, 0.03239107131958008, 0.033695220947265625, 0.03499937057495117, 0.03630352020263672, 0.037607669830322266, 0.03891181945800781, 0.04021596908569336, 0.041520118713378906, 0.04282426834106445, 0.04412841796875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 7.0, 2.0, 4.0, 2.0, 7.0, 11.0, 13.0, 13.0, 14.0, 16.0, 30.0, 42.0, 30.0, 37.0, 48.0, 71.0, 94.0, 106.0, 88.0, 82.0, 55.0, 51.0, 32.0, 34.0, 21.0, 12.0, 20.0, 12.0, 17.0, 5.0, 6.0, 6.0, 4.0, 5.0, 1.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0311603546142578e-05, -9.922310709953308e-06, -9.533017873764038e-06, -9.143725037574768e-06, -8.754432201385498e-06, -8.365139365196228e-06, -7.975846529006958e-06, -7.586553692817688e-06, -7.197260856628418e-06, -6.807968020439148e-06, -6.418675184249878e-06, -6.029382348060608e-06, -5.640089511871338e-06, -5.250796675682068e-06, -4.861503839492798e-06, -4.472211003303528e-06, -4.082918167114258e-06, -3.693625330924988e-06, -3.3043324947357178e-06, -2.9150396585464478e-06, -2.5257468223571777e-06, -2.1364539861679077e-06, -1.7471611499786377e-06, -1.3578683137893677e-06, -9.685754776000977e-07, -5.792826414108276e-07, -1.8998980522155762e-07, 1.993030309677124e-07, 5.885958671569824e-07, 9.778887033462524e-07, 1.3671815395355225e-06, 1.7564743757247925e-06, 2.1457672119140625e-06, 2.5350600481033325e-06, 2.9243528842926025e-06, 3.3136457204818726e-06, 3.7029385566711426e-06, 4.092231392860413e-06, 4.481524229049683e-06, 4.870817065238953e-06, 5.260109901428223e-06, 5.649402737617493e-06, 6.038695573806763e-06, 6.427988409996033e-06, 6.817281246185303e-06, 7.206574082374573e-06, 7.595866918563843e-06, 7.985159754753113e-06, 8.374452590942383e-06, 8.763745427131653e-06, 9.153038263320923e-06, 9.542331099510193e-06, 9.931623935699463e-06, 1.0320916771888733e-05, 1.0710209608078003e-05, 1.1099502444267273e-05, 1.1488795280456543e-05, 1.1878088116645813e-05, 1.2267380952835083e-05, 1.2656673789024353e-05, 1.3045966625213623e-05, 1.3435259461402893e-05, 1.3824552297592163e-05, 1.4213845133781433e-05, 1.4603137969970703e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 5.0, 1.0, 2.0, 6.0, 10.0, 8.0, 11.0, 22.0, 40.0, 57.0, 93.0, 164.0, 275.0, 458.0, 737.0, 1391.0, 2565.0, 4519.0, 8424.0, 16059.0, 29954.0, 56291.0, 101819.0, 168137.0, 215763.0, 184466.0, 116313.0, 65387.0, 35174.0, 18725.0, 9743.0, 5262.0, 2886.0, 1667.0, 945.0, 445.0, 294.0, 186.0, 100.0, 59.0, 29.0, 25.0, 10.0, 8.0, 10.0, 7.0, 0.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.03961181640625, -0.03835916519165039, -0.03710651397705078, -0.03585386276245117, -0.03460121154785156, -0.03334856033325195, -0.032095909118652344, -0.030843257904052734, -0.029590606689453125, -0.028337955474853516, -0.027085304260253906, -0.025832653045654297, -0.024580001831054688, -0.023327350616455078, -0.02207469940185547, -0.02082204818725586, -0.01956939697265625, -0.01831674575805664, -0.01706409454345703, -0.015811443328857422, -0.014558792114257812, -0.013306140899658203, -0.012053489685058594, -0.010800838470458984, -0.009548187255859375, -0.008295536041259766, -0.007042884826660156, -0.005790233612060547, -0.0045375823974609375, -0.003284931182861328, -0.0020322799682617188, -0.0007796287536621094, 0.0004730224609375, 0.0017256736755371094, 0.0029783248901367188, 0.004230976104736328, 0.0054836273193359375, 0.006736278533935547, 0.007988929748535156, 0.009241580963134766, 0.010494232177734375, 0.011746883392333984, 0.012999534606933594, 0.014252185821533203, 0.015504837036132812, 0.016757488250732422, 0.01801013946533203, 0.01926279067993164, 0.02051544189453125, 0.02176809310913086, 0.02302074432373047, 0.024273395538330078, 0.025526046752929688, 0.026778697967529297, 0.028031349182128906, 0.029284000396728516, 0.030536651611328125, 0.031789302825927734, 0.033041954040527344, 0.03429460525512695, 0.03554725646972656, 0.03679990768432617, 0.03805255889892578, 0.03930521011352539, 0.040557861328125]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 3.0, 4.0, 4.0, 6.0, 3.0, 8.0, 13.0, 16.0, 18.0, 18.0, 23.0, 20.0, 35.0, 35.0, 49.0, 36.0, 48.0, 44.0, 70.0, 64.0, 61.0, 56.0, 49.0, 39.0, 44.0, 42.0, 38.0, 18.0, 20.0, 27.0, 17.0, 16.0, 11.0, 13.0, 10.0, 3.0, 3.0, 2.0, 8.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.040924072265625, -0.03970623016357422, -0.03848838806152344, -0.037270545959472656, -0.036052703857421875, -0.034834861755371094, -0.03361701965332031, -0.03239917755126953, -0.03118133544921875, -0.02996349334716797, -0.028745651245117188, -0.027527809143066406, -0.026309967041015625, -0.025092124938964844, -0.023874282836914062, -0.02265644073486328, -0.0214385986328125, -0.02022075653076172, -0.019002914428710938, -0.017785072326660156, -0.016567230224609375, -0.015349388122558594, -0.014131546020507812, -0.012913703918457031, -0.01169586181640625, -0.010478019714355469, -0.009260177612304688, -0.008042335510253906, -0.006824493408203125, -0.005606651306152344, -0.0043888092041015625, -0.0031709671020507812, -0.001953125, -0.0007352828979492188, 0.0004825592041015625, 0.0017004013061523438, 0.002918243408203125, 0.004136085510253906, 0.0053539276123046875, 0.006571769714355469, 0.00778961181640625, 0.009007453918457031, 0.010225296020507812, 0.011443138122558594, 0.012660980224609375, 0.013878822326660156, 0.015096664428710938, 0.01631450653076172, 0.0175323486328125, 0.01875019073486328, 0.019968032836914062, 0.021185874938964844, 0.022403717041015625, 0.023621559143066406, 0.024839401245117188, 0.02605724334716797, 0.02727508544921875, 0.02849292755126953, 0.029710769653320312, 0.030928611755371094, 0.032146453857421875, 0.033364295959472656, 0.03458213806152344, 0.03579998016357422, 0.037017822265625]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 8.0, 9.0, 53.0, 159.0, 280.0, 319.0, 130.0, 43.0, 8.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.192502021789551, -2.1280267238616943, -2.063551187515259, -1.9990758895874023, -1.934600591659546, -1.8701251745224, -1.805649757385254, -1.7411744594573975, -1.6766990423202515, -1.6122236251831055, -1.547748327255249, -1.483272910118103, -1.418797492980957, -1.3543221950531006, -1.2898467779159546, -1.2253713607788086, -1.1608960628509521, -1.0964206457138062, -1.0319453477859497, -0.9674699306488037, -0.9029945731163025, -0.8385192155838013, -0.7740437984466553, -0.709568440914154, -0.6450930833816528, -0.5806177258491516, -0.5161423683166504, -0.4516669511795044, -0.3871915936470032, -0.32271623611450195, -0.25824084877967834, -0.19376546144485474, -0.12928986549377441, -0.064814493060112, -0.00033912062644958496, 0.06413625180721283, 0.12861162424087524, 0.19308698177337646, 0.2575623691082001, 0.3220377564430237, 0.3865131139755249, 0.4509884715080261, 0.5154638290405273, 0.5799392461776733, 0.6444146037101746, 0.7088899612426758, 0.7733653783798218, 0.837840735912323, 0.9023160934448242, 0.9667914509773254, 1.0312668085098267, 1.0957422256469727, 1.160217523574829, 1.224692940711975, 1.289168357849121, 1.3536436557769775, 1.4181190729141235, 1.4825944900512695, 1.547069787979126, 1.611545205116272, 1.676020622253418, 1.7404959201812744, 1.8049713373184204, 1.8694467544555664, 1.9339220523834229]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 4.0, 3.0, 3.0, 10.0, 10.0, 7.0, 11.0, 12.0, 18.0, 20.0, 28.0, 29.0, 26.0, 35.0, 44.0, 36.0, 30.0, 49.0, 51.0, 54.0, 43.0, 46.0, 39.0, 65.0, 43.0, 35.0, 35.0, 44.0, 18.0, 28.0, 24.0, 24.0, 24.0, 14.0, 13.0, 6.0, 9.0, 4.0, 7.0, 3.0, 3.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6124780774116516, -0.5935313701629639, -0.5745847225189209, -0.5556380152702332, -0.5366913080215454, -0.5177446007728577, -0.4987979233264923, -0.47985124588012695, -0.4609045386314392, -0.44195783138275146, -0.4230111539363861, -0.40406447649002075, -0.385117769241333, -0.36617106199264526, -0.3472243845462799, -0.32827770709991455, -0.3093309998512268, -0.29038429260253906, -0.2714376151561737, -0.25249093770980835, -0.2335442304611206, -0.21459753811359406, -0.1956508457660675, -0.17670415341854095, -0.1577574610710144, -0.13881076872348785, -0.1198640763759613, -0.10091738402843475, -0.0819706916809082, -0.06302399933338165, -0.0440773069858551, -0.025130614638328552, -0.006183981895446777, 0.012762710452079773, 0.03170940279960632, 0.050656095147132874, 0.06960278749465942, 0.08854947984218597, 0.10749617218971252, 0.12644286453723907, 0.14538955688476562, 0.16433624923229218, 0.18328294157981873, 0.20222963392734528, 0.22117632627487183, 0.24012301862239838, 0.2590697109699249, 0.2780163884162903, 0.296963095664978, 0.31590980291366577, 0.33485648036003113, 0.3538031578063965, 0.37274986505508423, 0.391696572303772, 0.41064324975013733, 0.4295899271965027, 0.44853663444519043, 0.4674833416938782, 0.48643001914024353, 0.5053766965866089, 0.5243234038352966, 0.5432701110839844, 0.5622167587280273, 0.5811634659767151, 0.6001101732254028]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 14.0, 10.0, 24.0, 35.0, 53.0, 111.0, 183.0, 428.0, 1108.0, 3002.0, 10149.0, 47117.0, 785882.0, 3193055.0, 128576.0, 16213.0, 4401.0, 1731.0, 836.0, 482.0, 299.0, 171.0, 125.0, 88.0, 51.0, 30.0, 29.0, 21.0, 21.0, 14.0, 8.0, 7.0, 0.0, 1.0, 4.0, 8.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.166015625, -0.15855026245117188, -0.15108489990234375, -0.14361953735351562, -0.1361541748046875, -0.12868881225585938, -0.12122344970703125, -0.11375808715820312, -0.106292724609375, -0.09882736206054688, -0.09136199951171875, -0.08389663696289062, -0.0764312744140625, -0.06896591186523438, -0.06150054931640625, -0.054035186767578125, -0.04656982421875, -0.039104461669921875, -0.03163909912109375, -0.024173736572265625, -0.0167083740234375, -0.009243011474609375, -0.00177764892578125, 0.005687713623046875, 0.013153076171875, 0.020618438720703125, 0.02808380126953125, 0.035549163818359375, 0.0430145263671875, 0.050479888916015625, 0.05794525146484375, 0.06541061401367188, 0.0728759765625, 0.08034133911132812, 0.08780670166015625, 0.09527206420898438, 0.1027374267578125, 0.11020278930664062, 0.11766815185546875, 0.12513351440429688, 0.132598876953125, 0.14006423950195312, 0.14752960205078125, 0.15499496459960938, 0.1624603271484375, 0.16992568969726562, 0.17739105224609375, 0.18485641479492188, 0.19232177734375, 0.19978713989257812, 0.20725250244140625, 0.21471786499023438, 0.2221832275390625, 0.22964859008789062, 0.23711395263671875, 0.24457931518554688, 0.252044677734375, 0.2595100402832031, 0.26697540283203125, 0.2744407653808594, 0.2819061279296875, 0.2893714904785156, 0.29683685302734375, 0.3043022155761719, 0.311767578125]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 4.0, 5.0, 10.0, 5.0, 22.0, 36.0, 46.0, 66.0, 95.0, 90.0, 111.0, 125.0, 105.0, 106.0, 61.0, 45.0, 32.0, 16.0, 16.0, 7.0, 6.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.06329345703125, -0.05913066864013672, -0.05496788024902344, -0.050805091857910156, -0.046642303466796875, -0.042479515075683594, -0.03831672668457031, -0.03415393829345703, -0.02999114990234375, -0.02582836151123047, -0.021665573120117188, -0.017502784729003906, -0.013339996337890625, -0.009177207946777344, -0.0050144195556640625, -0.0008516311645507812, 0.0033111572265625, 0.007473945617675781, 0.011636734008789062, 0.015799522399902344, 0.019962310791015625, 0.024125099182128906, 0.028287887573242188, 0.03245067596435547, 0.03661346435546875, 0.04077625274658203, 0.04493904113769531, 0.049101829528808594, 0.053264617919921875, 0.057427406311035156, 0.06159019470214844, 0.06575298309326172, 0.069915771484375, 0.07407855987548828, 0.07824134826660156, 0.08240413665771484, 0.08656692504882812, 0.0907297134399414, 0.09489250183105469, 0.09905529022216797, 0.10321807861328125, 0.10738086700439453, 0.11154365539550781, 0.1157064437866211, 0.11986923217773438, 0.12403202056884766, 0.12819480895996094, 0.13235759735107422, 0.1365203857421875, 0.14068317413330078, 0.14484596252441406, 0.14900875091552734, 0.15317153930664062, 0.1573343276977539, 0.1614971160888672, 0.16565990447998047, 0.16982269287109375, 0.17398548126220703, 0.1781482696533203, 0.1823110580444336, 0.18647384643554688, 0.19063663482666016, 0.19479942321777344, 0.19896221160888672, 0.203125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 2.0, 7.0, 6.0, 8.0, 17.0, 13.0, 21.0, 28.0, 43.0, 57.0, 123.0, 179.0, 367.0, 991.0, 3211.0, 15148.0, 125987.0, 1916748.0, 1980006.0, 130343.0, 15855.0, 3220.0, 957.0, 400.0, 172.0, 113.0, 78.0, 62.0, 38.0, 23.0, 15.0, 19.0, 5.0, 8.0, 1.0, 3.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2003173828125, -0.19364166259765625, -0.1869659423828125, -0.18029022216796875, -0.173614501953125, -0.16693878173828125, -0.1602630615234375, -0.15358734130859375, -0.14691162109375, -0.14023590087890625, -0.1335601806640625, -0.12688446044921875, -0.120208740234375, -0.11353302001953125, -0.1068572998046875, -0.10018157958984375, -0.093505859375, -0.08683013916015625, -0.0801544189453125, -0.07347869873046875, -0.066802978515625, -0.06012725830078125, -0.0534515380859375, -0.04677581787109375, -0.04010009765625, -0.03342437744140625, -0.0267486572265625, -0.02007293701171875, -0.013397216796875, -0.00672149658203125, -4.57763671875e-05, 0.00662994384765625, 0.0133056640625, 0.01998138427734375, 0.0266571044921875, 0.03333282470703125, 0.040008544921875, 0.04668426513671875, 0.0533599853515625, 0.06003570556640625, 0.06671142578125, 0.07338714599609375, 0.0800628662109375, 0.08673858642578125, 0.093414306640625, 0.10009002685546875, 0.1067657470703125, 0.11344146728515625, 0.1201171875, 0.12679290771484375, 0.1334686279296875, 0.14014434814453125, 0.146820068359375, 0.15349578857421875, 0.1601715087890625, 0.16684722900390625, 0.17352294921875, 0.18019866943359375, 0.1868743896484375, 0.19355010986328125, 0.200225830078125, 0.20690155029296875, 0.2135772705078125, 0.22025299072265625, 0.2269287109375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 6.0, 3.0, 5.0, 9.0, 11.0, 13.0, 18.0, 27.0, 38.0, 46.0, 76.0, 88.0, 145.0, 222.0, 282.0, 401.0, 494.0, 564.0, 484.0, 365.0, 248.0, 170.0, 113.0, 93.0, 56.0, 30.0, 20.0, 18.0, 14.0, 9.0, 4.0, 2.0, 2.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.129638671875, -0.12615394592285156, -0.12266921997070312, -0.11918449401855469, -0.11569976806640625, -0.11221504211425781, -0.10873031616210938, -0.10524559020996094, -0.1017608642578125, -0.09827613830566406, -0.09479141235351562, -0.09130668640136719, -0.08782196044921875, -0.08433723449707031, -0.08085250854492188, -0.07736778259277344, -0.073883056640625, -0.07039833068847656, -0.06691360473632812, -0.06342887878417969, -0.05994415283203125, -0.05645942687988281, -0.052974700927734375, -0.04948997497558594, -0.0460052490234375, -0.04252052307128906, -0.039035797119140625, -0.03555107116699219, -0.03206634521484375, -0.028581619262695312, -0.025096893310546875, -0.021612167358398438, -0.01812744140625, -0.014642715454101562, -0.011157989501953125, -0.0076732635498046875, -0.00418853759765625, -0.0007038116455078125, 0.002780914306640625, 0.0062656402587890625, 0.0097503662109375, 0.013235092163085938, 0.016719818115234375, 0.020204544067382812, 0.02368927001953125, 0.027173995971679688, 0.030658721923828125, 0.03414344787597656, 0.037628173828125, 0.04111289978027344, 0.044597625732421875, 0.04808235168457031, 0.05156707763671875, 0.05505180358886719, 0.058536529541015625, 0.06202125549316406, 0.0655059814453125, 0.06899070739746094, 0.07247543334960938, 0.07596015930175781, 0.07944488525390625, 0.08292961120605469, 0.08641433715820312, 0.08989906311035156, 0.0933837890625]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 8.0, 20.0, 38.0, 95.0, 168.0, 215.0, 212.0, 127.0, 80.0, 24.0, 13.0, 8.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.359740138053894, -1.3247348070144653, -1.2897295951843262, -1.2547242641448975, -1.2197190523147583, -1.1847137212753296, -1.1497085094451904, -1.1147031784057617, -1.079697847366333, -1.0446925163269043, -1.0096873044967651, -0.9746820330619812, -0.9396767616271973, -0.9046714305877686, -0.8696661591529846, -0.8346608877182007, -0.7996556758880615, -0.7646504044532776, -0.7296451330184937, -0.6946398615837097, -0.6596345901489258, -0.6246292591094971, -0.5896239876747131, -0.5546187162399292, -0.5196134448051453, -0.48460817337036133, -0.4496029019355774, -0.41459760069847107, -0.37959232926368713, -0.3445870578289032, -0.3095817565917969, -0.27457648515701294, -0.23957133293151855, -0.20456606149673462, -0.1695607751607895, -0.13455548882484436, -0.09955021739006042, -0.06454494595527649, -0.02953965961933136, 0.0054656267166137695, 0.040470898151397705, 0.07547617703676224, 0.11048145592212677, 0.1454867422580719, 0.18049201369285583, 0.21549728512763977, 0.2505025863647461, 0.28550785779953003, 0.32051312923431396, 0.3555184006690979, 0.39052367210388184, 0.42552897334098816, 0.4605342447757721, 0.49553951621055603, 0.5305448174476624, 0.5655500888824463, 0.6005553603172302, 0.6355606317520142, 0.6705659031867981, 0.705571174621582, 0.7405765056610107, 0.7755817174911499, 0.8105870485305786, 0.8455923199653625, 0.8805975914001465]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 6.0, 11.0, 8.0, 11.0, 18.0, 15.0, 20.0, 23.0, 28.0, 22.0, 25.0, 38.0, 40.0, 60.0, 53.0, 52.0, 48.0, 50.0, 49.0, 40.0, 49.0, 40.0, 40.0, 30.0, 32.0, 41.0, 24.0, 28.0, 17.0, 22.0, 13.0, 11.0, 15.0, 9.0, 6.0, 3.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3257802128791809, -0.31436967849731445, -0.3029591143131256, -0.29154857993125916, -0.2801380157470703, -0.26872748136520386, -0.2573169469833374, -0.24590638279914856, -0.2344958335161209, -0.22308528423309326, -0.2116747349500656, -0.20026418566703796, -0.1888536512851715, -0.17744308710098267, -0.1660325527191162, -0.15462200343608856, -0.1432114541530609, -0.13180090487003326, -0.12039035558700562, -0.10897981375455856, -0.09756926447153091, -0.08615871518850327, -0.07474817335605621, -0.06333762407302856, -0.051927074790000916, -0.04051652550697327, -0.029105979949235916, -0.017695434391498566, -0.006284885108470917, 0.005125664174556732, 0.016536206007003784, 0.027946755290031433, 0.03935730457305908, 0.05076785385608673, 0.06217839941382408, 0.07358894497156143, 0.08499949425458908, 0.09641004353761673, 0.10782058537006378, 0.11923113465309143, 0.13064168393611908, 0.14205223321914673, 0.15346278250217438, 0.16487333178520203, 0.17628386616706848, 0.18769443035125732, 0.19910496473312378, 0.21051551401615143, 0.22192606329917908, 0.23333661258220673, 0.24474716186523438, 0.25615769624710083, 0.2675682604312897, 0.27897879481315613, 0.29038935899734497, 0.3017998933792114, 0.3132104277610779, 0.32462096214294434, 0.3360315263271332, 0.34744206070899963, 0.3588526248931885, 0.37026315927505493, 0.3816736936569214, 0.39308425784111023, 0.4044948220252991]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 8.0, 8.0, 17.0, 15.0, 21.0, 32.0, 41.0, 66.0, 95.0, 128.0, 170.0, 258.0, 408.0, 709.0, 1400.0, 3532.0, 10784.0, 45827.0, 246227.0, 546444.0, 150271.0, 29143.0, 7573.0, 2608.0, 1108.0, 602.0, 356.0, 212.0, 138.0, 100.0, 77.0, 48.0, 39.0, 21.0, 21.0, 18.0, 9.0, 8.0, 10.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.470458984375, -0.45676422119140625, -0.4430694580078125, -0.42937469482421875, -0.415679931640625, -0.40198516845703125, -0.3882904052734375, -0.37459564208984375, -0.36090087890625, -0.34720611572265625, -0.3335113525390625, -0.31981658935546875, -0.306121826171875, -0.29242706298828125, -0.2787322998046875, -0.26503753662109375, -0.2513427734375, -0.23764801025390625, -0.2239532470703125, -0.21025848388671875, -0.196563720703125, -0.18286895751953125, -0.1691741943359375, -0.15547943115234375, -0.14178466796875, -0.12808990478515625, -0.1143951416015625, -0.10070037841796875, -0.087005615234375, -0.07331085205078125, -0.0596160888671875, -0.04592132568359375, -0.0322265625, -0.01853179931640625, -0.0048370361328125, 0.00885772705078125, 0.022552490234375, 0.03624725341796875, 0.0499420166015625, 0.06363677978515625, 0.07733154296875, 0.09102630615234375, 0.1047210693359375, 0.11841583251953125, 0.132110595703125, 0.14580535888671875, 0.1595001220703125, 0.17319488525390625, 0.1868896484375, 0.20058441162109375, 0.2142791748046875, 0.22797393798828125, 0.241668701171875, 0.25536346435546875, 0.2690582275390625, 0.28275299072265625, 0.29644775390625, 0.31014251708984375, 0.3238372802734375, 0.33753204345703125, 0.351226806640625, 0.36492156982421875, 0.3786163330078125, 0.39231109619140625, 0.406005859375]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 6.0, 7.0, 10.0, 22.0, 30.0, 59.0, 77.0, 105.0, 87.0, 127.0, 129.0, 121.0, 80.0, 56.0, 31.0, 31.0, 7.0, 11.0, 11.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0634765625, -0.059200286865234375, -0.05492401123046875, -0.050647735595703125, -0.0463714599609375, -0.042095184326171875, -0.03781890869140625, -0.033542633056640625, -0.029266357421875, -0.024990081787109375, -0.02071380615234375, -0.016437530517578125, -0.0121612548828125, -0.007884979248046875, -0.00360870361328125, 0.000667572021484375, 0.00494384765625, 0.009220123291015625, 0.01349639892578125, 0.017772674560546875, 0.0220489501953125, 0.026325225830078125, 0.03060150146484375, 0.034877777099609375, 0.039154052734375, 0.043430328369140625, 0.04770660400390625, 0.051982879638671875, 0.0562591552734375, 0.060535430908203125, 0.06481170654296875, 0.06908798217773438, 0.0733642578125, 0.07764053344726562, 0.08191680908203125, 0.08619308471679688, 0.0904693603515625, 0.09474563598632812, 0.09902191162109375, 0.10329818725585938, 0.107574462890625, 0.11185073852539062, 0.11612701416015625, 0.12040328979492188, 0.1246795654296875, 0.12895584106445312, 0.13323211669921875, 0.13750839233398438, 0.14178466796875, 0.14606094360351562, 0.15033721923828125, 0.15461349487304688, 0.1588897705078125, 0.16316604614257812, 0.16744232177734375, 0.17171859741210938, 0.175994873046875, 0.18027114868164062, 0.18454742431640625, 0.18882369995117188, 0.1930999755859375, 0.19737625122070312, 0.20165252685546875, 0.20592880249023438, 0.210205078125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 13.0, 9.0, 10.0, 23.0, 21.0, 27.0, 40.0, 53.0, 103.0, 136.0, 250.0, 408.0, 695.0, 1255.0, 2365.0, 4827.0, 9957.0, 21860.0, 48510.0, 105215.0, 199007.0, 262620.0, 197652.0, 103702.0, 47756.0, 21872.0, 9970.0, 4841.0, 2402.0, 1170.0, 675.0, 408.0, 265.0, 131.0, 91.0, 72.0, 51.0, 20.0, 19.0, 21.0, 15.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0], "bins": [-0.1976318359375, -0.19190216064453125, -0.1861724853515625, -0.18044281005859375, -0.174713134765625, -0.16898345947265625, -0.1632537841796875, -0.15752410888671875, -0.15179443359375, -0.14606475830078125, -0.1403350830078125, -0.13460540771484375, -0.128875732421875, -0.12314605712890625, -0.1174163818359375, -0.11168670654296875, -0.10595703125, -0.10022735595703125, -0.0944976806640625, -0.08876800537109375, -0.083038330078125, -0.07730865478515625, -0.0715789794921875, -0.06584930419921875, -0.06011962890625, -0.05438995361328125, -0.0486602783203125, -0.04293060302734375, -0.037200927734375, -0.03147125244140625, -0.0257415771484375, -0.02001190185546875, -0.0142822265625, -0.00855255126953125, -0.0028228759765625, 0.00290679931640625, 0.008636474609375, 0.01436614990234375, 0.0200958251953125, 0.02582550048828125, 0.03155517578125, 0.03728485107421875, 0.0430145263671875, 0.04874420166015625, 0.054473876953125, 0.06020355224609375, 0.0659332275390625, 0.07166290283203125, 0.077392578125, 0.08312225341796875, 0.0888519287109375, 0.09458160400390625, 0.100311279296875, 0.10604095458984375, 0.1117706298828125, 0.11750030517578125, 0.12322998046875, 0.12895965576171875, 0.1346893310546875, 0.14041900634765625, 0.146148681640625, 0.15187835693359375, 0.1576080322265625, 0.16333770751953125, 0.1690673828125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 7.0, 9.0, 10.0, 10.0, 17.0, 15.0, 22.0, 31.0, 22.0, 32.0, 42.0, 27.0, 39.0, 52.0, 45.0, 67.0, 49.0, 50.0, 52.0, 38.0, 53.0, 37.0, 47.0, 29.0, 30.0, 30.0, 26.0, 23.0, 18.0, 16.0, 18.0, 10.0, 6.0, 7.0, 4.0, 3.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1910400390625, -0.1848888397216797, -0.17873764038085938, -0.17258644104003906, -0.16643524169921875, -0.16028404235839844, -0.15413284301757812, -0.1479816436767578, -0.1418304443359375, -0.1356792449951172, -0.12952804565429688, -0.12337684631347656, -0.11722564697265625, -0.11107444763183594, -0.10492324829101562, -0.09877204895019531, -0.092620849609375, -0.08646965026855469, -0.08031845092773438, -0.07416725158691406, -0.06801605224609375, -0.06186485290527344, -0.055713653564453125, -0.04956245422363281, -0.0434112548828125, -0.03726005554199219, -0.031108856201171875, -0.024957656860351562, -0.01880645751953125, -0.012655258178710938, -0.006504058837890625, -0.0003528594970703125, 0.00579833984375, 0.011949539184570312, 0.018100738525390625, 0.024251937866210938, 0.03040313720703125, 0.03655433654785156, 0.042705535888671875, 0.04885673522949219, 0.0550079345703125, 0.06115913391113281, 0.06731033325195312, 0.07346153259277344, 0.07961273193359375, 0.08576393127441406, 0.09191513061523438, 0.09806632995605469, 0.104217529296875, 0.11036872863769531, 0.11651992797851562, 0.12267112731933594, 0.12882232666015625, 0.13497352600097656, 0.14112472534179688, 0.1472759246826172, 0.1534271240234375, 0.1595783233642578, 0.16572952270507812, 0.17188072204589844, 0.17803192138671875, 0.18418312072753906, 0.19033432006835938, 0.1964855194091797, 0.20263671875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 6.0, 6.0, 7.0, 17.0, 22.0, 21.0, 45.0, 54.0, 89.0, 98.0, 147.0, 236.0, 323.0, 435.0, 605.0, 894.0, 1389.0, 2141.0, 3483.0, 5842.0, 10647.0, 22104.0, 48792.0, 113417.0, 231069.0, 282487.0, 175111.0, 78045.0, 34140.0, 15938.0, 8212.0, 4519.0, 2777.0, 1702.0, 1162.0, 805.0, 502.0, 362.0, 278.0, 162.0, 138.0, 91.0, 60.0, 66.0, 37.0, 19.0, 19.0, 14.0, 9.0, 6.0, 4.0, 3.0, 7.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.080810546875, -0.07822704315185547, -0.07564353942871094, -0.0730600357055664, -0.07047653198242188, -0.06789302825927734, -0.06530952453613281, -0.06272602081298828, -0.06014251708984375, -0.05755901336669922, -0.05497550964355469, -0.052392005920410156, -0.049808502197265625, -0.047224998474121094, -0.04464149475097656, -0.04205799102783203, -0.0394744873046875, -0.03689098358154297, -0.03430747985839844, -0.031723976135253906, -0.029140472412109375, -0.026556968688964844, -0.023973464965820312, -0.02138996124267578, -0.01880645751953125, -0.01622295379638672, -0.013639450073242188, -0.011055946350097656, -0.008472442626953125, -0.005888938903808594, -0.0033054351806640625, -0.0007219314575195312, 0.001861572265625, 0.004445075988769531, 0.0070285797119140625, 0.009612083435058594, 0.012195587158203125, 0.014779090881347656, 0.017362594604492188, 0.01994609832763672, 0.02252960205078125, 0.02511310577392578, 0.027696609497070312, 0.030280113220214844, 0.032863616943359375, 0.035447120666503906, 0.03803062438964844, 0.04061412811279297, 0.0431976318359375, 0.04578113555908203, 0.04836463928222656, 0.050948143005371094, 0.053531646728515625, 0.056115150451660156, 0.05869865417480469, 0.06128215789794922, 0.06386566162109375, 0.06644916534423828, 0.06903266906738281, 0.07161617279052734, 0.07419967651367188, 0.0767831802368164, 0.07936668395996094, 0.08195018768310547, 0.08453369140625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 2.0, 6.0, 5.0, 8.0, 9.0, 12.0, 14.0, 17.0, 23.0, 59.0, 67.0, 87.0, 110.0, 129.0, 130.0, 88.0, 79.0, 44.0, 38.0, 20.0, 14.0, 10.0, 9.0, 11.0, 6.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.378225326538086e-05, -2.2814609110355377e-05, -2.1846964955329895e-05, -2.0879320800304413e-05, -1.991167664527893e-05, -1.894403249025345e-05, -1.7976388335227966e-05, -1.7008744180202484e-05, -1.6041100025177002e-05, -1.507345587015152e-05, -1.4105811715126038e-05, -1.3138167560100555e-05, -1.2170523405075073e-05, -1.1202879250049591e-05, -1.0235235095024109e-05, -9.267590939998627e-06, -8.299946784973145e-06, -7.332302629947662e-06, -6.36465847492218e-06, -5.397014319896698e-06, -4.429370164871216e-06, -3.4617260098457336e-06, -2.4940818548202515e-06, -1.5264376997947693e-06, -5.587935447692871e-07, 4.0885061025619507e-07, 1.3764947652816772e-06, 2.3441389203071594e-06, 3.3117830753326416e-06, 4.279427230358124e-06, 5.247071385383606e-06, 6.214715540409088e-06, 7.18235969543457e-06, 8.150003850460052e-06, 9.117648005485535e-06, 1.0085292160511017e-05, 1.1052936315536499e-05, 1.2020580470561981e-05, 1.2988224625587463e-05, 1.3955868780612946e-05, 1.4923512935638428e-05, 1.589115709066391e-05, 1.6858801245689392e-05, 1.7826445400714874e-05, 1.8794089555740356e-05, 1.976173371076584e-05, 2.072937786579132e-05, 2.1697022020816803e-05, 2.2664666175842285e-05, 2.3632310330867767e-05, 2.459995448589325e-05, 2.556759864091873e-05, 2.6535242795944214e-05, 2.7502886950969696e-05, 2.8470531105995178e-05, 2.943817526102066e-05, 3.0405819416046143e-05, 3.1373463571071625e-05, 3.234110772609711e-05, 3.330875188112259e-05, 3.427639603614807e-05, 3.5244040191173553e-05, 3.6211684346199036e-05, 3.717932850122452e-05, 3.814697265625e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 8.0, 11.0, 12.0, 24.0, 48.0, 95.0, 124.0, 209.0, 320.0, 581.0, 955.0, 1605.0, 2834.0, 5888.0, 12766.0, 34427.0, 118932.0, 365098.0, 341716.0, 107196.0, 31662.0, 11933.0, 5464.0, 2831.0, 1551.0, 935.0, 486.0, 314.0, 194.0, 116.0, 65.0, 55.0, 36.0, 26.0, 11.0, 6.0, 10.0, 2.0, 6.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.130615234375, -0.1267690658569336, -0.12292289733886719, -0.11907672882080078, -0.11523056030273438, -0.11138439178466797, -0.10753822326660156, -0.10369205474853516, -0.09984588623046875, -0.09599971771240234, -0.09215354919433594, -0.08830738067626953, -0.08446121215820312, -0.08061504364013672, -0.07676887512207031, -0.0729227066040039, -0.0690765380859375, -0.0652303695678711, -0.06138420104980469, -0.05753803253173828, -0.053691864013671875, -0.04984569549560547, -0.04599952697753906, -0.042153358459472656, -0.03830718994140625, -0.034461021423339844, -0.030614852905273438, -0.02676868438720703, -0.022922515869140625, -0.01907634735107422, -0.015230178833007812, -0.011384010314941406, -0.007537841796875, -0.0036916732788085938, 0.0001544952392578125, 0.004000663757324219, 0.007846832275390625, 0.011693000793457031, 0.015539169311523438, 0.019385337829589844, 0.02323150634765625, 0.027077674865722656, 0.030923843383789062, 0.03477001190185547, 0.038616180419921875, 0.04246234893798828, 0.04630851745605469, 0.050154685974121094, 0.0540008544921875, 0.057847023010253906, 0.06169319152832031, 0.06553936004638672, 0.06938552856445312, 0.07323169708251953, 0.07707786560058594, 0.08092403411865234, 0.08477020263671875, 0.08861637115478516, 0.09246253967285156, 0.09630870819091797, 0.10015487670898438, 0.10400104522705078, 0.10784721374511719, 0.1116933822631836, 0.11553955078125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 4.0, 4.0, 7.0, 7.0, 5.0, 15.0, 21.0, 30.0, 43.0, 49.0, 51.0, 65.0, 83.0, 93.0, 99.0, 105.0, 72.0, 58.0, 48.0, 33.0, 28.0, 12.0, 22.0, 19.0, 6.0, 10.0, 3.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0870361328125, -0.08404731750488281, -0.08105850219726562, -0.07806968688964844, -0.07508087158203125, -0.07209205627441406, -0.06910324096679688, -0.06611442565917969, -0.0631256103515625, -0.06013679504394531, -0.057147979736328125, -0.05415916442871094, -0.05117034912109375, -0.04818153381347656, -0.045192718505859375, -0.04220390319824219, -0.039215087890625, -0.03622627258300781, -0.033237457275390625, -0.030248641967773438, -0.02725982666015625, -0.024271011352539062, -0.021282196044921875, -0.018293380737304688, -0.0153045654296875, -0.012315750122070312, -0.009326934814453125, -0.0063381195068359375, -0.00334930419921875, -0.0003604888916015625, 0.002628326416015625, 0.0056171417236328125, 0.00860595703125, 0.011594772338867188, 0.014583587646484375, 0.017572402954101562, 0.02056121826171875, 0.023550033569335938, 0.026538848876953125, 0.029527664184570312, 0.0325164794921875, 0.03550529479980469, 0.038494110107421875, 0.04148292541503906, 0.04447174072265625, 0.04746055603027344, 0.050449371337890625, 0.05343818664550781, 0.056427001953125, 0.05941581726074219, 0.062404632568359375, 0.06539344787597656, 0.06838226318359375, 0.07137107849121094, 0.07435989379882812, 0.07734870910644531, 0.0803375244140625, 0.08332633972167969, 0.08631515502929688, 0.08930397033691406, 0.09229278564453125, 0.09528160095214844, 0.09827041625976562, 0.10125923156738281, 0.104248046875]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 7.0, 47.0, 176.0, 383.0, 281.0, 101.0, 19.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.578874111175537, -2.454348087310791, -2.329821825027466, -2.2052958011627197, -2.0807695388793945, -1.9562435150146484, -1.8317172527313232, -1.7071912288665771, -1.582664966583252, -1.4581388235092163, -1.3336126804351807, -1.209086537361145, -1.0845603942871094, -0.9600343108177185, -0.8355081677436829, -0.7109820246696472, -0.5864559412002563, -0.4619297981262207, -0.33740365505218506, -0.2128775417804718, -0.08835139870643616, 0.0361747145652771, 0.16070085763931274, 0.2852270007133484, 0.40975314378738403, 0.5342792868614197, 0.6588054299354553, 0.7833315134048462, 0.9078576564788818, 1.0323837995529175, 1.1569099426269531, 1.2814360857009888, 1.4059622287750244, 1.53048837184906, 1.6550145149230957, 1.7795406579971313, 1.904066801071167, 2.028592824935913, 2.1531190872192383, 2.2776451110839844, 2.4021713733673096, 2.5266973972320557, 2.651223659515381, 2.775749683380127, 2.900275945663452, 3.0248019695281982, 3.1493282318115234, 3.2738542556762695, 3.3983802795410156, 3.5229063034057617, 3.647432565689087, 3.771958589553833, 3.896484851837158, 4.021010875701904, 4.14553689956665, 4.270063400268555, 4.394589424133301, 4.519115447998047, 4.643641471862793, 4.768167972564697, 4.892693996429443, 5.0172200202941895, 5.1417460441589355, 5.26627254486084, 5.390798568725586]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 5.0, 6.0, 4.0, 5.0, 11.0, 3.0, 7.0, 13.0, 10.0, 19.0, 15.0, 16.0, 22.0, 24.0, 35.0, 36.0, 26.0, 33.0, 37.0, 49.0, 35.0, 40.0, 42.0, 35.0, 33.0, 33.0, 43.0, 40.0, 38.0, 35.0, 40.0, 19.0, 33.0, 16.0, 26.0, 12.0, 21.0, 17.0, 11.0, 19.0, 10.0, 4.0, 9.0, 8.0, 4.0, 7.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.6638127565383911, -0.6432740688323975, -0.6227354407310486, -0.6021967530250549, -0.5816580653190613, -0.5611194372177124, -0.5405807495117188, -0.5200420618057251, -0.4995034337043762, -0.47896477580070496, -0.4584260880947113, -0.43788743019104004, -0.4173487722873688, -0.3968101143836975, -0.37627142667770386, -0.3557327687740326, -0.33519408106803894, -0.3146554231643677, -0.294116735458374, -0.27357807755470276, -0.2530394196510315, -0.23250074684619904, -0.21196207404136658, -0.1914234161376953, -0.17088474333286285, -0.1503460705280304, -0.12980741262435913, -0.10926873981952667, -0.08873007446527481, -0.06819140911102295, -0.04765273630619049, -0.027114078402519226, -0.006575405597686768, 0.013963261619210243, 0.034501928836107254, 0.055040597915649414, 0.07557926326990128, 0.09611792862415314, 0.1166566014289856, 0.13719525933265686, 0.15773393213748932, 0.17827260494232178, 0.19881126284599304, 0.2193499356508255, 0.23988860845565796, 0.2604272663593292, 0.2809659242630005, 0.30150461196899414, 0.3220432698726654, 0.34258192777633667, 0.3631206154823303, 0.3836592733860016, 0.40419793128967285, 0.4247366189956665, 0.44527527689933777, 0.46581393480300903, 0.4863526225090027, 0.5068913102149963, 0.5274299383163452, 0.5479686260223389, 0.5685073137283325, 0.5890459418296814, 0.609584629535675, 0.6301232576370239, 0.6506619453430176]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 6.0, 9.0, 28.0, 53.0, 132.0, 342.0, 1169.0, 5426.0, 37566.0, 1196452.0, 2884109.0, 59241.0, 6830.0, 1591.0, 626.0, 309.0, 174.0, 89.0, 52.0, 29.0, 19.0, 16.0, 7.0, 7.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.25732421875, -0.24665069580078125, -0.2359771728515625, -0.22530364990234375, -0.214630126953125, -0.20395660400390625, -0.1932830810546875, -0.18260955810546875, -0.17193603515625, -0.16126251220703125, -0.1505889892578125, -0.13991546630859375, -0.129241943359375, -0.11856842041015625, -0.1078948974609375, -0.09722137451171875, -0.0865478515625, -0.07587432861328125, -0.0652008056640625, -0.05452728271484375, -0.043853759765625, -0.03318023681640625, -0.0225067138671875, -0.01183319091796875, -0.00115966796875, 0.00951385498046875, 0.0201873779296875, 0.03086090087890625, 0.041534423828125, 0.05220794677734375, 0.0628814697265625, 0.07355499267578125, 0.084228515625, 0.09490203857421875, 0.1055755615234375, 0.11624908447265625, 0.126922607421875, 0.13759613037109375, 0.1482696533203125, 0.15894317626953125, 0.16961669921875, 0.18029022216796875, 0.1909637451171875, 0.20163726806640625, 0.212310791015625, 0.22298431396484375, 0.2336578369140625, 0.24433135986328125, 0.2550048828125, 0.26567840576171875, 0.2763519287109375, 0.28702545166015625, 0.297698974609375, 0.30837249755859375, 0.3190460205078125, 0.32971954345703125, 0.34039306640625, 0.35106658935546875, 0.3617401123046875, 0.37241363525390625, 0.383087158203125, 0.39376068115234375, 0.4044342041015625, 0.41510772705078125, 0.42578125]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 6.0, 8.0, 8.0, 22.0, 32.0, 37.0, 49.0, 75.0, 90.0, 117.0, 101.0, 115.0, 96.0, 71.0, 70.0, 38.0, 24.0, 19.0, 19.0, 5.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.078125, -0.07344627380371094, -0.06876754760742188, -0.06408882141113281, -0.05941009521484375, -0.05473136901855469, -0.050052642822265625, -0.04537391662597656, -0.0406951904296875, -0.03601646423339844, -0.031337738037109375, -0.026659011840820312, -0.02198028564453125, -0.017301559448242188, -0.012622833251953125, -0.007944107055664062, -0.003265380859375, 0.0014133453369140625, 0.006092071533203125, 0.010770797729492188, 0.01544952392578125, 0.020128250122070312, 0.024806976318359375, 0.029485702514648438, 0.0341644287109375, 0.03884315490722656, 0.043521881103515625, 0.04820060729980469, 0.05287933349609375, 0.05755805969238281, 0.062236785888671875, 0.06691551208496094, 0.07159423828125, 0.07627296447753906, 0.08095169067382812, 0.08563041687011719, 0.09030914306640625, 0.09498786926269531, 0.09966659545898438, 0.10434532165527344, 0.1090240478515625, 0.11370277404785156, 0.11838150024414062, 0.12306022644042969, 0.12773895263671875, 0.1324176788330078, 0.13709640502929688, 0.14177513122558594, 0.146453857421875, 0.15113258361816406, 0.15581130981445312, 0.1604900360107422, 0.16516876220703125, 0.1698474884033203, 0.17452621459960938, 0.17920494079589844, 0.1838836669921875, 0.18856239318847656, 0.19324111938476562, 0.1979198455810547, 0.20259857177734375, 0.2072772979736328, 0.21195602416992188, 0.21663475036621094, 0.2213134765625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 9.0, 15.0, 35.0, 45.0, 64.0, 167.0, 283.0, 560.0, 1231.0, 3868.0, 15229.0, 92389.0, 1102564.0, 2728909.0, 211440.0, 27939.0, 6139.0, 1912.0, 752.0, 324.0, 157.0, 91.0, 63.0, 29.0, 21.0, 16.0, 13.0, 5.0, 4.0, 3.0, 6.0, 1.0, 1.0, 3.0], "bins": [-0.323974609375, -0.31647300720214844, -0.3089714050292969, -0.3014698028564453, -0.29396820068359375, -0.2864665985107422, -0.2789649963378906, -0.27146339416503906, -0.2639617919921875, -0.25646018981933594, -0.24895858764648438, -0.2414569854736328, -0.23395538330078125, -0.2264537811279297, -0.21895217895507812, -0.21145057678222656, -0.203948974609375, -0.19644737243652344, -0.18894577026367188, -0.1814441680908203, -0.17394256591796875, -0.1664409637451172, -0.15893936157226562, -0.15143775939941406, -0.1439361572265625, -0.13643455505371094, -0.12893295288085938, -0.12143135070800781, -0.11392974853515625, -0.10642814636230469, -0.09892654418945312, -0.09142494201660156, -0.08392333984375, -0.07642173767089844, -0.06892013549804688, -0.06141853332519531, -0.05391693115234375, -0.04641532897949219, -0.038913726806640625, -0.03141212463378906, -0.0239105224609375, -0.016408920288085938, -0.008907318115234375, -0.0014057159423828125, 0.00609588623046875, 0.013597488403320312, 0.021099090576171875, 0.028600692749023438, 0.036102294921875, 0.04360389709472656, 0.051105499267578125, 0.05860710144042969, 0.06610870361328125, 0.07361030578613281, 0.08111190795898438, 0.08861351013183594, 0.0961151123046875, 0.10361671447753906, 0.11111831665039062, 0.11861991882324219, 0.12612152099609375, 0.1336231231689453, 0.14112472534179688, 0.14862632751464844, 0.1561279296875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 4.0, 5.0, 7.0, 13.0, 15.0, 29.0, 42.0, 60.0, 110.0, 175.0, 221.0, 356.0, 566.0, 753.0, 623.0, 409.0, 233.0, 194.0, 101.0, 42.0, 45.0, 33.0, 9.0, 7.0, 5.0, 6.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1290283203125, -0.12398910522460938, -0.11894989013671875, -0.11391067504882812, -0.1088714599609375, -0.10383224487304688, -0.09879302978515625, -0.09375381469726562, -0.088714599609375, -0.08367538452148438, -0.07863616943359375, -0.07359695434570312, -0.0685577392578125, -0.06351852416992188, -0.05847930908203125, -0.053440093994140625, -0.04840087890625, -0.043361663818359375, -0.03832244873046875, -0.033283233642578125, -0.0282440185546875, -0.023204803466796875, -0.01816558837890625, -0.013126373291015625, -0.008087158203125, -0.003047943115234375, 0.00199127197265625, 0.007030487060546875, 0.0120697021484375, 0.017108917236328125, 0.02214813232421875, 0.027187347412109375, 0.0322265625, 0.037265777587890625, 0.04230499267578125, 0.047344207763671875, 0.0523834228515625, 0.057422637939453125, 0.06246185302734375, 0.06750106811523438, 0.072540283203125, 0.07757949829101562, 0.08261871337890625, 0.08765792846679688, 0.0926971435546875, 0.09773635864257812, 0.10277557373046875, 0.10781478881835938, 0.11285400390625, 0.11789321899414062, 0.12293243408203125, 0.12797164916992188, 0.1330108642578125, 0.13805007934570312, 0.14308929443359375, 0.14812850952148438, 0.153167724609375, 0.15820693969726562, 0.16324615478515625, 0.16828536987304688, 0.1733245849609375, 0.17836380004882812, 0.18340301513671875, 0.18844223022460938, 0.1934814453125]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 11.0, 12.0, 36.0, 95.0, 147.0, 159.0, 178.0, 165.0, 92.0, 54.0, 32.0, 14.0, 8.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3531036376953125, -1.314698338508606, -1.2762930393218994, -1.2378876209259033, -1.1994823217391968, -1.1610770225524902, -1.1226716041564941, -1.0842663049697876, -1.045861005783081, -1.0074557065963745, -0.9690503478050232, -0.9306449890136719, -0.8922396898269653, -0.8538343906402588, -0.8154290318489075, -0.7770236730575562, -0.7386183738708496, -0.7002130746841431, -0.6618077158927917, -0.6234023571014404, -0.5849970579147339, -0.5465917587280273, -0.508186399936676, -0.4697810709476471, -0.43137574195861816, -0.39297041296958923, -0.3545650839805603, -0.31615975499153137, -0.27775442600250244, -0.2393490970134735, -0.20094376802444458, -0.16253843903541565, -0.12413322925567627, -0.08572790026664734, -0.04732257127761841, -0.008917242288589478, 0.029488086700439453, 0.06789341568946838, 0.10629874467849731, 0.14470407366752625, 0.18310940265655518, 0.2215147316455841, 0.25992006063461304, 0.29832538962364197, 0.3367307186126709, 0.37513604760169983, 0.41354137659072876, 0.4519467055797577, 0.4903520345687866, 0.5287573337554932, 0.5671626925468445, 0.6055680513381958, 0.6439733505249023, 0.6823786497116089, 0.7207840085029602, 0.7591893672943115, 0.7975946664810181, 0.8359999656677246, 0.8744053244590759, 0.9128106832504272, 0.9512159824371338, 0.9896212816238403, 1.0280265808105469, 1.066431999206543, 1.1048372983932495]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 7.0, 5.0, 4.0, 13.0, 13.0, 22.0, 19.0, 16.0, 26.0, 27.0, 23.0, 34.0, 36.0, 38.0, 41.0, 43.0, 36.0, 43.0, 51.0, 54.0, 36.0, 31.0, 39.0, 38.0, 42.0, 33.0, 37.0, 35.0, 24.0, 36.0, 18.0, 16.0, 7.0, 12.0, 10.0, 7.0, 7.0, 2.0, 7.0, 4.0, 5.0, 3.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.3875146508216858, -0.3749905526638031, -0.362466424703598, -0.34994232654571533, -0.33741819858551025, -0.32489410042762756, -0.3123699724674225, -0.2998458743095398, -0.2873217463493347, -0.274797648191452, -0.26227352023124695, -0.24974940717220306, -0.23722529411315918, -0.2247011959552765, -0.2121770679950714, -0.19965296983718872, -0.18712885677814484, -0.17460474371910095, -0.16208063066005707, -0.14955651760101318, -0.1370324045419693, -0.12450829893350601, -0.11198418587446213, -0.09946007281541824, -0.08693595975637436, -0.07441184669733047, -0.06188773363828659, -0.049363624304533005, -0.03683951124548912, -0.024315401911735535, -0.01179128885269165, 0.0007328242063522339, 0.013256937265396118, 0.025781050324440002, 0.03830516338348389, 0.05082927271723747, 0.06335338950157166, 0.07587749511003494, 0.08840160816907883, 0.10092572122812271, 0.1134498342871666, 0.12597393989562988, 0.13849805295467377, 0.15102216601371765, 0.16354627907276154, 0.17607039213180542, 0.1885945051908493, 0.2011186182498932, 0.21364273130893707, 0.22616684436798096, 0.23869095742702484, 0.2512150704860687, 0.2637391686439514, 0.2762632966041565, 0.2887873947620392, 0.30131152272224426, 0.31383562088012695, 0.32635971903800964, 0.3388838469982147, 0.3514079451560974, 0.3639320731163025, 0.3764561712741852, 0.38898029923439026, 0.40150439739227295, 0.414028525352478]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 5.0, 6.0, 9.0, 18.0, 17.0, 31.0, 47.0, 64.0, 81.0, 121.0, 175.0, 302.0, 532.0, 1100.0, 2935.0, 9496.0, 37285.0, 187766.0, 584412.0, 174376.0, 35357.0, 9104.0, 2810.0, 1088.0, 524.0, 306.0, 193.0, 125.0, 81.0, 65.0, 39.0, 23.0, 16.0, 12.0, 11.0, 9.0, 7.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.323486328125, -0.310791015625, -0.298095703125, -0.285400390625, -0.272705078125, -0.260009765625, -0.247314453125, -0.234619140625, -0.221923828125, -0.209228515625, -0.196533203125, -0.183837890625, -0.171142578125, -0.158447265625, -0.145751953125, -0.133056640625, -0.120361328125, -0.107666015625, -0.094970703125, -0.082275390625, -0.069580078125, -0.056884765625, -0.044189453125, -0.031494140625, -0.018798828125, -0.006103515625, 0.006591796875, 0.019287109375, 0.031982421875, 0.044677734375, 0.057373046875, 0.070068359375, 0.082763671875, 0.095458984375, 0.108154296875, 0.120849609375, 0.133544921875, 0.146240234375, 0.158935546875, 0.171630859375, 0.184326171875, 0.197021484375, 0.209716796875, 0.222412109375, 0.235107421875, 0.247802734375, 0.260498046875, 0.273193359375, 0.285888671875, 0.298583984375, 0.311279296875, 0.323974609375, 0.336669921875, 0.349365234375, 0.362060546875, 0.374755859375, 0.387451171875, 0.400146484375, 0.412841796875, 0.425537109375, 0.438232421875, 0.450927734375, 0.463623046875, 0.476318359375, 0.489013671875]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 9.0, 16.0, 21.0, 26.0, 35.0, 54.0, 92.0, 80.0, 124.0, 109.0, 123.0, 77.0, 78.0, 62.0, 39.0, 23.0, 12.0, 14.0, 6.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.07806396484375, -0.07333660125732422, -0.06860923767089844, -0.06388187408447266, -0.059154510498046875, -0.054427146911621094, -0.04969978332519531, -0.04497241973876953, -0.04024505615234375, -0.03551769256591797, -0.030790328979492188, -0.026062965393066406, -0.021335601806640625, -0.016608238220214844, -0.011880874633789062, -0.007153511047363281, -0.0024261474609375, 0.0023012161254882812, 0.0070285797119140625, 0.011755943298339844, 0.016483306884765625, 0.021210670471191406, 0.025938034057617188, 0.03066539764404297, 0.03539276123046875, 0.04012012481689453, 0.04484748840332031, 0.049574851989746094, 0.054302215576171875, 0.059029579162597656, 0.06375694274902344, 0.06848430633544922, 0.073211669921875, 0.07793903350830078, 0.08266639709472656, 0.08739376068115234, 0.09212112426757812, 0.0968484878540039, 0.10157585144042969, 0.10630321502685547, 0.11103057861328125, 0.11575794219970703, 0.12048530578613281, 0.1252126693725586, 0.12994003295898438, 0.13466739654541016, 0.13939476013183594, 0.14412212371826172, 0.1488494873046875, 0.15357685089111328, 0.15830421447753906, 0.16303157806396484, 0.16775894165039062, 0.1724863052368164, 0.1772136688232422, 0.18194103240966797, 0.18666839599609375, 0.19139575958251953, 0.1961231231689453, 0.2008504867553711, 0.20557785034179688, 0.21030521392822266, 0.21503257751464844, 0.21975994110107422, 0.2244873046875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 7.0, 4.0, 7.0, 18.0, 16.0, 19.0, 35.0, 49.0, 80.0, 162.0, 352.0, 1064.0, 3572.0, 14514.0, 67109.0, 354508.0, 479122.0, 99847.0, 20849.0, 5011.0, 1317.0, 412.0, 189.0, 113.0, 66.0, 37.0, 20.0, 13.0, 12.0, 7.0, 8.0, 3.0, 1.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.353515625, -0.3425102233886719, -0.33150482177734375, -0.3204994201660156, -0.3094940185546875, -0.2984886169433594, -0.28748321533203125, -0.2764778137207031, -0.265472412109375, -0.2544670104980469, -0.24346160888671875, -0.23245620727539062, -0.2214508056640625, -0.21044540405273438, -0.19944000244140625, -0.18843460083007812, -0.17742919921875, -0.16642379760742188, -0.15541839599609375, -0.14441299438476562, -0.1334075927734375, -0.12240219116210938, -0.11139678955078125, -0.10039138793945312, -0.089385986328125, -0.07838058471679688, -0.06737518310546875, -0.056369781494140625, -0.0453643798828125, -0.034358978271484375, -0.02335357666015625, -0.012348175048828125, -0.0013427734375, 0.009662628173828125, 0.02066802978515625, 0.031673431396484375, 0.0426788330078125, 0.053684234619140625, 0.06468963623046875, 0.07569503784179688, 0.086700439453125, 0.09770584106445312, 0.10871124267578125, 0.11971664428710938, 0.1307220458984375, 0.14172744750976562, 0.15273284912109375, 0.16373825073242188, 0.17474365234375, 0.18574905395507812, 0.19675445556640625, 0.20775985717773438, 0.2187652587890625, 0.22977066040039062, 0.24077606201171875, 0.2517814636230469, 0.262786865234375, 0.2737922668457031, 0.28479766845703125, 0.2958030700683594, 0.3068084716796875, 0.3178138732910156, 0.32881927490234375, 0.3398246765136719, 0.350830078125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 5.0, 7.0, 4.0, 5.0, 14.0, 10.0, 16.0, 16.0, 21.0, 24.0, 28.0, 33.0, 32.0, 42.0, 66.0, 56.0, 59.0, 57.0, 55.0, 66.0, 46.0, 58.0, 47.0, 40.0, 40.0, 29.0, 32.0, 17.0, 15.0, 12.0, 18.0, 8.0, 9.0, 4.0, 5.0, 0.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2120361328125, -0.2046642303466797, -0.19729232788085938, -0.18992042541503906, -0.18254852294921875, -0.17517662048339844, -0.16780471801757812, -0.1604328155517578, -0.1530609130859375, -0.1456890106201172, -0.13831710815429688, -0.13094520568847656, -0.12357330322265625, -0.11620140075683594, -0.10882949829101562, -0.10145759582519531, -0.094085693359375, -0.08671379089355469, -0.07934188842773438, -0.07196998596191406, -0.06459808349609375, -0.05722618103027344, -0.049854278564453125, -0.04248237609863281, -0.0351104736328125, -0.027738571166992188, -0.020366668701171875, -0.012994766235351562, -0.00562286376953125, 0.0017490386962890625, 0.009120941162109375, 0.016492843627929688, 0.02386474609375, 0.031236648559570312, 0.038608551025390625, 0.04598045349121094, 0.05335235595703125, 0.06072425842285156, 0.06809616088867188, 0.07546806335449219, 0.0828399658203125, 0.09021186828613281, 0.09758377075195312, 0.10495567321777344, 0.11232757568359375, 0.11969947814941406, 0.12707138061523438, 0.1344432830810547, 0.141815185546875, 0.1491870880126953, 0.15655899047851562, 0.16393089294433594, 0.17130279541015625, 0.17867469787597656, 0.18604660034179688, 0.1934185028076172, 0.2007904052734375, 0.2081623077392578, 0.21553421020507812, 0.22290611267089844, 0.23027801513671875, 0.23764991760253906, 0.24502182006835938, 0.2523937225341797, 0.259765625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 3.0, 2.0, 7.0, 11.0, 16.0, 18.0, 18.0, 30.0, 37.0, 67.0, 96.0, 137.0, 195.0, 373.0, 592.0, 1213.0, 2586.0, 6427.0, 16877.0, 47749.0, 161311.0, 447135.0, 253063.0, 71113.0, 23775.0, 8733.0, 3472.0, 1547.0, 786.0, 423.0, 237.0, 125.0, 111.0, 71.0, 55.0, 43.0, 28.0, 22.0, 9.0, 14.0, 9.0, 4.0, 8.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1251220703125, -0.120758056640625, -0.11639404296875, -0.112030029296875, -0.107666015625, -0.103302001953125, -0.09893798828125, -0.094573974609375, -0.0902099609375, -0.085845947265625, -0.08148193359375, -0.077117919921875, -0.07275390625, -0.068389892578125, -0.06402587890625, -0.059661865234375, -0.0552978515625, -0.050933837890625, -0.04656982421875, -0.042205810546875, -0.037841796875, -0.033477783203125, -0.02911376953125, -0.024749755859375, -0.0203857421875, -0.016021728515625, -0.01165771484375, -0.007293701171875, -0.0029296875, 0.001434326171875, 0.00579833984375, 0.010162353515625, 0.0145263671875, 0.018890380859375, 0.02325439453125, 0.027618408203125, 0.031982421875, 0.036346435546875, 0.04071044921875, 0.045074462890625, 0.0494384765625, 0.053802490234375, 0.05816650390625, 0.062530517578125, 0.06689453125, 0.071258544921875, 0.07562255859375, 0.079986572265625, 0.0843505859375, 0.088714599609375, 0.09307861328125, 0.097442626953125, 0.101806640625, 0.106170654296875, 0.11053466796875, 0.114898681640625, 0.1192626953125, 0.123626708984375, 0.12799072265625, 0.132354736328125, 0.13671875, 0.141082763671875, 0.14544677734375, 0.149810791015625, 0.1541748046875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 6.0, 5.0, 3.0, 5.0, 7.0, 13.0, 9.0, 10.0, 11.0, 12.0, 27.0, 21.0, 42.0, 38.0, 70.0, 89.0, 93.0, 86.0, 72.0, 81.0, 68.0, 34.0, 46.0, 22.0, 21.0, 17.0, 10.0, 15.0, 10.0, 6.0, 11.0, 5.0, 6.0, 5.0, 4.0, 0.0, 5.0, 3.0, 3.0, 2.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.9729137420654297e-05, -1.9156374037265778e-05, -1.8583610653877258e-05, -1.801084727048874e-05, -1.743808388710022e-05, -1.68653205037117e-05, -1.629255712032318e-05, -1.5719793736934662e-05, -1.5147030353546143e-05, -1.4574266970157623e-05, -1.4001503586769104e-05, -1.3428740203380585e-05, -1.2855976819992065e-05, -1.2283213436603546e-05, -1.1710450053215027e-05, -1.1137686669826508e-05, -1.0564923286437988e-05, -9.992159903049469e-06, -9.41939651966095e-06, -8.84663313627243e-06, -8.273869752883911e-06, -7.701106369495392e-06, -7.1283429861068726e-06, -6.555579602718353e-06, -5.982816219329834e-06, -5.410052835941315e-06, -4.837289452552795e-06, -4.264526069164276e-06, -3.691762685775757e-06, -3.1189993023872375e-06, -2.5462359189987183e-06, -1.973472535610199e-06, -1.4007091522216797e-06, -8.279457688331604e-07, -2.551823854446411e-07, 3.175809979438782e-07, 8.903443813323975e-07, 1.4631077647209167e-06, 2.035871148109436e-06, 2.6086345314979553e-06, 3.1813979148864746e-06, 3.754161298274994e-06, 4.326924681663513e-06, 4.8996880650520325e-06, 5.472451448440552e-06, 6.045214831829071e-06, 6.61797821521759e-06, 7.19074159860611e-06, 7.763504981994629e-06, 8.336268365383148e-06, 8.909031748771667e-06, 9.481795132160187e-06, 1.0054558515548706e-05, 1.0627321898937225e-05, 1.1200085282325745e-05, 1.1772848665714264e-05, 1.2345612049102783e-05, 1.2918375432491302e-05, 1.3491138815879822e-05, 1.4063902199268341e-05, 1.463666558265686e-05, 1.520942896604538e-05, 1.57821923494339e-05, 1.6354955732822418e-05, 1.6927719116210938e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 7.0, 4.0, 7.0, 7.0, 9.0, 20.0, 31.0, 38.0, 61.0, 99.0, 118.0, 187.0, 260.0, 380.0, 624.0, 972.0, 1681.0, 3217.0, 7231.0, 19961.0, 65391.0, 281705.0, 486937.0, 123669.0, 34034.0, 11458.0, 4634.0, 2278.0, 1223.0, 767.0, 522.0, 320.0, 227.0, 131.0, 103.0, 74.0, 54.0, 29.0, 28.0, 22.0, 15.0, 4.0, 8.0, 4.0, 3.0, 3.0, 1.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.14013671875, -0.13550186157226562, -0.13086700439453125, -0.12623214721679688, -0.1215972900390625, -0.11696243286132812, -0.11232757568359375, -0.10769271850585938, -0.103057861328125, -0.09842300415039062, -0.09378814697265625, -0.08915328979492188, -0.0845184326171875, -0.07988357543945312, -0.07524871826171875, -0.07061386108398438, -0.06597900390625, -0.061344146728515625, -0.05670928955078125, -0.052074432373046875, -0.0474395751953125, -0.042804718017578125, -0.03816986083984375, -0.033535003662109375, -0.028900146484375, -0.024265289306640625, -0.01963043212890625, -0.014995574951171875, -0.0103607177734375, -0.005725860595703125, -0.00109100341796875, 0.003543853759765625, 0.0081787109375, 0.012813568115234375, 0.01744842529296875, 0.022083282470703125, 0.0267181396484375, 0.031352996826171875, 0.03598785400390625, 0.040622711181640625, 0.045257568359375, 0.049892425537109375, 0.05452728271484375, 0.059162139892578125, 0.0637969970703125, 0.06843185424804688, 0.07306671142578125, 0.07770156860351562, 0.08233642578125, 0.08697128295898438, 0.09160614013671875, 0.09624099731445312, 0.1008758544921875, 0.10551071166992188, 0.11014556884765625, 0.11478042602539062, 0.119415283203125, 0.12405014038085938, 0.12868499755859375, 0.13331985473632812, 0.1379547119140625, 0.14258956909179688, 0.14722442626953125, 0.15185928344726562, 0.156494140625]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 7.0, 5.0, 10.0, 12.0, 18.0, 17.0, 21.0, 36.0, 68.0, 113.0, 137.0, 148.0, 131.0, 83.0, 57.0, 38.0, 27.0, 16.0, 13.0, 6.0, 10.0, 6.0, 2.0, 6.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.171875, -0.16699790954589844, -0.16212081909179688, -0.1572437286376953, -0.15236663818359375, -0.1474895477294922, -0.14261245727539062, -0.13773536682128906, -0.1328582763671875, -0.12798118591308594, -0.12310409545898438, -0.11822700500488281, -0.11334991455078125, -0.10847282409667969, -0.10359573364257812, -0.09871864318847656, -0.093841552734375, -0.08896446228027344, -0.08408737182617188, -0.07921028137207031, -0.07433319091796875, -0.06945610046386719, -0.06457901000976562, -0.05970191955566406, -0.0548248291015625, -0.04994773864746094, -0.045070648193359375, -0.04019355773925781, -0.03531646728515625, -0.030439376831054688, -0.025562286376953125, -0.020685195922851562, -0.01580810546875, -0.010931015014648438, -0.006053924560546875, -0.0011768341064453125, 0.00370025634765625, 0.008577346801757812, 0.013454437255859375, 0.018331527709960938, 0.0232086181640625, 0.028085708618164062, 0.032962799072265625, 0.03783988952636719, 0.04271697998046875, 0.04759407043457031, 0.052471160888671875, 0.05734825134277344, 0.062225341796875, 0.06710243225097656, 0.07197952270507812, 0.07685661315917969, 0.08173370361328125, 0.08661079406738281, 0.09148788452148438, 0.09636497497558594, 0.1012420654296875, 0.10611915588378906, 0.11099624633789062, 0.11587333679199219, 0.12075042724609375, 0.1256275177001953, 0.13050460815429688, 0.13538169860839844, 0.1402587890625]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 10.0, 16.0, 35.0, 115.0, 228.0, 266.0, 201.0, 91.0, 36.0, 11.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0012428760528564, -0.9278908371925354, -0.8545387983322144, -0.7811867594718933, -0.7078347206115723, -0.6344826817512512, -0.5611306428909302, -0.48777860403060913, -0.4144265651702881, -0.34107452630996704, -0.267722487449646, -0.19437044858932495, -0.1210184097290039, -0.04766637086868286, 0.025685667991638184, 0.09903770685195923, 0.17238974571228027, 0.24574178457260132, 0.31909382343292236, 0.3924458622932434, 0.46579790115356445, 0.5391499400138855, 0.6125019788742065, 0.6858540177345276, 0.7592060565948486, 0.8325580954551697, 0.9059101343154907, 0.9792621731758118, 1.0526142120361328, 1.1259663105010986, 1.199318289756775, 1.2726702690124512, 1.346022367477417, 1.4193744659423828, 1.492726445198059, 1.5660784244537354, 1.6394305229187012, 1.712782621383667, 1.7861346006393433, 1.8594865798950195, 1.9328386783599854, 2.006190776824951, 2.079542636871338, 2.1528947353363037, 2.2262468338012695, 2.2995989322662354, 2.372951030731201, 2.446302890777588, 2.5196549892425537, 2.5930070877075195, 2.6663589477539062, 2.739711046218872, 2.813063144683838, 2.8864152431488037, 2.9597673416137695, 3.0331192016601562, 3.106471300125122, 3.179823398590088, 3.2531752586364746, 3.3265273571014404, 3.3998794555664062, 3.473231554031372, 3.546583652496338, 3.6199355125427246, 3.6932876110076904]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 3.0, 3.0, 5.0, 12.0, 12.0, 11.0, 20.0, 15.0, 24.0, 34.0, 31.0, 30.0, 27.0, 31.0, 45.0, 44.0, 54.0, 55.0, 52.0, 48.0, 60.0, 40.0, 37.0, 43.0, 33.0, 44.0, 31.0, 25.0, 22.0, 17.0, 19.0, 18.0, 15.0, 7.0, 9.0, 6.0, 9.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.7667695879936218, -0.7454947829246521, -0.7242200374603271, -0.7029452323913574, -0.6816704869270325, -0.6603956818580627, -0.6391209363937378, -0.6178461313247681, -0.5965713262557983, -0.5752965211868286, -0.5540217757225037, -0.5327469706535339, -0.511472225189209, -0.49019742012023926, -0.4689226448535919, -0.4476478695869446, -0.42637309432029724, -0.4050983190536499, -0.38382354378700256, -0.3625487685203552, -0.3412739634513855, -0.31999918818473816, -0.2987244129180908, -0.2774496078491211, -0.25617486238479614, -0.2349000871181488, -0.21362529695034027, -0.19235052168369293, -0.1710757315158844, -0.14980095624923706, -0.12852618098258972, -0.10725139081478119, -0.08597660064697266, -0.06470181792974472, -0.04342703893780708, -0.022152259945869446, -0.00087747722864151, 0.020397305488586426, 0.041672080755233765, 0.0629468709230423, 0.08422164618968964, 0.10549642890691757, 0.1267712116241455, 0.14804598689079285, 0.16932076215744019, 0.19059555232524872, 0.21187032759189606, 0.2331451177597046, 0.25441989302635193, 0.27569466829299927, 0.2969694435596466, 0.31824421882629395, 0.33951902389526367, 0.360793799161911, 0.38206857442855835, 0.4033433794975281, 0.424618124961853, 0.44589290022850037, 0.4671676754951477, 0.48844248056411743, 0.5097172260284424, 0.5309920310974121, 0.5522668361663818, 0.5735415816307068, 0.5948163866996765]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 1.0, 3.0, 6.0, 1.0, 12.0, 24.0, 45.0, 51.0, 127.0, 208.0, 376.0, 729.0, 1641.0, 3868.0, 10735.0, 39055.0, 222414.0, 2646245.0, 1133116.0, 101522.0, 21450.0, 6666.0, 2760.0, 1281.0, 686.0, 427.0, 268.0, 185.0, 97.0, 97.0, 39.0, 40.0, 24.0, 22.0, 20.0, 11.0, 6.0, 7.0, 5.0, 8.0, 3.0, 2.0, 1.0, 4.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.156005859375, -0.14850997924804688, -0.14101409912109375, -0.13351821899414062, -0.1260223388671875, -0.11852645874023438, -0.11103057861328125, -0.10353469848632812, -0.096038818359375, -0.08854293823242188, -0.08104705810546875, -0.07355117797851562, -0.0660552978515625, -0.058559417724609375, -0.05106353759765625, -0.043567657470703125, -0.03607177734375, -0.028575897216796875, -0.02108001708984375, -0.013584136962890625, -0.0060882568359375, 0.001407623291015625, 0.00890350341796875, 0.016399383544921875, 0.023895263671875, 0.031391143798828125, 0.03888702392578125, 0.046382904052734375, 0.0538787841796875, 0.061374664306640625, 0.06887054443359375, 0.07636642456054688, 0.0838623046875, 0.09135818481445312, 0.09885406494140625, 0.10634994506835938, 0.1138458251953125, 0.12134170532226562, 0.12883758544921875, 0.13633346557617188, 0.143829345703125, 0.15132522583007812, 0.15882110595703125, 0.16631698608398438, 0.1738128662109375, 0.18130874633789062, 0.18880462646484375, 0.19630050659179688, 0.20379638671875, 0.21129226684570312, 0.21878814697265625, 0.22628402709960938, 0.2337799072265625, 0.24127578735351562, 0.24877166748046875, 0.2562675476074219, 0.263763427734375, 0.2712593078613281, 0.27875518798828125, 0.2862510681152344, 0.2937469482421875, 0.3012428283691406, 0.30873870849609375, 0.3162345886230469, 0.32373046875]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 8.0, 13.0, 14.0, 21.0, 32.0, 48.0, 67.0, 84.0, 96.0, 117.0, 113.0, 105.0, 83.0, 58.0, 61.0, 36.0, 20.0, 15.0, 10.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0888671875, -0.0839691162109375, -0.079071044921875, -0.0741729736328125, -0.06927490234375, -0.0643768310546875, -0.059478759765625, -0.0545806884765625, -0.0496826171875, -0.0447845458984375, -0.039886474609375, -0.0349884033203125, -0.03009033203125, -0.0251922607421875, -0.020294189453125, -0.0153961181640625, -0.010498046875, -0.0055999755859375, -0.000701904296875, 0.0041961669921875, 0.00909423828125, 0.0139923095703125, 0.018890380859375, 0.0237884521484375, 0.0286865234375, 0.0335845947265625, 0.038482666015625, 0.0433807373046875, 0.04827880859375, 0.0531768798828125, 0.058074951171875, 0.0629730224609375, 0.06787109375, 0.0727691650390625, 0.077667236328125, 0.0825653076171875, 0.08746337890625, 0.0923614501953125, 0.097259521484375, 0.1021575927734375, 0.1070556640625, 0.1119537353515625, 0.116851806640625, 0.1217498779296875, 0.12664794921875, 0.1315460205078125, 0.136444091796875, 0.1413421630859375, 0.146240234375, 0.1511383056640625, 0.156036376953125, 0.1609344482421875, 0.16583251953125, 0.1707305908203125, 0.175628662109375, 0.1805267333984375, 0.1854248046875, 0.1903228759765625, 0.195220947265625, 0.2001190185546875, 0.20501708984375, 0.2099151611328125, 0.214813232421875, 0.2197113037109375, 0.224609375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 6.0, 1.0, 7.0, 1.0, 3.0, 5.0, 8.0, 6.0, 5.0, 22.0, 15.0, 27.0, 39.0, 63.0, 77.0, 118.0, 158.0, 234.0, 407.0, 645.0, 1318.0, 2704.0, 6310.0, 17226.0, 59667.0, 284307.0, 1894939.0, 1605942.0, 240574.0, 52920.0, 15308.0, 5845.0, 2434.0, 1181.0, 655.0, 349.0, 235.0, 166.0, 95.0, 66.0, 48.0, 47.0, 29.0, 13.0, 17.0, 8.0, 7.0, 13.0, 10.0, 4.0, 2.0, 1.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2017822265625, -0.19504547119140625, -0.1883087158203125, -0.18157196044921875, -0.174835205078125, -0.16809844970703125, -0.1613616943359375, -0.15462493896484375, -0.14788818359375, -0.14115142822265625, -0.1344146728515625, -0.12767791748046875, -0.120941162109375, -0.11420440673828125, -0.1074676513671875, -0.10073089599609375, -0.093994140625, -0.08725738525390625, -0.0805206298828125, -0.07378387451171875, -0.067047119140625, -0.06031036376953125, -0.0535736083984375, -0.04683685302734375, -0.04010009765625, -0.03336334228515625, -0.0266265869140625, -0.01988983154296875, -0.013153076171875, -0.00641632080078125, 0.0003204345703125, 0.00705718994140625, 0.0137939453125, 0.02053070068359375, 0.0272674560546875, 0.03400421142578125, 0.040740966796875, 0.04747772216796875, 0.0542144775390625, 0.06095123291015625, 0.06768798828125, 0.07442474365234375, 0.0811614990234375, 0.08789825439453125, 0.094635009765625, 0.10137176513671875, 0.1081085205078125, 0.11484527587890625, 0.12158203125, 0.12831878662109375, 0.1350555419921875, 0.14179229736328125, 0.148529052734375, 0.15526580810546875, 0.1620025634765625, 0.16873931884765625, 0.17547607421875, 0.18221282958984375, 0.1889495849609375, 0.19568634033203125, 0.202423095703125, 0.20915985107421875, 0.2158966064453125, 0.22263336181640625, 0.2293701171875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 6.0, 5.0, 6.0, 23.0, 11.0, 22.0, 17.0, 42.0, 39.0, 62.0, 84.0, 126.0, 188.0, 277.0, 380.0, 522.0, 622.0, 473.0, 344.0, 253.0, 157.0, 126.0, 84.0, 57.0, 39.0, 24.0, 21.0, 20.0, 19.0, 6.0, 4.0, 5.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.170166015625, -0.165069580078125, -0.15997314453125, -0.154876708984375, -0.1497802734375, -0.144683837890625, -0.13958740234375, -0.134490966796875, -0.12939453125, -0.124298095703125, -0.11920166015625, -0.114105224609375, -0.1090087890625, -0.103912353515625, -0.09881591796875, -0.093719482421875, -0.088623046875, -0.083526611328125, -0.07843017578125, -0.073333740234375, -0.0682373046875, -0.063140869140625, -0.05804443359375, -0.052947998046875, -0.0478515625, -0.042755126953125, -0.03765869140625, -0.032562255859375, -0.0274658203125, -0.022369384765625, -0.01727294921875, -0.012176513671875, -0.007080078125, -0.001983642578125, 0.00311279296875, 0.008209228515625, 0.0133056640625, 0.018402099609375, 0.02349853515625, 0.028594970703125, 0.03369140625, 0.038787841796875, 0.04388427734375, 0.048980712890625, 0.0540771484375, 0.059173583984375, 0.06427001953125, 0.069366455078125, 0.074462890625, 0.079559326171875, 0.08465576171875, 0.089752197265625, 0.0948486328125, 0.099945068359375, 0.10504150390625, 0.110137939453125, 0.115234375, 0.120330810546875, 0.12542724609375, 0.130523681640625, 0.1356201171875, 0.140716552734375, 0.14581298828125, 0.150909423828125, 0.156005859375]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 5.0, 8.0, 10.0, 12.0, 25.0, 31.0, 59.0, 85.0, 89.0, 92.0, 127.0, 99.0, 95.0, 83.0, 60.0, 38.0, 32.0, 17.0, 12.0, 8.0, 5.0, 2.0, 6.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-1.477787733078003, -1.4458448886871338, -1.413901925086975, -1.3819589614868164, -1.3500161170959473, -1.3180732727050781, -1.2861303091049194, -1.2541873455047607, -1.2222445011138916, -1.1903016567230225, -1.1583586931228638, -1.126415729522705, -1.094472885131836, -1.0625300407409668, -1.030587077140808, -0.9986441731452942, -0.9667012691497803, -0.9347583651542664, -0.9028154611587524, -0.8708725571632385, -0.8389296531677246, -0.8069867491722107, -0.7750438451766968, -0.7431009411811829, -0.711158037185669, -0.679215133190155, -0.6472722291946411, -0.6153293251991272, -0.5833864212036133, -0.5514435172080994, -0.5195006132125854, -0.48755770921707153, -0.4556148052215576, -0.4236719012260437, -0.3917289972305298, -0.35978609323501587, -0.32784318923950195, -0.29590028524398804, -0.2639573812484741, -0.2320144772529602, -0.2000715732574463, -0.16812866926193237, -0.13618576526641846, -0.10424286127090454, -0.07229995727539062, -0.04035705327987671, -0.008414149284362793, 0.023528754711151123, 0.05547165870666504, 0.08741456270217896, 0.11935746669769287, 0.1513003706932068, 0.1832432746887207, 0.21518617868423462, 0.24712908267974854, 0.27907198667526245, 0.31101489067077637, 0.3429577946662903, 0.3749006986618042, 0.4068436026573181, 0.43878650665283203, 0.47072941064834595, 0.5026723146438599, 0.5346152186393738, 0.5665581226348877]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 2.0, 5.0, 4.0, 6.0, 7.0, 13.0, 19.0, 12.0, 18.0, 26.0, 30.0, 22.0, 34.0, 36.0, 33.0, 47.0, 40.0, 40.0, 53.0, 49.0, 63.0, 47.0, 47.0, 39.0, 36.0, 39.0, 35.0, 26.0, 36.0, 23.0, 34.0, 17.0, 8.0, 14.0, 15.0, 5.0, 3.0, 5.0, 5.0, 2.0, 7.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6266806721687317, -0.6093015074729919, -0.5919223427772522, -0.5745431780815125, -0.5571639537811279, -0.5397847890853882, -0.5224056243896484, -0.5050264596939087, -0.48764729499816895, -0.4702681303024292, -0.45288896560668945, -0.4355097711086273, -0.4181306064128876, -0.4007514417171478, -0.3833722472190857, -0.36599308252334595, -0.3486139178276062, -0.33123475313186646, -0.3138555884361267, -0.2964763939380646, -0.27909722924232483, -0.2617180645465851, -0.24433888494968414, -0.2269597053527832, -0.20958054065704346, -0.1922013759613037, -0.17482219636440277, -0.15744301676750183, -0.14006385207176208, -0.12268467992544174, -0.1053055077791214, -0.08792633563280106, -0.07054710388183594, -0.053167931735515594, -0.03578875958919525, -0.01840958744287491, -0.0010304152965545654, 0.016348756849765778, 0.03372792899608612, 0.051107101142406464, 0.0684862732887268, 0.08586544543504715, 0.10324461758136749, 0.12062378972768784, 0.13800296187400818, 0.15538212656974792, 0.17276130616664886, 0.1901404857635498, 0.20751965045928955, 0.2248988151550293, 0.24227799475193024, 0.2596571743488312, 0.2770363390445709, 0.29441550374031067, 0.3117946982383728, 0.32917386293411255, 0.3465530276298523, 0.36393219232559204, 0.3813113570213318, 0.3986905515193939, 0.41606971621513367, 0.4334488809108734, 0.45082807540893555, 0.4682072401046753, 0.48558640480041504]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 10.0, 6.0, 15.0, 16.0, 20.0, 36.0, 46.0, 67.0, 93.0, 151.0, 194.0, 317.0, 535.0, 1015.0, 2273.0, 5937.0, 16227.0, 48374.0, 152245.0, 395893.0, 286074.0, 91508.0, 29600.0, 10419.0, 3914.0, 1627.0, 728.0, 420.0, 253.0, 173.0, 95.0, 91.0, 57.0, 37.0, 26.0, 25.0, 13.0, 8.0, 3.0, 4.0, 5.0, 5.0, 0.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.39990234375, -0.38840484619140625, -0.3769073486328125, -0.36540985107421875, -0.353912353515625, -0.34241485595703125, -0.3309173583984375, -0.31941986083984375, -0.30792236328125, -0.29642486572265625, -0.2849273681640625, -0.27342987060546875, -0.261932373046875, -0.25043487548828125, -0.2389373779296875, -0.22743988037109375, -0.2159423828125, -0.20444488525390625, -0.1929473876953125, -0.18144989013671875, -0.169952392578125, -0.15845489501953125, -0.1469573974609375, -0.13545989990234375, -0.12396240234375, -0.11246490478515625, -0.1009674072265625, -0.08946990966796875, -0.077972412109375, -0.06647491455078125, -0.0549774169921875, -0.04347991943359375, -0.031982421875, -0.02048492431640625, -0.0089874267578125, 0.00251007080078125, 0.014007568359375, 0.02550506591796875, 0.0370025634765625, 0.04850006103515625, 0.05999755859375, 0.07149505615234375, 0.0829925537109375, 0.09449005126953125, 0.105987548828125, 0.11748504638671875, 0.1289825439453125, 0.14048004150390625, 0.1519775390625, 0.16347503662109375, 0.1749725341796875, 0.18647003173828125, 0.197967529296875, 0.20946502685546875, 0.2209625244140625, 0.23246002197265625, 0.24395751953125, 0.25545501708984375, 0.2669525146484375, 0.27845001220703125, 0.289947509765625, 0.30144500732421875, 0.3129425048828125, 0.32444000244140625, 0.3359375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 8.0, 17.0, 10.0, 20.0, 26.0, 39.0, 62.0, 77.0, 99.0, 98.0, 116.0, 93.0, 97.0, 68.0, 59.0, 47.0, 23.0, 25.0, 12.0, 4.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.07525634765625, -0.07040882110595703, -0.06556129455566406, -0.060713768005371094, -0.055866241455078125, -0.051018714904785156, -0.04617118835449219, -0.04132366180419922, -0.03647613525390625, -0.03162860870361328, -0.026781082153320312, -0.021933555603027344, -0.017086029052734375, -0.012238502502441406, -0.0073909759521484375, -0.0025434494018554688, 0.0023040771484375, 0.007151603698730469, 0.011999130249023438, 0.016846656799316406, 0.021694183349609375, 0.026541709899902344, 0.03138923645019531, 0.03623676300048828, 0.04108428955078125, 0.04593181610107422, 0.05077934265136719, 0.055626869201660156, 0.060474395751953125, 0.0653219223022461, 0.07016944885253906, 0.07501697540283203, 0.079864501953125, 0.08471202850341797, 0.08955955505371094, 0.0944070816040039, 0.09925460815429688, 0.10410213470458984, 0.10894966125488281, 0.11379718780517578, 0.11864471435546875, 0.12349224090576172, 0.1283397674560547, 0.13318729400634766, 0.13803482055664062, 0.1428823471069336, 0.14772987365722656, 0.15257740020751953, 0.1574249267578125, 0.16227245330810547, 0.16711997985839844, 0.1719675064086914, 0.17681503295898438, 0.18166255950927734, 0.1865100860595703, 0.19135761260986328, 0.19620513916015625, 0.20105266571044922, 0.2059001922607422, 0.21074771881103516, 0.21559524536132812, 0.2204427719116211, 0.22529029846191406, 0.23013782501220703, 0.2349853515625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 4.0, 8.0, 12.0, 32.0, 24.0, 64.0, 90.0, 144.0, 248.0, 417.0, 717.0, 1389.0, 2618.0, 4926.0, 10170.0, 20516.0, 44229.0, 102651.0, 230448.0, 306853.0, 179604.0, 76974.0, 33758.0, 15916.0, 7995.0, 4059.0, 2088.0, 1101.0, 611.0, 350.0, 200.0, 112.0, 75.0, 53.0, 43.0, 29.0, 6.0, 7.0, 9.0, 1.0, 2.0, 6.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1766357421875, -0.16872596740722656, -0.16081619262695312, -0.1529064178466797, -0.14499664306640625, -0.1370868682861328, -0.12917709350585938, -0.12126731872558594, -0.1133575439453125, -0.10544776916503906, -0.09753799438476562, -0.08962821960449219, -0.08171844482421875, -0.07380867004394531, -0.06589889526367188, -0.05798912048339844, -0.050079345703125, -0.04216957092285156, -0.034259796142578125, -0.026350021362304688, -0.01844024658203125, -0.010530471801757812, -0.002620697021484375, 0.0052890777587890625, 0.0131988525390625, 0.021108627319335938, 0.029018402099609375, 0.03692817687988281, 0.04483795166015625, 0.05274772644042969, 0.060657501220703125, 0.06856727600097656, 0.07647705078125, 0.08438682556152344, 0.09229660034179688, 0.10020637512207031, 0.10811614990234375, 0.11602592468261719, 0.12393569946289062, 0.13184547424316406, 0.1397552490234375, 0.14766502380371094, 0.15557479858398438, 0.1634845733642578, 0.17139434814453125, 0.1793041229248047, 0.18721389770507812, 0.19512367248535156, 0.203033447265625, 0.21094322204589844, 0.21885299682617188, 0.2267627716064453, 0.23467254638671875, 0.2425823211669922, 0.2504920959472656, 0.25840187072753906, 0.2663116455078125, 0.27422142028808594, 0.2821311950683594, 0.2900409698486328, 0.29795074462890625, 0.3058605194091797, 0.3137702941894531, 0.32168006896972656, 0.32958984375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 4.0, 3.0, 6.0, 7.0, 6.0, 5.0, 11.0, 16.0, 14.0, 14.0, 21.0, 18.0, 22.0, 21.0, 31.0, 39.0, 33.0, 45.0, 58.0, 52.0, 34.0, 44.0, 36.0, 56.0, 49.0, 47.0, 44.0, 37.0, 31.0, 34.0, 30.0, 19.0, 27.0, 25.0, 19.0, 13.0, 5.0, 7.0, 5.0, 3.0, 10.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.272705078125, -0.2643585205078125, -0.256011962890625, -0.2476654052734375, -0.23931884765625, -0.2309722900390625, -0.222625732421875, -0.2142791748046875, -0.2059326171875, -0.1975860595703125, -0.189239501953125, -0.1808929443359375, -0.17254638671875, -0.1641998291015625, -0.155853271484375, -0.1475067138671875, -0.13916015625, -0.1308135986328125, -0.122467041015625, -0.1141204833984375, -0.10577392578125, -0.0974273681640625, -0.089080810546875, -0.0807342529296875, -0.0723876953125, -0.0640411376953125, -0.055694580078125, -0.0473480224609375, -0.03900146484375, -0.0306549072265625, -0.022308349609375, -0.0139617919921875, -0.005615234375, 0.0027313232421875, 0.011077880859375, 0.0194244384765625, 0.02777099609375, 0.0361175537109375, 0.044464111328125, 0.0528106689453125, 0.0611572265625, 0.0695037841796875, 0.077850341796875, 0.0861968994140625, 0.09454345703125, 0.1028900146484375, 0.111236572265625, 0.1195831298828125, 0.1279296875, 0.1362762451171875, 0.144622802734375, 0.1529693603515625, 0.16131591796875, 0.1696624755859375, 0.178009033203125, 0.1863555908203125, 0.1947021484375, 0.2030487060546875, 0.211395263671875, 0.2197418212890625, 0.22808837890625, 0.2364349365234375, 0.244781494140625, 0.2531280517578125, 0.261474609375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 4.0, 6.0, 6.0, 18.0, 27.0, 33.0, 52.0, 76.0, 125.0, 186.0, 281.0, 427.0, 714.0, 1205.0, 2161.0, 3797.0, 7985.0, 16835.0, 37662.0, 92408.0, 235600.0, 346722.0, 176920.0, 69284.0, 28971.0, 12998.0, 6289.0, 3279.0, 1731.0, 1065.0, 594.0, 390.0, 249.0, 165.0, 96.0, 65.0, 40.0, 25.0, 28.0, 9.0, 5.0, 12.0, 7.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.154052734375, -0.1491374969482422, -0.14422225952148438, -0.13930702209472656, -0.13439178466796875, -0.12947654724121094, -0.12456130981445312, -0.11964607238769531, -0.1147308349609375, -0.10981559753417969, -0.10490036010742188, -0.09998512268066406, -0.09506988525390625, -0.09015464782714844, -0.08523941040039062, -0.08032417297363281, -0.075408935546875, -0.07049369812011719, -0.06557846069335938, -0.06066322326660156, -0.05574798583984375, -0.05083274841308594, -0.045917510986328125, -0.04100227355957031, -0.0360870361328125, -0.031171798706054688, -0.026256561279296875, -0.021341323852539062, -0.01642608642578125, -0.011510848999023438, -0.006595611572265625, -0.0016803741455078125, 0.00323486328125, 0.008150100708007812, 0.013065338134765625, 0.017980575561523438, 0.02289581298828125, 0.027811050415039062, 0.032726287841796875, 0.03764152526855469, 0.0425567626953125, 0.04747200012207031, 0.052387237548828125, 0.05730247497558594, 0.06221771240234375, 0.06713294982910156, 0.07204818725585938, 0.07696342468261719, 0.081878662109375, 0.08679389953613281, 0.09170913696289062, 0.09662437438964844, 0.10153961181640625, 0.10645484924316406, 0.11137008666992188, 0.11628532409667969, 0.1212005615234375, 0.1261157989501953, 0.13103103637695312, 0.13594627380371094, 0.14086151123046875, 0.14577674865722656, 0.15069198608398438, 0.1556072235107422, 0.1605224609375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 5.0, 6.0, 5.0, 8.0, 6.0, 16.0, 16.0, 28.0, 33.0, 33.0, 51.0, 66.0, 121.0, 120.0, 113.0, 84.0, 80.0, 48.0, 39.0, 26.0, 25.0, 17.0, 15.0, 12.0, 5.0, 7.0, 7.0, 3.0, 2.0, 1.0, 0.0, 5.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1113624572753906e-05, -2.995505928993225e-05, -2.8796494007110596e-05, -2.763792872428894e-05, -2.6479363441467285e-05, -2.532079815864563e-05, -2.4162232875823975e-05, -2.300366759300232e-05, -2.1845102310180664e-05, -2.068653702735901e-05, -1.9527971744537354e-05, -1.8369406461715698e-05, -1.7210841178894043e-05, -1.6052275896072388e-05, -1.4893710613250732e-05, -1.3735145330429077e-05, -1.2576580047607422e-05, -1.1418014764785767e-05, -1.0259449481964111e-05, -9.100884199142456e-06, -7.9423189163208e-06, -6.7837536334991455e-06, -5.62518835067749e-06, -4.466623067855835e-06, -3.3080577850341797e-06, -2.1494925022125244e-06, -9.909272193908691e-07, 1.6763806343078613e-07, 1.3262033462524414e-06, 2.4847686290740967e-06, 3.643333911895752e-06, 4.801899194717407e-06, 5.9604644775390625e-06, 7.119029760360718e-06, 8.277595043182373e-06, 9.436160326004028e-06, 1.0594725608825684e-05, 1.1753290891647339e-05, 1.2911856174468994e-05, 1.407042145729065e-05, 1.5228986740112305e-05, 1.638755202293396e-05, 1.7546117305755615e-05, 1.870468258857727e-05, 1.9863247871398926e-05, 2.102181315422058e-05, 2.2180378437042236e-05, 2.333894371986389e-05, 2.4497509002685547e-05, 2.5656074285507202e-05, 2.6814639568328857e-05, 2.7973204851150513e-05, 2.9131770133972168e-05, 3.0290335416793823e-05, 3.144890069961548e-05, 3.2607465982437134e-05, 3.376603126525879e-05, 3.4924596548080444e-05, 3.60831618309021e-05, 3.7241727113723755e-05, 3.840029239654541e-05, 3.9558857679367065e-05, 4.071742296218872e-05, 4.1875988245010376e-05, 4.303455352783203e-05]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 5.0, 6.0, 10.0, 20.0, 18.0, 33.0, 36.0, 31.0, 89.0, 132.0, 207.0, 326.0, 552.0, 858.0, 1526.0, 2687.0, 4900.0, 9296.0, 18876.0, 41554.0, 99459.0, 246506.0, 335824.0, 162573.0, 65379.0, 28522.0, 13536.0, 6911.0, 3579.0, 2033.0, 1116.0, 775.0, 412.0, 272.0, 167.0, 113.0, 85.0, 45.0, 25.0, 20.0, 18.0, 13.0, 4.0, 5.0, 6.0, 1.0, 4.0], "bins": [-0.1884765625, -0.18367671966552734, -0.1788768768310547, -0.17407703399658203, -0.16927719116210938, -0.16447734832763672, -0.15967750549316406, -0.1548776626586914, -0.15007781982421875, -0.1452779769897461, -0.14047813415527344, -0.13567829132080078, -0.13087844848632812, -0.12607860565185547, -0.12127876281738281, -0.11647891998291016, -0.1116790771484375, -0.10687923431396484, -0.10207939147949219, -0.09727954864501953, -0.09247970581054688, -0.08767986297607422, -0.08288002014160156, -0.0780801773071289, -0.07328033447265625, -0.0684804916381836, -0.06368064880371094, -0.05888080596923828, -0.054080963134765625, -0.04928112030029297, -0.04448127746582031, -0.039681434631347656, -0.034881591796875, -0.030081748962402344, -0.025281906127929688, -0.02048206329345703, -0.015682220458984375, -0.010882377624511719, -0.0060825347900390625, -0.0012826919555664062, 0.00351715087890625, 0.008316993713378906, 0.013116836547851562, 0.01791667938232422, 0.022716522216796875, 0.02751636505126953, 0.03231620788574219, 0.037116050720214844, 0.0419158935546875, 0.046715736389160156, 0.05151557922363281, 0.05631542205810547, 0.061115264892578125, 0.06591510772705078, 0.07071495056152344, 0.0755147933959961, 0.08031463623046875, 0.0851144790649414, 0.08991432189941406, 0.09471416473388672, 0.09951400756835938, 0.10431385040283203, 0.10911369323730469, 0.11391353607177734, 0.11871337890625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 1.0, 3.0, 2.0, 7.0, 3.0, 3.0, 5.0, 7.0, 14.0, 15.0, 18.0, 22.0, 23.0, 32.0, 29.0, 32.0, 61.0, 55.0, 60.0, 59.0, 81.0, 79.0, 60.0, 63.0, 43.0, 44.0, 35.0, 38.0, 17.0, 14.0, 21.0, 17.0, 8.0, 5.0, 7.0, 3.0, 5.0, 1.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0], "bins": [-0.1434326171875, -0.13944625854492188, -0.13545989990234375, -0.13147354125976562, -0.1274871826171875, -0.12350082397460938, -0.11951446533203125, -0.11552810668945312, -0.111541748046875, -0.10755538940429688, -0.10356903076171875, -0.09958267211914062, -0.0955963134765625, -0.09160995483398438, -0.08762359619140625, -0.08363723754882812, -0.07965087890625, -0.07566452026367188, -0.07167816162109375, -0.06769180297851562, -0.0637054443359375, -0.059719085693359375, -0.05573272705078125, -0.051746368408203125, -0.047760009765625, -0.043773651123046875, -0.03978729248046875, -0.035800933837890625, -0.0318145751953125, -0.027828216552734375, -0.02384185791015625, -0.019855499267578125, -0.015869140625, -0.011882781982421875, -0.00789642333984375, -0.003910064697265625, 7.62939453125e-05, 0.004062652587890625, 0.00804901123046875, 0.012035369873046875, 0.016021728515625, 0.020008087158203125, 0.02399444580078125, 0.027980804443359375, 0.0319671630859375, 0.035953521728515625, 0.03993988037109375, 0.043926239013671875, 0.04791259765625, 0.051898956298828125, 0.05588531494140625, 0.059871673583984375, 0.0638580322265625, 0.06784439086914062, 0.07183074951171875, 0.07581710815429688, 0.079803466796875, 0.08378982543945312, 0.08777618408203125, 0.09176254272460938, 0.0957489013671875, 0.09973526000976562, 0.10372161865234375, 0.10770797729492188, 0.1116943359375]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 6.0, 13.0, 23.0, 40.0, 61.0, 95.0, 109.0, 140.0, 127.0, 114.0, 95.0, 76.0, 57.0, 21.0, 18.0, 8.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.9995193481445312, -2.9411139488220215, -2.8827085494995117, -2.824303150177002, -2.765897750854492, -2.7074923515319824, -2.6490869522094727, -2.590681552886963, -2.532276153564453, -2.4738707542419434, -2.4154653549194336, -2.357059955596924, -2.298654556274414, -2.2402491569519043, -2.1818437576293945, -2.1234383583068848, -2.065032958984375, -2.0066275596618652, -1.9482221603393555, -1.8898167610168457, -1.831411361694336, -1.7730059623718262, -1.7146005630493164, -1.6561951637268066, -1.597790002822876, -1.5393846035003662, -1.4809792041778564, -1.4225738048553467, -1.364168405532837, -1.3057630062103271, -1.2473576068878174, -1.1889522075653076, -1.1305468082427979, -1.072141408920288, -1.0137360095977783, -0.9553306102752686, -0.8969252109527588, -0.838519811630249, -0.780114471912384, -0.7217090725898743, -0.6633037328720093, -0.6048983335494995, -0.5464929342269897, -0.48808756470680237, -0.4296821653842926, -0.37127676606178284, -0.31287139654159546, -0.2544659972190857, -0.19606059789657593, -0.13765519857406616, -0.07924981415271759, -0.02084442973136902, 0.03756096959114075, 0.09596636891365051, 0.1543717384338379, 0.21277713775634766, 0.2711825370788574, 0.3295879364013672, 0.38799333572387695, 0.44639870524406433, 0.5048041343688965, 0.5632095336914062, 0.6216148734092712, 0.680020272731781, 0.7384256720542908]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 5.0, 8.0, 8.0, 11.0, 7.0, 10.0, 19.0, 11.0, 15.0, 30.0, 24.0, 34.0, 36.0, 34.0, 36.0, 34.0, 37.0, 37.0, 41.0, 41.0, 49.0, 46.0, 50.0, 44.0, 27.0, 36.0, 31.0, 31.0, 26.0, 25.0, 24.0, 19.0, 25.0, 13.0, 9.0, 12.0, 14.0, 9.0, 9.0, 5.0, 3.0, 5.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.6818969249725342, -0.6597164869308472, -0.6375360488891602, -0.6153556108474731, -0.5931751728057861, -0.5709947943687439, -0.5488143563270569, -0.5266339182853699, -0.5044534802436829, -0.48227304220199585, -0.46009260416030884, -0.4379121959209442, -0.4157317578792572, -0.3935513198375702, -0.37137091159820557, -0.34919047355651855, -0.32701003551483154, -0.30482959747314453, -0.2826491594314575, -0.2604687511920929, -0.23828831315040588, -0.21610787510871887, -0.19392745196819305, -0.17174702882766724, -0.14956659078598022, -0.1273861527442932, -0.1052057296037674, -0.08302529901266098, -0.060844868421554565, -0.03866443783044815, -0.016484007239341736, 0.005696415901184082, 0.02787691354751587, 0.050057344138622284, 0.0722377747297287, 0.09441820532083511, 0.11659863591194153, 0.13877907395362854, 0.16095949709415436, 0.18313992023468018, 0.2053203582763672, 0.2275007963180542, 0.24968121945858002, 0.27186164259910583, 0.29404208064079285, 0.31622251868247986, 0.3384029269218445, 0.3605833649635315, 0.3827638030052185, 0.4049442410469055, 0.42712467908859253, 0.44930508732795715, 0.47148552536964417, 0.4936659634113312, 0.5158463716506958, 0.5380268096923828, 0.5602072477340698, 0.5823876857757568, 0.6045681238174438, 0.6267485618591309, 0.6489289999008179, 0.6711093783378601, 0.6932898163795471, 0.7154702544212341, 0.7376506924629211]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 5.0, 8.0, 12.0, 16.0, 26.0, 40.0, 60.0, 87.0, 194.0, 350.0, 719.0, 1594.0, 4627.0, 16409.0, 78429.0, 670018.0, 3036253.0, 322869.0, 45578.0, 10587.0, 3465.0, 1366.0, 627.0, 367.0, 217.0, 132.0, 94.0, 44.0, 30.0, 31.0, 14.0, 5.0, 4.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.257568359375, -0.24779510498046875, -0.2380218505859375, -0.22824859619140625, -0.218475341796875, -0.20870208740234375, -0.1989288330078125, -0.18915557861328125, -0.17938232421875, -0.16960906982421875, -0.1598358154296875, -0.15006256103515625, -0.140289306640625, -0.13051605224609375, -0.1207427978515625, -0.11096954345703125, -0.1011962890625, -0.09142303466796875, -0.0816497802734375, -0.07187652587890625, -0.062103271484375, -0.05233001708984375, -0.0425567626953125, -0.03278350830078125, -0.02301025390625, -0.01323699951171875, -0.0034637451171875, 0.00630950927734375, 0.016082763671875, 0.02585601806640625, 0.0356292724609375, 0.04540252685546875, 0.05517578125, 0.06494903564453125, 0.0747222900390625, 0.08449554443359375, 0.094268798828125, 0.10404205322265625, 0.1138153076171875, 0.12358856201171875, 0.13336181640625, 0.14313507080078125, 0.1529083251953125, 0.16268157958984375, 0.172454833984375, 0.18222808837890625, 0.1920013427734375, 0.20177459716796875, 0.2115478515625, 0.22132110595703125, 0.2310943603515625, 0.24086761474609375, 0.250640869140625, 0.26041412353515625, 0.2701873779296875, 0.27996063232421875, 0.28973388671875, 0.29950714111328125, 0.3092803955078125, 0.31905364990234375, 0.328826904296875, 0.33860015869140625, 0.3483734130859375, 0.35814666748046875, 0.367919921875]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 5.0, 18.0, 15.0, 22.0, 35.0, 43.0, 47.0, 70.0, 65.0, 84.0, 98.0, 95.0, 84.0, 78.0, 57.0, 50.0, 48.0, 34.0, 20.0, 17.0, 12.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.08575439453125, -0.08075237274169922, -0.07575035095214844, -0.07074832916259766, -0.06574630737304688, -0.060744285583496094, -0.05574226379394531, -0.05074024200439453, -0.04573822021484375, -0.04073619842529297, -0.03573417663574219, -0.030732154846191406, -0.025730133056640625, -0.020728111267089844, -0.015726089477539062, -0.010724067687988281, -0.0057220458984375, -0.0007200241088867188, 0.0042819976806640625, 0.009284019470214844, 0.014286041259765625, 0.019288063049316406, 0.024290084838867188, 0.02929210662841797, 0.03429412841796875, 0.03929615020751953, 0.04429817199707031, 0.049300193786621094, 0.054302215576171875, 0.059304237365722656, 0.06430625915527344, 0.06930828094482422, 0.074310302734375, 0.07931232452392578, 0.08431434631347656, 0.08931636810302734, 0.09431838989257812, 0.0993204116821289, 0.10432243347167969, 0.10932445526123047, 0.11432647705078125, 0.11932849884033203, 0.12433052062988281, 0.1293325424194336, 0.13433456420898438, 0.13933658599853516, 0.14433860778808594, 0.14934062957763672, 0.1543426513671875, 0.15934467315673828, 0.16434669494628906, 0.16934871673583984, 0.17435073852539062, 0.1793527603149414, 0.1843547821044922, 0.18935680389404297, 0.19435882568359375, 0.19936084747314453, 0.2043628692626953, 0.2093648910522461, 0.21436691284179688, 0.21936893463134766, 0.22437095642089844, 0.22937297821044922, 0.234375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 9.0, 3.0, 9.0, 7.0, 19.0, 17.0, 23.0, 37.0, 48.0, 60.0, 110.0, 174.0, 336.0, 630.0, 1177.0, 2613.0, 6325.0, 18032.0, 63710.0, 323711.0, 2196821.0, 1320594.0, 194261.0, 43315.0, 13095.0, 4892.0, 2039.0, 994.0, 484.0, 279.0, 143.0, 111.0, 68.0, 39.0, 27.0, 26.0, 9.0, 6.0, 13.0, 9.0, 6.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.33740234375, -0.3271331787109375, -0.316864013671875, -0.3065948486328125, -0.29632568359375, -0.2860565185546875, -0.275787353515625, -0.2655181884765625, -0.2552490234375, -0.2449798583984375, -0.234710693359375, -0.2244415283203125, -0.21417236328125, -0.2039031982421875, -0.193634033203125, -0.1833648681640625, -0.173095703125, -0.1628265380859375, -0.152557373046875, -0.1422882080078125, -0.13201904296875, -0.1217498779296875, -0.111480712890625, -0.1012115478515625, -0.0909423828125, -0.0806732177734375, -0.070404052734375, -0.0601348876953125, -0.04986572265625, -0.0395965576171875, -0.029327392578125, -0.0190582275390625, -0.0087890625, 0.0014801025390625, 0.011749267578125, 0.0220184326171875, 0.03228759765625, 0.0425567626953125, 0.052825927734375, 0.0630950927734375, 0.0733642578125, 0.0836334228515625, 0.093902587890625, 0.1041717529296875, 0.11444091796875, 0.1247100830078125, 0.134979248046875, 0.1452484130859375, 0.155517578125, 0.1657867431640625, 0.176055908203125, 0.1863250732421875, 0.19659423828125, 0.2068634033203125, 0.217132568359375, 0.2274017333984375, 0.2376708984375, 0.2479400634765625, 0.258209228515625, 0.2684783935546875, 0.27874755859375, 0.2890167236328125, 0.299285888671875, 0.3095550537109375, 0.31982421875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 5.0, 6.0, 6.0, 13.0, 17.0, 18.0, 30.0, 50.0, 83.0, 109.0, 178.0, 276.0, 484.0, 682.0, 745.0, 482.0, 341.0, 186.0, 120.0, 83.0, 49.0, 30.0, 27.0, 20.0, 9.0, 9.0, 10.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.29541015625, -0.2869911193847656, -0.27857208251953125, -0.2701530456542969, -0.2617340087890625, -0.2533149719238281, -0.24489593505859375, -0.23647689819335938, -0.228057861328125, -0.21963882446289062, -0.21121978759765625, -0.20280075073242188, -0.1943817138671875, -0.18596267700195312, -0.17754364013671875, -0.16912460327148438, -0.16070556640625, -0.15228652954101562, -0.14386749267578125, -0.13544845581054688, -0.1270294189453125, -0.11861038208007812, -0.11019134521484375, -0.10177230834960938, -0.093353271484375, -0.08493423461914062, -0.07651519775390625, -0.06809616088867188, -0.0596771240234375, -0.051258087158203125, -0.04283905029296875, -0.034420013427734375, -0.0260009765625, -0.017581939697265625, -0.00916290283203125, -0.000743865966796875, 0.0076751708984375, 0.016094207763671875, 0.02451324462890625, 0.032932281494140625, 0.041351318359375, 0.049770355224609375, 0.05818939208984375, 0.06660842895507812, 0.0750274658203125, 0.08344650268554688, 0.09186553955078125, 0.10028457641601562, 0.10870361328125, 0.11712265014648438, 0.12554168701171875, 0.13396072387695312, 0.1423797607421875, 0.15079879760742188, 0.15921783447265625, 0.16763687133789062, 0.176055908203125, 0.18447494506835938, 0.19289398193359375, 0.20131301879882812, 0.2097320556640625, 0.21815109252929688, 0.22657012939453125, 0.23498916625976562, 0.243408203125]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 11.0, 3.0, 6.0, 6.0, 12.0, 25.0, 31.0, 30.0, 58.0, 57.0, 76.0, 77.0, 81.0, 73.0, 84.0, 85.0, 73.0, 51.0, 35.0, 41.0, 23.0, 17.0, 12.0, 10.0, 4.0, 6.0, 7.0, 5.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0217467546463013, -0.9913377165794373, -0.9609286785125732, -0.9305196404457092, -0.9001106023788452, -0.8697015643119812, -0.8392925262451172, -0.808883547782898, -0.7784744501113892, -0.7480654120445251, -0.7176563739776611, -0.6872473359107971, -0.6568382978439331, -0.6264292597770691, -0.5960202217102051, -0.5656112432479858, -0.5352022051811218, -0.5047931671142578, -0.4743841290473938, -0.4439750909805298, -0.41356605291366577, -0.38315701484680176, -0.35274800658226013, -0.3223389685153961, -0.2919299304485321, -0.2615208923816681, -0.23111185431480408, -0.20070283114910126, -0.17029379308223724, -0.13988475501537323, -0.10947573184967041, -0.0790666937828064, -0.04865765571594238, -0.018248621374368668, 0.012160412967205048, 0.042569443583488464, 0.07297848165035248, 0.10338751971721649, 0.1337965428829193, 0.16420558094978333, 0.19461461901664734, 0.22502365708351135, 0.25543269515037537, 0.285841703414917, 0.316250741481781, 0.346659779548645, 0.37706881761550903, 0.40747785568237305, 0.43788689374923706, 0.4682959318161011, 0.4987049698829651, 0.5291140079498291, 0.5595230460166931, 0.5899320840835571, 0.6203410625457764, 0.6507501602172852, 0.6811591386795044, 0.7115681767463684, 0.7419772148132324, 0.7723862528800964, 0.8027952909469604, 0.8332043290138245, 0.8636133670806885, 0.8940223455429077, 0.9244314432144165]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 5.0, 2.0, 7.0, 6.0, 5.0, 11.0, 15.0, 14.0, 10.0, 15.0, 20.0, 19.0, 25.0, 26.0, 41.0, 40.0, 33.0, 32.0, 50.0, 53.0, 45.0, 42.0, 37.0, 58.0, 46.0, 46.0, 27.0, 30.0, 38.0, 35.0, 32.0, 27.0, 19.0, 19.0, 11.0, 14.0, 18.0, 9.0, 5.0, 8.0, 2.0, 6.0, 7.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.7819831371307373, -0.7594842314720154, -0.7369852662086487, -0.7144863605499268, -0.6919873952865601, -0.6694884896278381, -0.6469895839691162, -0.6244906187057495, -0.6019916534423828, -0.5794927477836609, -0.5569937825202942, -0.5344948768615723, -0.5119959115982056, -0.48949700593948364, -0.46699807047843933, -0.444499135017395, -0.4220002293586731, -0.3995012938976288, -0.3770023584365845, -0.35450345277786255, -0.33200448751449585, -0.3095055818557739, -0.2870066463947296, -0.2645077109336853, -0.242008775472641, -0.21950984001159668, -0.19701090455055237, -0.17451198399066925, -0.15201304852962494, -0.12951411306858063, -0.10701519250869751, -0.0845162570476532, -0.06201726198196411, -0.0395183302462101, -0.017019398510456085, 0.005479529500007629, 0.02797846496105194, 0.05047740042209625, 0.07297632098197937, 0.09547525644302368, 0.117974191904068, 0.1404731273651123, 0.16297206282615662, 0.18547098338603973, 0.20796991884708405, 0.23046885430812836, 0.2529677748680115, 0.2754667103290558, 0.2979656457901001, 0.3204645812511444, 0.3429635167121887, 0.36546242237091064, 0.38796138763427734, 0.41046029329299927, 0.4329592287540436, 0.4554581642150879, 0.4779570996761322, 0.5004560351371765, 0.5229549407958984, 0.5454539060592651, 0.5679528117179871, 0.5904517769813538, 0.6129506826400757, 0.6354496479034424, 0.6579485535621643]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 6.0, 12.0, 5.0, 7.0, 12.0, 27.0, 37.0, 36.0, 69.0, 97.0, 184.0, 294.0, 501.0, 966.0, 2063.0, 4029.0, 8473.0, 18203.0, 43395.0, 119322.0, 313414.0, 326314.0, 127936.0, 46155.0, 19345.0, 8971.0, 4201.0, 2090.0, 1050.0, 533.0, 316.0, 189.0, 91.0, 74.0, 49.0, 23.0, 20.0, 19.0, 12.0, 9.0, 6.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.289794921875, -0.28045654296875, -0.2711181640625, -0.26177978515625, -0.25244140625, -0.24310302734375, -0.2337646484375, -0.22442626953125, -0.215087890625, -0.20574951171875, -0.1964111328125, -0.18707275390625, -0.177734375, -0.16839599609375, -0.1590576171875, -0.14971923828125, -0.140380859375, -0.13104248046875, -0.1217041015625, -0.11236572265625, -0.10302734375, -0.09368896484375, -0.0843505859375, -0.07501220703125, -0.065673828125, -0.05633544921875, -0.0469970703125, -0.03765869140625, -0.0283203125, -0.01898193359375, -0.0096435546875, -0.00030517578125, 0.009033203125, 0.01837158203125, 0.0277099609375, 0.03704833984375, 0.04638671875, 0.05572509765625, 0.0650634765625, 0.07440185546875, 0.083740234375, 0.09307861328125, 0.1024169921875, 0.11175537109375, 0.12109375, 0.13043212890625, 0.1397705078125, 0.14910888671875, 0.158447265625, 0.16778564453125, 0.1771240234375, 0.18646240234375, 0.19580078125, 0.20513916015625, 0.2144775390625, 0.22381591796875, 0.233154296875, 0.24249267578125, 0.2518310546875, 0.26116943359375, 0.2705078125, 0.27984619140625, 0.2891845703125, 0.29852294921875, 0.307861328125]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 3.0, 11.0, 8.0, 11.0, 27.0, 24.0, 34.0, 46.0, 47.0, 68.0, 56.0, 72.0, 94.0, 88.0, 62.0, 78.0, 80.0, 37.0, 54.0, 30.0, 32.0, 10.0, 11.0, 14.0, 5.0, 4.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0836181640625, -0.07875633239746094, -0.07389450073242188, -0.06903266906738281, -0.06417083740234375, -0.05930900573730469, -0.054447174072265625, -0.04958534240722656, -0.0447235107421875, -0.03986167907714844, -0.034999847412109375, -0.030138015747070312, -0.02527618408203125, -0.020414352416992188, -0.015552520751953125, -0.010690689086914062, -0.005828857421875, -0.0009670257568359375, 0.003894805908203125, 0.008756637573242188, 0.01361846923828125, 0.018480300903320312, 0.023342132568359375, 0.028203964233398438, 0.0330657958984375, 0.03792762756347656, 0.042789459228515625, 0.04765129089355469, 0.05251312255859375, 0.05737495422363281, 0.062236785888671875, 0.06709861755371094, 0.07196044921875, 0.07682228088378906, 0.08168411254882812, 0.08654594421386719, 0.09140777587890625, 0.09626960754394531, 0.10113143920898438, 0.10599327087402344, 0.1108551025390625, 0.11571693420410156, 0.12057876586914062, 0.1254405975341797, 0.13030242919921875, 0.1351642608642578, 0.14002609252929688, 0.14488792419433594, 0.149749755859375, 0.15461158752441406, 0.15947341918945312, 0.1643352508544922, 0.16919708251953125, 0.1740589141845703, 0.17892074584960938, 0.18378257751464844, 0.1886444091796875, 0.19350624084472656, 0.19836807250976562, 0.2032299041748047, 0.20809173583984375, 0.2129535675048828, 0.21781539916992188, 0.22267723083496094, 0.2275390625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 8.0, 7.0, 10.0, 18.0, 31.0, 58.0, 147.0, 267.0, 569.0, 1209.0, 2588.0, 5894.0, 13536.0, 37689.0, 154211.0, 516203.0, 232454.0, 52556.0, 17745.0, 7321.0, 3226.0, 1444.0, 658.0, 343.0, 150.0, 84.0, 49.0, 34.0, 12.0, 8.0, 12.0, 2.0, 7.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.3935546875, -0.38027191162109375, -0.3669891357421875, -0.35370635986328125, -0.340423583984375, -0.32714080810546875, -0.3138580322265625, -0.30057525634765625, -0.28729248046875, -0.27400970458984375, -0.2607269287109375, -0.24744415283203125, -0.234161376953125, -0.22087860107421875, -0.2075958251953125, -0.19431304931640625, -0.1810302734375, -0.16774749755859375, -0.1544647216796875, -0.14118194580078125, -0.127899169921875, -0.11461639404296875, -0.1013336181640625, -0.08805084228515625, -0.07476806640625, -0.06148529052734375, -0.0482025146484375, -0.03491973876953125, -0.021636962890625, -0.00835418701171875, 0.0049285888671875, 0.01821136474609375, 0.031494140625, 0.04477691650390625, 0.0580596923828125, 0.07134246826171875, 0.084625244140625, 0.09790802001953125, 0.1111907958984375, 0.12447357177734375, 0.13775634765625, 0.15103912353515625, 0.1643218994140625, 0.17760467529296875, 0.190887451171875, 0.20417022705078125, 0.2174530029296875, 0.23073577880859375, 0.2440185546875, 0.25730133056640625, 0.2705841064453125, 0.28386688232421875, 0.297149658203125, 0.31043243408203125, 0.3237152099609375, 0.33699798583984375, 0.35028076171875, 0.36356353759765625, 0.3768463134765625, 0.39012908935546875, 0.403411865234375, 0.41669464111328125, 0.4299774169921875, 0.44326019287109375, 0.45654296875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 6.0, 0.0, 1.0, 4.0, 2.0, 8.0, 4.0, 4.0, 8.0, 16.0, 14.0, 18.0, 28.0, 29.0, 30.0, 30.0, 43.0, 49.0, 61.0, 60.0, 62.0, 67.0, 53.0, 70.0, 56.0, 39.0, 48.0, 44.0, 26.0, 31.0, 24.0, 21.0, 18.0, 11.0, 8.0, 5.0, 5.0, 9.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.40625, -0.39488983154296875, -0.3835296630859375, -0.37216949462890625, -0.360809326171875, -0.34944915771484375, -0.3380889892578125, -0.32672882080078125, -0.31536865234375, -0.30400848388671875, -0.2926483154296875, -0.28128814697265625, -0.269927978515625, -0.25856781005859375, -0.2472076416015625, -0.23584747314453125, -0.2244873046875, -0.21312713623046875, -0.2017669677734375, -0.19040679931640625, -0.179046630859375, -0.16768646240234375, -0.1563262939453125, -0.14496612548828125, -0.13360595703125, -0.12224578857421875, -0.1108856201171875, -0.09952545166015625, -0.088165283203125, -0.07680511474609375, -0.0654449462890625, -0.05408477783203125, -0.042724609375, -0.03136444091796875, -0.0200042724609375, -0.00864410400390625, 0.002716064453125, 0.01407623291015625, 0.0254364013671875, 0.03679656982421875, 0.04815673828125, 0.05951690673828125, 0.0708770751953125, 0.08223724365234375, 0.093597412109375, 0.10495758056640625, 0.1163177490234375, 0.12767791748046875, 0.1390380859375, 0.15039825439453125, 0.1617584228515625, 0.17311859130859375, 0.184478759765625, 0.19583892822265625, 0.2071990966796875, 0.21855926513671875, 0.22991943359375, 0.24127960205078125, 0.2526397705078125, 0.26399993896484375, 0.275360107421875, 0.28672027587890625, 0.2980804443359375, 0.30944061279296875, 0.32080078125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 5.0, 1.0, 7.0, 8.0, 17.0, 29.0, 35.0, 65.0, 95.0, 200.0, 366.0, 559.0, 1087.0, 2155.0, 4454.0, 9976.0, 23890.0, 62425.0, 230100.0, 483577.0, 150036.0, 46034.0, 18185.0, 7875.0, 3568.0, 1729.0, 911.0, 503.0, 291.0, 143.0, 94.0, 56.0, 31.0, 18.0, 8.0, 13.0, 6.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2037353515625, -0.1967945098876953, -0.18985366821289062, -0.18291282653808594, -0.17597198486328125, -0.16903114318847656, -0.16209030151367188, -0.1551494598388672, -0.1482086181640625, -0.1412677764892578, -0.13432693481445312, -0.12738609313964844, -0.12044525146484375, -0.11350440979003906, -0.10656356811523438, -0.09962272644042969, -0.092681884765625, -0.08574104309082031, -0.07880020141601562, -0.07185935974121094, -0.06491851806640625, -0.05797767639160156, -0.051036834716796875, -0.04409599304199219, -0.0371551513671875, -0.030214309692382812, -0.023273468017578125, -0.016332626342773438, -0.00939178466796875, -0.0024509429931640625, 0.004489898681640625, 0.011430740356445312, 0.01837158203125, 0.025312423706054688, 0.032253265380859375, 0.03919410705566406, 0.04613494873046875, 0.05307579040527344, 0.060016632080078125, 0.06695747375488281, 0.0738983154296875, 0.08083915710449219, 0.08777999877929688, 0.09472084045410156, 0.10166168212890625, 0.10860252380371094, 0.11554336547851562, 0.12248420715332031, 0.129425048828125, 0.1363658905029297, 0.14330673217773438, 0.15024757385253906, 0.15718841552734375, 0.16412925720214844, 0.17107009887695312, 0.1780109405517578, 0.1849517822265625, 0.1918926239013672, 0.19883346557617188, 0.20577430725097656, 0.21271514892578125, 0.21965599060058594, 0.22659683227539062, 0.2335376739501953, 0.240478515625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0, 5.0, 5.0, 5.0, 8.0, 14.0, 14.0, 13.0, 40.0, 41.0, 81.0, 150.0, 195.0, 152.0, 88.0, 54.0, 28.0, 30.0, 19.0, 12.0, 7.0, 8.0, 7.0, 4.0, 6.0, 2.0, 1.0, 6.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.115436553955078e-05, -5.9567391872406006e-05, -5.798041820526123e-05, -5.6393444538116455e-05, -5.480647087097168e-05, -5.3219497203826904e-05, -5.163252353668213e-05, -5.0045549869537354e-05, -4.845857620239258e-05, -4.68716025352478e-05, -4.528462886810303e-05, -4.369765520095825e-05, -4.2110681533813477e-05, -4.05237078666687e-05, -3.8936734199523926e-05, -3.734976053237915e-05, -3.5762786865234375e-05, -3.41758131980896e-05, -3.2588839530944824e-05, -3.100186586380005e-05, -2.9414892196655273e-05, -2.7827918529510498e-05, -2.6240944862365723e-05, -2.4653971195220947e-05, -2.3066997528076172e-05, -2.1480023860931396e-05, -1.989305019378662e-05, -1.8306076526641846e-05, -1.671910285949707e-05, -1.5132129192352295e-05, -1.354515552520752e-05, -1.1958181858062744e-05, -1.0371208190917969e-05, -8.784234523773193e-06, -7.197260856628418e-06, -5.610287189483643e-06, -4.023313522338867e-06, -2.436339855194092e-06, -8.493661880493164e-07, 7.37607479095459e-07, 2.3245811462402344e-06, 3.91155481338501e-06, 5.498528480529785e-06, 7.0855021476745605e-06, 8.672475814819336e-06, 1.0259449481964111e-05, 1.1846423149108887e-05, 1.3433396816253662e-05, 1.5020370483398438e-05, 1.6607344150543213e-05, 1.8194317817687988e-05, 1.9781291484832764e-05, 2.136826515197754e-05, 2.2955238819122314e-05, 2.454221248626709e-05, 2.6129186153411865e-05, 2.771615982055664e-05, 2.9303133487701416e-05, 3.089010715484619e-05, 3.247708082199097e-05, 3.406405448913574e-05, 3.565102815628052e-05, 3.723800182342529e-05, 3.882497549057007e-05, 4.0411949157714844e-05]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 9.0, 9.0, 12.0, 29.0, 27.0, 32.0, 60.0, 83.0, 118.0, 198.0, 283.0, 467.0, 810.0, 1356.0, 2462.0, 4757.0, 9826.0, 21418.0, 50857.0, 152410.0, 438092.0, 238782.0, 72236.0, 28272.0, 12579.0, 6119.0, 3086.0, 1638.0, 936.0, 575.0, 318.0, 209.0, 145.0, 104.0, 77.0, 44.0, 29.0, 28.0, 20.0, 13.0, 12.0, 4.0, 4.0, 2.0, 6.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1822509765625, -0.17630958557128906, -0.17036819458007812, -0.1644268035888672, -0.15848541259765625, -0.1525440216064453, -0.14660263061523438, -0.14066123962402344, -0.1347198486328125, -0.12877845764160156, -0.12283706665039062, -0.11689567565917969, -0.11095428466796875, -0.10501289367675781, -0.09907150268554688, -0.09313011169433594, -0.087188720703125, -0.08124732971191406, -0.07530593872070312, -0.06936454772949219, -0.06342315673828125, -0.05748176574707031, -0.051540374755859375, -0.04559898376464844, -0.0396575927734375, -0.03371620178222656, -0.027774810791015625, -0.021833419799804688, -0.01589202880859375, -0.009950637817382812, -0.004009246826171875, 0.0019321441650390625, 0.00787353515625, 0.013814926147460938, 0.019756317138671875, 0.025697708129882812, 0.03163909912109375, 0.03758049011230469, 0.043521881103515625, 0.04946327209472656, 0.0554046630859375, 0.06134605407714844, 0.06728744506835938, 0.07322883605957031, 0.07917022705078125, 0.08511161804199219, 0.09105300903320312, 0.09699440002441406, 0.102935791015625, 0.10887718200683594, 0.11481857299804688, 0.12075996398925781, 0.12670135498046875, 0.1326427459716797, 0.13858413696289062, 0.14452552795410156, 0.1504669189453125, 0.15640830993652344, 0.16234970092773438, 0.1682910919189453, 0.17423248291015625, 0.1801738739013672, 0.18611526489257812, 0.19205665588378906, 0.197998046875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 3.0, 3.0, 4.0, 8.0, 2.0, 5.0, 3.0, 11.0, 13.0, 22.0, 34.0, 57.0, 90.0, 121.0, 136.0, 142.0, 114.0, 70.0, 56.0, 37.0, 17.0, 10.0, 8.0, 10.0, 7.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.288330078125, -0.28067588806152344, -0.2730216979980469, -0.2653675079345703, -0.25771331787109375, -0.2500591278076172, -0.24240493774414062, -0.23475074768066406, -0.2270965576171875, -0.21944236755371094, -0.21178817749023438, -0.2041339874267578, -0.19647979736328125, -0.1888256072998047, -0.18117141723632812, -0.17351722717285156, -0.165863037109375, -0.15820884704589844, -0.15055465698242188, -0.1429004669189453, -0.13524627685546875, -0.1275920867919922, -0.11993789672851562, -0.11228370666503906, -0.1046295166015625, -0.09697532653808594, -0.08932113647460938, -0.08166694641113281, -0.07401275634765625, -0.06635856628417969, -0.058704376220703125, -0.05105018615722656, -0.04339599609375, -0.03574180603027344, -0.028087615966796875, -0.020433425903320312, -0.01277923583984375, -0.0051250457763671875, 0.002529144287109375, 0.010183334350585938, 0.0178375244140625, 0.025491714477539062, 0.033145904541015625, 0.04080009460449219, 0.04845428466796875, 0.05610847473144531, 0.06376266479492188, 0.07141685485839844, 0.079071044921875, 0.08672523498535156, 0.09437942504882812, 0.10203361511230469, 0.10968780517578125, 0.11734199523925781, 0.12499618530273438, 0.13265037536621094, 0.1403045654296875, 0.14795875549316406, 0.15561294555664062, 0.1632671356201172, 0.17092132568359375, 0.1785755157470703, 0.18622970581054688, 0.19388389587402344, 0.2015380859375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 0.0, 3.0, 5.0, 8.0, 9.0, 22.0, 36.0, 47.0, 75.0, 99.0, 104.0, 101.0, 115.0, 95.0, 93.0, 52.0, 50.0, 30.0, 19.0, 9.0, 14.0, 6.0, 2.0, 8.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6127504110336304, -1.5591074228286743, -1.5054645538330078, -1.4518215656280518, -1.3981785774230957, -1.3445355892181396, -1.2908927202224731, -1.237249732017517, -1.1836068630218506, -1.1299638748168945, -1.076321005821228, -1.022678017616272, -0.9690350294113159, -0.9153921008110046, -0.8617491722106934, -0.8081061840057373, -0.7544631958007812, -0.70082026720047, -0.6471772789955139, -0.5935343503952026, -0.5398913621902466, -0.4862484335899353, -0.432605504989624, -0.37896254658699036, -0.3253195881843567, -0.271676629781723, -0.21803368628025055, -0.16439074277877808, -0.11074778437614441, -0.05710482597351074, -0.003461897373199463, 0.050181061029434204, 0.10382401943206787, 0.15746697783470154, 0.211109921336174, 0.2647528648376465, 0.31839582324028015, 0.3720387816429138, 0.4256817102432251, 0.47932466864585876, 0.5329676270484924, 0.5866105556488037, 0.6402535438537598, 0.693896472454071, 0.7475394010543823, 0.8011823892593384, 0.8548253178596497, 0.9084682464599609, 0.962111234664917, 1.015754222869873, 1.0693970918655396, 1.1230400800704956, 1.1766830682754517, 1.2303259372711182, 1.2839689254760742, 1.3376119136810303, 1.3912549018859863, 1.4448978900909424, 1.4985407590866089, 1.552183747291565, 1.605826735496521, 1.6594696044921875, 1.7131125926971436, 1.7667555809020996, 1.8203984498977661]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 4.0, 3.0, 5.0, 5.0, 8.0, 13.0, 6.0, 9.0, 10.0, 16.0, 20.0, 24.0, 18.0, 27.0, 40.0, 38.0, 30.0, 45.0, 33.0, 44.0, 34.0, 39.0, 51.0, 45.0, 47.0, 25.0, 35.0, 39.0, 31.0, 33.0, 31.0, 21.0, 27.0, 32.0, 23.0, 16.0, 21.0, 7.0, 14.0, 8.0, 9.0, 5.0, 8.0, 5.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.8816020488739014, -0.853523313999176, -0.8254446387290955, -0.7973659038543701, -0.7692871689796448, -0.7412084341049194, -0.7131297588348389, -0.6850510239601135, -0.6569722890853882, -0.6288935542106628, -0.6008148789405823, -0.5727361440658569, -0.5446574091911316, -0.5165786743164062, -0.4884999990463257, -0.46042126417160034, -0.4323425590991974, -0.40426385402679443, -0.3761851191520691, -0.34810641407966614, -0.3200276792049408, -0.29194897413253784, -0.2638702392578125, -0.23579153418540955, -0.2077128142118454, -0.17963409423828125, -0.1515553742647171, -0.12347666174173355, -0.0953979417681694, -0.06731922924518585, -0.039240509271621704, -0.011161789298057556, 0.016916930675506592, 0.04499565064907074, 0.07307437062263489, 0.10115308314561844, 0.12923181056976318, 0.15731051564216614, 0.18538923561573029, 0.21346795558929443, 0.24154667556285858, 0.26962539553642273, 0.2977041006088257, 0.325782835483551, 0.353861540555954, 0.38194024562835693, 0.4100189805030823, 0.4380977153778076, 0.46617642045021057, 0.4942551255226135, 0.5223338603973389, 0.5504125952720642, 0.5784912705421448, 0.6065700054168701, 0.6346487402915955, 0.6627274751663208, 0.6908061504364014, 0.7188848853111267, 0.7469635605812073, 0.7750422954559326, 0.803121030330658, 0.8311997652053833, 0.8592784404754639, 0.8873571753501892, 0.9154359102249146]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 8.0, 4.0, 3.0, 15.0, 11.0, 27.0, 37.0, 45.0, 62.0, 124.0, 179.0, 348.0, 668.0, 1340.0, 3046.0, 8021.0, 24825.0, 102023.0, 726140.0, 2915070.0, 327792.0, 58374.0, 15902.0, 5471.0, 2260.0, 1076.0, 594.0, 292.0, 187.0, 107.0, 77.0, 45.0, 34.0, 20.0, 18.0, 14.0, 5.0, 8.0, 6.0, 2.0, 3.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.31640625, -0.306304931640625, -0.29620361328125, -0.286102294921875, -0.2760009765625, -0.265899658203125, -0.25579833984375, -0.245697021484375, -0.235595703125, -0.225494384765625, -0.21539306640625, -0.205291748046875, -0.1951904296875, -0.185089111328125, -0.17498779296875, -0.164886474609375, -0.15478515625, -0.144683837890625, -0.13458251953125, -0.124481201171875, -0.1143798828125, -0.104278564453125, -0.09417724609375, -0.084075927734375, -0.073974609375, -0.063873291015625, -0.05377197265625, -0.043670654296875, -0.0335693359375, -0.023468017578125, -0.01336669921875, -0.003265380859375, 0.0068359375, 0.016937255859375, 0.02703857421875, 0.037139892578125, 0.0472412109375, 0.057342529296875, 0.06744384765625, 0.077545166015625, 0.087646484375, 0.097747802734375, 0.10784912109375, 0.117950439453125, 0.1280517578125, 0.138153076171875, 0.14825439453125, 0.158355712890625, 0.16845703125, 0.178558349609375, 0.18865966796875, 0.198760986328125, 0.2088623046875, 0.218963623046875, 0.22906494140625, 0.239166259765625, 0.249267578125, 0.259368896484375, 0.26947021484375, 0.279571533203125, 0.2896728515625, 0.299774169921875, 0.30987548828125, 0.319976806640625, 0.330078125]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 7.0, 12.0, 21.0, 21.0, 32.0, 36.0, 38.0, 57.0, 63.0, 60.0, 65.0, 80.0, 67.0, 73.0, 67.0, 59.0, 59.0, 46.0, 50.0, 20.0, 21.0, 18.0, 14.0, 3.0, 9.0, 1.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09344482421875, -0.08835506439208984, -0.08326530456542969, -0.07817554473876953, -0.07308578491210938, -0.06799602508544922, -0.06290626525878906, -0.057816505432128906, -0.05272674560546875, -0.047636985778808594, -0.04254722595214844, -0.03745746612548828, -0.032367706298828125, -0.02727794647216797, -0.022188186645507812, -0.017098426818847656, -0.0120086669921875, -0.006918907165527344, -0.0018291473388671875, 0.0032606124877929688, 0.008350372314453125, 0.013440132141113281, 0.018529891967773438, 0.023619651794433594, 0.02870941162109375, 0.033799171447753906, 0.03888893127441406, 0.04397869110107422, 0.049068450927734375, 0.05415821075439453, 0.05924797058105469, 0.06433773040771484, 0.069427490234375, 0.07451725006103516, 0.07960700988769531, 0.08469676971435547, 0.08978652954101562, 0.09487628936767578, 0.09996604919433594, 0.1050558090209961, 0.11014556884765625, 0.1152353286743164, 0.12032508850097656, 0.12541484832763672, 0.13050460815429688, 0.13559436798095703, 0.1406841278076172, 0.14577388763427734, 0.1508636474609375, 0.15595340728759766, 0.1610431671142578, 0.16613292694091797, 0.17122268676757812, 0.17631244659423828, 0.18140220642089844, 0.1864919662475586, 0.19158172607421875, 0.1966714859008789, 0.20176124572753906, 0.20685100555419922, 0.21194076538085938, 0.21703052520751953, 0.2221202850341797, 0.22721004486083984, 0.2322998046875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 4.0, 5.0, 8.0, 8.0, 13.0, 12.0, 13.0, 34.0, 52.0, 93.0, 122.0, 199.0, 249.0, 451.0, 783.0, 1253.0, 2249.0, 4653.0, 10091.0, 24575.0, 71031.0, 249227.0, 1167616.0, 2062995.0, 424768.0, 111099.0, 36053.0, 13826.0, 5949.0, 2878.0, 1582.0, 900.0, 524.0, 332.0, 214.0, 146.0, 94.0, 54.0, 46.0, 28.0, 24.0, 6.0, 12.0, 10.0, 6.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.3359375, -0.32550048828125, -0.3150634765625, -0.30462646484375, -0.294189453125, -0.28375244140625, -0.2733154296875, -0.26287841796875, -0.25244140625, -0.24200439453125, -0.2315673828125, -0.22113037109375, -0.210693359375, -0.20025634765625, -0.1898193359375, -0.17938232421875, -0.1689453125, -0.15850830078125, -0.1480712890625, -0.13763427734375, -0.127197265625, -0.11676025390625, -0.1063232421875, -0.09588623046875, -0.08544921875, -0.07501220703125, -0.0645751953125, -0.05413818359375, -0.043701171875, -0.03326416015625, -0.0228271484375, -0.01239013671875, -0.001953125, 0.00848388671875, 0.0189208984375, 0.02935791015625, 0.039794921875, 0.05023193359375, 0.0606689453125, 0.07110595703125, 0.08154296875, 0.09197998046875, 0.1024169921875, 0.11285400390625, 0.123291015625, 0.13372802734375, 0.1441650390625, 0.15460205078125, 0.1650390625, 0.17547607421875, 0.1859130859375, 0.19635009765625, 0.206787109375, 0.21722412109375, 0.2276611328125, 0.23809814453125, 0.24853515625, 0.25897216796875, 0.2694091796875, 0.27984619140625, 0.290283203125, 0.30072021484375, 0.3111572265625, 0.32159423828125, 0.33203125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 4.0, 0.0, 1.0, 5.0, 8.0, 10.0, 12.0, 22.0, 29.0, 45.0, 56.0, 95.0, 148.0, 219.0, 369.0, 587.0, 811.0, 612.0, 369.0, 224.0, 148.0, 103.0, 63.0, 35.0, 34.0, 19.0, 19.0, 12.0, 12.0, 6.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.257568359375, -0.24821853637695312, -0.23886871337890625, -0.22951889038085938, -0.2201690673828125, -0.21081924438476562, -0.20146942138671875, -0.19211959838867188, -0.182769775390625, -0.17341995239257812, -0.16407012939453125, -0.15472030639648438, -0.1453704833984375, -0.13602066040039062, -0.12667083740234375, -0.11732101440429688, -0.10797119140625, -0.09862136840820312, -0.08927154541015625, -0.07992172241210938, -0.0705718994140625, -0.061222076416015625, -0.05187225341796875, -0.042522430419921875, -0.033172607421875, -0.023822784423828125, -0.01447296142578125, -0.005123138427734375, 0.0042266845703125, 0.013576507568359375, 0.02292633056640625, 0.032276153564453125, 0.0416259765625, 0.050975799560546875, 0.06032562255859375, 0.06967544555664062, 0.0790252685546875, 0.08837509155273438, 0.09772491455078125, 0.10707473754882812, 0.116424560546875, 0.12577438354492188, 0.13512420654296875, 0.14447402954101562, 0.1538238525390625, 0.16317367553710938, 0.17252349853515625, 0.18187332153320312, 0.19122314453125, 0.20057296752929688, 0.20992279052734375, 0.21927261352539062, 0.2286224365234375, 0.23797225952148438, 0.24732208251953125, 0.2566719055175781, 0.266021728515625, 0.2753715515136719, 0.28472137451171875, 0.2940711975097656, 0.3034210205078125, 0.3127708435058594, 0.32212066650390625, 0.3314704895019531, 0.3408203125]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 8.0, 7.0, 14.0, 15.0, 15.0, 28.0, 31.0, 42.0, 60.0, 63.0, 68.0, 81.0, 93.0, 79.0, 87.0, 74.0, 57.0, 41.0, 40.0, 27.0, 13.0, 14.0, 14.0, 12.0, 11.0, 4.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.2687612771987915, -1.2335816621780396, -1.198401927947998, -1.163222312927246, -1.1280426979064941, -1.0928629636764526, -1.0576833486557007, -1.0225036144256592, -0.9873239994049072, -0.9521443247795105, -0.9169646501541138, -0.8817850351333618, -0.8466053605079651, -0.8114256858825684, -0.7762460708618164, -0.7410663962364197, -0.705886721611023, -0.6707070469856262, -0.6355273723602295, -0.6003477573394775, -0.5651680827140808, -0.5299884080886841, -0.49480876326560974, -0.4596291184425354, -0.42444944381713867, -0.38926976919174194, -0.3540901243686676, -0.31891047954559326, -0.28373080492019653, -0.248551145195961, -0.21337148547172546, -0.17819182574748993, -0.1430121660232544, -0.10783250629901886, -0.07265284657478333, -0.03747318685054779, -0.002293527126312256, 0.03288613259792328, 0.06806579232215881, 0.10324545204639435, 0.13842511177062988, 0.17360477149486542, 0.20878443121910095, 0.2439640909433365, 0.279143750667572, 0.31432342529296875, 0.3495030701160431, 0.38468271493911743, 0.41986238956451416, 0.4550420641899109, 0.49022170901298523, 0.5254013538360596, 0.5605810284614563, 0.595760703086853, 0.630940318107605, 0.6661199927330017, 0.7012996673583984, 0.7364793419837952, 0.7716590166091919, 0.8068386316299438, 0.8420183062553406, 0.8771979808807373, 0.9123775959014893, 0.947557270526886, 0.9827369451522827]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 3.0, 3.0, 5.0, 4.0, 6.0, 8.0, 12.0, 9.0, 16.0, 13.0, 12.0, 21.0, 18.0, 30.0, 21.0, 33.0, 26.0, 35.0, 48.0, 33.0, 37.0, 30.0, 45.0, 29.0, 38.0, 51.0, 35.0, 39.0, 31.0, 34.0, 31.0, 33.0, 27.0, 15.0, 22.0, 18.0, 19.0, 19.0, 13.0, 13.0, 17.0, 13.0, 4.0, 7.0, 9.0, 3.0, 3.0, 5.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.669475793838501, -0.6492985486984253, -0.6291213631629944, -0.6089441180229187, -0.588766872882843, -0.5685896873474121, -0.5484124422073364, -0.5282351970672607, -0.5080579519271851, -0.48788073658943176, -0.4677034914493561, -0.4475262761116028, -0.4273490309715271, -0.4071718156337738, -0.3869946002960205, -0.3668173551559448, -0.3466401696205139, -0.3264629542827606, -0.30628570914268494, -0.28610849380493164, -0.26593124866485596, -0.24575403332710266, -0.22557681798934937, -0.20539958775043488, -0.18522235751152039, -0.1650451272726059, -0.1448678970336914, -0.12469068169593811, -0.10451345145702362, -0.08433622121810913, -0.06415899842977524, -0.043981775641441345, -0.023804545402526855, -0.003627318888902664, 0.016549907624721527, 0.03672713413834572, 0.05690436065196991, 0.0770815908908844, 0.09725881367921829, 0.11743603646755219, 0.13761326670646667, 0.15779049694538116, 0.17796772718429565, 0.19814494252204895, 0.21832217276096344, 0.23849940299987793, 0.2586766183376312, 0.2788538336753845, 0.2990310788154602, 0.3192082941532135, 0.3393855392932892, 0.3595627546310425, 0.37973999977111816, 0.39991721510887146, 0.42009443044662476, 0.44027167558670044, 0.46044889092445374, 0.48062610626220703, 0.5008033514022827, 0.5209805965423584, 0.5411577820777893, 0.561335027217865, 0.5815122723579407, 0.6016894578933716, 0.6218667030334473]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 4.0, 2.0, 4.0, 9.0, 12.0, 15.0, 19.0, 39.0, 54.0, 68.0, 96.0, 184.0, 255.0, 431.0, 699.0, 1222.0, 2014.0, 3447.0, 6186.0, 10591.0, 19058.0, 35368.0, 72722.0, 171784.0, 336910.0, 210151.0, 85837.0, 41233.0, 21480.0, 12053.0, 6846.0, 3990.0, 2298.0, 1330.0, 793.0, 458.0, 287.0, 200.0, 125.0, 95.0, 60.0, 44.0, 29.0, 20.0, 14.0, 6.0, 5.0, 7.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.25830078125, -0.2503795623779297, -0.24245834350585938, -0.23453712463378906, -0.22661590576171875, -0.21869468688964844, -0.21077346801757812, -0.2028522491455078, -0.1949310302734375, -0.1870098114013672, -0.17908859252929688, -0.17116737365722656, -0.16324615478515625, -0.15532493591308594, -0.14740371704101562, -0.1394824981689453, -0.131561279296875, -0.12364006042480469, -0.11571884155273438, -0.10779762268066406, -0.09987640380859375, -0.09195518493652344, -0.08403396606445312, -0.07611274719238281, -0.0681915283203125, -0.06027030944824219, -0.052349090576171875, -0.04442787170410156, -0.03650665283203125, -0.028585433959960938, -0.020664215087890625, -0.012742996215820312, -0.00482177734375, 0.0030994415283203125, 0.011020660400390625, 0.018941879272460938, 0.02686309814453125, 0.03478431701660156, 0.042705535888671875, 0.05062675476074219, 0.0585479736328125, 0.06646919250488281, 0.07439041137695312, 0.08231163024902344, 0.09023284912109375, 0.09815406799316406, 0.10607528686523438, 0.11399650573730469, 0.121917724609375, 0.1298389434814453, 0.13776016235351562, 0.14568138122558594, 0.15360260009765625, 0.16152381896972656, 0.16944503784179688, 0.1773662567138672, 0.1852874755859375, 0.1932086944580078, 0.20112991333007812, 0.20905113220214844, 0.21697235107421875, 0.22489356994628906, 0.23281478881835938, 0.2407360076904297, 0.2486572265625]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 1.0, 4.0, 5.0, 7.0, 14.0, 22.0, 19.0, 28.0, 27.0, 56.0, 44.0, 40.0, 53.0, 66.0, 80.0, 57.0, 68.0, 55.0, 50.0, 43.0, 62.0, 50.0, 38.0, 40.0, 16.0, 16.0, 12.0, 11.0, 10.0, 4.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.09765625, -0.09277534484863281, -0.08789443969726562, -0.08301353454589844, -0.07813262939453125, -0.07325172424316406, -0.06837081909179688, -0.06348991394042969, -0.0586090087890625, -0.05372810363769531, -0.048847198486328125, -0.04396629333496094, -0.03908538818359375, -0.03420448303222656, -0.029323577880859375, -0.024442672729492188, -0.019561767578125, -0.014680862426757812, -0.009799957275390625, -0.0049190521240234375, -3.814697265625e-05, 0.0048427581787109375, 0.009723663330078125, 0.014604568481445312, 0.0194854736328125, 0.024366378784179688, 0.029247283935546875, 0.03412818908691406, 0.03900909423828125, 0.04388999938964844, 0.048770904541015625, 0.05365180969238281, 0.05853271484375, 0.06341361999511719, 0.06829452514648438, 0.07317543029785156, 0.07805633544921875, 0.08293724060058594, 0.08781814575195312, 0.09269905090332031, 0.0975799560546875, 0.10246086120605469, 0.10734176635742188, 0.11222267150878906, 0.11710357666015625, 0.12198448181152344, 0.12686538696289062, 0.1317462921142578, 0.136627197265625, 0.1415081024169922, 0.14638900756835938, 0.15126991271972656, 0.15615081787109375, 0.16103172302246094, 0.16591262817382812, 0.1707935333251953, 0.1756744384765625, 0.1805553436279297, 0.18543624877929688, 0.19031715393066406, 0.19519805908203125, 0.20007896423339844, 0.20495986938476562, 0.2098407745361328, 0.2147216796875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 5.0, 4.0, 9.0, 17.0, 12.0, 24.0, 25.0, 34.0, 48.0, 53.0, 105.0, 156.0, 275.0, 465.0, 963.0, 1882.0, 3600.0, 7079.0, 14442.0, 30233.0, 69648.0, 202500.0, 422429.0, 177020.0, 63079.0, 27648.0, 13194.0, 6625.0, 3257.0, 1689.0, 901.0, 452.0, 250.0, 140.0, 89.0, 56.0, 33.0, 24.0, 26.0, 14.0, 8.0, 10.0, 9.0, 4.0, 6.0, 4.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.310302734375, -0.3004341125488281, -0.29056549072265625, -0.2806968688964844, -0.2708282470703125, -0.2609596252441406, -0.25109100341796875, -0.24122238159179688, -0.231353759765625, -0.22148513793945312, -0.21161651611328125, -0.20174789428710938, -0.1918792724609375, -0.18201065063476562, -0.17214202880859375, -0.16227340698242188, -0.15240478515625, -0.14253616333007812, -0.13266754150390625, -0.12279891967773438, -0.1129302978515625, -0.10306167602539062, -0.09319305419921875, -0.08332443237304688, -0.073455810546875, -0.06358718872070312, -0.05371856689453125, -0.043849945068359375, -0.0339813232421875, -0.024112701416015625, -0.01424407958984375, -0.004375457763671875, 0.0054931640625, 0.015361785888671875, 0.02523040771484375, 0.035099029541015625, 0.0449676513671875, 0.054836273193359375, 0.06470489501953125, 0.07457351684570312, 0.084442138671875, 0.09431076049804688, 0.10417938232421875, 0.11404800415039062, 0.1239166259765625, 0.13378524780273438, 0.14365386962890625, 0.15352249145507812, 0.16339111328125, 0.17325973510742188, 0.18312835693359375, 0.19299697875976562, 0.2028656005859375, 0.21273422241210938, 0.22260284423828125, 0.23247146606445312, 0.242340087890625, 0.2522087097167969, 0.26207733154296875, 0.2719459533691406, 0.2818145751953125, 0.2916831970214844, 0.30155181884765625, 0.3114204406738281, 0.3212890625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 5.0, 5.0, 6.0, 5.0, 10.0, 10.0, 18.0, 17.0, 11.0, 21.0, 29.0, 32.0, 38.0, 36.0, 48.0, 43.0, 49.0, 65.0, 48.0, 46.0, 46.0, 43.0, 45.0, 52.0, 40.0, 27.0, 20.0, 35.0, 21.0, 25.0, 12.0, 22.0, 12.0, 13.0, 12.0, 5.0, 7.0, 4.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.34228515625, -0.33154296875, -0.32080078125, -0.31005859375, -0.29931640625, -0.28857421875, -0.27783203125, -0.26708984375, -0.25634765625, -0.24560546875, -0.23486328125, -0.22412109375, -0.21337890625, -0.20263671875, -0.19189453125, -0.18115234375, -0.17041015625, -0.15966796875, -0.14892578125, -0.13818359375, -0.12744140625, -0.11669921875, -0.10595703125, -0.09521484375, -0.08447265625, -0.07373046875, -0.06298828125, -0.05224609375, -0.04150390625, -0.03076171875, -0.02001953125, -0.00927734375, 0.00146484375, 0.01220703125, 0.02294921875, 0.03369140625, 0.04443359375, 0.05517578125, 0.06591796875, 0.07666015625, 0.08740234375, 0.09814453125, 0.10888671875, 0.11962890625, 0.13037109375, 0.14111328125, 0.15185546875, 0.16259765625, 0.17333984375, 0.18408203125, 0.19482421875, 0.20556640625, 0.21630859375, 0.22705078125, 0.23779296875, 0.24853515625, 0.25927734375, 0.27001953125, 0.28076171875, 0.29150390625, 0.30224609375, 0.31298828125, 0.32373046875, 0.33447265625, 0.34521484375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 4.0, 6.0, 9.0, 13.0, 17.0, 21.0, 65.0, 89.0, 150.0, 291.0, 447.0, 843.0, 1526.0, 2642.0, 4890.0, 8557.0, 15554.0, 27801.0, 53806.0, 134353.0, 373212.0, 251194.0, 85800.0, 39418.0, 21034.0, 11755.0, 6640.0, 3705.0, 2068.0, 1122.0, 652.0, 347.0, 222.0, 118.0, 77.0, 39.0, 34.0, 18.0, 9.0, 4.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.129150390625, -0.12450027465820312, -0.11985015869140625, -0.11520004272460938, -0.1105499267578125, -0.10589981079101562, -0.10124969482421875, -0.09659957885742188, -0.091949462890625, -0.08729934692382812, -0.08264923095703125, -0.07799911499023438, -0.0733489990234375, -0.06869888305664062, -0.06404876708984375, -0.059398651123046875, -0.05474853515625, -0.050098419189453125, -0.04544830322265625, -0.040798187255859375, -0.0361480712890625, -0.031497955322265625, -0.02684783935546875, -0.022197723388671875, -0.017547607421875, -0.012897491455078125, -0.00824737548828125, -0.003597259521484375, 0.0010528564453125, 0.005702972412109375, 0.01035308837890625, 0.015003204345703125, 0.0196533203125, 0.024303436279296875, 0.02895355224609375, 0.033603668212890625, 0.0382537841796875, 0.042903900146484375, 0.04755401611328125, 0.052204132080078125, 0.056854248046875, 0.061504364013671875, 0.06615447998046875, 0.07080459594726562, 0.0754547119140625, 0.08010482788085938, 0.08475494384765625, 0.08940505981445312, 0.09405517578125, 0.09870529174804688, 0.10335540771484375, 0.10800552368164062, 0.1126556396484375, 0.11730575561523438, 0.12195587158203125, 0.12660598754882812, 0.131256103515625, 0.13590621948242188, 0.14055633544921875, 0.14520645141601562, 0.1498565673828125, 0.15450668334960938, 0.15915679931640625, 0.16380691528320312, 0.16845703125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0, 5.0, 5.0, 3.0, 8.0, 14.0, 10.0, 28.0, 26.0, 48.0, 51.0, 106.0, 174.0, 170.0, 117.0, 60.0, 54.0, 27.0, 26.0, 12.0, 10.0, 7.0, 11.0, 6.0, 6.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.601478576660156e-05, -4.463084042072296e-05, -4.324689507484436e-05, -4.186294972896576e-05, -4.047900438308716e-05, -3.909505903720856e-05, -3.7711113691329956e-05, -3.6327168345451355e-05, -3.4943222999572754e-05, -3.355927765369415e-05, -3.217533230781555e-05, -3.079138696193695e-05, -2.940744161605835e-05, -2.802349627017975e-05, -2.6639550924301147e-05, -2.5255605578422546e-05, -2.3871660232543945e-05, -2.2487714886665344e-05, -2.1103769540786743e-05, -1.9719824194908142e-05, -1.833587884902954e-05, -1.695193350315094e-05, -1.556798815727234e-05, -1.4184042811393738e-05, -1.2800097465515137e-05, -1.1416152119636536e-05, -1.0032206773757935e-05, -8.648261427879333e-06, -7.264316082000732e-06, -5.880370736122131e-06, -4.49642539024353e-06, -3.112480044364929e-06, -1.7285346984863281e-06, -3.4458935260772705e-07, 1.039355993270874e-06, 2.423301339149475e-06, 3.807246685028076e-06, 5.191192030906677e-06, 6.575137376785278e-06, 7.95908272266388e-06, 9.34302806854248e-06, 1.0726973414421082e-05, 1.2110918760299683e-05, 1.3494864106178284e-05, 1.4878809452056885e-05, 1.6262754797935486e-05, 1.7646700143814087e-05, 1.9030645489692688e-05, 2.041459083557129e-05, 2.179853618144989e-05, 2.318248152732849e-05, 2.4566426873207092e-05, 2.5950372219085693e-05, 2.7334317564964294e-05, 2.8718262910842896e-05, 3.0102208256721497e-05, 3.14861536026001e-05, 3.28700989484787e-05, 3.42540442943573e-05, 3.56379896402359e-05, 3.70219349861145e-05, 3.84058803319931e-05, 3.9789825677871704e-05, 4.1173771023750305e-05, 4.2557716369628906e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 6.0, 6.0, 16.0, 20.0, 35.0, 56.0, 121.0, 168.0, 449.0, 1126.0, 2721.0, 7231.0, 18793.0, 48660.0, 159540.0, 558463.0, 168911.0, 50108.0, 19670.0, 7491.0, 2900.0, 1125.0, 471.0, 205.0, 106.0, 62.0, 33.0, 36.0, 13.0, 7.0, 8.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2333984375, -0.22622108459472656, -0.21904373168945312, -0.2118663787841797, -0.20468902587890625, -0.1975116729736328, -0.19033432006835938, -0.18315696716308594, -0.1759796142578125, -0.16880226135253906, -0.16162490844726562, -0.1544475555419922, -0.14727020263671875, -0.1400928497314453, -0.13291549682617188, -0.12573814392089844, -0.118560791015625, -0.11138343811035156, -0.10420608520507812, -0.09702873229980469, -0.08985137939453125, -0.08267402648925781, -0.07549667358398438, -0.06831932067871094, -0.0611419677734375, -0.05396461486816406, -0.046787261962890625, -0.03960990905761719, -0.03243255615234375, -0.025255203247070312, -0.018077850341796875, -0.010900497436523438, -0.00372314453125, 0.0034542083740234375, 0.010631561279296875, 0.017808914184570312, 0.02498626708984375, 0.03216361999511719, 0.039340972900390625, 0.04651832580566406, 0.0536956787109375, 0.06087303161621094, 0.06805038452148438, 0.07522773742675781, 0.08240509033203125, 0.08958244323730469, 0.09675979614257812, 0.10393714904785156, 0.111114501953125, 0.11829185485839844, 0.12546920776367188, 0.1326465606689453, 0.13982391357421875, 0.1470012664794922, 0.15417861938476562, 0.16135597229003906, 0.1685333251953125, 0.17571067810058594, 0.18288803100585938, 0.1900653839111328, 0.19724273681640625, 0.2044200897216797, 0.21159744262695312, 0.21877479553222656, 0.2259521484375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 2.0, 1.0, 3.0, 3.0, 2.0, 10.0, 9.0, 7.0, 7.0, 9.0, 13.0, 17.0, 15.0, 30.0, 35.0, 43.0, 62.0, 94.0, 107.0, 121.0, 94.0, 92.0, 44.0, 34.0, 26.0, 18.0, 15.0, 16.0, 17.0, 11.0, 9.0, 9.0, 8.0, 4.0, 3.0, 2.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.162109375, -0.15708160400390625, -0.1520538330078125, -0.14702606201171875, -0.141998291015625, -0.13697052001953125, -0.1319427490234375, -0.12691497802734375, -0.12188720703125, -0.11685943603515625, -0.1118316650390625, -0.10680389404296875, -0.101776123046875, -0.09674835205078125, -0.0917205810546875, -0.08669281005859375, -0.0816650390625, -0.07663726806640625, -0.0716094970703125, -0.06658172607421875, -0.061553955078125, -0.05652618408203125, -0.0514984130859375, -0.04647064208984375, -0.04144287109375, -0.03641510009765625, -0.0313873291015625, -0.02635955810546875, -0.021331787109375, -0.01630401611328125, -0.0112762451171875, -0.00624847412109375, -0.001220703125, 0.00380706787109375, 0.0088348388671875, 0.01386260986328125, 0.018890380859375, 0.02391815185546875, 0.0289459228515625, 0.03397369384765625, 0.03900146484375, 0.04402923583984375, 0.0490570068359375, 0.05408477783203125, 0.059112548828125, 0.06414031982421875, 0.0691680908203125, 0.07419586181640625, 0.0792236328125, 0.08425140380859375, 0.0892791748046875, 0.09430694580078125, 0.099334716796875, 0.10436248779296875, 0.1093902587890625, 0.11441802978515625, 0.11944580078125, 0.12447357177734375, 0.1295013427734375, 0.13452911376953125, 0.139556884765625, 0.14458465576171875, 0.1496124267578125, 0.15464019775390625, 0.15966796875]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 5.0, 27.0, 84.0, 163.0, 282.0, 257.0, 129.0, 49.0, 13.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1073641777038574, -0.9641190767288208, -0.8208739757537842, -0.6776288747787476, -0.5343837738037109, -0.3911386728286743, -0.2478935718536377, -0.10464847087860107, 0.03859663009643555, 0.18184173107147217, 0.3250868320465088, 0.4683319330215454, 0.611577033996582, 0.7548221349716187, 0.8980672359466553, 1.041312336921692, 1.1845574378967285, 1.3278025388717651, 1.4710476398468018, 1.6142927408218384, 1.757537841796875, 1.9007829427719116, 2.0440280437469482, 2.1872730255126953, 2.3305182456970215, 2.4737634658813477, 2.6170084476470947, 2.760253429412842, 2.903498649597168, 3.046743869781494, 3.189988851547241, 3.3332338333129883, 3.4764795303344727, 3.619724750518799, 3.762969732284546, 3.906214714050293, 4.049459934234619, 4.192705154418945, 4.335949897766113, 4.4791951179504395, 4.622440338134766, 4.765685558319092, 4.908930778503418, 5.052175521850586, 5.195420742034912, 5.338665962219238, 5.481910705566406, 5.625155925750732, 5.768401145935059, 5.911646366119385, 6.054891586303711, 6.198136329650879, 6.341381549835205, 6.484626770019531, 6.627871513366699, 6.771116733551025, 6.914361953735352, 7.057607173919678, 7.200852394104004, 7.344097137451172, 7.487342357635498, 7.630587577819824, 7.773832321166992, 7.917077541351318, 8.060322761535645]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 4.0, 4.0, 2.0, 2.0, 7.0, 7.0, 6.0, 11.0, 13.0, 17.0, 21.0, 15.0, 9.0, 24.0, 27.0, 23.0, 21.0, 24.0, 43.0, 46.0, 36.0, 43.0, 28.0, 33.0, 38.0, 28.0, 44.0, 46.0, 40.0, 25.0, 38.0, 26.0, 40.0, 26.0, 20.0, 21.0, 23.0, 22.0, 24.0, 20.0, 6.0, 8.0, 10.0, 6.0, 8.0, 4.0, 7.0, 8.0, 2.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.8121540546417236, -0.783103883266449, -0.7540537118911743, -0.7250035405158997, -0.695953369140625, -0.6669031977653503, -0.6378530263900757, -0.6088029146194458, -0.5797526836395264, -0.5507025122642517, -0.521652340888977, -0.4926021695137024, -0.46355199813842773, -0.4345018267631531, -0.4054516851902008, -0.37640151381492615, -0.3473513722419739, -0.3183012008666992, -0.28925102949142456, -0.2602008581161499, -0.23115070164203644, -0.20210053026676178, -0.17305037379264832, -0.14400020241737366, -0.114950031042099, -0.08589985966682434, -0.05684969574213028, -0.027799531817436218, 0.00125063955783844, 0.030300810933113098, 0.05935096740722656, 0.08840113878250122, 0.11745131015777588, 0.14650148153305054, 0.1755516529083252, 0.20460180938243866, 0.23365198075771332, 0.26270216703414917, 0.29175230860710144, 0.3208024799823761, 0.34985265135765076, 0.3789028227329254, 0.4079529941082001, 0.43700313568115234, 0.466053307056427, 0.49510347843170166, 0.5241536498069763, 0.553203821182251, 0.5822539925575256, 0.6113041639328003, 0.640354335308075, 0.6694045066833496, 0.6984546780586243, 0.7275048494338989, 0.7565549612045288, 0.7856051921844482, 0.8146553039550781, 0.8437054753303528, 0.8727556467056274, 0.9018058180809021, 0.9308559894561768, 0.9599061608314514, 0.9889563322067261, 1.018006443977356, 1.0470566749572754]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 4.0, 2.0, 4.0, 7.0, 11.0, 14.0, 11.0, 20.0, 38.0, 52.0, 72.0, 84.0, 142.0, 222.0, 319.0, 497.0, 798.0, 1315.0, 2260.0, 4081.0, 8115.0, 16443.0, 35752.0, 85098.0, 228738.0, 840760.0, 2206996.0, 491301.0, 156436.0, 60987.0, 26436.0, 12615.0, 6436.0, 3248.0, 1828.0, 1144.0, 669.0, 434.0, 277.0, 195.0, 119.0, 110.0, 52.0, 37.0, 34.0, 24.0, 15.0, 14.0, 13.0, 6.0, 5.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.192626953125, -0.18627357482910156, -0.17992019653320312, -0.1735668182373047, -0.16721343994140625, -0.1608600616455078, -0.15450668334960938, -0.14815330505371094, -0.1417999267578125, -0.13544654846191406, -0.12909317016601562, -0.12273979187011719, -0.11638641357421875, -0.11003303527832031, -0.10367965698242188, -0.09732627868652344, -0.090972900390625, -0.08461952209472656, -0.07826614379882812, -0.07191276550292969, -0.06555938720703125, -0.05920600891113281, -0.052852630615234375, -0.04649925231933594, -0.0401458740234375, -0.03379249572753906, -0.027439117431640625, -0.021085739135742188, -0.01473236083984375, -0.008378982543945312, -0.002025604248046875, 0.0043277740478515625, 0.01068115234375, 0.017034530639648438, 0.023387908935546875, 0.029741287231445312, 0.03609466552734375, 0.04244804382324219, 0.048801422119140625, 0.05515480041503906, 0.0615081787109375, 0.06786155700683594, 0.07421493530273438, 0.08056831359863281, 0.08692169189453125, 0.09327507019042969, 0.09962844848632812, 0.10598182678222656, 0.112335205078125, 0.11868858337402344, 0.12504196166992188, 0.1313953399658203, 0.13774871826171875, 0.1441020965576172, 0.15045547485351562, 0.15680885314941406, 0.1631622314453125, 0.16951560974121094, 0.17586898803710938, 0.1822223663330078, 0.18857574462890625, 0.1949291229248047, 0.20128250122070312, 0.20763587951660156, 0.2139892578125]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 6.0, 5.0, 8.0, 8.0, 11.0, 11.0, 22.0, 26.0, 29.0, 34.0, 37.0, 48.0, 61.0, 61.0, 62.0, 66.0, 53.0, 64.0, 57.0, 59.0, 38.0, 60.0, 37.0, 37.0, 27.0, 23.0, 15.0, 9.0, 10.0, 6.0, 5.0, 5.0, 3.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.101318359375, -0.09636116027832031, -0.09140396118164062, -0.08644676208496094, -0.08148956298828125, -0.07653236389160156, -0.07157516479492188, -0.06661796569824219, -0.0616607666015625, -0.05670356750488281, -0.051746368408203125, -0.04678916931152344, -0.04183197021484375, -0.03687477111816406, -0.031917572021484375, -0.026960372924804688, -0.022003173828125, -0.017045974731445312, -0.012088775634765625, -0.0071315765380859375, -0.00217437744140625, 0.0027828216552734375, 0.007740020751953125, 0.012697219848632812, 0.0176544189453125, 0.022611618041992188, 0.027568817138671875, 0.03252601623535156, 0.03748321533203125, 0.04244041442871094, 0.047397613525390625, 0.05235481262207031, 0.05731201171875, 0.06226921081542969, 0.06722640991210938, 0.07218360900878906, 0.07714080810546875, 0.08209800720214844, 0.08705520629882812, 0.09201240539550781, 0.0969696044921875, 0.10192680358886719, 0.10688400268554688, 0.11184120178222656, 0.11679840087890625, 0.12175559997558594, 0.12671279907226562, 0.1316699981689453, 0.136627197265625, 0.1415843963623047, 0.14654159545898438, 0.15149879455566406, 0.15645599365234375, 0.16141319274902344, 0.16637039184570312, 0.1713275909423828, 0.1762847900390625, 0.1812419891357422, 0.18619918823242188, 0.19115638732910156, 0.19611358642578125, 0.20107078552246094, 0.20602798461914062, 0.2109851837158203, 0.2159423828125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 3.0, 5.0, 4.0, 7.0, 14.0, 16.0, 24.0, 32.0, 44.0, 58.0, 81.0, 119.0, 151.0, 254.0, 397.0, 519.0, 816.0, 1334.0, 1961.0, 3466.0, 5898.0, 10932.0, 21002.0, 43153.0, 97026.0, 238522.0, 672722.0, 1842119.0, 779127.0, 267941.0, 107604.0, 48014.0, 22737.0, 11992.0, 6446.0, 3637.0, 2181.0, 1384.0, 849.0, 537.0, 354.0, 259.0, 162.0, 123.0, 74.0, 50.0, 44.0, 34.0, 17.0, 20.0, 11.0, 5.0, 3.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2490234375, -0.240875244140625, -0.23272705078125, -0.224578857421875, -0.2164306640625, -0.208282470703125, -0.20013427734375, -0.191986083984375, -0.183837890625, -0.175689697265625, -0.16754150390625, -0.159393310546875, -0.1512451171875, -0.143096923828125, -0.13494873046875, -0.126800537109375, -0.11865234375, -0.110504150390625, -0.10235595703125, -0.094207763671875, -0.0860595703125, -0.077911376953125, -0.06976318359375, -0.061614990234375, -0.053466796875, -0.045318603515625, -0.03717041015625, -0.029022216796875, -0.0208740234375, -0.012725830078125, -0.00457763671875, 0.003570556640625, 0.01171875, 0.019866943359375, 0.02801513671875, 0.036163330078125, 0.0443115234375, 0.052459716796875, 0.06060791015625, 0.068756103515625, 0.076904296875, 0.085052490234375, 0.09320068359375, 0.101348876953125, 0.1094970703125, 0.117645263671875, 0.12579345703125, 0.133941650390625, 0.14208984375, 0.150238037109375, 0.15838623046875, 0.166534423828125, 0.1746826171875, 0.182830810546875, 0.19097900390625, 0.199127197265625, 0.207275390625, 0.215423583984375, 0.22357177734375, 0.231719970703125, 0.2398681640625, 0.248016357421875, 0.25616455078125, 0.264312744140625, 0.2724609375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 6.0, 1.0, 5.0, 12.0, 16.0, 10.0, 15.0, 21.0, 31.0, 35.0, 41.0, 70.0, 91.0, 146.0, 177.0, 253.0, 369.0, 527.0, 655.0, 464.0, 317.0, 232.0, 173.0, 104.0, 75.0, 56.0, 48.0, 26.0, 28.0, 15.0, 12.0, 6.0, 12.0, 7.0, 9.0, 3.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.281005859375, -0.2732830047607422, -0.2655601501464844, -0.25783729553222656, -0.25011444091796875, -0.24239158630371094, -0.23466873168945312, -0.2269458770751953, -0.2192230224609375, -0.2115001678466797, -0.20377731323242188, -0.19605445861816406, -0.18833160400390625, -0.18060874938964844, -0.17288589477539062, -0.1651630401611328, -0.157440185546875, -0.1497173309326172, -0.14199447631835938, -0.13427162170410156, -0.12654876708984375, -0.11882591247558594, -0.11110305786132812, -0.10338020324707031, -0.0956573486328125, -0.08793449401855469, -0.08021163940429688, -0.07248878479003906, -0.06476593017578125, -0.05704307556152344, -0.049320220947265625, -0.04159736633300781, -0.03387451171875, -0.026151657104492188, -0.018428802490234375, -0.010705947875976562, -0.00298309326171875, 0.0047397613525390625, 0.012462615966796875, 0.020185470581054688, 0.0279083251953125, 0.03563117980957031, 0.043354034423828125, 0.05107688903808594, 0.05879974365234375, 0.06652259826660156, 0.07424545288085938, 0.08196830749511719, 0.089691162109375, 0.09741401672363281, 0.10513687133789062, 0.11285972595214844, 0.12058258056640625, 0.12830543518066406, 0.13602828979492188, 0.1437511444091797, 0.1514739990234375, 0.1591968536376953, 0.16691970825195312, 0.17464256286621094, 0.18236541748046875, 0.19008827209472656, 0.19781112670898438, 0.2055339813232422, 0.2132568359375]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 11.0, 6.0, 12.0, 29.0, 34.0, 53.0, 66.0, 79.0, 84.0, 75.0, 92.0, 99.0, 78.0, 70.0, 61.0, 42.0, 31.0, 28.0, 15.0, 11.0, 11.0, 6.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6479687690734863, -1.604292392730713, -1.5606160163879395, -1.5169397592544556, -1.4732633829116821, -1.4295870065689087, -1.3859106302261353, -1.3422343730926514, -1.298557996749878, -1.2548816204071045, -1.211205244064331, -1.1675289869308472, -1.1238526105880737, -1.0801762342453003, -1.0364998579025269, -0.9928235411643982, -0.9491471648216248, -0.9054707884788513, -0.8617944717407227, -0.8181180953979492, -0.7744417786598206, -0.7307654023170471, -0.6870890855789185, -0.643412709236145, -0.5997363328933716, -0.5560599565505981, -0.5123836398124695, -0.46870726346969604, -0.4250309467315674, -0.38135457038879395, -0.3376782238483429, -0.29400187730789185, -0.2503255605697632, -0.20664921402931213, -0.16297286748886108, -0.11929650604724884, -0.07562015950679779, -0.03194381296634674, 0.011732548475265503, 0.05540889501571655, 0.0990852415561676, 0.14276158809661865, 0.1864379346370697, 0.23011429607868195, 0.2737906575202942, 0.31746697425842285, 0.3611433506011963, 0.40481969714164734, 0.4484960436820984, 0.49217239022254944, 0.5358487367630005, 0.5795251131057739, 0.6232014298439026, 0.666877806186676, 0.7105541229248047, 0.7542304992675781, 0.7979068756103516, 0.841583251953125, 0.8852595686912537, 0.9289359450340271, 0.9726122617721558, 1.0162886381149292, 1.0599650144577026, 1.1036412715911865, 1.14731764793396]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 7.0, 5.0, 6.0, 4.0, 9.0, 12.0, 10.0, 20.0, 13.0, 24.0, 18.0, 19.0, 18.0, 31.0, 30.0, 23.0, 31.0, 45.0, 40.0, 30.0, 39.0, 36.0, 44.0, 33.0, 43.0, 47.0, 39.0, 27.0, 40.0, 30.0, 38.0, 34.0, 25.0, 14.0, 21.0, 15.0, 21.0, 22.0, 8.0, 8.0, 10.0, 5.0, 7.0, 3.0, 0.0, 3.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.7765210270881653, -0.7536066174507141, -0.7306922674179077, -0.7077778577804565, -0.6848634481430054, -0.661949098110199, -0.6390346884727478, -0.6161203384399414, -0.5932059288024902, -0.5702915191650391, -0.5473771691322327, -0.5244627594947815, -0.5015484094619751, -0.4786339998245239, -0.45571959018707275, -0.43280521035194397, -0.4098908305168152, -0.3869764506816864, -0.3640620708465576, -0.34114766120910645, -0.31823328137397766, -0.2953189015388489, -0.2724044919013977, -0.24949011206626892, -0.22657573223114014, -0.20366135239601135, -0.18074695765972137, -0.1578325629234314, -0.1349181830883026, -0.11200379580259323, -0.08908940851688385, -0.06617501378059387, -0.04326069355010986, -0.020346306264400482, 0.002568081021308899, 0.02548246830701828, 0.04839685559272766, 0.07131124287843704, 0.09422563016414642, 0.1171400249004364, 0.14005440473556519, 0.16296878457069397, 0.18588317930698395, 0.20879757404327393, 0.2317119538784027, 0.2546263337135315, 0.27754074335098267, 0.30045512318611145, 0.32336950302124023, 0.346283882856369, 0.3691982626914978, 0.392112672328949, 0.41502705216407776, 0.43794143199920654, 0.4608558416366577, 0.4837702214717865, 0.5066846013069153, 0.5295990109443665, 0.5525133609771729, 0.575427770614624, 0.5983421802520752, 0.6212565302848816, 0.6441709399223328, 0.6670852899551392, 0.6899996995925903]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 6.0, 1.0, 5.0, 8.0, 12.0, 8.0, 21.0, 25.0, 31.0, 77.0, 84.0, 127.0, 199.0, 293.0, 489.0, 720.0, 1196.0, 1932.0, 2936.0, 4544.0, 7317.0, 11663.0, 18671.0, 29895.0, 49802.0, 83304.0, 136979.0, 192500.0, 185137.0, 126209.0, 75451.0, 45138.0, 27466.0, 17256.0, 10505.0, 6872.0, 4277.0, 2734.0, 1666.0, 984.0, 735.0, 435.0, 293.0, 163.0, 142.0, 86.0, 58.0, 45.0, 18.0, 14.0, 15.0, 7.0, 7.0, 1.0, 8.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.16943359375, -0.16395187377929688, -0.15847015380859375, -0.15298843383789062, -0.1475067138671875, -0.14202499389648438, -0.13654327392578125, -0.13106155395507812, -0.125579833984375, -0.12009811401367188, -0.11461639404296875, -0.10913467407226562, -0.1036529541015625, -0.09817123413085938, -0.09268951416015625, -0.08720779418945312, -0.08172607421875, -0.07624435424804688, -0.07076263427734375, -0.06528091430664062, -0.0597991943359375, -0.054317474365234375, -0.04883575439453125, -0.043354034423828125, -0.037872314453125, -0.032390594482421875, -0.02690887451171875, -0.021427154541015625, -0.0159454345703125, -0.010463714599609375, -0.00498199462890625, 0.000499725341796875, 0.0059814453125, 0.011463165283203125, 0.01694488525390625, 0.022426605224609375, 0.0279083251953125, 0.033390045166015625, 0.03887176513671875, 0.044353485107421875, 0.049835205078125, 0.055316925048828125, 0.06079864501953125, 0.06628036499023438, 0.0717620849609375, 0.07724380493164062, 0.08272552490234375, 0.08820724487304688, 0.09368896484375, 0.09917068481445312, 0.10465240478515625, 0.11013412475585938, 0.1156158447265625, 0.12109756469726562, 0.12657928466796875, 0.13206100463867188, 0.137542724609375, 0.14302444458007812, 0.14850616455078125, 0.15398788452148438, 0.1594696044921875, 0.16495132446289062, 0.17043304443359375, 0.17591476440429688, 0.181396484375]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 3.0, 6.0, 4.0, 11.0, 10.0, 11.0, 12.0, 26.0, 24.0, 33.0, 30.0, 45.0, 37.0, 47.0, 56.0, 64.0, 55.0, 67.0, 70.0, 62.0, 44.0, 44.0, 43.0, 37.0, 45.0, 26.0, 20.0, 21.0, 19.0, 17.0, 6.0, 3.0, 3.0, 4.0, 2.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11785888671875, -0.1123952865600586, -0.10693168640136719, -0.10146808624267578, -0.09600448608398438, -0.09054088592529297, -0.08507728576660156, -0.07961368560791016, -0.07415008544921875, -0.06868648529052734, -0.06322288513183594, -0.05775928497314453, -0.052295684814453125, -0.04683208465576172, -0.04136848449707031, -0.035904884338378906, -0.0304412841796875, -0.024977684020996094, -0.019514083862304688, -0.014050483703613281, -0.008586883544921875, -0.0031232833862304688, 0.0023403167724609375, 0.007803916931152344, 0.01326751708984375, 0.018731117248535156, 0.024194717407226562, 0.02965831756591797, 0.035121917724609375, 0.04058551788330078, 0.04604911804199219, 0.051512718200683594, 0.056976318359375, 0.062439918518066406, 0.06790351867675781, 0.07336711883544922, 0.07883071899414062, 0.08429431915283203, 0.08975791931152344, 0.09522151947021484, 0.10068511962890625, 0.10614871978759766, 0.11161231994628906, 0.11707592010498047, 0.12253952026367188, 0.12800312042236328, 0.1334667205810547, 0.1389303207397461, 0.1443939208984375, 0.1498575210571289, 0.1553211212158203, 0.16078472137451172, 0.16624832153320312, 0.17171192169189453, 0.17717552185058594, 0.18263912200927734, 0.18810272216796875, 0.19356632232666016, 0.19902992248535156, 0.20449352264404297, 0.20995712280273438, 0.21542072296142578, 0.2208843231201172, 0.2263479232788086, 0.2318115234375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 3.0, 7.0, 4.0, 6.0, 12.0, 12.0, 24.0, 28.0, 47.0, 70.0, 122.0, 230.0, 561.0, 1263.0, 3647.0, 10277.0, 30220.0, 99236.0, 350242.0, 386133.0, 114194.0, 34157.0, 11436.0, 3983.0, 1493.0, 565.0, 248.0, 122.0, 58.0, 45.0, 29.0, 11.0, 21.0, 13.0, 9.0, 11.0, 7.0, 3.0, 3.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.425048828125, -0.4113616943359375, -0.397674560546875, -0.3839874267578125, -0.37030029296875, -0.3566131591796875, -0.342926025390625, -0.3292388916015625, -0.3155517578125, -0.3018646240234375, -0.288177490234375, -0.2744903564453125, -0.26080322265625, -0.2471160888671875, -0.233428955078125, -0.2197418212890625, -0.2060546875, -0.1923675537109375, -0.178680419921875, -0.1649932861328125, -0.15130615234375, -0.1376190185546875, -0.123931884765625, -0.1102447509765625, -0.0965576171875, -0.0828704833984375, -0.069183349609375, -0.0554962158203125, -0.04180908203125, -0.0281219482421875, -0.014434814453125, -0.0007476806640625, 0.012939453125, 0.0266265869140625, 0.040313720703125, 0.0540008544921875, 0.06768798828125, 0.0813751220703125, 0.095062255859375, 0.1087493896484375, 0.1224365234375, 0.1361236572265625, 0.149810791015625, 0.1634979248046875, 0.17718505859375, 0.1908721923828125, 0.204559326171875, 0.2182464599609375, 0.23193359375, 0.2456207275390625, 0.259307861328125, 0.2729949951171875, 0.28668212890625, 0.3003692626953125, 0.314056396484375, 0.3277435302734375, 0.3414306640625, 0.3551177978515625, 0.368804931640625, 0.3824920654296875, 0.39617919921875, 0.4098663330078125, 0.423553466796875, 0.4372406005859375, 0.450927734375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 3.0, 4.0, 9.0, 7.0, 8.0, 9.0, 20.0, 19.0, 18.0, 17.0, 27.0, 27.0, 28.0, 41.0, 59.0, 49.0, 36.0, 47.0, 58.0, 39.0, 43.0, 38.0, 48.0, 47.0, 45.0, 37.0, 37.0, 33.0, 36.0, 24.0, 17.0, 13.0, 12.0, 4.0, 6.0, 2.0, 7.0, 8.0, 4.0, 6.0, 2.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.431396484375, -0.4179801940917969, -0.40456390380859375, -0.3911476135253906, -0.3777313232421875, -0.3643150329589844, -0.35089874267578125, -0.3374824523925781, -0.324066162109375, -0.3106498718261719, -0.29723358154296875, -0.2838172912597656, -0.2704010009765625, -0.2569847106933594, -0.24356842041015625, -0.23015213012695312, -0.21673583984375, -0.20331954956054688, -0.18990325927734375, -0.17648696899414062, -0.1630706787109375, -0.14965438842773438, -0.13623809814453125, -0.12282180786132812, -0.109405517578125, -0.09598922729492188, -0.08257293701171875, -0.06915664672851562, -0.0557403564453125, -0.042324066162109375, -0.02890777587890625, -0.015491485595703125, -0.0020751953125, 0.011341094970703125, 0.02475738525390625, 0.038173675537109375, 0.0515899658203125, 0.06500625610351562, 0.07842254638671875, 0.09183883666992188, 0.105255126953125, 0.11867141723632812, 0.13208770751953125, 0.14550399780273438, 0.1589202880859375, 0.17233657836914062, 0.18575286865234375, 0.19916915893554688, 0.21258544921875, 0.22600173950195312, 0.23941802978515625, 0.2528343200683594, 0.2662506103515625, 0.2796669006347656, 0.29308319091796875, 0.3064994812011719, 0.319915771484375, 0.3333320617675781, 0.34674835205078125, 0.3601646423339844, 0.3735809326171875, 0.3869972229003906, 0.40041351318359375, 0.4138298034667969, 0.42724609375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 6.0, 6.0, 11.0, 12.0, 19.0, 21.0, 39.0, 44.0, 69.0, 105.0, 146.0, 288.0, 416.0, 788.0, 1425.0, 2600.0, 5169.0, 10262.0, 21629.0, 47171.0, 110137.0, 312352.0, 325625.0, 116226.0, 49385.0, 22500.0, 10638.0, 5262.0, 2646.0, 1529.0, 792.0, 451.0, 279.0, 171.0, 119.0, 65.0, 47.0, 32.0, 27.0, 20.0, 13.0, 4.0, 1.0, 6.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.164306640625, -0.15883445739746094, -0.15336227416992188, -0.1478900909423828, -0.14241790771484375, -0.1369457244873047, -0.13147354125976562, -0.12600135803222656, -0.1205291748046875, -0.11505699157714844, -0.10958480834960938, -0.10411262512207031, -0.09864044189453125, -0.09316825866699219, -0.08769607543945312, -0.08222389221191406, -0.076751708984375, -0.07127952575683594, -0.06580734252929688, -0.06033515930175781, -0.05486297607421875, -0.04939079284667969, -0.043918609619140625, -0.03844642639160156, -0.0329742431640625, -0.027502059936523438, -0.022029876708984375, -0.016557693481445312, -0.01108551025390625, -0.0056133270263671875, -0.000141143798828125, 0.0053310394287109375, 0.01080322265625, 0.016275405883789062, 0.021747589111328125, 0.027219772338867188, 0.03269195556640625, 0.03816413879394531, 0.043636322021484375, 0.04910850524902344, 0.0545806884765625, 0.06005287170410156, 0.06552505493164062, 0.07099723815917969, 0.07646942138671875, 0.08194160461425781, 0.08741378784179688, 0.09288597106933594, 0.098358154296875, 0.10383033752441406, 0.10930252075195312, 0.11477470397949219, 0.12024688720703125, 0.1257190704345703, 0.13119125366210938, 0.13666343688964844, 0.1421356201171875, 0.14760780334472656, 0.15307998657226562, 0.1585521697998047, 0.16402435302734375, 0.1694965362548828, 0.17496871948242188, 0.18044090270996094, 0.1859130859375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 6.0, 5.0, 5.0, 16.0, 15.0, 15.0, 25.0, 38.0, 54.0, 99.0, 145.0, 203.0, 153.0, 64.0, 49.0, 35.0, 33.0, 16.0, 8.0, 9.0, 5.0, 4.0, 6.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0187110900878906e-05, -4.820898175239563e-05, -4.6230852603912354e-05, -4.425272345542908e-05, -4.22745943069458e-05, -4.0296465158462524e-05, -3.831833600997925e-05, -3.634020686149597e-05, -3.4362077713012695e-05, -3.238394856452942e-05, -3.0405819416046143e-05, -2.8427690267562866e-05, -2.644956111907959e-05, -2.4471431970596313e-05, -2.2493302822113037e-05, -2.051517367362976e-05, -1.8537044525146484e-05, -1.6558915376663208e-05, -1.4580786228179932e-05, -1.2602657079696655e-05, -1.0624527931213379e-05, -8.646398782730103e-06, -6.668269634246826e-06, -4.69014048576355e-06, -2.7120113372802734e-06, -7.338821887969971e-07, 1.2442469596862793e-06, 3.2223761081695557e-06, 5.200505256652832e-06, 7.178634405136108e-06, 9.156763553619385e-06, 1.1134892702102661e-05, 1.3113021850585938e-05, 1.5091150999069214e-05, 1.706928014755249e-05, 1.9047409296035767e-05, 2.1025538444519043e-05, 2.300366759300232e-05, 2.4981796741485596e-05, 2.6959925889968872e-05, 2.893805503845215e-05, 3.0916184186935425e-05, 3.28943133354187e-05, 3.487244248390198e-05, 3.6850571632385254e-05, 3.882870078086853e-05, 4.080682992935181e-05, 4.278495907783508e-05, 4.476308822631836e-05, 4.6741217374801636e-05, 4.871934652328491e-05, 5.069747567176819e-05, 5.2675604820251465e-05, 5.465373396873474e-05, 5.663186311721802e-05, 5.8609992265701294e-05, 6.058812141418457e-05, 6.256625056266785e-05, 6.454437971115112e-05, 6.65225088596344e-05, 6.850063800811768e-05, 7.047876715660095e-05, 7.245689630508423e-05, 7.44350254535675e-05, 7.641315460205078e-05]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 6.0, 7.0, 15.0, 9.0, 28.0, 40.0, 37.0, 73.0, 127.0, 185.0, 310.0, 508.0, 983.0, 1972.0, 4536.0, 11369.0, 31597.0, 93028.0, 375199.0, 380796.0, 95111.0, 32235.0, 11679.0, 4653.0, 1916.0, 920.0, 466.0, 245.0, 166.0, 122.0, 76.0, 39.0, 40.0, 24.0, 13.0, 7.0, 6.0, 8.0, 5.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.287353515625, -0.2795886993408203, -0.2718238830566406, -0.26405906677246094, -0.25629425048828125, -0.24852943420410156, -0.24076461791992188, -0.2329998016357422, -0.2252349853515625, -0.2174701690673828, -0.20970535278320312, -0.20194053649902344, -0.19417572021484375, -0.18641090393066406, -0.17864608764648438, -0.1708812713623047, -0.163116455078125, -0.1553516387939453, -0.14758682250976562, -0.13982200622558594, -0.13205718994140625, -0.12429237365722656, -0.11652755737304688, -0.10876274108886719, -0.1009979248046875, -0.09323310852050781, -0.08546829223632812, -0.07770347595214844, -0.06993865966796875, -0.06217384338378906, -0.054409027099609375, -0.04664421081542969, -0.03887939453125, -0.031114578247070312, -0.023349761962890625, -0.015584945678710938, -0.00782012939453125, -5.53131103515625e-05, 0.007709503173828125, 0.015474319458007812, 0.0232391357421875, 0.031003952026367188, 0.038768768310546875, 0.04653358459472656, 0.05429840087890625, 0.06206321716308594, 0.06982803344726562, 0.07759284973144531, 0.085357666015625, 0.09312248229980469, 0.10088729858398438, 0.10865211486816406, 0.11641693115234375, 0.12418174743652344, 0.13194656372070312, 0.1397113800048828, 0.1474761962890625, 0.1552410125732422, 0.16300582885742188, 0.17077064514160156, 0.17853546142578125, 0.18630027770996094, 0.19406509399414062, 0.2018299102783203, 0.2095947265625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 5.0, 7.0, 8.0, 10.0, 17.0, 18.0, 25.0, 37.0, 64.0, 126.0, 162.0, 190.0, 109.0, 71.0, 41.0, 28.0, 22.0, 18.0, 19.0, 5.0, 9.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.246337890625, -0.23785781860351562, -0.22937774658203125, -0.22089767456054688, -0.2124176025390625, -0.20393753051757812, -0.19545745849609375, -0.18697738647460938, -0.178497314453125, -0.17001724243164062, -0.16153717041015625, -0.15305709838867188, -0.1445770263671875, -0.13609695434570312, -0.12761688232421875, -0.11913681030273438, -0.11065673828125, -0.10217666625976562, -0.09369659423828125, -0.08521652221679688, -0.0767364501953125, -0.06825637817382812, -0.05977630615234375, -0.051296234130859375, -0.042816162109375, -0.034336090087890625, -0.02585601806640625, -0.017375946044921875, -0.0088958740234375, -0.000415802001953125, 0.00806427001953125, 0.016544342041015625, 0.0250244140625, 0.033504486083984375, 0.04198455810546875, 0.050464630126953125, 0.0589447021484375, 0.06742477416992188, 0.07590484619140625, 0.08438491821289062, 0.092864990234375, 0.10134506225585938, 0.10982513427734375, 0.11830520629882812, 0.1267852783203125, 0.13526535034179688, 0.14374542236328125, 0.15222549438476562, 0.16070556640625, 0.16918563842773438, 0.17766571044921875, 0.18614578247070312, 0.1946258544921875, 0.20310592651367188, 0.21158599853515625, 0.22006607055664062, 0.228546142578125, 0.23702621459960938, 0.24550628662109375, 0.2539863586425781, 0.2624664306640625, 0.2709465026855469, 0.27942657470703125, 0.2879066467285156, 0.29638671875]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 6.0, 45.0, 266.0, 482.0, 193.0, 24.0, 2.0, 1.0], "bins": [-16.446990966796875, -16.1691837310791, -15.891377449035645, -15.613570213317871, -15.335763931274414, -15.05795669555664, -14.780150413513184, -14.50234317779541, -14.224536895751953, -13.94672966003418, -13.668923377990723, -13.39111614227295, -13.113309860229492, -12.835502624511719, -12.557696342468262, -12.279889106750488, -12.002082824707031, -11.724275588989258, -11.4464693069458, -11.168662071228027, -10.89085578918457, -10.613048553466797, -10.33524227142334, -10.057435035705566, -9.779627799987793, -9.50182056427002, -9.224014282226562, -8.946207046508789, -8.668400764465332, -8.390593528747559, -8.112787246704102, -7.834980010986328, -7.557173728942871, -7.279366970062256, -7.001560211181641, -6.723753452301025, -6.44594669342041, -6.168139934539795, -5.89033317565918, -5.612525939941406, -5.334719181060791, -5.056912422180176, -4.7791056632995605, -4.501298904418945, -4.22349214553833, -3.945685386657715, -3.6678783893585205, -3.3900716304779053, -3.112265110015869, -2.834458351135254, -2.5566515922546387, -2.2788448333740234, -2.001038074493408, -1.7232311964035034, -1.4454243183135986, -1.1676175594329834, -0.8898106813430786, -0.6120039224624634, -0.33419710397720337, -0.05639028549194336, 0.22141647338867188, 0.4992232322692871, 0.7770301103591919, 1.0548368692398071, 1.3326436281204224]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 2.0, 4.0, 3.0, 4.0, 14.0, 6.0, 5.0, 9.0, 24.0, 15.0, 28.0, 32.0, 28.0, 34.0, 33.0, 37.0, 38.0, 42.0, 53.0, 63.0, 67.0, 51.0, 44.0, 63.0, 54.0, 43.0, 31.0, 37.0, 29.0, 31.0, 23.0, 17.0, 11.0, 11.0, 10.0, 8.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.956747829914093, -0.9150879979133606, -0.873428225517273, -0.8317683935165405, -0.7901085615158081, -0.7484487295150757, -0.706788957118988, -0.6651291251182556, -0.623469352722168, -0.5818095207214355, -0.5401497483253479, -0.4984899163246155, -0.45683008432388306, -0.415170282125473, -0.373510479927063, -0.33185064792633057, -0.29019081592559814, -0.24853099882602692, -0.2068711817264557, -0.16521137952804565, -0.12355156242847443, -0.0818917453289032, -0.040231943130493164, 0.0014278888702392578, 0.04308769106864929, 0.08474750816822052, 0.12640732526779175, 0.16806712746620178, 0.209726944565773, 0.25138676166534424, 0.2930465638637543, 0.3347063958644867, 0.3763662576675415, 0.41802605986595154, 0.45968589186668396, 0.501345694065094, 0.5430055260658264, 0.5846652984619141, 0.6263251304626465, 0.6679849624633789, 0.7096447944641113, 0.7513046264648438, 0.7929643988609314, 0.8346242308616638, 0.8762840628623962, 0.9179438352584839, 0.9596036672592163, 1.0012634992599487, 1.0429232120513916, 1.084583044052124, 1.1262428760528564, 1.1679027080535889, 1.2095624208450317, 1.2512222528457642, 1.2928820848464966, 1.334541916847229, 1.3762017488479614, 1.4178615808486938, 1.4595214128494263, 1.5011811256408691, 1.5428409576416016, 1.584500789642334, 1.6261606216430664, 1.6678204536437988, 1.7094802856445312]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 2.0, 6.0, 3.0, 9.0, 15.0, 14.0, 17.0, 19.0, 40.0, 58.0, 67.0, 113.0, 158.0, 214.0, 345.0, 580.0, 843.0, 1438.0, 2437.0, 4595.0, 9366.0, 19759.0, 46586.0, 122861.0, 399964.0, 1914837.0, 1238912.0, 273725.0, 90886.0, 35022.0, 15005.0, 7262.0, 3700.0, 2082.0, 1229.0, 697.0, 462.0, 294.0, 217.0, 136.0, 109.0, 63.0, 39.0, 26.0, 26.0, 9.0, 12.0, 12.0, 4.0, 4.0, 4.0, 1.0, 2.0, 6.0], "bins": [-0.290283203125, -0.28218650817871094, -0.2740898132324219, -0.2659931182861328, -0.25789642333984375, -0.2497997283935547, -0.24170303344726562, -0.23360633850097656, -0.2255096435546875, -0.21741294860839844, -0.20931625366210938, -0.2012195587158203, -0.19312286376953125, -0.1850261688232422, -0.17692947387695312, -0.16883277893066406, -0.160736083984375, -0.15263938903808594, -0.14454269409179688, -0.1364459991455078, -0.12834930419921875, -0.12025260925292969, -0.11215591430664062, -0.10405921936035156, -0.0959625244140625, -0.08786582946777344, -0.07976913452148438, -0.07167243957519531, -0.06357574462890625, -0.05547904968261719, -0.047382354736328125, -0.03928565979003906, -0.03118896484375, -0.023092269897460938, -0.014995574951171875, -0.0068988800048828125, 0.00119781494140625, 0.009294509887695312, 0.017391204833984375, 0.025487899780273438, 0.0335845947265625, 0.04168128967285156, 0.049777984619140625, 0.05787467956542969, 0.06597137451171875, 0.07406806945800781, 0.08216476440429688, 0.09026145935058594, 0.098358154296875, 0.10645484924316406, 0.11455154418945312, 0.12264823913574219, 0.13074493408203125, 0.1388416290283203, 0.14693832397460938, 0.15503501892089844, 0.1631317138671875, 0.17122840881347656, 0.17932510375976562, 0.1874217987060547, 0.19551849365234375, 0.2036151885986328, 0.21171188354492188, 0.21980857849121094, 0.2279052734375]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 5.0, 3.0, 4.0, 3.0, 13.0, 13.0, 14.0, 11.0, 24.0, 29.0, 27.0, 22.0, 44.0, 28.0, 49.0, 38.0, 47.0, 39.0, 38.0, 63.0, 62.0, 57.0, 43.0, 36.0, 44.0, 39.0, 49.0, 28.0, 25.0, 24.0, 17.0, 15.0, 16.0, 9.0, 8.0, 10.0, 6.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.10968017578125, -0.10486888885498047, -0.10005760192871094, -0.0952463150024414, -0.09043502807617188, -0.08562374114990234, -0.08081245422363281, -0.07600116729736328, -0.07118988037109375, -0.06637859344482422, -0.06156730651855469, -0.056756019592285156, -0.051944732666015625, -0.047133445739746094, -0.04232215881347656, -0.03751087188720703, -0.0326995849609375, -0.02788829803466797, -0.023077011108398438, -0.018265724182128906, -0.013454437255859375, -0.008643150329589844, -0.0038318634033203125, 0.0009794235229492188, 0.00579071044921875, 0.010601997375488281, 0.015413284301757812, 0.020224571228027344, 0.025035858154296875, 0.029847145080566406, 0.03465843200683594, 0.03946971893310547, 0.044281005859375, 0.04909229278564453, 0.05390357971191406, 0.058714866638183594, 0.06352615356445312, 0.06833744049072266, 0.07314872741699219, 0.07796001434326172, 0.08277130126953125, 0.08758258819580078, 0.09239387512207031, 0.09720516204833984, 0.10201644897460938, 0.1068277359008789, 0.11163902282714844, 0.11645030975341797, 0.1212615966796875, 0.12607288360595703, 0.13088417053222656, 0.1356954574584961, 0.14050674438476562, 0.14531803131103516, 0.1501293182373047, 0.15494060516357422, 0.15975189208984375, 0.16456317901611328, 0.1693744659423828, 0.17418575286865234, 0.17899703979492188, 0.1838083267211914, 0.18861961364746094, 0.19343090057373047, 0.1982421875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 13.0, 21.0, 18.0, 34.0, 57.0, 73.0, 103.0, 172.0, 243.0, 379.0, 605.0, 940.0, 1576.0, 2720.0, 4943.0, 8935.0, 18084.0, 39448.0, 95700.0, 261971.0, 904187.0, 1954870.0, 579441.0, 186499.0, 70912.0, 30744.0, 14455.0, 7356.0, 3948.0, 2218.0, 1324.0, 829.0, 522.0, 325.0, 225.0, 150.0, 86.0, 58.0, 35.0, 24.0, 13.0, 9.0, 9.0, 4.0, 7.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3173828125, -0.3072547912597656, -0.29712677001953125, -0.2869987487792969, -0.2768707275390625, -0.2667427062988281, -0.25661468505859375, -0.24648666381835938, -0.236358642578125, -0.22623062133789062, -0.21610260009765625, -0.20597457885742188, -0.1958465576171875, -0.18571853637695312, -0.17559051513671875, -0.16546249389648438, -0.15533447265625, -0.14520645141601562, -0.13507843017578125, -0.12495040893554688, -0.1148223876953125, -0.10469436645507812, -0.09456634521484375, -0.08443832397460938, -0.074310302734375, -0.06418228149414062, -0.05405426025390625, -0.043926239013671875, -0.0337982177734375, -0.023670196533203125, -0.01354217529296875, -0.003414154052734375, 0.0067138671875, 0.016841888427734375, 0.02696990966796875, 0.037097930908203125, 0.0472259521484375, 0.057353973388671875, 0.06748199462890625, 0.07761001586914062, 0.087738037109375, 0.09786605834960938, 0.10799407958984375, 0.11812210083007812, 0.1282501220703125, 0.13837814331054688, 0.14850616455078125, 0.15863418579101562, 0.16876220703125, 0.17889022827148438, 0.18901824951171875, 0.19914627075195312, 0.2092742919921875, 0.21940231323242188, 0.22953033447265625, 0.23965835571289062, 0.249786376953125, 0.2599143981933594, 0.27004241943359375, 0.2801704406738281, 0.2902984619140625, 0.3004264831542969, 0.31055450439453125, 0.3206825256347656, 0.330810546875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 3.0, 5.0, 3.0, 5.0, 13.0, 10.0, 8.0, 15.0, 11.0, 22.0, 29.0, 39.0, 60.0, 85.0, 110.0, 166.0, 237.0, 360.0, 563.0, 745.0, 543.0, 330.0, 221.0, 158.0, 99.0, 73.0, 58.0, 35.0, 20.0, 13.0, 10.0, 8.0, 6.0, 5.0, 5.0, 1.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.34033203125, -0.3283576965332031, -0.31638336181640625, -0.3044090270996094, -0.2924346923828125, -0.2804603576660156, -0.26848602294921875, -0.2565116882324219, -0.244537353515625, -0.23256301879882812, -0.22058868408203125, -0.20861434936523438, -0.1966400146484375, -0.18466567993164062, -0.17269134521484375, -0.16071701049804688, -0.14874267578125, -0.13676834106445312, -0.12479400634765625, -0.11281967163085938, -0.1008453369140625, -0.08887100219726562, -0.07689666748046875, -0.06492233276367188, -0.052947998046875, -0.040973663330078125, -0.02899932861328125, -0.017024993896484375, -0.0050506591796875, 0.006923675537109375, 0.01889801025390625, 0.030872344970703125, 0.0428466796875, 0.054821014404296875, 0.06679534912109375, 0.07876968383789062, 0.0907440185546875, 0.10271835327148438, 0.11469268798828125, 0.12666702270507812, 0.138641357421875, 0.15061569213867188, 0.16259002685546875, 0.17456436157226562, 0.1865386962890625, 0.19851303100585938, 0.21048736572265625, 0.22246170043945312, 0.23443603515625, 0.24641036987304688, 0.25838470458984375, 0.2703590393066406, 0.2823333740234375, 0.2943077087402344, 0.30628204345703125, 0.3182563781738281, 0.330230712890625, 0.3422050476074219, 0.35417938232421875, 0.3661537170410156, 0.3781280517578125, 0.3901023864746094, 0.40207672119140625, 0.4140510559082031, 0.426025390625]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 6.0, 8.0, 6.0, 7.0, 10.0, 16.0, 20.0, 38.0, 38.0, 54.0, 62.0, 74.0, 99.0, 99.0, 80.0, 87.0, 71.0, 61.0, 48.0, 29.0, 28.0, 19.0, 18.0, 10.0, 7.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4691505432128906, -1.4128050804138184, -1.3564597368240356, -1.3001142740249634, -1.2437689304351807, -1.1874234676361084, -1.1310780048370361, -1.0747326612472534, -1.0183873176574707, -0.9620419144630432, -0.9056965112686157, -0.8493510484695435, -0.7930057048797607, -0.7366602420806885, -0.680314838886261, -0.6239694356918335, -0.5676239728927612, -0.5112785696983337, -0.45493316650390625, -0.39858773350715637, -0.3422423303127289, -0.2858969271183014, -0.2295514941215515, -0.17320609092712402, -0.11686068773269653, -0.060515277087688446, -0.004169866442680359, 0.052175551652908325, 0.10852095484733582, 0.1648663580417633, 0.22121179103851318, 0.2775571942329407, 0.33390259742736816, 0.39024800062179565, 0.44659340381622314, 0.5029388666152954, 0.5592842102050781, 0.6156296730041504, 0.6719750761985779, 0.7283204793930054, 0.7846658825874329, 0.8410112857818604, 0.8973566889762878, 0.9537020921707153, 1.0100475549697876, 1.0663928985595703, 1.1227383613586426, 1.1790838241577148, 1.2354291677474976, 1.2917746305465698, 1.3481199741363525, 1.4044654369354248, 1.4608107805252075, 1.5171562433242798, 1.5735015869140625, 1.6298470497131348, 1.686192512512207, 1.7425379753112793, 1.798883318901062, 1.8552287817001343, 1.911574125289917, 1.9679195880889893, 2.0242650508880615, 2.0806102752685547, 2.136955738067627]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 4.0, 3.0, 3.0, 10.0, 8.0, 10.0, 15.0, 9.0, 8.0, 13.0, 16.0, 18.0, 13.0, 28.0, 25.0, 23.0, 30.0, 40.0, 46.0, 41.0, 42.0, 41.0, 38.0, 48.0, 29.0, 40.0, 32.0, 39.0, 40.0, 31.0, 30.0, 25.0, 23.0, 37.0, 26.0, 17.0, 14.0, 13.0, 17.0, 12.0, 13.0, 10.0, 9.0, 5.0, 9.0, 6.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0113821029663086, -0.9774859547615051, -0.9435898661613464, -0.909693717956543, -0.8757976293563843, -0.8419014811515808, -0.8080053329467773, -0.7741092443466187, -0.7402130961418152, -0.7063169479370117, -0.672420859336853, -0.6385247111320496, -0.6046285629272461, -0.5707324743270874, -0.5368363261222839, -0.5029401779174805, -0.4690440893173218, -0.4351479709148407, -0.4012518525123596, -0.36735570430755615, -0.3334595859050751, -0.299563467502594, -0.2656673192977905, -0.23177120089530945, -0.19787508249282837, -0.1639789640903473, -0.13008283078670502, -0.09618670493364334, -0.062290579080581665, -0.028394460678100586, 0.005501672625541687, 0.03939780592918396, 0.07329380512237549, 0.10718993097543716, 0.14108605682849884, 0.1749821901321411, 0.2088783085346222, 0.24277442693710327, 0.27667057514190674, 0.3105666935443878, 0.3444628119468689, 0.37835893034935, 0.41225504875183105, 0.4461511969566345, 0.4800473153591156, 0.5139434337615967, 0.5478395819664001, 0.5817357301712036, 0.6156318187713623, 0.6495279669761658, 0.6834240555763245, 0.7173202037811279, 0.7512162923812866, 0.7851124405860901, 0.8190085887908936, 0.8529046773910522, 0.8868008255958557, 0.9206969738006592, 0.9545930624008179, 0.9884892106056213, 1.0223853588104248, 1.0562814474105835, 1.0901775360107422, 1.1240737438201904, 1.1579698324203491]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 6.0, 10.0, 12.0, 17.0, 33.0, 48.0, 74.0, 123.0, 195.0, 342.0, 514.0, 768.0, 1303.0, 2020.0, 3343.0, 5304.0, 8951.0, 14898.0, 24758.0, 42582.0, 74987.0, 134257.0, 224607.0, 216027.0, 124478.0, 69838.0, 39841.0, 23395.0, 13794.0, 8434.0, 5176.0, 3241.0, 2025.0, 1179.0, 725.0, 472.0, 290.0, 178.0, 116.0, 70.0, 43.0, 36.0, 24.0, 11.0, 9.0, 3.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.264404296875, -0.2555732727050781, -0.24674224853515625, -0.23791122436523438, -0.2290802001953125, -0.22024917602539062, -0.21141815185546875, -0.20258712768554688, -0.193756103515625, -0.18492507934570312, -0.17609405517578125, -0.16726303100585938, -0.1584320068359375, -0.14960098266601562, -0.14076995849609375, -0.13193893432617188, -0.12310791015625, -0.11427688598632812, -0.10544586181640625, -0.09661483764648438, -0.0877838134765625, -0.07895278930664062, -0.07012176513671875, -0.061290740966796875, -0.052459716796875, -0.043628692626953125, -0.03479766845703125, -0.025966644287109375, -0.0171356201171875, -0.008304595947265625, 0.00052642822265625, 0.009357452392578125, 0.0181884765625, 0.027019500732421875, 0.03585052490234375, 0.044681549072265625, 0.0535125732421875, 0.062343597412109375, 0.07117462158203125, 0.08000564575195312, 0.088836669921875, 0.09766769409179688, 0.10649871826171875, 0.11532974243164062, 0.1241607666015625, 0.13299179077148438, 0.14182281494140625, 0.15065383911132812, 0.15948486328125, 0.16831588745117188, 0.17714691162109375, 0.18597793579101562, 0.1948089599609375, 0.20363998413085938, 0.21247100830078125, 0.22130203247070312, 0.230133056640625, 0.23896408081054688, 0.24779510498046875, 0.2566261291503906, 0.2654571533203125, 0.2742881774902344, 0.28311920166015625, 0.2919502258300781, 0.30078125]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 1.0, 3.0, 2.0, 10.0, 12.0, 9.0, 20.0, 21.0, 22.0, 30.0, 34.0, 33.0, 30.0, 35.0, 38.0, 36.0, 43.0, 65.0, 58.0, 47.0, 55.0, 55.0, 47.0, 43.0, 35.0, 34.0, 29.0, 45.0, 26.0, 12.0, 19.0, 12.0, 15.0, 10.0, 3.0, 2.0, 5.0, 2.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1453857421875, -0.13978004455566406, -0.13417434692382812, -0.1285686492919922, -0.12296295166015625, -0.11735725402832031, -0.11175155639648438, -0.10614585876464844, -0.1005401611328125, -0.09493446350097656, -0.08932876586914062, -0.08372306823730469, -0.07811737060546875, -0.07251167297363281, -0.06690597534179688, -0.06130027770996094, -0.055694580078125, -0.05008888244628906, -0.044483184814453125, -0.03887748718261719, -0.03327178955078125, -0.027666091918945312, -0.022060394287109375, -0.016454696655273438, -0.0108489990234375, -0.0052433013916015625, 0.000362396240234375, 0.0059680938720703125, 0.01157379150390625, 0.017179489135742188, 0.022785186767578125, 0.028390884399414062, 0.03399658203125, 0.03960227966308594, 0.045207977294921875, 0.05081367492675781, 0.05641937255859375, 0.06202507019042969, 0.06763076782226562, 0.07323646545410156, 0.0788421630859375, 0.08444786071777344, 0.09005355834960938, 0.09565925598144531, 0.10126495361328125, 0.10687065124511719, 0.11247634887695312, 0.11808204650878906, 0.123687744140625, 0.12929344177246094, 0.13489913940429688, 0.1405048370361328, 0.14611053466796875, 0.1517162322998047, 0.15732192993164062, 0.16292762756347656, 0.1685333251953125, 0.17413902282714844, 0.17974472045898438, 0.1853504180908203, 0.19095611572265625, 0.1965618133544922, 0.20216751098632812, 0.20777320861816406, 0.21337890625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 6.0, 6.0, 6.0, 1.0, 2.0, 10.0, 5.0, 9.0, 15.0, 9.0, 26.0, 34.0, 47.0, 61.0, 99.0, 164.0, 291.0, 534.0, 1105.0, 2192.0, 4787.0, 10175.0, 22268.0, 50259.0, 117993.0, 283950.0, 314697.0, 136008.0, 56607.0, 25328.0, 11459.0, 5237.0, 2495.0, 1176.0, 604.0, 336.0, 194.0, 112.0, 81.0, 49.0, 29.0, 20.0, 14.0, 15.0, 13.0, 8.0, 8.0, 7.0, 3.0, 1.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.415771484375, -0.401947021484375, -0.38812255859375, -0.374298095703125, -0.3604736328125, -0.346649169921875, -0.33282470703125, -0.319000244140625, -0.30517578125, -0.291351318359375, -0.27752685546875, -0.263702392578125, -0.2498779296875, -0.236053466796875, -0.22222900390625, -0.208404541015625, -0.194580078125, -0.180755615234375, -0.16693115234375, -0.153106689453125, -0.1392822265625, -0.125457763671875, -0.11163330078125, -0.097808837890625, -0.083984375, -0.070159912109375, -0.05633544921875, -0.042510986328125, -0.0286865234375, -0.014862060546875, -0.00103759765625, 0.012786865234375, 0.026611328125, 0.040435791015625, 0.05426025390625, 0.068084716796875, 0.0819091796875, 0.095733642578125, 0.10955810546875, 0.123382568359375, 0.13720703125, 0.151031494140625, 0.16485595703125, 0.178680419921875, 0.1925048828125, 0.206329345703125, 0.22015380859375, 0.233978271484375, 0.247802734375, 0.261627197265625, 0.27545166015625, 0.289276123046875, 0.3031005859375, 0.316925048828125, 0.33074951171875, 0.344573974609375, 0.3583984375, 0.372222900390625, 0.38604736328125, 0.399871826171875, 0.4136962890625, 0.427520751953125, 0.44134521484375, 0.455169677734375, 0.468994140625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 3.0, 4.0, 4.0, 7.0, 9.0, 15.0, 17.0, 21.0, 14.0, 27.0, 26.0, 32.0, 40.0, 32.0, 33.0, 40.0, 39.0, 50.0, 60.0, 55.0, 44.0, 44.0, 38.0, 45.0, 32.0, 29.0, 29.0, 35.0, 29.0, 22.0, 15.0, 23.0, 19.0, 13.0, 12.0, 12.0, 7.0, 2.0, 4.0, 3.0, 3.0, 0.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.5439453125, -0.5272445678710938, -0.5105438232421875, -0.49384307861328125, -0.477142333984375, -0.46044158935546875, -0.4437408447265625, -0.42704010009765625, -0.41033935546875, -0.39363861083984375, -0.3769378662109375, -0.36023712158203125, -0.343536376953125, -0.32683563232421875, -0.3101348876953125, -0.29343414306640625, -0.2767333984375, -0.26003265380859375, -0.2433319091796875, -0.22663116455078125, -0.209930419921875, -0.19322967529296875, -0.1765289306640625, -0.15982818603515625, -0.14312744140625, -0.12642669677734375, -0.1097259521484375, -0.09302520751953125, -0.076324462890625, -0.05962371826171875, -0.0429229736328125, -0.02622222900390625, -0.009521484375, 0.00717926025390625, 0.0238800048828125, 0.04058074951171875, 0.057281494140625, 0.07398223876953125, 0.0906829833984375, 0.10738372802734375, 0.12408447265625, 0.14078521728515625, 0.1574859619140625, 0.17418670654296875, 0.190887451171875, 0.20758819580078125, 0.2242889404296875, 0.24098968505859375, 0.2576904296875, 0.27439117431640625, 0.2910919189453125, 0.30779266357421875, 0.324493408203125, 0.34119415283203125, 0.3578948974609375, 0.37459564208984375, 0.39129638671875, 0.40799713134765625, 0.4246978759765625, 0.44139862060546875, 0.458099365234375, 0.47480010986328125, 0.4915008544921875, 0.5082015991210938, 0.52490234375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 6.0, 8.0, 6.0, 9.0, 10.0, 31.0, 38.0, 66.0, 111.0, 162.0, 229.0, 386.0, 563.0, 1023.0, 1911.0, 3710.0, 7888.0, 17758.0, 41561.0, 107422.0, 307035.0, 349077.0, 123939.0, 47634.0, 19858.0, 8990.0, 4180.0, 2057.0, 1141.0, 659.0, 415.0, 249.0, 147.0, 104.0, 68.0, 41.0, 27.0, 17.0, 7.0, 2.0, 9.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2432861328125, -0.2357006072998047, -0.22811508178710938, -0.22052955627441406, -0.21294403076171875, -0.20535850524902344, -0.19777297973632812, -0.1901874542236328, -0.1826019287109375, -0.1750164031982422, -0.16743087768554688, -0.15984535217285156, -0.15225982666015625, -0.14467430114746094, -0.13708877563476562, -0.1295032501220703, -0.121917724609375, -0.11433219909667969, -0.10674667358398438, -0.09916114807128906, -0.09157562255859375, -0.08399009704589844, -0.07640457153320312, -0.06881904602050781, -0.0612335205078125, -0.05364799499511719, -0.046062469482421875, -0.03847694396972656, -0.03089141845703125, -0.023305892944335938, -0.015720367431640625, -0.008134841918945312, -0.00054931640625, 0.0070362091064453125, 0.014621734619140625, 0.022207260131835938, 0.02979278564453125, 0.03737831115722656, 0.044963836669921875, 0.05254936218261719, 0.0601348876953125, 0.06772041320800781, 0.07530593872070312, 0.08289146423339844, 0.09047698974609375, 0.09806251525878906, 0.10564804077148438, 0.11323356628417969, 0.120819091796875, 0.1284046173095703, 0.13599014282226562, 0.14357566833496094, 0.15116119384765625, 0.15874671936035156, 0.16633224487304688, 0.1739177703857422, 0.1815032958984375, 0.1890888214111328, 0.19667434692382812, 0.20425987243652344, 0.21184539794921875, 0.21943092346191406, 0.22701644897460938, 0.2346019744873047, 0.2421875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 4.0, 4.0, 2.0, 3.0, 4.0, 7.0, 6.0, 5.0, 13.0, 8.0, 16.0, 13.0, 17.0, 14.0, 27.0, 20.0, 32.0, 46.0, 57.0, 93.0, 106.0, 97.0, 84.0, 56.0, 47.0, 38.0, 32.0, 21.0, 25.0, 21.0, 13.0, 15.0, 13.0, 7.0, 5.0, 7.0, 7.0, 2.0, 3.0, 4.0, 5.0, 3.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.684925079345703e-05, -4.543270915746689e-05, -4.4016167521476746e-05, -4.25996258854866e-05, -4.118308424949646e-05, -3.976654261350632e-05, -3.8350000977516174e-05, -3.693345934152603e-05, -3.551691770553589e-05, -3.4100376069545746e-05, -3.26838344335556e-05, -3.126729279756546e-05, -2.9850751161575317e-05, -2.8434209525585175e-05, -2.7017667889595032e-05, -2.560112625360489e-05, -2.4184584617614746e-05, -2.2768042981624603e-05, -2.135150134563446e-05, -1.9934959709644318e-05, -1.8518418073654175e-05, -1.7101876437664032e-05, -1.568533480167389e-05, -1.4268793165683746e-05, -1.2852251529693604e-05, -1.143570989370346e-05, -1.0019168257713318e-05, -8.602626621723175e-06, -7.186084985733032e-06, -5.769543349742889e-06, -4.353001713752747e-06, -2.9364600777626038e-06, -1.519918441772461e-06, -1.0337680578231812e-07, 1.3131648302078247e-06, 2.7297064661979675e-06, 4.14624810218811e-06, 5.562789738178253e-06, 6.979331374168396e-06, 8.395873010158539e-06, 9.812414646148682e-06, 1.1228956282138824e-05, 1.2645497918128967e-05, 1.406203955411911e-05, 1.5478581190109253e-05, 1.6895122826099396e-05, 1.831166446208954e-05, 1.972820609807968e-05, 2.1144747734069824e-05, 2.2561289370059967e-05, 2.397783100605011e-05, 2.5394372642040253e-05, 2.6810914278030396e-05, 2.822745591402054e-05, 2.964399755001068e-05, 3.1060539186000824e-05, 3.247708082199097e-05, 3.389362245798111e-05, 3.531016409397125e-05, 3.6726705729961395e-05, 3.814324736595154e-05, 3.955978900194168e-05, 4.0976330637931824e-05, 4.2392872273921967e-05, 4.380941390991211e-05]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 6.0, 3.0, 7.0, 5.0, 5.0, 11.0, 12.0, 30.0, 28.0, 57.0, 89.0, 141.0, 251.0, 495.0, 956.0, 2063.0, 4972.0, 13062.0, 35979.0, 106313.0, 329608.0, 366883.0, 121571.0, 41053.0, 14858.0, 5608.0, 2296.0, 1038.0, 475.0, 271.0, 151.0, 103.0, 49.0, 39.0, 35.0, 10.0, 12.0, 9.0, 4.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.206298828125, -0.19806671142578125, -0.1898345947265625, -0.18160247802734375, -0.173370361328125, -0.16513824462890625, -0.1569061279296875, -0.14867401123046875, -0.14044189453125, -0.13220977783203125, -0.1239776611328125, -0.11574554443359375, -0.107513427734375, -0.09928131103515625, -0.0910491943359375, -0.08281707763671875, -0.0745849609375, -0.06635284423828125, -0.0581207275390625, -0.04988861083984375, -0.041656494140625, -0.03342437744140625, -0.0251922607421875, -0.01696014404296875, -0.00872802734375, -0.00049591064453125, 0.0077362060546875, 0.01596832275390625, 0.024200439453125, 0.03243255615234375, 0.0406646728515625, 0.04889678955078125, 0.05712890625, 0.06536102294921875, 0.0735931396484375, 0.08182525634765625, 0.090057373046875, 0.09828948974609375, 0.1065216064453125, 0.11475372314453125, 0.12298583984375, 0.13121795654296875, 0.1394500732421875, 0.14768218994140625, 0.155914306640625, 0.16414642333984375, 0.1723785400390625, 0.18061065673828125, 0.1888427734375, 0.19707489013671875, 0.2053070068359375, 0.21353912353515625, 0.221771240234375, 0.23000335693359375, 0.2382354736328125, 0.24646759033203125, 0.25469970703125, 0.26293182373046875, 0.2711639404296875, 0.27939605712890625, 0.287628173828125, 0.29586029052734375, 0.3040924072265625, 0.31232452392578125, 0.320556640625]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 2.0, 3.0, 5.0, 6.0, 6.0, 5.0, 7.0, 10.0, 22.0, 13.0, 22.0, 26.0, 50.0, 36.0, 55.0, 59.0, 77.0, 86.0, 85.0, 81.0, 57.0, 58.0, 49.0, 23.0, 34.0, 26.0, 27.0, 14.0, 8.0, 10.0, 12.0, 6.0, 7.0, 4.0, 4.0, 4.0, 2.0, 3.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1707763671875, -0.1644916534423828, -0.15820693969726562, -0.15192222595214844, -0.14563751220703125, -0.13935279846191406, -0.13306808471679688, -0.1267833709716797, -0.1204986572265625, -0.11421394348144531, -0.10792922973632812, -0.10164451599121094, -0.09535980224609375, -0.08907508850097656, -0.08279037475585938, -0.07650566101074219, -0.070220947265625, -0.06393623352050781, -0.057651519775390625, -0.05136680603027344, -0.04508209228515625, -0.03879737854003906, -0.032512664794921875, -0.026227951049804688, -0.0199432373046875, -0.013658523559570312, -0.007373809814453125, -0.0010890960693359375, 0.00519561767578125, 0.011480331420898438, 0.017765045166015625, 0.024049758911132812, 0.03033447265625, 0.03661918640136719, 0.042903900146484375, 0.04918861389160156, 0.05547332763671875, 0.06175804138183594, 0.06804275512695312, 0.07432746887207031, 0.0806121826171875, 0.08689689636230469, 0.09318161010742188, 0.09946632385253906, 0.10575103759765625, 0.11203575134277344, 0.11832046508789062, 0.12460517883300781, 0.130889892578125, 0.1371746063232422, 0.14345932006835938, 0.14974403381347656, 0.15602874755859375, 0.16231346130371094, 0.16859817504882812, 0.1748828887939453, 0.1811676025390625, 0.1874523162841797, 0.19373703002929688, 0.20002174377441406, 0.20630645751953125, 0.21259117126464844, 0.21887588500976562, 0.2251605987548828, 0.2314453125]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 28.0, 87.0, 186.0, 320.0, 233.0, 110.0, 39.0, 8.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1280171871185303, -1.8813002109527588, -1.6345831155776978, -1.3878660202026367, -1.1411490440368652, -0.8944320678710938, -0.6477149724960327, -0.4009978771209717, -0.1542809009552002, 0.09243613481521606, 0.3391531705856323, 0.5858702063560486, 0.8325872421264648, 1.0793042182922363, 1.3260213136672974, 1.5727384090423584, 1.8194553852081299, 2.0661723613739014, 2.312889575958252, 2.5596065521240234, 2.806323528289795, 3.0530405044555664, 3.299757480621338, 3.5464746952056885, 3.79319167137146, 4.0399088859558105, 4.286625862121582, 4.5333428382873535, 4.780059814453125, 5.0267767906188965, 5.273493766784668, 5.520211219787598, 5.766927719116211, 6.013644695281982, 6.260361671447754, 6.507078647613525, 6.753795623779297, 7.000513076782227, 7.247230052947998, 7.4939470291137695, 7.740664005279541, 7.9873809814453125, 8.234098434448242, 8.480814933776855, 8.727532386779785, 8.974248886108398, 9.220966339111328, 9.467683792114258, 9.714400291442871, 9.9611177444458, 10.207834243774414, 10.454551696777344, 10.701268196105957, 10.947985649108887, 11.1947021484375, 11.44141960144043, 11.68813705444336, 11.934854507446289, 12.181571006774902, 12.428288459777832, 12.675004959106445, 12.921722412109375, 13.168438911437988, 13.415156364440918, 13.661872863769531]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 7.0, 4.0, 11.0, 9.0, 18.0, 10.0, 16.0, 15.0, 24.0, 30.0, 22.0, 34.0, 37.0, 34.0, 48.0, 51.0, 36.0, 64.0, 50.0, 49.0, 54.0, 32.0, 37.0, 50.0, 47.0, 44.0, 19.0, 34.0, 16.0, 21.0, 17.0, 17.0, 10.0, 7.0, 8.0, 10.0, 7.0, 1.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.7428758144378662, -1.6881561279296875, -1.6334364414215088, -1.57871675491333, -1.5239969491958618, -1.469277262687683, -1.4145575761795044, -1.3598378896713257, -1.3051180839538574, -1.2503983974456787, -1.1956787109375, -1.1409590244293213, -1.086239218711853, -1.0315195322036743, -0.9767998456954956, -0.9220801591873169, -0.8673604726791382, -0.8126407861709595, -0.757921040058136, -0.7032013535499573, -0.6484816074371338, -0.5937619209289551, -0.5390422344207764, -0.48432251811027527, -0.42960280179977417, -0.37488308548927307, -0.320163369178772, -0.26544368267059326, -0.21072396636009216, -0.15600425004959106, -0.10128456354141235, -0.046564847230911255, 0.008154749870300293, 0.0628744587302208, 0.1175941675901413, 0.1723138689994812, 0.2270335853099823, 0.2817533016204834, 0.3364729881286621, 0.3911927044391632, 0.4459124207496643, 0.500632107257843, 0.5553518533706665, 0.6100715398788452, 0.6647912263870239, 0.7195109724998474, 0.7742306590080261, 0.8289504051208496, 0.8836700916290283, 0.938389778137207, 0.9931095242500305, 1.0478291511535645, 1.1025489568710327, 1.1572686433792114, 1.2119883298873901, 1.2667080163955688, 1.321427822113037, 1.3761475086212158, 1.4308671951293945, 1.4855868816375732, 1.5403066873550415, 1.5950263738632202, 1.649746060371399, 1.7044657468795776, 1.7591854333877563]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 7.0, 3.0, 11.0, 12.0, 15.0, 21.0, 24.0, 42.0, 54.0, 74.0, 107.0, 114.0, 194.0, 285.0, 453.0, 659.0, 1009.0, 1703.0, 2784.0, 4527.0, 7761.0, 13947.0, 24695.0, 47372.0, 95897.0, 212798.0, 588133.0, 1774509.0, 883003.0, 284104.0, 120847.0, 58708.0, 30572.0, 16627.0, 9272.0, 5508.0, 3078.0, 1906.0, 1100.0, 758.0, 519.0, 335.0, 210.0, 168.0, 92.0, 81.0, 61.0, 42.0, 36.0, 15.0, 16.0, 6.0, 12.0, 5.0, 4.0, 0.0, 1.0, 3.0, 1.0, 1.0], "bins": [-0.2200927734375, -0.21314048767089844, -0.20618820190429688, -0.1992359161376953, -0.19228363037109375, -0.1853313446044922, -0.17837905883789062, -0.17142677307128906, -0.1644744873046875, -0.15752220153808594, -0.15056991577148438, -0.1436176300048828, -0.13666534423828125, -0.1297130584716797, -0.12276077270507812, -0.11580848693847656, -0.108856201171875, -0.10190391540527344, -0.09495162963867188, -0.08799934387207031, -0.08104705810546875, -0.07409477233886719, -0.06714248657226562, -0.06019020080566406, -0.0532379150390625, -0.04628562927246094, -0.039333343505859375, -0.03238105773925781, -0.02542877197265625, -0.018476486206054688, -0.011524200439453125, -0.0045719146728515625, 0.00238037109375, 0.009332656860351562, 0.016284942626953125, 0.023237228393554688, 0.03018951416015625, 0.03714179992675781, 0.044094085693359375, 0.05104637145996094, 0.0579986572265625, 0.06495094299316406, 0.07190322875976562, 0.07885551452636719, 0.08580780029296875, 0.09276008605957031, 0.09971237182617188, 0.10666465759277344, 0.113616943359375, 0.12056922912597656, 0.12752151489257812, 0.1344738006591797, 0.14142608642578125, 0.1483783721923828, 0.15533065795898438, 0.16228294372558594, 0.1692352294921875, 0.17618751525878906, 0.18313980102539062, 0.1900920867919922, 0.19704437255859375, 0.2039966583251953, 0.21094894409179688, 0.21790122985839844, 0.224853515625]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 2.0, 3.0, 6.0, 8.0, 18.0, 14.0, 11.0, 14.0, 17.0, 15.0, 30.0, 28.0, 41.0, 36.0, 34.0, 41.0, 38.0, 39.0, 40.0, 43.0, 45.0, 46.0, 40.0, 53.0, 48.0, 51.0, 46.0, 32.0, 28.0, 28.0, 20.0, 22.0, 17.0, 12.0, 11.0, 6.0, 7.0, 7.0, 3.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1497802734375, -0.144073486328125, -0.13836669921875, -0.132659912109375, -0.126953125, -0.121246337890625, -0.11553955078125, -0.109832763671875, -0.1041259765625, -0.098419189453125, -0.09271240234375, -0.087005615234375, -0.081298828125, -0.075592041015625, -0.06988525390625, -0.064178466796875, -0.0584716796875, -0.052764892578125, -0.04705810546875, -0.041351318359375, -0.03564453125, -0.029937744140625, -0.02423095703125, -0.018524169921875, -0.0128173828125, -0.007110595703125, -0.00140380859375, 0.004302978515625, 0.010009765625, 0.015716552734375, 0.02142333984375, 0.027130126953125, 0.0328369140625, 0.038543701171875, 0.04425048828125, 0.049957275390625, 0.0556640625, 0.061370849609375, 0.06707763671875, 0.072784423828125, 0.0784912109375, 0.084197998046875, 0.08990478515625, 0.095611572265625, 0.101318359375, 0.107025146484375, 0.11273193359375, 0.118438720703125, 0.1241455078125, 0.129852294921875, 0.13555908203125, 0.141265869140625, 0.14697265625, 0.152679443359375, 0.15838623046875, 0.164093017578125, 0.1697998046875, 0.175506591796875, 0.18121337890625, 0.186920166015625, 0.192626953125, 0.198333740234375, 0.20404052734375, 0.209747314453125, 0.2154541015625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 7.0, 16.0, 28.0, 26.0, 42.0, 89.0, 116.0, 176.0, 276.0, 458.0, 784.0, 1488.0, 2672.0, 5139.0, 10101.0, 21547.0, 48353.0, 113634.0, 294526.0, 951151.0, 1844581.0, 558157.0, 195997.0, 78889.0, 34062.0, 15741.0, 7557.0, 3826.0, 2039.0, 1108.0, 611.0, 388.0, 225.0, 172.0, 109.0, 62.0, 41.0, 35.0, 19.0, 9.0, 10.0, 7.0, 6.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.389404296875, -0.3773460388183594, -0.36528778076171875, -0.3532295227050781, -0.3411712646484375, -0.3291130065917969, -0.31705474853515625, -0.3049964904785156, -0.292938232421875, -0.2808799743652344, -0.26882171630859375, -0.2567634582519531, -0.2447052001953125, -0.23264694213867188, -0.22058868408203125, -0.20853042602539062, -0.19647216796875, -0.18441390991210938, -0.17235565185546875, -0.16029739379882812, -0.1482391357421875, -0.13618087768554688, -0.12412261962890625, -0.11206436157226562, -0.100006103515625, -0.08794784545898438, -0.07588958740234375, -0.06383132934570312, -0.0517730712890625, -0.039714813232421875, -0.02765655517578125, -0.015598297119140625, -0.0035400390625, 0.008518218994140625, 0.02057647705078125, 0.032634735107421875, 0.0446929931640625, 0.056751251220703125, 0.06880950927734375, 0.08086776733398438, 0.092926025390625, 0.10498428344726562, 0.11704254150390625, 0.12910079956054688, 0.1411590576171875, 0.15321731567382812, 0.16527557373046875, 0.17733383178710938, 0.18939208984375, 0.20145034790039062, 0.21350860595703125, 0.22556686401367188, 0.2376251220703125, 0.24968338012695312, 0.26174163818359375, 0.2737998962402344, 0.285858154296875, 0.2979164123535156, 0.30997467041015625, 0.3220329284667969, 0.3340911865234375, 0.3461494445800781, 0.35820770263671875, 0.3702659606933594, 0.38232421875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 6.0, 11.0, 12.0, 11.0, 17.0, 24.0, 34.0, 43.0, 60.0, 102.0, 133.0, 159.0, 233.0, 373.0, 557.0, 734.0, 544.0, 309.0, 216.0, 147.0, 114.0, 71.0, 39.0, 37.0, 26.0, 23.0, 12.0, 8.0, 9.0, 6.0, 3.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.42822265625, -0.4130859375, -0.39794921875, -0.3828125, -0.36767578125, -0.3525390625, -0.33740234375, -0.322265625, -0.30712890625, -0.2919921875, -0.27685546875, -0.26171875, -0.24658203125, -0.2314453125, -0.21630859375, -0.201171875, -0.18603515625, -0.1708984375, -0.15576171875, -0.140625, -0.12548828125, -0.1103515625, -0.09521484375, -0.080078125, -0.06494140625, -0.0498046875, -0.03466796875, -0.01953125, -0.00439453125, 0.0107421875, 0.02587890625, 0.041015625, 0.05615234375, 0.0712890625, 0.08642578125, 0.1015625, 0.11669921875, 0.1318359375, 0.14697265625, 0.162109375, 0.17724609375, 0.1923828125, 0.20751953125, 0.22265625, 0.23779296875, 0.2529296875, 0.26806640625, 0.283203125, 0.29833984375, 0.3134765625, 0.32861328125, 0.34375, 0.35888671875, 0.3740234375, 0.38916015625, 0.404296875, 0.41943359375, 0.4345703125, 0.44970703125, 0.46484375, 0.47998046875, 0.4951171875, 0.51025390625, 0.525390625, 0.54052734375]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 1.0, 3.0, 12.0, 15.0, 27.0, 39.0, 52.0, 64.0, 75.0, 84.0, 120.0, 112.0, 91.0, 84.0, 63.0, 64.0, 35.0, 21.0, 15.0, 7.0, 11.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.2121691703796387, -2.129901647567749, -2.0476343631744385, -1.9653668403625488, -1.8830993175506592, -1.800831913948059, -1.718564510345459, -1.6362969875335693, -1.5540295839309692, -1.4717621803283691, -1.3894946575164795, -1.3072272539138794, -1.2249598503112793, -1.1426923274993896, -1.0604249238967896, -0.9781574606895447, -0.8958899974822998, -0.8136225342750549, -0.7313550710678101, -0.64908766746521, -0.5668202042579651, -0.4845527410507202, -0.40228530764579773, -0.32001787424087524, -0.23775041103363037, -0.1554829627275467, -0.07321551442146301, 0.009051933884620667, 0.09131938219070435, 0.17358684539794922, 0.2558542788028717, 0.3381217122077942, 0.42038917541503906, 0.5026566386222839, 0.5849241018295288, 0.6671915054321289, 0.7494589686393738, 0.8317264318466187, 0.9139938354492188, 0.9962612986564636, 1.0785287618637085, 1.1607961654663086, 1.2430636882781982, 1.3253310918807983, 1.4075984954833984, 1.489866018295288, 1.5721334218978882, 1.6544008255004883, 1.736668348312378, 1.818935751914978, 1.9012032747268677, 1.9834706783294678, 2.0657382011413574, 2.148005485534668, 2.2302730083465576, 2.3125405311584473, 2.394807815551758, 2.4770753383636475, 2.559342622756958, 2.6416101455688477, 2.7238776683807373, 2.806145191192627, 2.8884124755859375, 2.970679998397827, 3.052947521209717]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 5.0, 1.0, 5.0, 3.0, 8.0, 7.0, 7.0, 13.0, 12.0, 9.0, 10.0, 23.0, 18.0, 26.0, 19.0, 25.0, 18.0, 33.0, 34.0, 40.0, 50.0, 31.0, 41.0, 34.0, 27.0, 36.0, 39.0, 48.0, 37.0, 41.0, 40.0, 26.0, 30.0, 28.0, 24.0, 27.0, 31.0, 14.0, 14.0, 17.0, 15.0, 6.0, 13.0, 6.0, 6.0, 4.0, 3.0, 2.0, 1.0, 5.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1867331266403198, -1.146103024482727, -1.1054729223251343, -1.064842939376831, -1.0242128372192383, -0.9835827350616455, -0.9429526329040527, -0.90232253074646, -0.861692488193512, -0.8210623860359192, -0.7804323434829712, -0.7398022413253784, -0.6991721391677856, -0.6585420966148376, -0.6179119944572449, -0.5772819519042969, -0.5366518497467041, -0.4960217773914337, -0.45539170503616333, -0.41476160287857056, -0.37413153052330017, -0.3335014581680298, -0.292871356010437, -0.2522412836551666, -0.21161121129989624, -0.17098113894462585, -0.13035105168819427, -0.08972097188234329, -0.04909089207649231, -0.008460819721221924, 0.032169267535209656, 0.07279935479164124, 0.11342930793762207, 0.15405938029289246, 0.19468946754932404, 0.23531955480575562, 0.275949627161026, 0.3165796995162964, 0.35720980167388916, 0.39783987402915955, 0.43846994638442993, 0.4791000187397003, 0.5197300910949707, 0.5603601932525635, 0.6009902954101562, 0.6416203379631042, 0.682250440120697, 0.722880482673645, 0.7635105848312378, 0.8041406869888306, 0.8447707295417786, 0.8854008316993713, 0.9260308742523193, 0.9666609764099121, 1.0072910785675049, 1.0479211807250977, 1.0885512828826904, 1.1291813850402832, 1.169811487197876, 1.2104414701461792, 1.251071572303772, 1.2917016744613647, 1.3323317766189575, 1.3729618787765503, 1.4135918617248535]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 7.0, 15.0, 16.0, 21.0, 18.0, 50.0, 58.0, 80.0, 134.0, 192.0, 296.0, 441.0, 536.0, 816.0, 1233.0, 1838.0, 2790.0, 4187.0, 6414.0, 10138.0, 16107.0, 27638.0, 50192.0, 103849.0, 235368.0, 288095.0, 144463.0, 65076.0, 34205.0, 19815.0, 12064.0, 7454.0, 4846.0, 3327.0, 2103.0, 1448.0, 997.0, 711.0, 489.0, 336.0, 218.0, 156.0, 102.0, 66.0, 51.0, 34.0, 22.0, 19.0, 11.0, 10.0, 8.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.304443359375, -0.2949867248535156, -0.28553009033203125, -0.2760734558105469, -0.2666168212890625, -0.2571601867675781, -0.24770355224609375, -0.23824691772460938, -0.228790283203125, -0.21933364868164062, -0.20987701416015625, -0.20042037963867188, -0.1909637451171875, -0.18150711059570312, -0.17205047607421875, -0.16259384155273438, -0.15313720703125, -0.14368057250976562, -0.13422393798828125, -0.12476730346679688, -0.1153106689453125, -0.10585403442382812, -0.09639739990234375, -0.08694076538085938, -0.077484130859375, -0.06802749633789062, -0.05857086181640625, -0.049114227294921875, -0.0396575927734375, -0.030200958251953125, -0.02074432373046875, -0.011287689208984375, -0.0018310546875, 0.007625579833984375, 0.01708221435546875, 0.026538848876953125, 0.0359954833984375, 0.045452117919921875, 0.05490875244140625, 0.06436538696289062, 0.073822021484375, 0.08327865600585938, 0.09273529052734375, 0.10219192504882812, 0.1116485595703125, 0.12110519409179688, 0.13056182861328125, 0.14001846313476562, 0.14947509765625, 0.15893173217773438, 0.16838836669921875, 0.17784500122070312, 0.1873016357421875, 0.19675827026367188, 0.20621490478515625, 0.21567153930664062, 0.225128173828125, 0.23458480834960938, 0.24404144287109375, 0.2534980773925781, 0.2629547119140625, 0.2724113464355469, 0.28186798095703125, 0.2913246154785156, 0.30078125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 4.0, 6.0, 1.0, 2.0, 7.0, 2.0, 13.0, 9.0, 6.0, 12.0, 13.0, 21.0, 19.0, 20.0, 30.0, 19.0, 30.0, 37.0, 34.0, 44.0, 28.0, 32.0, 40.0, 39.0, 40.0, 40.0, 35.0, 51.0, 36.0, 43.0, 33.0, 28.0, 30.0, 22.0, 33.0, 26.0, 25.0, 20.0, 13.0, 21.0, 18.0, 8.0, 4.0, 6.0, 0.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.162353515625, -0.15653228759765625, -0.1507110595703125, -0.14488983154296875, -0.139068603515625, -0.13324737548828125, -0.1274261474609375, -0.12160491943359375, -0.11578369140625, -0.10996246337890625, -0.1041412353515625, -0.09832000732421875, -0.092498779296875, -0.08667755126953125, -0.0808563232421875, -0.07503509521484375, -0.0692138671875, -0.06339263916015625, -0.0575714111328125, -0.05175018310546875, -0.045928955078125, -0.04010772705078125, -0.0342864990234375, -0.02846527099609375, -0.02264404296875, -0.01682281494140625, -0.0110015869140625, -0.00518035888671875, 0.000640869140625, 0.00646209716796875, 0.0122833251953125, 0.01810455322265625, 0.02392578125, 0.02974700927734375, 0.0355682373046875, 0.04138946533203125, 0.047210693359375, 0.05303192138671875, 0.0588531494140625, 0.06467437744140625, 0.07049560546875, 0.07631683349609375, 0.0821380615234375, 0.08795928955078125, 0.093780517578125, 0.09960174560546875, 0.1054229736328125, 0.11124420166015625, 0.1170654296875, 0.12288665771484375, 0.1287078857421875, 0.13452911376953125, 0.140350341796875, 0.14617156982421875, 0.1519927978515625, 0.15781402587890625, 0.16363525390625, 0.16945648193359375, 0.1752777099609375, 0.18109893798828125, 0.186920166015625, 0.19274139404296875, 0.1985626220703125, 0.20438385009765625, 0.210205078125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 6.0, 2.0, 6.0, 4.0, 17.0, 27.0, 32.0, 77.0, 117.0, 310.0, 575.0, 1106.0, 2540.0, 5614.0, 12924.0, 29043.0, 75276.0, 282311.0, 438623.0, 125656.0, 41711.0, 17912.0, 7827.0, 3683.0, 1676.0, 720.0, 360.0, 198.0, 87.0, 51.0, 24.0, 20.0, 9.0, 6.0, 6.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.65380859375, -0.6371345520019531, -0.6204605102539062, -0.6037864685058594, -0.5871124267578125, -0.5704383850097656, -0.5537643432617188, -0.5370903015136719, -0.520416259765625, -0.5037422180175781, -0.48706817626953125, -0.4703941345214844, -0.4537200927734375, -0.4370460510253906, -0.42037200927734375, -0.4036979675292969, -0.38702392578125, -0.3703498840332031, -0.35367584228515625, -0.3370018005371094, -0.3203277587890625, -0.3036537170410156, -0.28697967529296875, -0.2703056335449219, -0.253631591796875, -0.23695755004882812, -0.22028350830078125, -0.20360946655273438, -0.1869354248046875, -0.17026138305664062, -0.15358734130859375, -0.13691329956054688, -0.1202392578125, -0.10356521606445312, -0.08689117431640625, -0.07021713256835938, -0.0535430908203125, -0.036869049072265625, -0.02019500732421875, -0.003520965576171875, 0.013153076171875, 0.029827117919921875, 0.04650115966796875, 0.06317520141601562, 0.0798492431640625, 0.09652328491210938, 0.11319732666015625, 0.12987136840820312, 0.14654541015625, 0.16321945190429688, 0.17989349365234375, 0.19656753540039062, 0.2132415771484375, 0.22991561889648438, 0.24658966064453125, 0.2632637023925781, 0.279937744140625, 0.2966117858886719, 0.31328582763671875, 0.3299598693847656, 0.3466339111328125, 0.3633079528808594, 0.37998199462890625, 0.3966560363769531, 0.413330078125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 9.0, 6.0, 7.0, 6.0, 9.0, 1.0, 8.0, 18.0, 9.0, 13.0, 20.0, 25.0, 21.0, 27.0, 26.0, 30.0, 42.0, 38.0, 52.0, 38.0, 42.0, 46.0, 34.0, 39.0, 33.0, 38.0, 37.0, 48.0, 36.0, 32.0, 24.0, 26.0, 23.0, 16.0, 18.0, 13.0, 14.0, 12.0, 13.0, 11.0, 12.0, 5.0, 2.0, 7.0, 7.0, 8.0, 1.0, 1.0, 4.0, 4.0, 1.0, 0.0, 1.0], "bins": [-0.5771484375, -0.5598907470703125, -0.542633056640625, -0.5253753662109375, -0.50811767578125, -0.4908599853515625, -0.473602294921875, -0.4563446044921875, -0.4390869140625, -0.4218292236328125, -0.404571533203125, -0.3873138427734375, -0.37005615234375, -0.3527984619140625, -0.335540771484375, -0.3182830810546875, -0.301025390625, -0.2837677001953125, -0.266510009765625, -0.2492523193359375, -0.23199462890625, -0.2147369384765625, -0.197479248046875, -0.1802215576171875, -0.1629638671875, -0.1457061767578125, -0.128448486328125, -0.1111907958984375, -0.09393310546875, -0.0766754150390625, -0.059417724609375, -0.0421600341796875, -0.02490234375, -0.0076446533203125, 0.009613037109375, 0.0268707275390625, 0.04412841796875, 0.0613861083984375, 0.078643798828125, 0.0959014892578125, 0.1131591796875, 0.1304168701171875, 0.147674560546875, 0.1649322509765625, 0.18218994140625, 0.1994476318359375, 0.216705322265625, 0.2339630126953125, 0.251220703125, 0.2684783935546875, 0.285736083984375, 0.3029937744140625, 0.32025146484375, 0.3375091552734375, 0.354766845703125, 0.3720245361328125, 0.3892822265625, 0.4065399169921875, 0.423797607421875, 0.4410552978515625, 0.45831298828125, 0.4755706787109375, 0.492828369140625, 0.5100860595703125, 0.52734375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 5.0, 4.0, 7.0, 17.0, 19.0, 17.0, 47.0, 67.0, 124.0, 181.0, 296.0, 553.0, 883.0, 1583.0, 2764.0, 4783.0, 8484.0, 14869.0, 26375.0, 47069.0, 89651.0, 210704.0, 324708.0, 154211.0, 71467.0, 39116.0, 21691.0, 12259.0, 7169.0, 3953.0, 2289.0, 1329.0, 764.0, 451.0, 251.0, 133.0, 91.0, 58.0, 48.0, 26.0, 21.0, 7.0, 11.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11358642578125, -0.10927295684814453, -0.10495948791503906, -0.1006460189819336, -0.09633255004882812, -0.09201908111572266, -0.08770561218261719, -0.08339214324951172, -0.07907867431640625, -0.07476520538330078, -0.07045173645019531, -0.06613826751708984, -0.061824798583984375, -0.057511329650878906, -0.05319786071777344, -0.04888439178466797, -0.0445709228515625, -0.04025745391845703, -0.03594398498535156, -0.031630516052246094, -0.027317047119140625, -0.023003578186035156, -0.018690109252929688, -0.014376640319824219, -0.01006317138671875, -0.005749702453613281, -0.0014362335205078125, 0.0028772354125976562, 0.007190704345703125, 0.011504173278808594, 0.015817642211914062, 0.02013111114501953, 0.024444580078125, 0.02875804901123047, 0.03307151794433594, 0.037384986877441406, 0.041698455810546875, 0.046011924743652344, 0.05032539367675781, 0.05463886260986328, 0.05895233154296875, 0.06326580047607422, 0.06757926940917969, 0.07189273834228516, 0.07620620727539062, 0.0805196762084961, 0.08483314514160156, 0.08914661407470703, 0.0934600830078125, 0.09777355194091797, 0.10208702087402344, 0.1064004898071289, 0.11071395874023438, 0.11502742767333984, 0.11934089660644531, 0.12365436553955078, 0.12796783447265625, 0.13228130340576172, 0.1365947723388672, 0.14090824127197266, 0.14522171020507812, 0.1495351791381836, 0.15384864807128906, 0.15816211700439453, 0.1624755859375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 6.0, 8.0, 3.0, 10.0, 4.0, 7.0, 9.0, 9.0, 11.0, 9.0, 26.0, 31.0, 40.0, 57.0, 106.0, 167.0, 149.0, 126.0, 62.0, 47.0, 39.0, 15.0, 11.0, 14.0, 9.0, 4.0, 5.0, 3.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.435943603515625e-05, -5.260482430458069e-05, -5.085021257400513e-05, -4.9095600843429565e-05, -4.7340989112854004e-05, -4.558637738227844e-05, -4.383176565170288e-05, -4.207715392112732e-05, -4.032254219055176e-05, -3.8567930459976196e-05, -3.6813318729400635e-05, -3.505870699882507e-05, -3.330409526824951e-05, -3.154948353767395e-05, -2.979487180709839e-05, -2.8040260076522827e-05, -2.6285648345947266e-05, -2.4531036615371704e-05, -2.2776424884796143e-05, -2.102181315422058e-05, -1.926720142364502e-05, -1.7512589693069458e-05, -1.5757977962493896e-05, -1.4003366231918335e-05, -1.2248754501342773e-05, -1.0494142770767212e-05, -8.73953104019165e-06, -6.984919309616089e-06, -5.230307579040527e-06, -3.475695848464966e-06, -1.7210841178894043e-06, 3.3527612686157227e-08, 1.7881393432617188e-06, 3.5427510738372803e-06, 5.297362804412842e-06, 7.051974534988403e-06, 8.806586265563965e-06, 1.0561197996139526e-05, 1.2315809726715088e-05, 1.407042145729065e-05, 1.582503318786621e-05, 1.7579644918441772e-05, 1.9334256649017334e-05, 2.1088868379592896e-05, 2.2843480110168457e-05, 2.459809184074402e-05, 2.635270357131958e-05, 2.810731530189514e-05, 2.9861927032470703e-05, 3.1616538763046265e-05, 3.3371150493621826e-05, 3.512576222419739e-05, 3.688037395477295e-05, 3.863498568534851e-05, 4.038959741592407e-05, 4.2144209146499634e-05, 4.3898820877075195e-05, 4.565343260765076e-05, 4.740804433822632e-05, 4.916265606880188e-05, 5.091726779937744e-05, 5.2671879529953e-05, 5.4426491260528564e-05, 5.6181102991104126e-05, 5.793571472167969e-05]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 8.0, 16.0, 28.0, 46.0, 75.0, 107.0, 189.0, 416.0, 781.0, 1590.0, 3659.0, 7730.0, 17536.0, 40967.0, 103022.0, 319666.0, 355804.0, 115994.0, 45632.0, 19222.0, 8565.0, 3900.0, 1837.0, 844.0, 441.0, 205.0, 109.0, 67.0, 47.0, 27.0, 17.0, 4.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2052001953125, -0.1991748809814453, -0.19314956665039062, -0.18712425231933594, -0.18109893798828125, -0.17507362365722656, -0.16904830932617188, -0.1630229949951172, -0.1569976806640625, -0.1509723663330078, -0.14494705200195312, -0.13892173767089844, -0.13289642333984375, -0.12687110900878906, -0.12084579467773438, -0.11482048034667969, -0.108795166015625, -0.10276985168457031, -0.09674453735351562, -0.09071922302246094, -0.08469390869140625, -0.07866859436035156, -0.07264328002929688, -0.06661796569824219, -0.0605926513671875, -0.05456733703613281, -0.048542022705078125, -0.04251670837402344, -0.03649139404296875, -0.030466079711914062, -0.024440765380859375, -0.018415451049804688, -0.01239013671875, -0.0063648223876953125, -0.000339508056640625, 0.0056858062744140625, 0.01171112060546875, 0.017736434936523438, 0.023761749267578125, 0.029787063598632812, 0.0358123779296875, 0.04183769226074219, 0.047863006591796875, 0.05388832092285156, 0.05991363525390625, 0.06593894958496094, 0.07196426391601562, 0.07798957824707031, 0.084014892578125, 0.09004020690917969, 0.09606552124023438, 0.10209083557128906, 0.10811614990234375, 0.11414146423339844, 0.12016677856445312, 0.1261920928955078, 0.1322174072265625, 0.1382427215576172, 0.14426803588867188, 0.15029335021972656, 0.15631866455078125, 0.16234397888183594, 0.16836929321289062, 0.1743946075439453, 0.180419921875]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 5.0, 3.0, 6.0, 6.0, 15.0, 6.0, 19.0, 17.0, 21.0, 25.0, 35.0, 42.0, 46.0, 81.0, 75.0, 103.0, 101.0, 88.0, 61.0, 50.0, 36.0, 35.0, 18.0, 21.0, 20.0, 7.0, 8.0, 13.0, 6.0, 7.0, 3.0, 2.0, 5.0, 3.0, 1.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1878662109375, -0.18215179443359375, -0.1764373779296875, -0.17072296142578125, -0.165008544921875, -0.15929412841796875, -0.1535797119140625, -0.14786529541015625, -0.14215087890625, -0.13643646240234375, -0.1307220458984375, -0.12500762939453125, -0.119293212890625, -0.11357879638671875, -0.1078643798828125, -0.10214996337890625, -0.096435546875, -0.09072113037109375, -0.0850067138671875, -0.07929229736328125, -0.073577880859375, -0.06786346435546875, -0.0621490478515625, -0.05643463134765625, -0.05072021484375, -0.04500579833984375, -0.0392913818359375, -0.03357696533203125, -0.027862548828125, -0.02214813232421875, -0.0164337158203125, -0.01071929931640625, -0.0050048828125, 0.00070953369140625, 0.0064239501953125, 0.01213836669921875, 0.017852783203125, 0.02356719970703125, 0.0292816162109375, 0.03499603271484375, 0.04071044921875, 0.04642486572265625, 0.0521392822265625, 0.05785369873046875, 0.063568115234375, 0.06928253173828125, 0.0749969482421875, 0.08071136474609375, 0.08642578125, 0.09214019775390625, 0.0978546142578125, 0.10356903076171875, 0.109283447265625, 0.11499786376953125, 0.1207122802734375, 0.12642669677734375, 0.13214111328125, 0.13785552978515625, 0.1435699462890625, 0.14928436279296875, 0.154998779296875, 0.16071319580078125, 0.1664276123046875, 0.17214202880859375, 0.1778564453125]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 11.0, 11.0, 22.0, 29.0, 29.0, 74.0, 78.0, 102.0, 120.0, 125.0, 107.0, 87.0, 67.0, 45.0, 33.0, 26.0, 9.0, 16.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5914758443832397, -1.517104148864746, -1.442732334136963, -1.3683606386184692, -1.2939889430999756, -1.2196171283721924, -1.1452454328536987, -1.070873737335205, -0.9965019822120667, -0.9221302270889282, -0.8477585315704346, -0.7733867764472961, -0.6990150213241577, -0.6246433258056641, -0.5502715706825256, -0.475899875164032, -0.40152812004089355, -0.3271563947200775, -0.2527846693992615, -0.17841291427612305, -0.104041188955307, -0.029669463634490967, 0.04470229148864746, 0.11907398700714111, 0.19344574213027954, 0.2678174674510956, 0.3421891927719116, 0.41656094789505005, 0.4909326732158661, 0.5653043985366821, 0.6396761536598206, 0.7140478491783142, 0.7884194850921631, 0.8627912402153015, 0.9371629357337952, 1.0115346908569336, 1.0859063863754272, 1.160278081893921, 1.234649896621704, 1.3090215921401978, 1.3833932876586914, 1.457764983177185, 1.5321367979049683, 1.606508493423462, 1.6808801889419556, 1.7552518844604492, 1.8296236991882324, 1.903995394706726, 1.9783672094345093, 2.052738904953003, 2.127110719680786, 2.2014822959899902, 2.2758541107177734, 2.3502259254455566, 2.42459774017334, 2.498969316482544, 2.573341131210327, 2.6477129459381104, 2.7220845222473145, 2.7964563369750977, 2.870828151702881, 2.945199728012085, 3.019571542739868, 3.0939431190490723, 3.1683149337768555]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 0.0, 7.0, 2.0, 2.0, 4.0, 10.0, 7.0, 5.0, 15.0, 11.0, 18.0, 15.0, 27.0, 30.0, 30.0, 30.0, 30.0, 30.0, 33.0, 33.0, 40.0, 46.0, 40.0, 39.0, 42.0, 33.0, 39.0, 48.0, 37.0, 37.0, 36.0, 30.0, 31.0, 29.0, 28.0, 14.0, 18.0, 17.0, 18.0, 19.0, 6.0, 5.0, 7.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.5477862358093262, -1.5011661052703857, -1.4545459747314453, -1.4079258441925049, -1.361305832862854, -1.3146857023239136, -1.2680655717849731, -1.2214454412460327, -1.1748254299163818, -1.1282052993774414, -1.081585168838501, -1.0349650382995605, -0.9883450269699097, -0.9417248964309692, -0.8951047658920288, -0.8484846353530884, -0.801864504814148, -0.7552443742752075, -0.7086243033409119, -0.6620041728019714, -0.6153841018676758, -0.5687639713287354, -0.5221438407897949, -0.4755237400531769, -0.42890363931655884, -0.3822835385799408, -0.33566343784332275, -0.2890433073043823, -0.24242320656776428, -0.19580310583114624, -0.1491829752922058, -0.10256287455558777, -0.05594289302825928, -0.009322784841060638, 0.037297323346138, 0.08391743898391724, 0.13053753972053528, 0.17715764045715332, 0.22377777099609375, 0.2703978717327118, 0.31701797246932983, 0.3636380732059479, 0.4102581739425659, 0.45687830448150635, 0.5034984350204468, 0.5501185059547424, 0.5967386364936829, 0.6433587074279785, 0.689978837966919, 0.7365989685058594, 0.783219039440155, 0.8298391699790955, 0.8764592409133911, 0.9230793714523315, 0.969699501991272, 1.0163196325302124, 1.0629396438598633, 1.1095597743988037, 1.1561799049377441, 1.2028000354766846, 1.2494200468063354, 1.2960401773452759, 1.3426603078842163, 1.3892804384231567, 1.4359005689620972]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 5.0, 8.0, 5.0, 11.0, 21.0, 23.0, 27.0, 50.0, 71.0, 120.0, 189.0, 296.0, 476.0, 798.0, 1389.0, 2221.0, 4104.0, 7431.0, 13439.0, 26063.0, 52191.0, 112308.0, 284336.0, 1165929.0, 1848822.0, 398302.0, 142822.0, 64174.0, 31483.0, 16368.0, 8935.0, 4931.0, 2848.0, 1594.0, 1015.0, 576.0, 304.0, 221.0, 142.0, 89.0, 59.0, 27.0, 23.0, 15.0, 15.0, 7.0, 5.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2431640625, -0.23386383056640625, -0.2245635986328125, -0.21526336669921875, -0.205963134765625, -0.19666290283203125, -0.1873626708984375, -0.17806243896484375, -0.16876220703125, -0.15946197509765625, -0.1501617431640625, -0.14086151123046875, -0.131561279296875, -0.12226104736328125, -0.1129608154296875, -0.10366058349609375, -0.0943603515625, -0.08506011962890625, -0.0757598876953125, -0.06645965576171875, -0.057159423828125, -0.04785919189453125, -0.0385589599609375, -0.02925872802734375, -0.01995849609375, -0.01065826416015625, -0.0013580322265625, 0.00794219970703125, 0.017242431640625, 0.02654266357421875, 0.0358428955078125, 0.04514312744140625, 0.054443359375, 0.06374359130859375, 0.0730438232421875, 0.08234405517578125, 0.091644287109375, 0.10094451904296875, 0.1102447509765625, 0.11954498291015625, 0.12884521484375, 0.13814544677734375, 0.1474456787109375, 0.15674591064453125, 0.166046142578125, 0.17534637451171875, 0.1846466064453125, 0.19394683837890625, 0.2032470703125, 0.21254730224609375, 0.2218475341796875, 0.23114776611328125, 0.240447998046875, 0.24974822998046875, 0.2590484619140625, 0.26834869384765625, 0.27764892578125, 0.28694915771484375, 0.2962493896484375, 0.30554962158203125, 0.314849853515625, 0.32415008544921875, 0.3334503173828125, 0.34275054931640625, 0.35205078125]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 4.0, 1.0, 6.0, 3.0, 7.0, 4.0, 15.0, 5.0, 15.0, 15.0, 10.0, 8.0, 8.0, 19.0, 23.0, 28.0, 25.0, 30.0, 25.0, 46.0, 45.0, 42.0, 36.0, 42.0, 37.0, 38.0, 49.0, 26.0, 26.0, 39.0, 40.0, 29.0, 38.0, 34.0, 36.0, 18.0, 23.0, 20.0, 17.0, 23.0, 13.0, 14.0, 5.0, 6.0, 4.0, 4.0, 4.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.16259765625, -0.15688133239746094, -0.15116500854492188, -0.1454486846923828, -0.13973236083984375, -0.1340160369873047, -0.12829971313476562, -0.12258338928222656, -0.1168670654296875, -0.11115074157714844, -0.10543441772460938, -0.09971809387207031, -0.09400177001953125, -0.08828544616699219, -0.08256912231445312, -0.07685279846191406, -0.071136474609375, -0.06542015075683594, -0.059703826904296875, -0.05398750305175781, -0.04827117919921875, -0.04255485534667969, -0.036838531494140625, -0.031122207641601562, -0.0254058837890625, -0.019689559936523438, -0.013973236083984375, -0.008256912231445312, -0.00254058837890625, 0.0031757354736328125, 0.008892059326171875, 0.014608383178710938, 0.02032470703125, 0.026041030883789062, 0.031757354736328125, 0.03747367858886719, 0.04319000244140625, 0.04890632629394531, 0.054622650146484375, 0.06033897399902344, 0.0660552978515625, 0.07177162170410156, 0.07748794555664062, 0.08320426940917969, 0.08892059326171875, 0.09463691711425781, 0.10035324096679688, 0.10606956481933594, 0.111785888671875, 0.11750221252441406, 0.12321853637695312, 0.1289348602294922, 0.13465118408203125, 0.1403675079345703, 0.14608383178710938, 0.15180015563964844, 0.1575164794921875, 0.16323280334472656, 0.16894912719726562, 0.1746654510498047, 0.18038177490234375, 0.1860980987548828, 0.19181442260742188, 0.19753074645996094, 0.2032470703125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 1.0, 11.0, 17.0, 21.0, 22.0, 49.0, 71.0, 134.0, 206.0, 377.0, 522.0, 921.0, 1622.0, 2781.0, 4959.0, 9256.0, 17475.0, 34203.0, 69954.0, 150748.0, 368608.0, 1351184.0, 1479493.0, 393931.0, 159926.0, 72549.0, 35599.0, 18001.0, 9597.0, 5184.0, 2900.0, 1613.0, 949.0, 565.0, 335.0, 179.0, 117.0, 67.0, 50.0, 45.0, 10.0, 11.0, 10.0, 6.0, 7.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.379150390625, -0.3676719665527344, -0.35619354248046875, -0.3447151184082031, -0.3332366943359375, -0.3217582702636719, -0.31027984619140625, -0.2988014221191406, -0.287322998046875, -0.2758445739746094, -0.26436614990234375, -0.2528877258300781, -0.2414093017578125, -0.22993087768554688, -0.21845245361328125, -0.20697402954101562, -0.19549560546875, -0.18401718139648438, -0.17253875732421875, -0.16106033325195312, -0.1495819091796875, -0.13810348510742188, -0.12662506103515625, -0.11514663696289062, -0.103668212890625, -0.09218978881835938, -0.08071136474609375, -0.06923294067382812, -0.0577545166015625, -0.046276092529296875, -0.03479766845703125, -0.023319244384765625, -0.0118408203125, -0.000362396240234375, 0.01111602783203125, 0.022594451904296875, 0.0340728759765625, 0.045551300048828125, 0.05702972412109375, 0.06850814819335938, 0.079986572265625, 0.09146499633789062, 0.10294342041015625, 0.11442184448242188, 0.1259002685546875, 0.13737869262695312, 0.14885711669921875, 0.16033554077148438, 0.17181396484375, 0.18329238891601562, 0.19477081298828125, 0.20624923706054688, 0.2177276611328125, 0.22920608520507812, 0.24068450927734375, 0.2521629333496094, 0.263641357421875, 0.2751197814941406, 0.28659820556640625, 0.2980766296386719, 0.3095550537109375, 0.3210334777832031, 0.33251190185546875, 0.3439903259277344, 0.35546875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 6.0, 6.0, 3.0, 10.0, 19.0, 19.0, 24.0, 32.0, 32.0, 43.0, 58.0, 94.0, 114.0, 190.0, 228.0, 379.0, 683.0, 757.0, 458.0, 283.0, 164.0, 138.0, 101.0, 62.0, 42.0, 29.0, 22.0, 25.0, 24.0, 13.0, 9.0, 3.0, 6.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.416015625, -0.40006256103515625, -0.3841094970703125, -0.36815643310546875, -0.352203369140625, -0.33625030517578125, -0.3202972412109375, -0.30434417724609375, -0.28839111328125, -0.27243804931640625, -0.2564849853515625, -0.24053192138671875, -0.224578857421875, -0.20862579345703125, -0.1926727294921875, -0.17671966552734375, -0.1607666015625, -0.14481353759765625, -0.1288604736328125, -0.11290740966796875, -0.096954345703125, -0.08100128173828125, -0.0650482177734375, -0.04909515380859375, -0.03314208984375, -0.01718902587890625, -0.0012359619140625, 0.01471710205078125, 0.030670166015625, 0.04662322998046875, 0.0625762939453125, 0.07852935791015625, 0.094482421875, 0.11043548583984375, 0.1263885498046875, 0.14234161376953125, 0.158294677734375, 0.17424774169921875, 0.1902008056640625, 0.20615386962890625, 0.22210693359375, 0.23805999755859375, 0.2540130615234375, 0.26996612548828125, 0.285919189453125, 0.30187225341796875, 0.3178253173828125, 0.33377838134765625, 0.3497314453125, 0.36568450927734375, 0.3816375732421875, 0.39759063720703125, 0.413543701171875, 0.42949676513671875, 0.4454498291015625, 0.46140289306640625, 0.47735595703125, 0.49330902099609375, 0.5092620849609375, 0.5252151489257812, 0.541168212890625, 0.5571212768554688, 0.5730743408203125, 0.5890274047851562, 0.60498046875]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 4.0, 15.0, 17.0, 43.0, 45.0, 75.0, 100.0, 126.0, 139.0, 112.0, 119.0, 68.0, 56.0, 37.0, 27.0, 10.0, 4.0, 4.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9155347347259521, -1.808927297592163, -1.702319860458374, -1.595712423324585, -1.489104986190796, -1.3824975490570068, -1.2758902311325073, -1.1692827939987183, -1.0626753568649292, -0.9560679197311401, -0.8494604825973511, -0.7428531050682068, -0.6362456679344177, -0.5296382308006287, -0.4230308532714844, -0.3164234161376953, -0.20981597900390625, -0.10320855677127838, 0.0033988654613494873, 0.11000627279281616, 0.21661370992660522, 0.3232211470603943, 0.4298285245895386, 0.5364359617233276, 0.6430433988571167, 0.7496508359909058, 0.8562582731246948, 0.9628656506538391, 1.0694730281829834, 1.1760804653167725, 1.2826879024505615, 1.3892953395843506, 1.4959025382995605, 1.6025099754333496, 1.7091174125671387, 1.8157248497009277, 1.9223322868347168, 2.028939723968506, 2.135547161102295, 2.242154598236084, 2.348762035369873, 2.455369472503662, 2.561976909637451, 2.6685843467712402, 2.7751917839050293, 2.8817992210388184, 2.9884066581726074, 3.0950140953063965, 3.2016212940216064, 3.3082287311553955, 3.4148361682891846, 3.5214436054229736, 3.6280510425567627, 3.7346584796905518, 3.8412656784057617, 3.947873115539551, 4.05448055267334, 4.161087989807129, 4.267695426940918, 4.374302864074707, 4.480910301208496, 4.587517738342285, 4.694125175476074, 4.800732612609863, 4.907340049743652]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 3.0, 3.0, 6.0, 4.0, 11.0, 3.0, 9.0, 7.0, 11.0, 20.0, 20.0, 21.0, 27.0, 35.0, 24.0, 24.0, 37.0, 40.0, 39.0, 50.0, 48.0, 37.0, 45.0, 44.0, 52.0, 49.0, 50.0, 21.0, 33.0, 28.0, 27.0, 35.0, 23.0, 19.0, 22.0, 14.0, 12.0, 6.0, 9.0, 10.0, 4.0, 7.0, 3.0, 3.0, 3.0, 3.0, 4.0, 0.0, 0.0, 1.0], "bins": [-1.650313377380371, -1.6048355102539062, -1.5593576431274414, -1.5138797760009766, -1.4684019088745117, -1.4229241609573364, -1.3774462938308716, -1.3319684267044067, -1.286490559577942, -1.241012692451477, -1.1955348253250122, -1.1500569581985474, -1.104579210281372, -1.0591013431549072, -1.0136234760284424, -0.9681456089019775, -0.9226677417755127, -0.8771898746490479, -0.831712007522583, -0.7862342000007629, -0.7407563328742981, -0.6952784657478333, -0.6498006582260132, -0.6043227910995483, -0.5588449239730835, -0.5133670568466187, -0.4678892195224762, -0.42241138219833374, -0.3769335150718689, -0.33145564794540405, -0.2859778106212616, -0.24049997329711914, -0.19502222537994385, -0.1495443731546402, -0.10406652092933655, -0.0585886687040329, -0.013110816478729248, 0.0323670357465744, 0.07784488797187805, 0.12332272529602051, 0.16880059242248535, 0.214278444647789, 0.25975629687309265, 0.3052341341972351, 0.35071200132369995, 0.3961898684501648, 0.44166770577430725, 0.4871455430984497, 0.5326234102249146, 0.5781012773513794, 0.6235791444778442, 0.6690569519996643, 0.7145348191261292, 0.760012686252594, 0.8054904937744141, 0.8509683609008789, 0.8964462280273438, 0.9419240951538086, 0.9874019622802734, 1.0328798294067383, 1.0783576965332031, 1.1238354444503784, 1.1693133115768433, 1.214791178703308, 1.260269045829773]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 3.0, 2.0, 10.0, 4.0, 5.0, 19.0, 32.0, 39.0, 56.0, 117.0, 137.0, 219.0, 352.0, 550.0, 852.0, 1275.0, 2068.0, 3244.0, 5019.0, 8698.0, 14597.0, 26270.0, 53375.0, 117249.0, 235056.0, 272600.0, 156582.0, 71105.0, 33901.0, 18064.0, 10396.0, 6055.0, 3887.0, 2373.0, 1589.0, 961.0, 639.0, 407.0, 261.0, 184.0, 116.0, 63.0, 40.0, 24.0, 22.0, 18.0, 9.0, 10.0, 4.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.334716796875, -0.3246307373046875, -0.314544677734375, -0.3044586181640625, -0.29437255859375, -0.2842864990234375, -0.274200439453125, -0.2641143798828125, -0.2540283203125, -0.2439422607421875, -0.233856201171875, -0.2237701416015625, -0.21368408203125, -0.2035980224609375, -0.193511962890625, -0.1834259033203125, -0.17333984375, -0.1632537841796875, -0.153167724609375, -0.1430816650390625, -0.13299560546875, -0.1229095458984375, -0.112823486328125, -0.1027374267578125, -0.0926513671875, -0.0825653076171875, -0.072479248046875, -0.0623931884765625, -0.05230712890625, -0.0422210693359375, -0.032135009765625, -0.0220489501953125, -0.011962890625, -0.0018768310546875, 0.008209228515625, 0.0182952880859375, 0.02838134765625, 0.0384674072265625, 0.048553466796875, 0.0586395263671875, 0.0687255859375, 0.0788116455078125, 0.088897705078125, 0.0989837646484375, 0.10906982421875, 0.1191558837890625, 0.129241943359375, 0.1393280029296875, 0.1494140625, 0.1595001220703125, 0.169586181640625, 0.1796722412109375, 0.18975830078125, 0.1998443603515625, 0.209930419921875, 0.2200164794921875, 0.2301025390625, 0.2401885986328125, 0.250274658203125, 0.2603607177734375, 0.27044677734375, 0.2805328369140625, 0.290618896484375, 0.3007049560546875, 0.310791015625]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 5.0, 6.0, 5.0, 6.0, 2.0, 11.0, 14.0, 13.0, 12.0, 18.0, 20.0, 16.0, 23.0, 32.0, 31.0, 37.0, 28.0, 38.0, 39.0, 41.0, 42.0, 41.0, 50.0, 40.0, 42.0, 40.0, 54.0, 41.0, 25.0, 31.0, 36.0, 25.0, 27.0, 28.0, 15.0, 15.0, 12.0, 9.0, 6.0, 8.0, 7.0, 3.0, 3.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0], "bins": [-0.2099609375, -0.20343589782714844, -0.19691085815429688, -0.1903858184814453, -0.18386077880859375, -0.1773357391357422, -0.17081069946289062, -0.16428565979003906, -0.1577606201171875, -0.15123558044433594, -0.14471054077148438, -0.1381855010986328, -0.13166046142578125, -0.1251354217529297, -0.11861038208007812, -0.11208534240722656, -0.105560302734375, -0.09903526306152344, -0.09251022338867188, -0.08598518371582031, -0.07946014404296875, -0.07293510437011719, -0.06641006469726562, -0.05988502502441406, -0.0533599853515625, -0.04683494567871094, -0.040309906005859375, -0.03378486633300781, -0.02725982666015625, -0.020734786987304688, -0.014209747314453125, -0.0076847076416015625, -0.00115966796875, 0.0053653717041015625, 0.011890411376953125, 0.018415451049804688, 0.02494049072265625, 0.03146553039550781, 0.037990570068359375, 0.04451560974121094, 0.0510406494140625, 0.05756568908691406, 0.06409072875976562, 0.07061576843261719, 0.07714080810546875, 0.08366584777832031, 0.09019088745117188, 0.09671592712402344, 0.103240966796875, 0.10976600646972656, 0.11629104614257812, 0.12281608581542969, 0.12934112548828125, 0.1358661651611328, 0.14239120483398438, 0.14891624450683594, 0.1554412841796875, 0.16196632385253906, 0.16849136352539062, 0.1750164031982422, 0.18154144287109375, 0.1880664825439453, 0.19459152221679688, 0.20111656188964844, 0.2076416015625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 6.0, 11.0, 14.0, 28.0, 30.0, 60.0, 105.0, 167.0, 402.0, 879.0, 2149.0, 5420.0, 13867.0, 39467.0, 137298.0, 435619.0, 295228.0, 77170.0, 24939.0, 9244.0, 3672.0, 1508.0, 616.0, 290.0, 121.0, 88.0, 53.0, 40.0, 19.0, 13.0, 13.0, 3.0, 7.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.6494140625, -0.6317596435546875, -0.614105224609375, -0.5964508056640625, -0.57879638671875, -0.5611419677734375, -0.543487548828125, -0.5258331298828125, -0.5081787109375, -0.4905242919921875, -0.472869873046875, -0.4552154541015625, -0.43756103515625, -0.4199066162109375, -0.402252197265625, -0.3845977783203125, -0.366943359375, -0.3492889404296875, -0.331634521484375, -0.3139801025390625, -0.29632568359375, -0.2786712646484375, -0.261016845703125, -0.2433624267578125, -0.2257080078125, -0.2080535888671875, -0.190399169921875, -0.1727447509765625, -0.15509033203125, -0.1374359130859375, -0.119781494140625, -0.1021270751953125, -0.08447265625, -0.0668182373046875, -0.049163818359375, -0.0315093994140625, -0.01385498046875, 0.0037994384765625, 0.021453857421875, 0.0391082763671875, 0.0567626953125, 0.0744171142578125, 0.092071533203125, 0.1097259521484375, 0.12738037109375, 0.1450347900390625, 0.162689208984375, 0.1803436279296875, 0.197998046875, 0.2156524658203125, 0.233306884765625, 0.2509613037109375, 0.26861572265625, 0.2862701416015625, 0.303924560546875, 0.3215789794921875, 0.3392333984375, 0.3568878173828125, 0.374542236328125, 0.3921966552734375, 0.40985107421875, 0.4275054931640625, 0.445159912109375, 0.4628143310546875, 0.48046875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 9.0, 9.0, 5.0, 9.0, 13.0, 16.0, 19.0, 16.0, 26.0, 23.0, 25.0, 37.0, 35.0, 46.0, 40.0, 38.0, 44.0, 46.0, 52.0, 41.0, 43.0, 48.0, 37.0, 40.0, 34.0, 41.0, 39.0, 26.0, 24.0, 22.0, 15.0, 14.0, 18.0, 10.0, 8.0, 8.0, 10.0, 5.0, 4.0, 3.0, 6.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.67822265625, -0.6588134765625, -0.639404296875, -0.6199951171875, -0.6005859375, -0.5811767578125, -0.561767578125, -0.5423583984375, -0.52294921875, -0.5035400390625, -0.484130859375, -0.4647216796875, -0.4453125, -0.4259033203125, -0.406494140625, -0.3870849609375, -0.36767578125, -0.3482666015625, -0.328857421875, -0.3094482421875, -0.2900390625, -0.2706298828125, -0.251220703125, -0.2318115234375, -0.21240234375, -0.1929931640625, -0.173583984375, -0.1541748046875, -0.134765625, -0.1153564453125, -0.095947265625, -0.0765380859375, -0.05712890625, -0.0377197265625, -0.018310546875, 0.0010986328125, 0.0205078125, 0.0399169921875, 0.059326171875, 0.0787353515625, 0.09814453125, 0.1175537109375, 0.136962890625, 0.1563720703125, 0.17578125, 0.1951904296875, 0.214599609375, 0.2340087890625, 0.25341796875, 0.2728271484375, 0.292236328125, 0.3116455078125, 0.3310546875, 0.3504638671875, 0.369873046875, 0.3892822265625, 0.40869140625, 0.4281005859375, 0.447509765625, 0.4669189453125, 0.486328125, 0.5057373046875, 0.525146484375, 0.5445556640625, 0.56396484375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 5.0, 6.0, 7.0, 15.0, 21.0, 35.0, 48.0, 70.0, 119.0, 169.0, 306.0, 506.0, 971.0, 1844.0, 3608.0, 7151.0, 15089.0, 32620.0, 71192.0, 164916.0, 310309.0, 240949.0, 108055.0, 47624.0, 22055.0, 10332.0, 5025.0, 2486.0, 1335.0, 665.0, 372.0, 223.0, 140.0, 109.0, 52.0, 36.0, 36.0, 15.0, 12.0, 12.0, 8.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.17333984375, -0.16820335388183594, -0.16306686401367188, -0.1579303741455078, -0.15279388427734375, -0.1476573944091797, -0.14252090454101562, -0.13738441467285156, -0.1322479248046875, -0.12711143493652344, -0.12197494506835938, -0.11683845520019531, -0.11170196533203125, -0.10656547546386719, -0.10142898559570312, -0.09629249572753906, -0.091156005859375, -0.08601951599121094, -0.08088302612304688, -0.07574653625488281, -0.07061004638671875, -0.06547355651855469, -0.060337066650390625, -0.05520057678222656, -0.0500640869140625, -0.04492759704589844, -0.039791107177734375, -0.03465461730957031, -0.02951812744140625, -0.024381637573242188, -0.019245147705078125, -0.014108657836914062, -0.00897216796875, -0.0038356781005859375, 0.001300811767578125, 0.0064373016357421875, 0.01157379150390625, 0.016710281372070312, 0.021846771240234375, 0.026983261108398438, 0.0321197509765625, 0.03725624084472656, 0.042392730712890625, 0.04752922058105469, 0.05266571044921875, 0.05780220031738281, 0.06293869018554688, 0.06807518005371094, 0.073211669921875, 0.07834815979003906, 0.08348464965820312, 0.08862113952636719, 0.09375762939453125, 0.09889411926269531, 0.10403060913085938, 0.10916709899902344, 0.1143035888671875, 0.11944007873535156, 0.12457656860351562, 0.1297130584716797, 0.13484954833984375, 0.1399860382080078, 0.14512252807617188, 0.15025901794433594, 0.1553955078125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 5.0, 2.0, 7.0, 7.0, 8.0, 12.0, 13.0, 12.0, 26.0, 24.0, 68.0, 76.0, 109.0, 140.0, 146.0, 121.0, 58.0, 40.0, 34.0, 34.0, 13.0, 8.0, 8.0, 4.0, 3.0, 11.0, 6.0, 3.0, 3.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.7637691497802734e-05, -5.577504634857178e-05, -5.391240119934082e-05, -5.204975605010986e-05, -5.0187110900878906e-05, -4.832446575164795e-05, -4.646182060241699e-05, -4.4599175453186035e-05, -4.273653030395508e-05, -4.087388515472412e-05, -3.9011240005493164e-05, -3.714859485626221e-05, -3.528594970703125e-05, -3.342330455780029e-05, -3.1560659408569336e-05, -2.969801425933838e-05, -2.7835369110107422e-05, -2.5972723960876465e-05, -2.4110078811645508e-05, -2.224743366241455e-05, -2.0384788513183594e-05, -1.8522143363952637e-05, -1.665949821472168e-05, -1.4796853065490723e-05, -1.2934207916259766e-05, -1.1071562767028809e-05, -9.208917617797852e-06, -7.3462724685668945e-06, -5.4836273193359375e-06, -3.6209821701049805e-06, -1.7583370208740234e-06, 1.043081283569336e-07, 1.9669532775878906e-06, 3.829598426818848e-06, 5.692243576049805e-06, 7.554888725280762e-06, 9.417533874511719e-06, 1.1280179023742676e-05, 1.3142824172973633e-05, 1.500546932220459e-05, 1.6868114471435547e-05, 1.8730759620666504e-05, 2.059340476989746e-05, 2.2456049919128418e-05, 2.4318695068359375e-05, 2.6181340217590332e-05, 2.804398536682129e-05, 2.9906630516052246e-05, 3.17692756652832e-05, 3.363192081451416e-05, 3.549456596374512e-05, 3.7357211112976074e-05, 3.921985626220703e-05, 4.108250141143799e-05, 4.2945146560668945e-05, 4.48077917098999e-05, 4.667043685913086e-05, 4.8533082008361816e-05, 5.0395727157592773e-05, 5.225837230682373e-05, 5.412101745605469e-05, 5.5983662605285645e-05, 5.78463077545166e-05, 5.970895290374756e-05, 6.157159805297852e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 5.0, 7.0, 5.0, 9.0, 16.0, 24.0, 45.0, 71.0, 106.0, 164.0, 321.0, 602.0, 1084.0, 2124.0, 4580.0, 10466.0, 26325.0, 69021.0, 188991.0, 360267.0, 237548.0, 89252.0, 33358.0, 13131.0, 5726.0, 2605.0, 1170.0, 640.0, 367.0, 193.0, 135.0, 79.0, 43.0, 30.0, 21.0, 12.0, 9.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1754150390625, -0.1690654754638672, -0.16271591186523438, -0.15636634826660156, -0.15001678466796875, -0.14366722106933594, -0.13731765747070312, -0.1309680938720703, -0.1246185302734375, -0.11826896667480469, -0.11191940307617188, -0.10556983947753906, -0.09922027587890625, -0.09287071228027344, -0.08652114868164062, -0.08017158508300781, -0.073822021484375, -0.06747245788574219, -0.061122894287109375, -0.05477333068847656, -0.04842376708984375, -0.04207420349121094, -0.035724639892578125, -0.029375076293945312, -0.0230255126953125, -0.016675949096679688, -0.010326385498046875, -0.0039768218994140625, 0.00237274169921875, 0.008722305297851562, 0.015071868896484375, 0.021421432495117188, 0.02777099609375, 0.03412055969238281, 0.040470123291015625, 0.04681968688964844, 0.05316925048828125, 0.05951881408691406, 0.06586837768554688, 0.07221794128417969, 0.0785675048828125, 0.08491706848144531, 0.09126663208007812, 0.09761619567871094, 0.10396575927734375, 0.11031532287597656, 0.11666488647460938, 0.12301445007324219, 0.129364013671875, 0.1357135772705078, 0.14206314086914062, 0.14841270446777344, 0.15476226806640625, 0.16111183166503906, 0.16746139526367188, 0.1738109588623047, 0.1801605224609375, 0.1865100860595703, 0.19285964965820312, 0.19920921325683594, 0.20555877685546875, 0.21190834045410156, 0.21825790405273438, 0.2246074676513672, 0.23095703125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 6.0, 10.0, 14.0, 11.0, 21.0, 23.0, 31.0, 40.0, 52.0, 48.0, 70.0, 96.0, 100.0, 74.0, 79.0, 59.0, 38.0, 55.0, 36.0, 33.0, 26.0, 13.0, 16.0, 17.0, 6.0, 6.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.2095947265625, -0.20334815979003906, -0.19710159301757812, -0.1908550262451172, -0.18460845947265625, -0.1783618927001953, -0.17211532592773438, -0.16586875915527344, -0.1596221923828125, -0.15337562561035156, -0.14712905883789062, -0.1408824920654297, -0.13463592529296875, -0.1283893585205078, -0.12214279174804688, -0.11589622497558594, -0.109649658203125, -0.10340309143066406, -0.09715652465820312, -0.09090995788574219, -0.08466339111328125, -0.07841682434082031, -0.07217025756835938, -0.06592369079589844, -0.0596771240234375, -0.05343055725097656, -0.047183990478515625, -0.04093742370605469, -0.03469085693359375, -0.028444290161132812, -0.022197723388671875, -0.015951156616210938, -0.00970458984375, -0.0034580230712890625, 0.002788543701171875, 0.009035110473632812, 0.01528167724609375, 0.021528244018554688, 0.027774810791015625, 0.03402137756347656, 0.0402679443359375, 0.04651451110839844, 0.052761077880859375, 0.05900764465332031, 0.06525421142578125, 0.07150077819824219, 0.07774734497070312, 0.08399391174316406, 0.090240478515625, 0.09648704528808594, 0.10273361206054688, 0.10898017883300781, 0.11522674560546875, 0.12147331237792969, 0.12771987915039062, 0.13396644592285156, 0.1402130126953125, 0.14645957946777344, 0.15270614624023438, 0.1589527130126953, 0.16519927978515625, 0.1714458465576172, 0.17769241333007812, 0.18393898010253906, 0.190185546875]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 4.0, 0.0, 4.0, 11.0, 21.0, 31.0, 43.0, 71.0, 102.0, 134.0, 145.0, 135.0, 113.0, 85.0, 47.0, 20.0, 23.0, 9.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9292144775390625, -2.8419816493988037, -2.754748821258545, -2.667515993118286, -2.5802831649780273, -2.4930505752563477, -2.405817747116089, -2.31858491897583, -2.2313520908355713, -2.1441192626953125, -2.0568864345550537, -1.9696537256240845, -1.8824208974838257, -1.795188069343567, -1.7079553604125977, -1.6207225322723389, -1.53348970413208, -1.4462568759918213, -1.3590240478515625, -1.2717913389205933, -1.1845585107803345, -1.0973256826400757, -1.0100929737091064, -0.9228601455688477, -0.8356273174285889, -0.7483944892883301, -0.6611617207527161, -0.573928952217102, -0.48669612407684326, -0.39946332573890686, -0.31223052740097046, -0.22499775886535645, -0.13776516914367676, -0.050532370805740356, 0.036700427532196045, 0.12393322587013245, 0.21116602420806885, 0.29839882254600525, 0.38563162088394165, 0.47286438941955566, 0.5600972175598145, 0.6473300457000732, 0.7345628142356873, 0.8217955827713013, 0.9090284109115601, 0.9962612390518188, 1.083493947982788, 1.1707267761230469, 1.2579596042633057, 1.3451924324035645, 1.4324252605438232, 1.5196579694747925, 1.6068907976150513, 1.69412362575531, 1.7813563346862793, 1.868589162826538, 1.9558219909667969, 2.0430548191070557, 2.1302876472473145, 2.2175204753875732, 2.304753303527832, 2.3919858932495117, 2.4792187213897705, 2.5664515495300293, 2.653684377670288]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 3.0, 1.0, 1.0, 6.0, 5.0, 3.0, 12.0, 14.0, 10.0, 11.0, 15.0, 19.0, 26.0, 15.0, 24.0, 29.0, 21.0, 40.0, 37.0, 30.0, 35.0, 50.0, 44.0, 29.0, 33.0, 41.0, 39.0, 48.0, 50.0, 36.0, 33.0, 39.0, 33.0, 33.0, 17.0, 19.0, 18.0, 17.0, 8.0, 11.0, 10.0, 11.0, 7.0, 8.0, 4.0, 2.0, 1.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.4986697435379028, -1.4501937627792358, -1.4017176628112793, -1.3532416820526123, -1.3047655820846558, -1.2562896013259888, -1.2078135013580322, -1.1593375205993652, -1.1108615398406982, -1.0623855590820312, -1.0139094591140747, -0.9654334783554077, -0.9169573783874512, -0.8684813976287842, -0.8200053572654724, -0.7715293169021606, -0.7230532169342041, -0.6745771765708923, -0.6261011362075806, -0.5776251554489136, -0.529149055480957, -0.48067304491996765, -0.43219703435897827, -0.3837209939956665, -0.33524495363235474, -0.28676891326904297, -0.2382928878068924, -0.18981686234474182, -0.14134082198143005, -0.09286478161811829, -0.044388771057128906, 0.004087269306182861, 0.05256319046020508, 0.10103922337293625, 0.14951525628566742, 0.197991281747818, 0.24646732211112976, 0.29494336247444153, 0.3434193730354309, 0.3918954133987427, 0.44037145376205444, 0.4888474941253662, 0.537323534488678, 0.5857995748519897, 0.6342755556106567, 0.6827516555786133, 0.7312276363372803, 0.779703676700592, 0.8281797170639038, 0.8766557574272156, 0.9251317977905273, 0.9736077785491943, 1.0220838785171509, 1.0705598592758179, 1.1190359592437744, 1.1675119400024414, 1.2159879207611084, 1.2644639015197754, 1.312940001487732, 1.361415982246399, 1.4098920822143555, 1.4583680629730225, 1.5068440437316895, 1.555320143699646, 1.6037962436676025]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 5.0, 7.0, 4.0, 13.0, 14.0, 37.0, 46.0, 86.0, 152.0, 280.0, 557.0, 1205.0, 2498.0, 5504.0, 13562.0, 34655.0, 98162.0, 333721.0, 1727240.0, 1531983.0, 299338.0, 90327.0, 32559.0, 12626.0, 5258.0, 2314.0, 1085.0, 499.0, 253.0, 144.0, 70.0, 43.0, 17.0, 10.0, 8.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.302978515625, -0.2885246276855469, -0.27407073974609375, -0.2596168518066406, -0.2451629638671875, -0.23070907592773438, -0.21625518798828125, -0.20180130004882812, -0.187347412109375, -0.17289352416992188, -0.15843963623046875, -0.14398574829101562, -0.1295318603515625, -0.11507797241210938, -0.10062408447265625, -0.08617019653320312, -0.07171630859375, -0.057262420654296875, -0.04280853271484375, -0.028354644775390625, -0.0139007568359375, 0.000553131103515625, 0.01500701904296875, 0.029460906982421875, 0.043914794921875, 0.058368682861328125, 0.07282257080078125, 0.08727645874023438, 0.1017303466796875, 0.11618423461914062, 0.13063812255859375, 0.14509201049804688, 0.1595458984375, 0.17399978637695312, 0.18845367431640625, 0.20290756225585938, 0.2173614501953125, 0.23181533813476562, 0.24626922607421875, 0.2607231140136719, 0.275177001953125, 0.2896308898925781, 0.30408477783203125, 0.3185386657714844, 0.3329925537109375, 0.3474464416503906, 0.36190032958984375, 0.3763542175292969, 0.39080810546875, 0.4052619934082031, 0.41971588134765625, 0.4341697692871094, 0.4486236572265625, 0.4630775451660156, 0.47753143310546875, 0.4919853210449219, 0.506439208984375, 0.5208930969238281, 0.5353469848632812, 0.5498008728027344, 0.5642547607421875, 0.5787086486816406, 0.5931625366210938, 0.6076164245605469, 0.6220703125]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 2.0, 2.0, 2.0, 4.0, 9.0, 14.0, 6.0, 8.0, 19.0, 20.0, 23.0, 32.0, 22.0, 22.0, 29.0, 28.0, 38.0, 35.0, 45.0, 52.0, 41.0, 43.0, 40.0, 37.0, 43.0, 48.0, 36.0, 33.0, 33.0, 48.0, 28.0, 23.0, 16.0, 16.0, 21.0, 17.0, 12.0, 14.0, 12.0, 9.0, 11.0, 3.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.2109375, -0.20439720153808594, -0.19785690307617188, -0.1913166046142578, -0.18477630615234375, -0.1782360076904297, -0.17169570922851562, -0.16515541076660156, -0.1586151123046875, -0.15207481384277344, -0.14553451538085938, -0.1389942169189453, -0.13245391845703125, -0.1259136199951172, -0.11937332153320312, -0.11283302307128906, -0.106292724609375, -0.09975242614746094, -0.09321212768554688, -0.08667182922363281, -0.08013153076171875, -0.07359123229980469, -0.06705093383789062, -0.06051063537597656, -0.0539703369140625, -0.04743003845214844, -0.040889739990234375, -0.03434944152832031, -0.02780914306640625, -0.021268844604492188, -0.014728546142578125, -0.008188247680664062, -0.00164794921875, 0.0048923492431640625, 0.011432647705078125, 0.017972946166992188, 0.02451324462890625, 0.031053543090820312, 0.037593841552734375, 0.04413414001464844, 0.0506744384765625, 0.05721473693847656, 0.06375503540039062, 0.07029533386230469, 0.07683563232421875, 0.08337593078613281, 0.08991622924804688, 0.09645652770996094, 0.102996826171875, 0.10953712463378906, 0.11607742309570312, 0.12261772155761719, 0.12915802001953125, 0.1356983184814453, 0.14223861694335938, 0.14877891540527344, 0.1553192138671875, 0.16185951232910156, 0.16839981079101562, 0.1749401092529297, 0.18148040771484375, 0.1880207061767578, 0.19456100463867188, 0.20110130310058594, 0.2076416015625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 5.0, 12.0, 18.0, 18.0, 29.0, 39.0, 70.0, 105.0, 180.0, 260.0, 390.0, 626.0, 971.0, 1671.0, 2777.0, 4819.0, 8580.0, 15861.0, 29616.0, 58013.0, 117262.0, 255245.0, 644477.0, 1653106.0, 817601.0, 303061.0, 137127.0, 66672.0, 34300.0, 17972.0, 9854.0, 5457.0, 3173.0, 1907.0, 1157.0, 678.0, 399.0, 277.0, 176.0, 114.0, 69.0, 50.0, 28.0, 23.0, 15.0, 10.0, 9.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.309326171875, -0.2998390197753906, -0.29035186767578125, -0.2808647155761719, -0.2713775634765625, -0.2618904113769531, -0.25240325927734375, -0.24291610717773438, -0.233428955078125, -0.22394180297851562, -0.21445465087890625, -0.20496749877929688, -0.1954803466796875, -0.18599319458007812, -0.17650604248046875, -0.16701889038085938, -0.15753173828125, -0.14804458618164062, -0.13855743408203125, -0.12907028198242188, -0.1195831298828125, -0.11009597778320312, -0.10060882568359375, -0.09112167358398438, -0.081634521484375, -0.07214736938476562, -0.06266021728515625, -0.053173065185546875, -0.0436859130859375, -0.034198760986328125, -0.02471160888671875, -0.015224456787109375, -0.0057373046875, 0.003749847412109375, 0.01323699951171875, 0.022724151611328125, 0.0322113037109375, 0.041698455810546875, 0.05118560791015625, 0.060672760009765625, 0.070159912109375, 0.07964706420898438, 0.08913421630859375, 0.09862136840820312, 0.1081085205078125, 0.11759567260742188, 0.12708282470703125, 0.13656997680664062, 0.14605712890625, 0.15554428100585938, 0.16503143310546875, 0.17451858520507812, 0.1840057373046875, 0.19349288940429688, 0.20298004150390625, 0.21246719360351562, 0.221954345703125, 0.23144149780273438, 0.24092864990234375, 0.2504158020019531, 0.2599029541015625, 0.2693901062011719, 0.27887725830078125, 0.2883644104003906, 0.2978515625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 5.0, 4.0, 9.0, 4.0, 11.0, 16.0, 19.0, 14.0, 18.0, 30.0, 32.0, 44.0, 49.0, 77.0, 71.0, 124.0, 164.0, 199.0, 270.0, 383.0, 506.0, 513.0, 405.0, 242.0, 189.0, 171.0, 94.0, 106.0, 60.0, 56.0, 48.0, 24.0, 37.0, 17.0, 14.0, 11.0, 7.0, 8.0, 6.0, 6.0, 2.0, 2.0, 3.0, 1.0, 0.0, 5.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0], "bins": [-0.413330078125, -0.4004058837890625, -0.387481689453125, -0.3745574951171875, -0.36163330078125, -0.3487091064453125, -0.335784912109375, -0.3228607177734375, -0.3099365234375, -0.2970123291015625, -0.284088134765625, -0.2711639404296875, -0.25823974609375, -0.2453155517578125, -0.232391357421875, -0.2194671630859375, -0.20654296875, -0.1936187744140625, -0.180694580078125, -0.1677703857421875, -0.15484619140625, -0.1419219970703125, -0.128997802734375, -0.1160736083984375, -0.1031494140625, -0.0902252197265625, -0.077301025390625, -0.0643768310546875, -0.05145263671875, -0.0385284423828125, -0.025604248046875, -0.0126800537109375, 0.000244140625, 0.0131683349609375, 0.026092529296875, 0.0390167236328125, 0.05194091796875, 0.0648651123046875, 0.077789306640625, 0.0907135009765625, 0.1036376953125, 0.1165618896484375, 0.129486083984375, 0.1424102783203125, 0.15533447265625, 0.1682586669921875, 0.181182861328125, 0.1941070556640625, 0.20703125, 0.2199554443359375, 0.232879638671875, 0.2458038330078125, 0.25872802734375, 0.2716522216796875, 0.284576416015625, 0.2975006103515625, 0.3104248046875, 0.3233489990234375, 0.336273193359375, 0.3491973876953125, 0.36212158203125, 0.3750457763671875, 0.387969970703125, 0.4008941650390625, 0.413818359375]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 7.0, 4.0, 10.0, 19.0, 28.0, 45.0, 52.0, 71.0, 86.0, 104.0, 111.0, 108.0, 91.0, 86.0, 46.0, 41.0, 37.0, 19.0, 9.0, 13.0, 8.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.197746515274048, -2.1109507083892822, -2.0241551399230957, -1.93735933303833, -1.8505635261535645, -1.7637677192687988, -1.6769720315933228, -1.5901763439178467, -1.503380537033081, -1.4165847301483154, -1.3297890424728394, -1.2429933547973633, -1.1561975479125977, -1.069401741027832, -0.982606053352356, -0.8958103060722351, -0.8090145587921143, -0.7222188115119934, -0.6354230642318726, -0.5486273169517517, -0.46183156967163086, -0.37503582239151, -0.28824007511138916, -0.2014443278312683, -0.11464858055114746, -0.02785283327102661, 0.05894291400909424, 0.1457386612892151, 0.23253440856933594, 0.3193301558494568, 0.40612590312957764, 0.4929216504096985, 0.5797173976898193, 0.6665131449699402, 0.753308892250061, 0.8401046395301819, 0.9269003868103027, 1.0136961936950684, 1.1004918813705444, 1.1872875690460205, 1.2740833759307861, 1.3608791828155518, 1.4476748704910278, 1.534470558166504, 1.6212663650512695, 1.7080621719360352, 1.7948578596115112, 1.8816535472869873, 1.968449354171753, 2.0552451610565186, 2.142040729522705, 2.2288365364074707, 2.3156323432922363, 2.402428150177002, 2.4892239570617676, 2.576019525527954, 2.6628153324127197, 2.7496111392974854, 2.836406707763672, 2.9232025146484375, 3.009998321533203, 3.0967941284179688, 3.1835899353027344, 3.270385503768921, 3.3571813106536865]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 6.0, 5.0, 5.0, 5.0, 5.0, 11.0, 8.0, 11.0, 8.0, 13.0, 12.0, 23.0, 18.0, 18.0, 22.0, 23.0, 23.0, 38.0, 32.0, 45.0, 32.0, 36.0, 35.0, 48.0, 42.0, 39.0, 29.0, 45.0, 38.0, 30.0, 44.0, 31.0, 23.0, 30.0, 35.0, 32.0, 16.0, 10.0, 14.0, 16.0, 12.0, 8.0, 13.0, 6.0, 7.0, 3.0, 3.0, 3.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.4809997081756592, -1.435689091682434, -1.3903785943984985, -1.3450679779052734, -1.299757480621338, -1.2544468641281128, -1.2091363668441772, -1.1638257503509521, -1.1185152530670166, -1.0732046365737915, -1.027894139289856, -0.9825835824012756, -0.9372730255126953, -0.891962468624115, -0.8466519117355347, -0.8013412952423096, -0.7560307383537292, -0.7107201814651489, -0.6654096245765686, -0.6200990676879883, -0.574788510799408, -0.5294779539108276, -0.4841673672199249, -0.4388568103313446, -0.3935462534427643, -0.34823569655418396, -0.30292513966560364, -0.2576145529747009, -0.2123040109872818, -0.16699345409870148, -0.12168288230895996, -0.07637232542037964, -0.031061768531799316, 0.014248792082071304, 0.059559352695941925, 0.10486991703510284, 0.15018047392368317, 0.1954910308122635, 0.240801602602005, 0.2861121594905853, 0.33142271637916565, 0.37673327326774597, 0.4220438301563263, 0.467354416847229, 0.5126649737358093, 0.5579755306243896, 0.60328608751297, 0.6485966444015503, 0.6939072012901306, 0.7392177581787109, 0.7845283150672913, 0.8298388719558716, 0.8751494288444519, 0.9204599857330322, 0.9657706022262573, 1.0110810995101929, 1.056391716003418, 1.101702332496643, 1.1470128297805786, 1.1923234462738037, 1.2376339435577393, 1.2829445600509644, 1.3282550573349, 1.373565673828125, 1.4188761711120605]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 7.0, 17.0, 16.0, 27.0, 35.0, 102.0, 126.0, 160.0, 256.0, 453.0, 599.0, 839.0, 1257.0, 1839.0, 2667.0, 3816.0, 5422.0, 8403.0, 13210.0, 22587.0, 44179.0, 105154.0, 257661.0, 306881.0, 143294.0, 57211.0, 27384.0, 15533.0, 9405.0, 6205.0, 4301.0, 3001.0, 2065.0, 1484.0, 967.0, 654.0, 496.0, 284.0, 195.0, 130.0, 77.0, 53.0, 46.0, 28.0, 9.0, 10.0, 8.0, 6.0, 2.0, 2.0, 1.0], "bins": [-0.44775390625, -0.43537139892578125, -0.4229888916015625, -0.41060638427734375, -0.398223876953125, -0.38584136962890625, -0.3734588623046875, -0.36107635498046875, -0.34869384765625, -0.33631134033203125, -0.3239288330078125, -0.31154632568359375, -0.299163818359375, -0.28678131103515625, -0.2743988037109375, -0.26201629638671875, -0.2496337890625, -0.23725128173828125, -0.2248687744140625, -0.21248626708984375, -0.200103759765625, -0.18772125244140625, -0.1753387451171875, -0.16295623779296875, -0.15057373046875, -0.13819122314453125, -0.1258087158203125, -0.11342620849609375, -0.101043701171875, -0.08866119384765625, -0.0762786865234375, -0.06389617919921875, -0.051513671875, -0.03913116455078125, -0.0267486572265625, -0.01436614990234375, -0.001983642578125, 0.01039886474609375, 0.0227813720703125, 0.03516387939453125, 0.04754638671875, 0.05992889404296875, 0.0723114013671875, 0.08469390869140625, 0.097076416015625, 0.10945892333984375, 0.1218414306640625, 0.13422393798828125, 0.1466064453125, 0.15898895263671875, 0.1713714599609375, 0.18375396728515625, 0.196136474609375, 0.20851898193359375, 0.2209014892578125, 0.23328399658203125, 0.24566650390625, 0.25804901123046875, 0.2704315185546875, 0.28281402587890625, 0.295196533203125, 0.30757904052734375, 0.3199615478515625, 0.33234405517578125, 0.3447265625]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 6.0, 2.0, 12.0, 7.0, 8.0, 10.0, 8.0, 18.0, 18.0, 18.0, 22.0, 19.0, 24.0, 38.0, 35.0, 33.0, 38.0, 37.0, 35.0, 42.0, 35.0, 30.0, 39.0, 42.0, 40.0, 39.0, 49.0, 35.0, 37.0, 36.0, 28.0, 20.0, 26.0, 27.0, 18.0, 15.0, 17.0, 9.0, 8.0, 4.0, 3.0, 2.0, 2.0, 4.0, 3.0, 4.0, 5.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.204833984375, -0.19839096069335938, -0.19194793701171875, -0.18550491333007812, -0.1790618896484375, -0.17261886596679688, -0.16617584228515625, -0.15973281860351562, -0.153289794921875, -0.14684677124023438, -0.14040374755859375, -0.13396072387695312, -0.1275177001953125, -0.12107467651367188, -0.11463165283203125, -0.10818862915039062, -0.10174560546875, -0.09530258178710938, -0.08885955810546875, -0.08241653442382812, -0.0759735107421875, -0.06953048706054688, -0.06308746337890625, -0.056644439697265625, -0.050201416015625, -0.043758392333984375, -0.03731536865234375, -0.030872344970703125, -0.0244293212890625, -0.017986297607421875, -0.01154327392578125, -0.005100250244140625, 0.0013427734375, 0.007785797119140625, 0.01422882080078125, 0.020671844482421875, 0.0271148681640625, 0.033557891845703125, 0.04000091552734375, 0.046443939208984375, 0.052886962890625, 0.059329986572265625, 0.06577301025390625, 0.07221603393554688, 0.0786590576171875, 0.08510208129882812, 0.09154510498046875, 0.09798812866210938, 0.10443115234375, 0.11087417602539062, 0.11731719970703125, 0.12376022338867188, 0.1302032470703125, 0.13664627075195312, 0.14308929443359375, 0.14953231811523438, 0.155975341796875, 0.16241836547851562, 0.16886138916015625, 0.17530441284179688, 0.1817474365234375, 0.18819046020507812, 0.19463348388671875, 0.20107650756835938, 0.20751953125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 1.0, 2.0, 5.0, 5.0, 7.0, 6.0, 12.0, 13.0, 17.0, 17.0, 38.0, 58.0, 81.0, 109.0, 182.0, 262.0, 545.0, 1092.0, 2226.0, 4922.0, 11396.0, 25914.0, 68499.0, 267720.0, 464745.0, 128306.0, 41023.0, 17099.0, 7417.0, 3465.0, 1575.0, 760.0, 390.0, 200.0, 141.0, 88.0, 64.0, 52.0, 27.0, 25.0, 14.0, 21.0, 7.0, 7.0, 1.0, 5.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.70654296875, -0.6865005493164062, -0.6664581298828125, -0.6464157104492188, -0.626373291015625, -0.6063308715820312, -0.5862884521484375, -0.5662460327148438, -0.54620361328125, -0.5261611938476562, -0.5061187744140625, -0.48607635498046875, -0.466033935546875, -0.44599151611328125, -0.4259490966796875, -0.40590667724609375, -0.3858642578125, -0.36582183837890625, -0.3457794189453125, -0.32573699951171875, -0.305694580078125, -0.28565216064453125, -0.2656097412109375, -0.24556732177734375, -0.22552490234375, -0.20548248291015625, -0.1854400634765625, -0.16539764404296875, -0.145355224609375, -0.12531280517578125, -0.1052703857421875, -0.08522796630859375, -0.065185546875, -0.04514312744140625, -0.0251007080078125, -0.00505828857421875, 0.014984130859375, 0.03502655029296875, 0.0550689697265625, 0.07511138916015625, 0.09515380859375, 0.11519622802734375, 0.1352386474609375, 0.15528106689453125, 0.175323486328125, 0.19536590576171875, 0.2154083251953125, 0.23545074462890625, 0.2554931640625, 0.27553558349609375, 0.2955780029296875, 0.31562042236328125, 0.335662841796875, 0.35570526123046875, 0.3757476806640625, 0.39579010009765625, 0.41583251953125, 0.43587493896484375, 0.4559173583984375, 0.47595977783203125, 0.496002197265625, 0.5160446166992188, 0.5360870361328125, 0.5561294555664062, 0.576171875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 8.0, 4.0, 7.0, 6.0, 6.0, 9.0, 9.0, 12.0, 10.0, 17.0, 25.0, 35.0, 27.0, 40.0, 28.0, 32.0, 34.0, 31.0, 56.0, 42.0, 46.0, 32.0, 44.0, 42.0, 38.0, 42.0, 47.0, 28.0, 35.0, 34.0, 36.0, 16.0, 23.0, 16.0, 19.0, 12.0, 11.0, 9.0, 11.0, 4.0, 6.0, 5.0, 2.0, 7.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.57568359375, -0.5565032958984375, -0.537322998046875, -0.5181427001953125, -0.49896240234375, -0.4797821044921875, -0.460601806640625, -0.4414215087890625, -0.4222412109375, -0.4030609130859375, -0.383880615234375, -0.3647003173828125, -0.34552001953125, -0.3263397216796875, -0.307159423828125, -0.2879791259765625, -0.268798828125, -0.2496185302734375, -0.230438232421875, -0.2112579345703125, -0.19207763671875, -0.1728973388671875, -0.153717041015625, -0.1345367431640625, -0.1153564453125, -0.0961761474609375, -0.076995849609375, -0.0578155517578125, -0.03863525390625, -0.0194549560546875, -0.000274658203125, 0.0189056396484375, 0.0380859375, 0.0572662353515625, 0.076446533203125, 0.0956268310546875, 0.11480712890625, 0.1339874267578125, 0.153167724609375, 0.1723480224609375, 0.1915283203125, 0.2107086181640625, 0.229888916015625, 0.2490692138671875, 0.26824951171875, 0.2874298095703125, 0.306610107421875, 0.3257904052734375, 0.344970703125, 0.3641510009765625, 0.383331298828125, 0.4025115966796875, 0.42169189453125, 0.4408721923828125, 0.460052490234375, 0.4792327880859375, 0.4984130859375, 0.5175933837890625, 0.536773681640625, 0.5559539794921875, 0.57513427734375, 0.5943145751953125, 0.613494873046875, 0.6326751708984375, 0.65185546875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 6.0, 6.0, 7.0, 7.0, 4.0, 16.0, 20.0, 29.0, 27.0, 45.0, 82.0, 121.0, 195.0, 310.0, 516.0, 858.0, 1359.0, 2040.0, 3258.0, 5313.0, 9259.0, 17039.0, 36104.0, 83861.0, 212199.0, 337122.0, 191449.0, 76356.0, 33076.0, 15713.0, 8600.0, 5079.0, 3124.0, 2031.0, 1239.0, 742.0, 506.0, 293.0, 187.0, 126.0, 87.0, 57.0, 29.0, 21.0, 13.0, 14.0, 3.0, 6.0, 3.0, 7.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.144775390625, -0.14017105102539062, -0.13556671142578125, -0.13096237182617188, -0.1263580322265625, -0.12175369262695312, -0.11714935302734375, -0.11254501342773438, -0.107940673828125, -0.10333633422851562, -0.09873199462890625, -0.09412765502929688, -0.0895233154296875, -0.08491897583007812, -0.08031463623046875, -0.07571029663085938, -0.07110595703125, -0.06650161743164062, -0.06189727783203125, -0.057292938232421875, -0.0526885986328125, -0.048084259033203125, -0.04347991943359375, -0.038875579833984375, -0.034271240234375, -0.029666900634765625, -0.02506256103515625, -0.020458221435546875, -0.0158538818359375, -0.011249542236328125, -0.00664520263671875, -0.002040863037109375, 0.0025634765625, 0.007167816162109375, 0.01177215576171875, 0.016376495361328125, 0.0209808349609375, 0.025585174560546875, 0.03018951416015625, 0.034793853759765625, 0.039398193359375, 0.044002532958984375, 0.04860687255859375, 0.053211212158203125, 0.0578155517578125, 0.062419891357421875, 0.06702423095703125, 0.07162857055664062, 0.07623291015625, 0.08083724975585938, 0.08544158935546875, 0.09004592895507812, 0.0946502685546875, 0.09925460815429688, 0.10385894775390625, 0.10846328735351562, 0.113067626953125, 0.11767196655273438, 0.12227630615234375, 0.12688064575195312, 0.1314849853515625, 0.13608932495117188, 0.14069366455078125, 0.14529800415039062, 0.14990234375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 4.0, 8.0, 10.0, 30.0, 21.0, 42.0, 70.0, 155.0, 250.0, 184.0, 83.0, 39.0, 31.0, 9.0, 11.0, 10.0, 4.0, 4.0, 4.0, 4.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.202957153320312e-05, -8.91275703907013e-05, -8.622556924819946e-05, -8.332356810569763e-05, -8.04215669631958e-05, -7.751956582069397e-05, -7.461756467819214e-05, -7.171556353569031e-05, -6.881356239318848e-05, -6.591156125068665e-05, -6.300956010818481e-05, -6.0107558965682983e-05, -5.720555782318115e-05, -5.430355668067932e-05, -5.140155553817749e-05, -4.849955439567566e-05, -4.559755325317383e-05, -4.2695552110672e-05, -3.9793550968170166e-05, -3.6891549825668335e-05, -3.3989548683166504e-05, -3.108754754066467e-05, -2.8185546398162842e-05, -2.528354525566101e-05, -2.238154411315918e-05, -1.947954297065735e-05, -1.6577541828155518e-05, -1.3675540685653687e-05, -1.0773539543151855e-05, -7.871538400650024e-06, -4.969537258148193e-06, -2.0675361156463623e-06, 8.344650268554688e-07, 3.7364661693573e-06, 6.638467311859131e-06, 9.540468454360962e-06, 1.2442469596862793e-05, 1.5344470739364624e-05, 1.8246471881866455e-05, 2.1148473024368286e-05, 2.4050474166870117e-05, 2.6952475309371948e-05, 2.985447645187378e-05, 3.275647759437561e-05, 3.565847873687744e-05, 3.856047987937927e-05, 4.1462481021881104e-05, 4.4364482164382935e-05, 4.7266483306884766e-05, 5.01684844493866e-05, 5.307048559188843e-05, 5.597248673439026e-05, 5.887448787689209e-05, 6.177648901939392e-05, 6.467849016189575e-05, 6.758049130439758e-05, 7.048249244689941e-05, 7.338449358940125e-05, 7.628649473190308e-05, 7.918849587440491e-05, 8.209049701690674e-05, 8.499249815940857e-05, 8.78944993019104e-05, 9.079650044441223e-05, 9.369850158691406e-05]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 8.0, 1.0, 5.0, 9.0, 10.0, 15.0, 10.0, 16.0, 23.0, 28.0, 45.0, 59.0, 73.0, 121.0, 222.0, 339.0, 531.0, 980.0, 1841.0, 3415.0, 6898.0, 13962.0, 31131.0, 75787.0, 187912.0, 323670.0, 230435.0, 97139.0, 39221.0, 17121.0, 8376.0, 4085.0, 2181.0, 1113.0, 680.0, 394.0, 243.0, 144.0, 90.0, 72.0, 40.0, 38.0, 22.0, 21.0, 10.0, 7.0, 6.0, 5.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.1424560546875, -0.13780593872070312, -0.13315582275390625, -0.12850570678710938, -0.1238555908203125, -0.11920547485351562, -0.11455535888671875, -0.10990524291992188, -0.105255126953125, -0.10060501098632812, -0.09595489501953125, -0.09130477905273438, -0.0866546630859375, -0.08200454711914062, -0.07735443115234375, -0.07270431518554688, -0.06805419921875, -0.06340408325195312, -0.05875396728515625, -0.054103851318359375, -0.0494537353515625, -0.044803619384765625, -0.04015350341796875, -0.035503387451171875, -0.030853271484375, -0.026203155517578125, -0.02155303955078125, -0.016902923583984375, -0.0122528076171875, -0.007602691650390625, -0.00295257568359375, 0.001697540283203125, 0.00634765625, 0.010997772216796875, 0.01564788818359375, 0.020298004150390625, 0.0249481201171875, 0.029598236083984375, 0.03424835205078125, 0.038898468017578125, 0.043548583984375, 0.048198699951171875, 0.05284881591796875, 0.057498931884765625, 0.0621490478515625, 0.06679916381835938, 0.07144927978515625, 0.07609939575195312, 0.08074951171875, 0.08539962768554688, 0.09004974365234375, 0.09469985961914062, 0.0993499755859375, 0.10400009155273438, 0.10865020751953125, 0.11330032348632812, 0.117950439453125, 0.12260055541992188, 0.12725067138671875, 0.13190078735351562, 0.1365509033203125, 0.14120101928710938, 0.14585113525390625, 0.15050125122070312, 0.1551513671875]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 6.0, 7.0, 10.0, 15.0, 14.0, 11.0, 23.0, 35.0, 36.0, 48.0, 77.0, 83.0, 107.0, 107.0, 93.0, 84.0, 61.0, 53.0, 37.0, 24.0, 14.0, 22.0, 9.0, 9.0, 8.0, 4.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2103271484375, -0.20372772216796875, -0.1971282958984375, -0.19052886962890625, -0.183929443359375, -0.17733001708984375, -0.1707305908203125, -0.16413116455078125, -0.15753173828125, -0.15093231201171875, -0.1443328857421875, -0.13773345947265625, -0.131134033203125, -0.12453460693359375, -0.1179351806640625, -0.11133575439453125, -0.104736328125, -0.09813690185546875, -0.0915374755859375, -0.08493804931640625, -0.078338623046875, -0.07173919677734375, -0.0651397705078125, -0.05854034423828125, -0.05194091796875, -0.04534149169921875, -0.0387420654296875, -0.03214263916015625, -0.025543212890625, -0.01894378662109375, -0.0123443603515625, -0.00574493408203125, 0.0008544921875, 0.00745391845703125, 0.0140533447265625, 0.02065277099609375, 0.027252197265625, 0.03385162353515625, 0.0404510498046875, 0.04705047607421875, 0.05364990234375, 0.06024932861328125, 0.0668487548828125, 0.07344818115234375, 0.080047607421875, 0.08664703369140625, 0.0932464599609375, 0.09984588623046875, 0.1064453125, 0.11304473876953125, 0.1196441650390625, 0.12624359130859375, 0.132843017578125, 0.13944244384765625, 0.1460418701171875, 0.15264129638671875, 0.15924072265625, 0.16584014892578125, 0.1724395751953125, 0.17903900146484375, 0.185638427734375, 0.19223785400390625, 0.1988372802734375, 0.20543670654296875, 0.2120361328125]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 5.0, 8.0, 17.0, 21.0, 33.0, 51.0, 68.0, 88.0, 70.0, 81.0, 103.0, 79.0, 90.0, 81.0, 56.0, 42.0, 36.0, 25.0, 11.0, 12.0, 6.0, 6.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.058450222015381, -1.9919641017913818, -1.9254779815673828, -1.8589919805526733, -1.7925058603286743, -1.7260197401046753, -1.6595337390899658, -1.5930476188659668, -1.5265614986419678, -1.4600753784179688, -1.3935892581939697, -1.3271032571792603, -1.2606171369552612, -1.1941310167312622, -1.1276450157165527, -1.0611588954925537, -0.9946727752685547, -0.9281866550445557, -0.8617005944252014, -0.7952145338058472, -0.7287284135818481, -0.6622422933578491, -0.5957562327384949, -0.5292701721191406, -0.4627840518951416, -0.39629796147346497, -0.32981187105178833, -0.2633257806301117, -0.19683969020843506, -0.13035359978675842, -0.06386750936508179, 0.0026185810565948486, 0.06910467147827148, 0.13559076189994812, 0.20207685232162476, 0.2685629427433014, 0.335049033164978, 0.40153512358665466, 0.4680212140083313, 0.5345072746276855, 0.6009933948516846, 0.6674795150756836, 0.7339655756950378, 0.8004516363143921, 0.8669377565383911, 0.9334238767623901, 0.9999099373817444, 1.0663959980010986, 1.1328821182250977, 1.1993682384490967, 1.2658543586730957, 1.3323403596878052, 1.3988264799118042, 1.4653126001358032, 1.5317986011505127, 1.5982847213745117, 1.6647708415985107, 1.7312569618225098, 1.7977430820465088, 1.8642290830612183, 1.9307152032852173, 1.9972013235092163, 2.063687324523926, 2.130173444747925, 2.196659564971924]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 8.0, 6.0, 8.0, 5.0, 11.0, 12.0, 7.0, 16.0, 19.0, 16.0, 17.0, 17.0, 19.0, 25.0, 37.0, 28.0, 30.0, 45.0, 31.0, 40.0, 43.0, 38.0, 60.0, 50.0, 38.0, 35.0, 35.0, 43.0, 35.0, 33.0, 24.0, 28.0, 29.0, 20.0, 16.0, 18.0, 12.0, 7.0, 9.0, 7.0, 6.0, 3.0, 5.0, 4.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.4276683330535889, -1.3805620670318604, -1.3334559202194214, -1.2863496541976929, -1.2392433881759644, -1.1921372413635254, -1.1450309753417969, -1.0979247093200684, -1.0508184432983398, -1.0037121772766113, -0.9566059708595276, -0.9094997644424438, -0.8623934984207153, -0.8152872920036316, -0.7681810855865479, -0.7210748195648193, -0.6739686727523804, -0.6268624663352966, -0.5797562003135681, -0.5326499938964844, -0.48554375767707825, -0.4384375214576721, -0.3913313150405884, -0.34422507882118225, -0.2971188426017761, -0.25001260638237, -0.20290638506412506, -0.15580016374588013, -0.108693927526474, -0.06158769130706787, -0.01448148488998413, 0.032624751329422, 0.07973098754882812, 0.12683722376823425, 0.1739434450864792, 0.22104966640472412, 0.26815590262413025, 0.3152621388435364, 0.3623683452606201, 0.40947458148002625, 0.4565808176994324, 0.5036870241165161, 0.5507932901382446, 0.5978994965553284, 0.6450057029724121, 0.6921119689941406, 0.7392181754112244, 0.7863243818283081, 0.8334306478500366, 0.8805368542671204, 0.9276431202888489, 0.9747493267059326, 1.0218555927276611, 1.0689618587493896, 1.1160680055618286, 1.1631742715835571, 1.210280418395996, 1.2573866844177246, 1.3044928312301636, 1.351599097251892, 1.3987053632736206, 1.4458115100860596, 1.492917776107788, 1.5400240421295166, 1.5871303081512451]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 3.0, 8.0, 13.0, 20.0, 37.0, 54.0, 78.0, 154.0, 236.0, 414.0, 867.0, 1632.0, 3209.0, 7231.0, 16718.0, 40968.0, 108778.0, 354673.0, 1707446.0, 1481594.0, 307568.0, 97087.0, 37012.0, 15480.0, 6618.0, 3043.0, 1526.0, 821.0, 437.0, 217.0, 124.0, 79.0, 55.0, 40.0, 25.0, 6.0, 11.0, 1.0, 1.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.266845703125, -0.2546882629394531, -0.24253082275390625, -0.23037338256835938, -0.2182159423828125, -0.20605850219726562, -0.19390106201171875, -0.18174362182617188, -0.169586181640625, -0.15742874145507812, -0.14527130126953125, -0.13311386108398438, -0.1209564208984375, -0.10879898071289062, -0.09664154052734375, -0.08448410034179688, -0.07232666015625, -0.060169219970703125, -0.04801177978515625, -0.035854339599609375, -0.0236968994140625, -0.011539459228515625, 0.00061798095703125, 0.012775421142578125, 0.024932861328125, 0.037090301513671875, 0.04924774169921875, 0.061405181884765625, 0.0735626220703125, 0.08572006225585938, 0.09787750244140625, 0.11003494262695312, 0.1221923828125, 0.13434982299804688, 0.14650726318359375, 0.15866470336914062, 0.1708221435546875, 0.18297958374023438, 0.19513702392578125, 0.20729446411132812, 0.219451904296875, 0.23160934448242188, 0.24376678466796875, 0.2559242248535156, 0.2680816650390625, 0.2802391052246094, 0.29239654541015625, 0.3045539855957031, 0.31671142578125, 0.3288688659667969, 0.34102630615234375, 0.3531837463378906, 0.3653411865234375, 0.3774986267089844, 0.38965606689453125, 0.4018135070800781, 0.413970947265625, 0.4261283874511719, 0.43828582763671875, 0.4504432678222656, 0.4626007080078125, 0.4747581481933594, 0.48691558837890625, 0.4990730285644531, 0.51123046875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 1.0, 4.0, 4.0, 5.0, 4.0, 11.0, 7.0, 13.0, 11.0, 15.0, 11.0, 17.0, 15.0, 22.0, 23.0, 22.0, 19.0, 34.0, 36.0, 39.0, 41.0, 29.0, 45.0, 41.0, 38.0, 32.0, 44.0, 39.0, 48.0, 34.0, 34.0, 33.0, 20.0, 24.0, 20.0, 23.0, 28.0, 16.0, 12.0, 17.0, 19.0, 6.0, 11.0, 12.0, 7.0, 6.0, 4.0, 2.0, 5.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.16796875, -0.16219329833984375, -0.1564178466796875, -0.15064239501953125, -0.144866943359375, -0.13909149169921875, -0.1333160400390625, -0.12754058837890625, -0.12176513671875, -0.11598968505859375, -0.1102142333984375, -0.10443878173828125, -0.098663330078125, -0.09288787841796875, -0.0871124267578125, -0.08133697509765625, -0.0755615234375, -0.06978607177734375, -0.0640106201171875, -0.05823516845703125, -0.052459716796875, -0.04668426513671875, -0.0409088134765625, -0.03513336181640625, -0.02935791015625, -0.02358245849609375, -0.0178070068359375, -0.01203155517578125, -0.006256103515625, -0.00048065185546875, 0.0052947998046875, 0.01107025146484375, 0.016845703125, 0.02262115478515625, 0.0283966064453125, 0.03417205810546875, 0.039947509765625, 0.04572296142578125, 0.0514984130859375, 0.05727386474609375, 0.06304931640625, 0.06882476806640625, 0.0746002197265625, 0.08037567138671875, 0.086151123046875, 0.09192657470703125, 0.0977020263671875, 0.10347747802734375, 0.1092529296875, 0.11502838134765625, 0.1208038330078125, 0.12657928466796875, 0.132354736328125, 0.13813018798828125, 0.1439056396484375, 0.14968109130859375, 0.15545654296875, 0.16123199462890625, 0.1670074462890625, 0.17278289794921875, 0.178558349609375, 0.18433380126953125, 0.1901092529296875, 0.19588470458984375, 0.20166015625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 6.0, 9.0, 17.0, 24.0, 35.0, 54.0, 105.0, 127.0, 229.0, 355.0, 601.0, 1220.0, 2417.0, 5924.0, 15520.0, 46205.0, 153358.0, 692175.0, 2538330.0, 544356.0, 129757.0, 39734.0, 13636.0, 5265.0, 2297.0, 1114.0, 562.0, 328.0, 205.0, 114.0, 89.0, 37.0, 28.0, 24.0, 6.0, 6.0, 4.0, 5.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.56982421875, -0.5527801513671875, -0.535736083984375, -0.5186920166015625, -0.50164794921875, -0.4846038818359375, -0.467559814453125, -0.4505157470703125, -0.4334716796875, -0.4164276123046875, -0.399383544921875, -0.3823394775390625, -0.36529541015625, -0.3482513427734375, -0.331207275390625, -0.3141632080078125, -0.297119140625, -0.2800750732421875, -0.263031005859375, -0.2459869384765625, -0.22894287109375, -0.2118988037109375, -0.194854736328125, -0.1778106689453125, -0.1607666015625, -0.1437225341796875, -0.126678466796875, -0.1096343994140625, -0.09259033203125, -0.0755462646484375, -0.058502197265625, -0.0414581298828125, -0.0244140625, -0.0073699951171875, 0.009674072265625, 0.0267181396484375, 0.04376220703125, 0.0608062744140625, 0.077850341796875, 0.0948944091796875, 0.1119384765625, 0.1289825439453125, 0.146026611328125, 0.1630706787109375, 0.18011474609375, 0.1971588134765625, 0.214202880859375, 0.2312469482421875, 0.248291015625, 0.2653350830078125, 0.282379150390625, 0.2994232177734375, 0.31646728515625, 0.3335113525390625, 0.350555419921875, 0.3675994873046875, 0.3846435546875, 0.4016876220703125, 0.418731689453125, 0.4357757568359375, 0.45281982421875, 0.4698638916015625, 0.486907958984375, 0.5039520263671875, 0.52099609375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 6.0, 10.0, 6.0, 13.0, 13.0, 19.0, 24.0, 34.0, 49.0, 61.0, 64.0, 88.0, 148.0, 188.0, 308.0, 465.0, 628.0, 626.0, 378.0, 262.0, 156.0, 126.0, 100.0, 77.0, 56.0, 31.0, 31.0, 26.0, 16.0, 13.0, 13.0, 12.0, 6.0, 2.0, 2.0, 4.0, 5.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.552734375, -0.536865234375, -0.52099609375, -0.505126953125, -0.4892578125, -0.473388671875, -0.45751953125, -0.441650390625, -0.42578125, -0.409912109375, -0.39404296875, -0.378173828125, -0.3623046875, -0.346435546875, -0.33056640625, -0.314697265625, -0.298828125, -0.282958984375, -0.26708984375, -0.251220703125, -0.2353515625, -0.219482421875, -0.20361328125, -0.187744140625, -0.171875, -0.156005859375, -0.14013671875, -0.124267578125, -0.1083984375, -0.092529296875, -0.07666015625, -0.060791015625, -0.044921875, -0.029052734375, -0.01318359375, 0.002685546875, 0.0185546875, 0.034423828125, 0.05029296875, 0.066162109375, 0.08203125, 0.097900390625, 0.11376953125, 0.129638671875, 0.1455078125, 0.161376953125, 0.17724609375, 0.193115234375, 0.208984375, 0.224853515625, 0.24072265625, 0.256591796875, 0.2724609375, 0.288330078125, 0.30419921875, 0.320068359375, 0.3359375, 0.351806640625, 0.36767578125, 0.383544921875, 0.3994140625, 0.415283203125, 0.43115234375, 0.447021484375, 0.462890625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 6.0, 18.0, 30.0, 64.0, 92.0, 136.0, 153.0, 153.0, 141.0, 89.0, 50.0, 33.0, 19.0, 8.0, 4.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.621156692504883, -5.490445613861084, -5.359734535217285, -5.229023456573486, -5.0983123779296875, -4.967601776123047, -4.83689022064209, -4.706179618835449, -4.57546854019165, -4.444757461547852, -4.314046382904053, -4.183335304260254, -4.052624225616455, -3.9219133853912354, -3.7912023067474365, -3.6604912281036377, -3.529780149459839, -3.39906907081604, -3.268357992172241, -3.1376471519470215, -3.0069360733032227, -2.876224994659424, -2.745513916015625, -2.614802837371826, -2.4840917587280273, -2.3533806800842285, -2.2226696014404297, -2.091958522796631, -1.9612476825714111, -1.8305366039276123, -1.6998255252838135, -1.5691144466400146, -1.4384033679962158, -1.307692289352417, -1.1769813299179077, -1.0462702512741089, -0.9155592322349548, -0.7848482131958008, -0.654137134552002, -0.5234261155128479, -0.39271509647369385, -0.2620040774345398, -0.13129302859306335, -0.0005819797515869141, 0.13012903928756714, 0.2608400583267212, 0.39155113697052, 0.5222621560096741, 0.6529731750488281, 0.7836841940879822, 0.9143952131271362, 1.045106291770935, 1.1758172512054443, 1.3065283298492432, 1.437239408493042, 1.5679504871368408, 1.69866144657135, 1.829372525215149, 1.9600834846496582, 2.090794563293457, 2.221505641937256, 2.3522167205810547, 2.4829277992248535, 2.6136386394500732, 2.744349718093872]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 4.0, 9.0, 7.0, 7.0, 11.0, 7.0, 12.0, 14.0, 18.0, 19.0, 31.0, 28.0, 28.0, 28.0, 27.0, 43.0, 46.0, 43.0, 45.0, 51.0, 35.0, 29.0, 42.0, 42.0, 53.0, 34.0, 43.0, 39.0, 32.0, 33.0, 14.0, 21.0, 14.0, 12.0, 15.0, 6.0, 19.0, 9.0, 8.0, 11.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.5673120021820068, -1.5174849033355713, -1.4676578044891357, -1.4178305864334106, -1.368003487586975, -1.3181763887405396, -1.2683491706848145, -1.218522071838379, -1.1686949729919434, -1.1188678741455078, -1.0690407752990723, -1.0192135572433472, -0.9693864583969116, -0.9195593595504761, -0.8697322010993958, -0.8199050426483154, -0.7700779438018799, -0.7202508449554443, -0.670423686504364, -0.6205965280532837, -0.5707694292068481, -0.5209423303604126, -0.4711151719093323, -0.42128804326057434, -0.3714609146118164, -0.32163378596305847, -0.27180665731430054, -0.2219795286655426, -0.17215240001678467, -0.12232527136802673, -0.0724981427192688, -0.022671014070510864, 0.02715611457824707, 0.076983243227005, 0.12681037187576294, 0.17663750052452087, 0.2264646291732788, 0.27629175782203674, 0.3261188864707947, 0.3759460151195526, 0.42577314376831055, 0.4756002724170685, 0.5254274010658264, 0.5752545595169067, 0.6250816583633423, 0.6749087572097778, 0.7247359156608582, 0.7745630741119385, 0.824390172958374, 0.8742172718048096, 0.9240444302558899, 0.9738715887069702, 1.0236986875534058, 1.0735257863998413, 1.1233530044555664, 1.173180103302002, 1.2230072021484375, 1.272834300994873, 1.3226613998413086, 1.3724886178970337, 1.4223157167434692, 1.4721428155899048, 1.5219700336456299, 1.5717971324920654, 1.621624231338501]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 3.0, 4.0, 7.0, 9.0, 11.0, 20.0, 34.0, 46.0, 87.0, 126.0, 215.0, 285.0, 535.0, 816.0, 1253.0, 2042.0, 2976.0, 4698.0, 7168.0, 11502.0, 18714.0, 33136.0, 68169.0, 162104.0, 296028.0, 230345.0, 100438.0, 45011.0, 23682.0, 14027.0, 9014.0, 5738.0, 3733.0, 2395.0, 1554.0, 947.0, 608.0, 437.0, 244.0, 166.0, 96.0, 66.0, 29.0, 11.0, 17.0, 9.0, 6.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.34375, -0.3317832946777344, -0.31981658935546875, -0.3078498840332031, -0.2958831787109375, -0.2839164733886719, -0.27194976806640625, -0.2599830627441406, -0.248016357421875, -0.23604965209960938, -0.22408294677734375, -0.21211624145507812, -0.2001495361328125, -0.18818283081054688, -0.17621612548828125, -0.16424942016601562, -0.15228271484375, -0.14031600952148438, -0.12834930419921875, -0.11638259887695312, -0.1044158935546875, -0.09244918823242188, -0.08048248291015625, -0.06851577758789062, -0.056549072265625, -0.044582366943359375, -0.03261566162109375, -0.020648956298828125, -0.0086822509765625, 0.003284454345703125, 0.01525115966796875, 0.027217864990234375, 0.0391845703125, 0.051151275634765625, 0.06311798095703125, 0.07508468627929688, 0.0870513916015625, 0.09901809692382812, 0.11098480224609375, 0.12295150756835938, 0.134918212890625, 0.14688491821289062, 0.15885162353515625, 0.17081832885742188, 0.1827850341796875, 0.19475173950195312, 0.20671844482421875, 0.21868515014648438, 0.23065185546875, 0.24261856079101562, 0.25458526611328125, 0.2665519714355469, 0.2785186767578125, 0.2904853820800781, 0.30245208740234375, 0.3144187927246094, 0.326385498046875, 0.3383522033691406, 0.35031890869140625, 0.3622856140136719, 0.3742523193359375, 0.3862190246582031, 0.39818572998046875, 0.4101524353027344, 0.422119140625]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 5.0, 4.0, 4.0, 9.0, 11.0, 16.0, 14.0, 18.0, 16.0, 21.0, 21.0, 26.0, 26.0, 33.0, 33.0, 37.0, 42.0, 42.0, 33.0, 43.0, 36.0, 45.0, 42.0, 41.0, 39.0, 44.0, 36.0, 35.0, 30.0, 27.0, 25.0, 27.0, 17.0, 16.0, 16.0, 16.0, 16.0, 8.0, 6.0, 6.0, 5.0, 5.0, 3.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.2113037109375, -0.2046833038330078, -0.19806289672851562, -0.19144248962402344, -0.18482208251953125, -0.17820167541503906, -0.17158126831054688, -0.1649608612060547, -0.1583404541015625, -0.1517200469970703, -0.14509963989257812, -0.13847923278808594, -0.13185882568359375, -0.12523841857910156, -0.11861801147460938, -0.11199760437011719, -0.105377197265625, -0.09875679016113281, -0.09213638305664062, -0.08551597595214844, -0.07889556884765625, -0.07227516174316406, -0.06565475463867188, -0.05903434753417969, -0.0524139404296875, -0.04579353332519531, -0.039173126220703125, -0.03255271911621094, -0.02593231201171875, -0.019311904907226562, -0.012691497802734375, -0.0060710906982421875, 0.00054931640625, 0.0071697235107421875, 0.013790130615234375, 0.020410537719726562, 0.02703094482421875, 0.03365135192871094, 0.040271759033203125, 0.04689216613769531, 0.0535125732421875, 0.06013298034667969, 0.06675338745117188, 0.07337379455566406, 0.07999420166015625, 0.08661460876464844, 0.09323501586914062, 0.09985542297363281, 0.106475830078125, 0.11309623718261719, 0.11971664428710938, 0.12633705139160156, 0.13295745849609375, 0.13957786560058594, 0.14619827270507812, 0.1528186798095703, 0.1594390869140625, 0.1660594940185547, 0.17267990112304688, 0.17930030822753906, 0.18592071533203125, 0.19254112243652344, 0.19916152954101562, 0.2057819366455078, 0.21240234375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 0.0, 0.0, 3.0, 7.0, 7.0, 8.0, 11.0, 10.0, 18.0, 37.0, 25.0, 50.0, 63.0, 90.0, 128.0, 208.0, 345.0, 627.0, 1252.0, 2535.0, 5695.0, 13849.0, 36563.0, 121051.0, 476892.0, 281936.0, 66568.0, 23310.0, 9378.0, 3973.0, 1796.0, 877.0, 463.0, 259.0, 166.0, 102.0, 66.0, 49.0, 38.0, 28.0, 25.0, 13.0, 19.0, 5.0, 5.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 3.0], "bins": [-0.8447265625, -0.8217544555664062, -0.7987823486328125, -0.7758102416992188, -0.752838134765625, -0.7298660278320312, -0.7068939208984375, -0.6839218139648438, -0.66094970703125, -0.6379776000976562, -0.6150054931640625, -0.5920333862304688, -0.569061279296875, -0.5460891723632812, -0.5231170654296875, -0.5001449584960938, -0.4771728515625, -0.45420074462890625, -0.4312286376953125, -0.40825653076171875, -0.385284423828125, -0.36231231689453125, -0.3393402099609375, -0.31636810302734375, -0.29339599609375, -0.27042388916015625, -0.2474517822265625, -0.22447967529296875, -0.201507568359375, -0.17853546142578125, -0.1555633544921875, -0.13259124755859375, -0.109619140625, -0.08664703369140625, -0.0636749267578125, -0.04070281982421875, -0.017730712890625, 0.00524139404296875, 0.0282135009765625, 0.05118560791015625, 0.07415771484375, 0.09712982177734375, 0.1201019287109375, 0.14307403564453125, 0.166046142578125, 0.18901824951171875, 0.2119903564453125, 0.23496246337890625, 0.2579345703125, 0.28090667724609375, 0.3038787841796875, 0.32685089111328125, 0.349822998046875, 0.37279510498046875, 0.3957672119140625, 0.41873931884765625, 0.44171142578125, 0.46468353271484375, 0.4876556396484375, 0.5106277465820312, 0.533599853515625, 0.5565719604492188, 0.5795440673828125, 0.6025161743164062, 0.62548828125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 5.0, 5.0, 4.0, 8.0, 9.0, 17.0, 12.0, 23.0, 29.0, 31.0, 43.0, 40.0, 54.0, 51.0, 60.0, 67.0, 68.0, 62.0, 63.0, 53.0, 59.0, 52.0, 33.0, 33.0, 31.0, 20.0, 26.0, 15.0, 13.0, 6.0, 4.0, 4.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.224609375, -1.1919937133789062, -1.1593780517578125, -1.1267623901367188, -1.094146728515625, -1.0615310668945312, -1.0289154052734375, -0.9962997436523438, -0.96368408203125, -0.9310684204101562, -0.8984527587890625, -0.8658370971679688, -0.833221435546875, -0.8006057739257812, -0.7679901123046875, -0.7353744506835938, -0.7027587890625, -0.6701431274414062, -0.6375274658203125, -0.6049118041992188, -0.572296142578125, -0.5396804809570312, -0.5070648193359375, -0.47444915771484375, -0.44183349609375, -0.40921783447265625, -0.3766021728515625, -0.34398651123046875, -0.311370849609375, -0.27875518798828125, -0.2461395263671875, -0.21352386474609375, -0.180908203125, -0.14829254150390625, -0.1156768798828125, -0.08306121826171875, -0.050445556640625, -0.01782989501953125, 0.0147857666015625, 0.04740142822265625, 0.08001708984375, 0.11263275146484375, 0.1452484130859375, 0.17786407470703125, 0.210479736328125, 0.24309539794921875, 0.2757110595703125, 0.30832672119140625, 0.3409423828125, 0.37355804443359375, 0.4061737060546875, 0.43878936767578125, 0.471405029296875, 0.5040206909179688, 0.5366363525390625, 0.5692520141601562, 0.60186767578125, 0.6344833374023438, 0.6670989990234375, 0.6997146606445312, 0.732330322265625, 0.7649459838867188, 0.7975616455078125, 0.8301773071289062, 0.86279296875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 5.0, 2.0, 8.0, 2.0, 8.0, 6.0, 7.0, 7.0, 29.0, 17.0, 39.0, 57.0, 92.0, 165.0, 247.0, 427.0, 708.0, 1307.0, 2413.0, 4724.0, 9615.0, 19942.0, 44618.0, 114098.0, 342489.0, 321636.0, 105531.0, 42368.0, 19090.0, 9163.0, 4408.0, 2359.0, 1236.0, 713.0, 365.0, 243.0, 133.0, 85.0, 56.0, 34.0, 26.0, 21.0, 17.0, 14.0, 6.0, 6.0, 4.0, 7.0, 4.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.20068359375, -0.1945953369140625, -0.188507080078125, -0.1824188232421875, -0.17633056640625, -0.1702423095703125, -0.164154052734375, -0.1580657958984375, -0.1519775390625, -0.1458892822265625, -0.139801025390625, -0.1337127685546875, -0.12762451171875, -0.1215362548828125, -0.115447998046875, -0.1093597412109375, -0.103271484375, -0.0971832275390625, -0.091094970703125, -0.0850067138671875, -0.07891845703125, -0.0728302001953125, -0.066741943359375, -0.0606536865234375, -0.0545654296875, -0.0484771728515625, -0.042388916015625, -0.0363006591796875, -0.03021240234375, -0.0241241455078125, -0.018035888671875, -0.0119476318359375, -0.005859375, 0.0002288818359375, 0.006317138671875, 0.0124053955078125, 0.01849365234375, 0.0245819091796875, 0.030670166015625, 0.0367584228515625, 0.0428466796875, 0.0489349365234375, 0.055023193359375, 0.0611114501953125, 0.06719970703125, 0.0732879638671875, 0.079376220703125, 0.0854644775390625, 0.091552734375, 0.0976409912109375, 0.103729248046875, 0.1098175048828125, 0.11590576171875, 0.1219940185546875, 0.128082275390625, 0.1341705322265625, 0.1402587890625, 0.1463470458984375, 0.152435302734375, 0.1585235595703125, 0.16461181640625, 0.1707000732421875, 0.176788330078125, 0.1828765869140625, 0.18896484375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 8.0, 7.0, 9.0, 2.0, 16.0, 10.0, 22.0, 26.0, 38.0, 80.0, 139.0, 186.0, 178.0, 104.0, 54.0, 27.0, 13.0, 19.0, 16.0, 9.0, 11.0, 10.0, 0.0, 5.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.00010943412780761719, -0.00010660570114850998, -0.00010377727448940277, -0.00010094884783029556, -9.812042117118835e-05, -9.529199451208115e-05, -9.246356785297394e-05, -8.963514119386673e-05, -8.680671453475952e-05, -8.397828787565231e-05, -8.11498612165451e-05, -7.83214345574379e-05, -7.549300789833069e-05, -7.266458123922348e-05, -6.983615458011627e-05, -6.700772792100906e-05, -6.417930126190186e-05, -6.135087460279465e-05, -5.852244794368744e-05, -5.569402128458023e-05, -5.286559462547302e-05, -5.0037167966365814e-05, -4.7208741307258606e-05, -4.43803146481514e-05, -4.155188798904419e-05, -3.872346132993698e-05, -3.589503467082977e-05, -3.3066608011722565e-05, -3.0238181352615356e-05, -2.7409754693508148e-05, -2.458132803440094e-05, -2.175290137529373e-05, -1.8924474716186523e-05, -1.6096048057079315e-05, -1.3267621397972107e-05, -1.0439194738864899e-05, -7.6107680797576904e-06, -4.782341420650482e-06, -1.953914761543274e-06, 8.745118975639343e-07, 3.7029385566711426e-06, 6.531365215778351e-06, 9.359791874885559e-06, 1.2188218533992767e-05, 1.5016645193099976e-05, 1.7845071852207184e-05, 2.0673498511314392e-05, 2.35019251704216e-05, 2.633035182952881e-05, 2.9158778488636017e-05, 3.1987205147743225e-05, 3.481563180685043e-05, 3.764405846595764e-05, 4.047248512506485e-05, 4.330091178417206e-05, 4.6129338443279266e-05, 4.8957765102386475e-05, 5.178619176149368e-05, 5.461461842060089e-05, 5.74430450797081e-05, 6.027147173881531e-05, 6.309989839792252e-05, 6.592832505702972e-05, 6.875675171613693e-05, 7.158517837524414e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 5.0, 4.0, 6.0, 9.0, 13.0, 16.0, 21.0, 24.0, 33.0, 50.0, 65.0, 92.0, 142.0, 198.0, 320.0, 465.0, 893.0, 1681.0, 3525.0, 7903.0, 18641.0, 45373.0, 116221.0, 321300.0, 329039.0, 120657.0, 46512.0, 19540.0, 8040.0, 3732.0, 1700.0, 883.0, 490.0, 292.0, 206.0, 138.0, 84.0, 62.0, 62.0, 41.0, 28.0, 23.0, 13.0, 11.0, 7.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.20263671875, -0.19684982299804688, -0.19106292724609375, -0.18527603149414062, -0.1794891357421875, -0.17370223999023438, -0.16791534423828125, -0.16212844848632812, -0.156341552734375, -0.15055465698242188, -0.14476776123046875, -0.13898086547851562, -0.1331939697265625, -0.12740707397460938, -0.12162017822265625, -0.11583328247070312, -0.11004638671875, -0.10425949096679688, -0.09847259521484375, -0.09268569946289062, -0.0868988037109375, -0.08111190795898438, -0.07532501220703125, -0.06953811645507812, -0.063751220703125, -0.057964324951171875, -0.05217742919921875, -0.046390533447265625, -0.0406036376953125, -0.034816741943359375, -0.02902984619140625, -0.023242950439453125, -0.0174560546875, -0.011669158935546875, -0.00588226318359375, -9.5367431640625e-05, 0.0056915283203125, 0.011478424072265625, 0.01726531982421875, 0.023052215576171875, 0.028839111328125, 0.034626007080078125, 0.04041290283203125, 0.046199798583984375, 0.0519866943359375, 0.057773590087890625, 0.06356048583984375, 0.06934738159179688, 0.07513427734375, 0.08092117309570312, 0.08670806884765625, 0.09249496459960938, 0.0982818603515625, 0.10406875610351562, 0.10985565185546875, 0.11564254760742188, 0.121429443359375, 0.12721633911132812, 0.13300323486328125, 0.13879013061523438, 0.1445770263671875, 0.15036392211914062, 0.15615081787109375, 0.16193771362304688, 0.167724609375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 7.0, 3.0, 1.0, 2.0, 3.0, 4.0, 1.0, 6.0, 10.0, 7.0, 12.0, 14.0, 22.0, 25.0, 25.0, 28.0, 38.0, 41.0, 55.0, 62.0, 75.0, 78.0, 86.0, 73.0, 53.0, 49.0, 34.0, 34.0, 32.0, 14.0, 20.0, 15.0, 13.0, 11.0, 15.0, 7.0, 8.0, 5.0, 5.0, 7.0, 5.0, 1.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.156005859375, -0.1500244140625, -0.14404296875, -0.1380615234375, -0.132080078125, -0.1260986328125, -0.1201171875, -0.1141357421875, -0.108154296875, -0.1021728515625, -0.09619140625, -0.0902099609375, -0.084228515625, -0.0782470703125, -0.072265625, -0.0662841796875, -0.060302734375, -0.0543212890625, -0.04833984375, -0.0423583984375, -0.036376953125, -0.0303955078125, -0.0244140625, -0.0184326171875, -0.012451171875, -0.0064697265625, -0.00048828125, 0.0054931640625, 0.011474609375, 0.0174560546875, 0.0234375, 0.0294189453125, 0.035400390625, 0.0413818359375, 0.04736328125, 0.0533447265625, 0.059326171875, 0.0653076171875, 0.0712890625, 0.0772705078125, 0.083251953125, 0.0892333984375, 0.09521484375, 0.1011962890625, 0.107177734375, 0.1131591796875, 0.119140625, 0.1251220703125, 0.131103515625, 0.1370849609375, 0.14306640625, 0.1490478515625, 0.155029296875, 0.1610107421875, 0.1669921875, 0.1729736328125, 0.178955078125, 0.1849365234375, 0.19091796875, 0.1968994140625, 0.202880859375, 0.2088623046875, 0.21484375, 0.2208251953125, 0.226806640625]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 7.0, 14.0, 19.0, 62.0, 146.0, 217.0, 230.0, 159.0, 91.0, 34.0, 12.0, 5.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.352656841278076, -6.17669153213501, -6.000726222991943, -5.824760913848877, -5.6487956047058105, -5.472830295562744, -5.2968645095825195, -5.120899200439453, -4.944933891296387, -4.76896858215332, -4.593003273010254, -4.4170379638671875, -4.241072654724121, -4.065107345581055, -3.889141798019409, -3.7131764888763428, -3.5372114181518555, -3.361246109008789, -3.1852807998657227, -3.0093154907226562, -2.83335018157959, -2.6573848724365234, -2.481419324874878, -2.3054540157318115, -2.129488706588745, -1.9535233974456787, -1.7775580883026123, -1.6015926599502563, -1.42562735080719, -1.2496620416641235, -1.0736966133117676, -0.8977313041687012, -0.7217655181884766, -0.5458002090454102, -0.369834840297699, -0.1938694715499878, -0.017904162406921387, 0.15806114673614502, 0.334026575088501, 0.5099918842315674, 0.6859571933746338, 0.8619225025177002, 1.0378878116607666, 1.2138532400131226, 1.389818549156189, 1.5657838582992554, 1.7417492866516113, 1.9177145957946777, 2.093679904937744, 2.2696452140808105, 2.445610523223877, 2.6215758323669434, 2.7975411415100098, 2.973506450653076, 3.1494719982147217, 3.325437307357788, 3.5014026165008545, 3.677367925643921, 3.8533332347869873, 4.029298782348633, 4.205264091491699, 4.381229400634766, 4.557194709777832, 4.733160018920898, 4.909125328063965]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 6.0, 1.0, 0.0, 4.0, 5.0, 5.0, 13.0, 10.0, 10.0, 13.0, 17.0, 9.0, 25.0, 19.0, 22.0, 34.0, 14.0, 37.0, 25.0, 25.0, 42.0, 39.0, 49.0, 35.0, 31.0, 32.0, 51.0, 34.0, 42.0, 37.0, 36.0, 40.0, 25.0, 29.0, 19.0, 27.0, 19.0, 27.0, 20.0, 16.0, 16.0, 12.0, 11.0, 9.0, 1.0, 6.0, 3.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.7826440334320068, -1.7286403179168701, -1.674636721611023, -1.6206330060958862, -1.5666292905807495, -1.5126256942749023, -1.4586219787597656, -1.404618263244629, -1.3506145477294922, -1.2966108322143555, -1.2426072359085083, -1.1886035203933716, -1.1345998048782349, -1.0805962085723877, -1.026592493057251, -0.9725887775421143, -0.9185851812362671, -0.8645815253257751, -0.8105778098106384, -0.7565741539001465, -0.7025704383850098, -0.6485667824745178, -0.5945631265640259, -0.5405594110488892, -0.4865557551383972, -0.4325520694255829, -0.37854838371276855, -0.3245447278022766, -0.2705410420894623, -0.21653735637664795, -0.162533700466156, -0.10853001475334167, -0.054526329040527344, -0.0005226507782936096, 0.053481027483940125, 0.10748469829559326, 0.1614883840084076, 0.21549206972122192, 0.26949572563171387, 0.3234994113445282, 0.37750309705734253, 0.43150678277015686, 0.4855104684829712, 0.5395141243934631, 0.5935177803039551, 0.6475214958190918, 0.7015251517295837, 0.7555288076400757, 0.8095325231552124, 0.8635361790657043, 0.9175398945808411, 0.971543550491333, 1.0255472660064697, 1.0795509815216064, 1.1335545778274536, 1.1875582933425903, 1.2415618896484375, 1.2955656051635742, 1.3495692014694214, 1.403572916984558, 1.4575766324996948, 1.511580228805542, 1.5655839443206787, 1.6195876598358154, 1.6735913753509521]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 4.0, 1.0, 1.0, 6.0, 8.0, 13.0, 20.0, 27.0, 29.0, 52.0, 88.0, 138.0, 202.0, 311.0, 493.0, 850.0, 1440.0, 2452.0, 4335.0, 8095.0, 15054.0, 29420.0, 59536.0, 131706.0, 329281.0, 942850.0, 1533463.0, 684014.0, 246965.0, 103852.0, 48384.0, 23998.0, 12197.0, 6481.0, 3484.0, 2015.0, 1200.0, 724.0, 377.0, 259.0, 161.0, 114.0, 65.0, 45.0, 31.0, 25.0, 8.0, 5.0, 6.0, 7.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2435302734375, -0.2355060577392578, -0.22748184204101562, -0.21945762634277344, -0.21143341064453125, -0.20340919494628906, -0.19538497924804688, -0.1873607635498047, -0.1793365478515625, -0.1713123321533203, -0.16328811645507812, -0.15526390075683594, -0.14723968505859375, -0.13921546936035156, -0.13119125366210938, -0.12316703796386719, -0.115142822265625, -0.10711860656738281, -0.09909439086914062, -0.09107017517089844, -0.08304595947265625, -0.07502174377441406, -0.06699752807617188, -0.05897331237792969, -0.0509490966796875, -0.04292488098144531, -0.034900665283203125, -0.026876449584960938, -0.01885223388671875, -0.010828018188476562, -0.002803802490234375, 0.0052204132080078125, 0.01324462890625, 0.021268844604492188, 0.029293060302734375, 0.03731727600097656, 0.04534149169921875, 0.05336570739746094, 0.061389923095703125, 0.06941413879394531, 0.0774383544921875, 0.08546257019042969, 0.09348678588867188, 0.10151100158691406, 0.10953521728515625, 0.11755943298339844, 0.12558364868164062, 0.1336078643798828, 0.141632080078125, 0.1496562957763672, 0.15768051147460938, 0.16570472717285156, 0.17372894287109375, 0.18175315856933594, 0.18977737426757812, 0.1978015899658203, 0.2058258056640625, 0.2138500213623047, 0.22187423706054688, 0.22989845275878906, 0.23792266845703125, 0.24594688415527344, 0.2539710998535156, 0.2619953155517578, 0.27001953125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 4.0, 5.0, 1.0, 5.0, 2.0, 6.0, 3.0, 8.0, 6.0, 9.0, 6.0, 12.0, 12.0, 11.0, 17.0, 16.0, 20.0, 27.0, 33.0, 26.0, 37.0, 32.0, 27.0, 28.0, 32.0, 31.0, 43.0, 49.0, 51.0, 47.0, 42.0, 30.0, 45.0, 28.0, 31.0, 25.0, 30.0, 21.0, 23.0, 17.0, 20.0, 16.0, 18.0, 12.0, 10.0, 6.0, 6.0, 5.0, 7.0, 5.0, 5.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.1776123046875, -0.17143630981445312, -0.16526031494140625, -0.15908432006835938, -0.1529083251953125, -0.14673233032226562, -0.14055633544921875, -0.13438034057617188, -0.128204345703125, -0.12202835083007812, -0.11585235595703125, -0.10967636108398438, -0.1035003662109375, -0.09732437133789062, -0.09114837646484375, -0.08497238159179688, -0.07879638671875, -0.07262039184570312, -0.06644439697265625, -0.060268402099609375, -0.0540924072265625, -0.047916412353515625, -0.04174041748046875, -0.035564422607421875, -0.029388427734375, -0.023212432861328125, -0.01703643798828125, -0.010860443115234375, -0.0046844482421875, 0.001491546630859375, 0.00766754150390625, 0.013843536376953125, 0.02001953125, 0.026195526123046875, 0.03237152099609375, 0.038547515869140625, 0.0447235107421875, 0.050899505615234375, 0.05707550048828125, 0.06325149536132812, 0.069427490234375, 0.07560348510742188, 0.08177947998046875, 0.08795547485351562, 0.0941314697265625, 0.10030746459960938, 0.10648345947265625, 0.11265945434570312, 0.11883544921875, 0.12501144409179688, 0.13118743896484375, 0.13736343383789062, 0.1435394287109375, 0.14971542358398438, 0.15589141845703125, 0.16206741333007812, 0.168243408203125, 0.17441940307617188, 0.18059539794921875, 0.18677139282226562, 0.1929473876953125, 0.19912338256835938, 0.20529937744140625, 0.21147537231445312, 0.2176513671875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 4.0, 2.0, 1.0, 3.0, 4.0, 7.0, 11.0, 8.0, 14.0, 31.0, 30.0, 46.0, 87.0, 127.0, 193.0, 250.0, 457.0, 791.0, 1408.0, 2954.0, 6689.0, 16404.0, 46557.0, 141669.0, 493585.0, 2103897.0, 1012044.0, 245004.0, 76432.0, 26308.0, 10120.0, 4304.0, 2005.0, 1121.0, 625.0, 352.0, 254.0, 169.0, 107.0, 56.0, 38.0, 32.0, 21.0, 15.0, 21.0, 12.0, 8.0, 6.0, 1.0, 7.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.43994140625, -0.42462921142578125, -0.4093170166015625, -0.39400482177734375, -0.378692626953125, -0.36338043212890625, -0.3480682373046875, -0.33275604248046875, -0.31744384765625, -0.30213165283203125, -0.2868194580078125, -0.27150726318359375, -0.256195068359375, -0.24088287353515625, -0.2255706787109375, -0.21025848388671875, -0.1949462890625, -0.17963409423828125, -0.1643218994140625, -0.14900970458984375, -0.133697509765625, -0.11838531494140625, -0.1030731201171875, -0.08776092529296875, -0.07244873046875, -0.05713653564453125, -0.0418243408203125, -0.02651214599609375, -0.011199951171875, 0.00411224365234375, 0.0194244384765625, 0.03473663330078125, 0.050048828125, 0.06536102294921875, 0.0806732177734375, 0.09598541259765625, 0.111297607421875, 0.12660980224609375, 0.1419219970703125, 0.15723419189453125, 0.17254638671875, 0.18785858154296875, 0.2031707763671875, 0.21848297119140625, 0.233795166015625, 0.24910736083984375, 0.2644195556640625, 0.27973175048828125, 0.2950439453125, 0.31035614013671875, 0.3256683349609375, 0.34098052978515625, 0.356292724609375, 0.37160491943359375, 0.3869171142578125, 0.40222930908203125, 0.41754150390625, 0.43285369873046875, 0.4481658935546875, 0.46347808837890625, 0.478790283203125, 0.49410247802734375, 0.5094146728515625, 0.5247268676757812, 0.5400390625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 3.0, 8.0, 10.0, 13.0, 19.0, 28.0, 46.0, 66.0, 90.0, 122.0, 156.0, 237.0, 348.0, 527.0, 693.0, 588.0, 341.0, 225.0, 147.0, 102.0, 81.0, 60.0, 54.0, 35.0, 23.0, 18.0, 9.0, 10.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5341796875, -0.5140228271484375, -0.493865966796875, -0.4737091064453125, -0.45355224609375, -0.4333953857421875, -0.413238525390625, -0.3930816650390625, -0.3729248046875, -0.3527679443359375, -0.332611083984375, -0.3124542236328125, -0.29229736328125, -0.2721405029296875, -0.251983642578125, -0.2318267822265625, -0.211669921875, -0.1915130615234375, -0.171356201171875, -0.1511993408203125, -0.13104248046875, -0.1108856201171875, -0.090728759765625, -0.0705718994140625, -0.0504150390625, -0.0302581787109375, -0.010101318359375, 0.0100555419921875, 0.03021240234375, 0.0503692626953125, 0.070526123046875, 0.0906829833984375, 0.11083984375, 0.1309967041015625, 0.151153564453125, 0.1713104248046875, 0.19146728515625, 0.2116241455078125, 0.231781005859375, 0.2519378662109375, 0.2720947265625, 0.2922515869140625, 0.312408447265625, 0.3325653076171875, 0.35272216796875, 0.3728790283203125, 0.393035888671875, 0.4131927490234375, 0.433349609375, 0.4535064697265625, 0.473663330078125, 0.4938201904296875, 0.51397705078125, 0.5341339111328125, 0.554290771484375, 0.5744476318359375, 0.5946044921875, 0.6147613525390625, 0.634918212890625, 0.6550750732421875, 0.67523193359375, 0.6953887939453125, 0.715545654296875, 0.7357025146484375, 0.755859375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 9.0, 13.0, 23.0, 63.0, 74.0, 121.0, 129.0, 145.0, 138.0, 104.0, 83.0, 39.0, 25.0, 15.0, 5.0, 3.0, 3.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.9223976135253906, -3.7934978008270264, -3.664597988128662, -3.535698413848877, -3.4067986011505127, -3.2778987884521484, -3.1489992141723633, -3.020099401473999, -2.8911995887756348, -2.7622997760772705, -2.6333999633789062, -2.504500389099121, -2.375600576400757, -2.2467007637023926, -2.1178011894226074, -1.9889013767242432, -1.860001564025879, -1.7311017513275146, -1.60220205783844, -1.4733023643493652, -1.344402551651001, -1.2155027389526367, -1.086603045463562, -0.9577032923698425, -0.828803539276123, -0.6999037861824036, -0.5710040330886841, -0.4421042799949646, -0.3132045269012451, -0.18430477380752563, -0.05540502071380615, 0.07349473237991333, 0.2023940086364746, 0.3312937617301941, 0.4601935148239136, 0.5890932679176331, 0.7179930210113525, 0.846892774105072, 0.9757925271987915, 1.1046922206878662, 1.2335920333862305, 1.3624918460845947, 1.4913915395736694, 1.6202912330627441, 1.7491910457611084, 1.8780908584594727, 2.006990432739258, 2.135890245437622, 2.2647900581359863, 2.3936898708343506, 2.522589683532715, 2.6514892578125, 2.7803890705108643, 2.9092888832092285, 3.0381884574890137, 3.167088270187378, 3.295988082885742, 3.4248878955841064, 3.5537877082824707, 3.682687282562256, 3.81158709526062, 3.9404869079589844, 4.0693864822387695, 4.198286533355713, 4.327186107635498]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 8.0, 9.0, 8.0, 14.0, 12.0, 14.0, 13.0, 19.0, 19.0, 20.0, 35.0, 38.0, 23.0, 32.0, 35.0, 45.0, 40.0, 45.0, 47.0, 46.0, 39.0, 46.0, 51.0, 32.0, 39.0, 30.0, 29.0, 29.0, 25.0, 35.0, 19.0, 17.0, 17.0, 11.0, 13.0, 8.0, 9.0, 13.0, 8.0, 1.0, 9.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-2.1739280223846436, -2.1132686138153076, -2.0526092052459717, -1.9919497966766357, -1.9312903881072998, -1.8706309795379639, -1.809971570968628, -1.7493120431900024, -1.6886526346206665, -1.6279932260513306, -1.5673338174819946, -1.5066744089126587, -1.4460150003433228, -1.3853554725646973, -1.3246960639953613, -1.2640366554260254, -1.2033772468566895, -1.1427178382873535, -1.0820584297180176, -1.0213990211486816, -0.9607395529747009, -0.900080144405365, -0.839420735836029, -0.7787612676620483, -0.718101978302002, -0.657442569732666, -0.5967831611633301, -0.5361237525939941, -0.4754642844200134, -0.4148048758506775, -0.35414546728134155, -0.2934860289096832, -0.2328265905380249, -0.17216716706752777, -0.11150775104761124, -0.0508483350276947, 0.00981108844280243, 0.07047051191329956, 0.1311299204826355, 0.19178935885429382, 0.25244876742362976, 0.3131081759929657, 0.373767614364624, 0.43442702293395996, 0.4950864315032959, 0.5557458400726318, 0.6164052486419678, 0.6770647168159485, 0.7377241253852844, 0.7983835339546204, 0.8590429425239563, 0.919702410697937, 0.980361819267273, 1.0410212278366089, 1.1016806364059448, 1.1623400449752808, 1.2229994535446167, 1.2836588621139526, 1.3443182706832886, 1.4049776792526245, 1.4656370878219604, 1.526296615600586, 1.5869560241699219, 1.6476154327392578, 1.7082748413085938]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 8.0, 3.0, 7.0, 14.0, 12.0, 13.0, 18.0, 40.0, 57.0, 72.0, 107.0, 172.0, 254.0, 384.0, 501.0, 826.0, 1262.0, 1891.0, 2827.0, 4252.0, 6505.0, 10039.0, 15177.0, 23480.0, 37822.0, 65282.0, 119097.0, 198675.0, 216936.0, 142443.0, 77853.0, 44726.0, 27253.0, 17297.0, 11388.0, 7449.0, 4933.0, 3221.0, 2087.0, 1447.0, 912.0, 626.0, 392.0, 267.0, 187.0, 108.0, 90.0, 50.0, 38.0, 26.0, 13.0, 7.0, 10.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.287841796875, -0.27860260009765625, -0.2693634033203125, -0.26012420654296875, -0.250885009765625, -0.24164581298828125, -0.2324066162109375, -0.22316741943359375, -0.21392822265625, -0.20468902587890625, -0.1954498291015625, -0.18621063232421875, -0.176971435546875, -0.16773223876953125, -0.1584930419921875, -0.14925384521484375, -0.1400146484375, -0.13077545166015625, -0.1215362548828125, -0.11229705810546875, -0.103057861328125, -0.09381866455078125, -0.0845794677734375, -0.07534027099609375, -0.06610107421875, -0.05686187744140625, -0.0476226806640625, -0.03838348388671875, -0.029144287109375, -0.01990509033203125, -0.0106658935546875, -0.00142669677734375, 0.0078125, 0.01705169677734375, 0.0262908935546875, 0.03553009033203125, 0.044769287109375, 0.05400848388671875, 0.0632476806640625, 0.07248687744140625, 0.08172607421875, 0.09096527099609375, 0.1002044677734375, 0.10944366455078125, 0.118682861328125, 0.12792205810546875, 0.1371612548828125, 0.14640045166015625, 0.1556396484375, 0.16487884521484375, 0.1741180419921875, 0.18335723876953125, 0.192596435546875, 0.20183563232421875, 0.2110748291015625, 0.22031402587890625, 0.22955322265625, 0.23879241943359375, 0.2480316162109375, 0.25727081298828125, 0.266510009765625, 0.27574920654296875, 0.2849884033203125, 0.29422760009765625, 0.303466796875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 1.0, 5.0, 4.0, 6.0, 4.0, 10.0, 15.0, 18.0, 17.0, 20.0, 20.0, 32.0, 25.0, 38.0, 47.0, 34.0, 34.0, 43.0, 45.0, 42.0, 46.0, 43.0, 40.0, 43.0, 44.0, 45.0, 25.0, 31.0, 22.0, 30.0, 27.0, 13.0, 19.0, 23.0, 18.0, 17.0, 18.0, 4.0, 7.0, 6.0, 6.0, 4.0, 5.0, 4.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.2196044921875, -0.21258544921875, -0.20556640625, -0.19854736328125, -0.1915283203125, -0.18450927734375, -0.177490234375, -0.17047119140625, -0.1634521484375, -0.15643310546875, -0.1494140625, -0.14239501953125, -0.1353759765625, -0.12835693359375, -0.121337890625, -0.11431884765625, -0.1072998046875, -0.10028076171875, -0.09326171875, -0.08624267578125, -0.0792236328125, -0.07220458984375, -0.065185546875, -0.05816650390625, -0.0511474609375, -0.04412841796875, -0.037109375, -0.03009033203125, -0.0230712890625, -0.01605224609375, -0.009033203125, -0.00201416015625, 0.0050048828125, 0.01202392578125, 0.01904296875, 0.02606201171875, 0.0330810546875, 0.04010009765625, 0.047119140625, 0.05413818359375, 0.0611572265625, 0.06817626953125, 0.0751953125, 0.08221435546875, 0.0892333984375, 0.09625244140625, 0.103271484375, 0.11029052734375, 0.1173095703125, 0.12432861328125, 0.13134765625, 0.13836669921875, 0.1453857421875, 0.15240478515625, 0.159423828125, 0.16644287109375, 0.1734619140625, 0.18048095703125, 0.1875, 0.19451904296875, 0.2015380859375, 0.20855712890625, 0.215576171875, 0.22259521484375, 0.2296142578125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 4.0, 6.0, 16.0, 19.0, 28.0, 40.0, 77.0, 122.0, 250.0, 488.0, 1004.0, 2812.0, 9748.0, 39841.0, 212664.0, 603277.0, 138179.0, 28794.0, 7348.0, 2165.0, 809.0, 359.0, 213.0, 96.0, 73.0, 42.0, 24.0, 21.0, 11.0, 10.0, 6.0, 4.0, 2.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.76416015625, -0.7314834594726562, -0.6988067626953125, -0.6661300659179688, -0.633453369140625, -0.6007766723632812, -0.5680999755859375, -0.5354232788085938, -0.50274658203125, -0.47006988525390625, -0.4373931884765625, -0.40471649169921875, -0.372039794921875, -0.33936309814453125, -0.3066864013671875, -0.27400970458984375, -0.2413330078125, -0.20865631103515625, -0.1759796142578125, -0.14330291748046875, -0.110626220703125, -0.07794952392578125, -0.0452728271484375, -0.01259613037109375, 0.02008056640625, 0.05275726318359375, 0.0854339599609375, 0.11811065673828125, 0.150787353515625, 0.18346405029296875, 0.2161407470703125, 0.24881744384765625, 0.281494140625, 0.31417083740234375, 0.3468475341796875, 0.37952423095703125, 0.412200927734375, 0.44487762451171875, 0.4775543212890625, 0.5102310180664062, 0.54290771484375, 0.5755844116210938, 0.6082611083984375, 0.6409378051757812, 0.673614501953125, 0.7062911987304688, 0.7389678955078125, 0.7716445922851562, 0.8043212890625, 0.8369979858398438, 0.8696746826171875, 0.9023513793945312, 0.935028076171875, 0.9677047729492188, 1.0003814697265625, 1.0330581665039062, 1.06573486328125, 1.0984115600585938, 1.1310882568359375, 1.1637649536132812, 1.196441650390625, 1.2291183471679688, 1.2617950439453125, 1.2944717407226562, 1.3271484375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 8.0, 4.0, 1.0, 2.0, 8.0, 4.0, 8.0, 10.0, 7.0, 15.0, 18.0, 22.0, 26.0, 35.0, 26.0, 33.0, 43.0, 29.0, 45.0, 42.0, 59.0, 53.0, 39.0, 47.0, 58.0, 47.0, 34.0, 43.0, 29.0, 19.0, 29.0, 39.0, 15.0, 20.0, 18.0, 10.0, 17.0, 11.0, 11.0, 5.0, 7.0, 4.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.68603515625, -0.6632537841796875, -0.640472412109375, -0.6176910400390625, -0.59490966796875, -0.5721282958984375, -0.549346923828125, -0.5265655517578125, -0.5037841796875, -0.4810028076171875, -0.458221435546875, -0.4354400634765625, -0.41265869140625, -0.3898773193359375, -0.367095947265625, -0.3443145751953125, -0.321533203125, -0.2987518310546875, -0.275970458984375, -0.2531890869140625, -0.23040771484375, -0.2076263427734375, -0.184844970703125, -0.1620635986328125, -0.1392822265625, -0.1165008544921875, -0.093719482421875, -0.0709381103515625, -0.04815673828125, -0.0253753662109375, -0.002593994140625, 0.0201873779296875, 0.04296875, 0.0657501220703125, 0.088531494140625, 0.1113128662109375, 0.13409423828125, 0.1568756103515625, 0.179656982421875, 0.2024383544921875, 0.2252197265625, 0.2480010986328125, 0.270782470703125, 0.2935638427734375, 0.31634521484375, 0.3391265869140625, 0.361907958984375, 0.3846893310546875, 0.407470703125, 0.4302520751953125, 0.453033447265625, 0.4758148193359375, 0.49859619140625, 0.5213775634765625, 0.544158935546875, 0.5669403076171875, 0.5897216796875, 0.6125030517578125, 0.635284423828125, 0.6580657958984375, 0.68084716796875, 0.7036285400390625, 0.726409912109375, 0.7491912841796875, 0.77197265625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 6.0, 6.0, 9.0, 14.0, 27.0, 36.0, 75.0, 151.0, 279.0, 553.0, 1208.0, 3169.0, 8109.0, 22953.0, 79410.0, 340087.0, 436739.0, 109034.0, 29835.0, 10205.0, 3822.0, 1438.0, 679.0, 327.0, 157.0, 92.0, 50.0, 39.0, 23.0, 12.0, 6.0, 6.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3017578125, -0.2936267852783203, -0.2854957580566406, -0.27736473083496094, -0.26923370361328125, -0.26110267639160156, -0.2529716491699219, -0.2448406219482422, -0.2367095947265625, -0.2285785675048828, -0.22044754028320312, -0.21231651306152344, -0.20418548583984375, -0.19605445861816406, -0.18792343139648438, -0.1797924041748047, -0.171661376953125, -0.1635303497314453, -0.15539932250976562, -0.14726829528808594, -0.13913726806640625, -0.13100624084472656, -0.12287521362304688, -0.11474418640136719, -0.1066131591796875, -0.09848213195800781, -0.09035110473632812, -0.08222007751464844, -0.07408905029296875, -0.06595802307128906, -0.057826995849609375, -0.04969596862792969, -0.04156494140625, -0.03343391418457031, -0.025302886962890625, -0.017171859741210938, -0.00904083251953125, -0.0009098052978515625, 0.007221221923828125, 0.015352249145507812, 0.0234832763671875, 0.03161430358886719, 0.039745330810546875, 0.04787635803222656, 0.05600738525390625, 0.06413841247558594, 0.07226943969726562, 0.08040046691894531, 0.088531494140625, 0.09666252136230469, 0.10479354858398438, 0.11292457580566406, 0.12105560302734375, 0.12918663024902344, 0.13731765747070312, 0.1454486846923828, 0.1535797119140625, 0.1617107391357422, 0.16984176635742188, 0.17797279357910156, 0.18610382080078125, 0.19423484802246094, 0.20236587524414062, 0.2104969024658203, 0.2186279296875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 2.0, 6.0, 4.0, 8.0, 4.0, 14.0, 11.0, 18.0, 32.0, 34.0, 70.0, 99.0, 134.0, 170.0, 124.0, 85.0, 53.0, 34.0, 22.0, 15.0, 17.0, 9.0, 4.0, 5.0, 7.0, 4.0, 8.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.07046890258789e-05, -7.820315659046173e-05, -7.570162415504456e-05, -7.320009171962738e-05, -7.06985592842102e-05, -6.819702684879303e-05, -6.569549441337585e-05, -6.319396197795868e-05, -6.0692429542541504e-05, -5.819089710712433e-05, -5.568936467170715e-05, -5.318783223628998e-05, -5.06862998008728e-05, -4.818476736545563e-05, -4.568323493003845e-05, -4.318170249462128e-05, -4.06801700592041e-05, -3.8178637623786926e-05, -3.567710518836975e-05, -3.3175572752952576e-05, -3.06740403175354e-05, -2.8172507882118225e-05, -2.567097544670105e-05, -2.3169443011283875e-05, -2.06679105758667e-05, -1.8166378140449524e-05, -1.566484570503235e-05, -1.3163313269615173e-05, -1.0661780834197998e-05, -8.160248398780823e-06, -5.6587159633636475e-06, -3.157183527946472e-06, -6.556510925292969e-07, 1.8458813428878784e-06, 4.347413778305054e-06, 6.848946213722229e-06, 9.350478649139404e-06, 1.185201108455658e-05, 1.4353543519973755e-05, 1.685507595539093e-05, 1.9356608390808105e-05, 2.185814082622528e-05, 2.4359673261642456e-05, 2.686120569705963e-05, 2.9362738132476807e-05, 3.186427056789398e-05, 3.436580300331116e-05, 3.686733543872833e-05, 3.936886787414551e-05, 4.187040030956268e-05, 4.437193274497986e-05, 4.6873465180397034e-05, 4.937499761581421e-05, 5.1876530051231384e-05, 5.437806248664856e-05, 5.6879594922065735e-05, 5.938112735748291e-05, 6.188265979290009e-05, 6.438419222831726e-05, 6.688572466373444e-05, 6.938725709915161e-05, 7.188878953456879e-05, 7.439032196998596e-05, 7.689185440540314e-05, 7.939338684082031e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 2.0, 7.0, 6.0, 7.0, 5.0, 12.0, 21.0, 28.0, 35.0, 63.0, 76.0, 150.0, 182.0, 299.0, 511.0, 806.0, 1686.0, 3543.0, 8016.0, 19666.0, 53594.0, 146844.0, 343560.0, 289629.0, 111796.0, 40333.0, 15307.0, 6198.0, 2857.0, 1378.0, 728.0, 438.0, 253.0, 160.0, 105.0, 62.0, 59.0, 38.0, 29.0, 18.0, 12.0, 14.0, 5.0, 6.0, 7.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.170654296875, -0.1652984619140625, -0.159942626953125, -0.1545867919921875, -0.14923095703125, -0.1438751220703125, -0.138519287109375, -0.1331634521484375, -0.1278076171875, -0.1224517822265625, -0.117095947265625, -0.1117401123046875, -0.10638427734375, -0.1010284423828125, -0.095672607421875, -0.0903167724609375, -0.0849609375, -0.0796051025390625, -0.074249267578125, -0.0688934326171875, -0.06353759765625, -0.0581817626953125, -0.052825927734375, -0.0474700927734375, -0.0421142578125, -0.0367584228515625, -0.031402587890625, -0.0260467529296875, -0.02069091796875, -0.0153350830078125, -0.009979248046875, -0.0046234130859375, 0.000732421875, 0.0060882568359375, 0.011444091796875, 0.0167999267578125, 0.02215576171875, 0.0275115966796875, 0.032867431640625, 0.0382232666015625, 0.0435791015625, 0.0489349365234375, 0.054290771484375, 0.0596466064453125, 0.06500244140625, 0.0703582763671875, 0.075714111328125, 0.0810699462890625, 0.08642578125, 0.0917816162109375, 0.097137451171875, 0.1024932861328125, 0.10784912109375, 0.1132049560546875, 0.118560791015625, 0.1239166259765625, 0.1292724609375, 0.1346282958984375, 0.139984130859375, 0.1453399658203125, 0.15069580078125, 0.1560516357421875, 0.161407470703125, 0.1667633056640625, 0.172119140625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 5.0, 6.0, 7.0, 6.0, 13.0, 15.0, 19.0, 31.0, 38.0, 55.0, 61.0, 85.0, 72.0, 110.0, 94.0, 91.0, 66.0, 36.0, 42.0, 34.0, 35.0, 14.0, 18.0, 12.0, 8.0, 3.0, 5.0, 5.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.21875, -0.21225357055664062, -0.20575714111328125, -0.19926071166992188, -0.1927642822265625, -0.18626785278320312, -0.17977142333984375, -0.17327499389648438, -0.166778564453125, -0.16028213500976562, -0.15378570556640625, -0.14728927612304688, -0.1407928466796875, -0.13429641723632812, -0.12779998779296875, -0.12130355834960938, -0.11480712890625, -0.10831069946289062, -0.10181427001953125, -0.09531784057617188, -0.0888214111328125, -0.08232498168945312, -0.07582855224609375, -0.06933212280273438, -0.062835693359375, -0.056339263916015625, -0.04984283447265625, -0.043346405029296875, -0.0368499755859375, -0.030353546142578125, -0.02385711669921875, -0.017360687255859375, -0.0108642578125, -0.004367828369140625, 0.00212860107421875, 0.008625030517578125, 0.0151214599609375, 0.021617889404296875, 0.02811431884765625, 0.034610748291015625, 0.041107177734375, 0.047603607177734375, 0.05410003662109375, 0.060596466064453125, 0.0670928955078125, 0.07358932495117188, 0.08008575439453125, 0.08658218383789062, 0.09307861328125, 0.09957504272460938, 0.10607147216796875, 0.11256790161132812, 0.1190643310546875, 0.12556076049804688, 0.13205718994140625, 0.13855361938476562, 0.145050048828125, 0.15154647827148438, 0.15804290771484375, 0.16453933715820312, 0.1710357666015625, 0.17753219604492188, 0.18402862548828125, 0.19052505493164062, 0.197021484375]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 0.0, 5.0, 10.0, 25.0, 35.0, 49.0, 71.0, 138.0, 137.0, 156.0, 123.0, 79.0, 69.0, 40.0, 17.0, 12.0, 10.0, 5.0, 6.0, 3.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.483091354370117, -3.380591630935669, -3.2780919075012207, -3.1755921840667725, -3.073092460632324, -2.970592975616455, -2.868093252182007, -2.7655935287475586, -2.6630938053131104, -2.560594081878662, -2.458094358444214, -2.3555946350097656, -2.2530951499938965, -2.150595188140869, -2.048095703125, -1.9455959796905518, -1.8430962562561035, -1.7405965328216553, -1.638096809387207, -1.5355972051620483, -1.4330974817276, -1.3305977582931519, -1.2280981540679932, -1.125598430633545, -1.0230987071990967, -0.9205989837646484, -0.818099319934845, -0.7155996561050415, -0.6130999326705933, -0.510600209236145, -0.40810054540634155, -0.3056008815765381, -0.20310115814208984, -0.10060146450996399, 0.0018982291221618652, 0.10439792275428772, 0.20689761638641357, 0.3093973398208618, 0.4118970036506653, 0.5143966674804688, 0.616896390914917, 0.7193961143493652, 0.8218957781791687, 0.9243954420089722, 1.0268951654434204, 1.1293948888778687, 1.2318944931030273, 1.3343942165374756, 1.4368939399719238, 1.539393663406372, 1.6418933868408203, 1.744392991065979, 1.8468927145004272, 1.9493924379348755, 2.051892042160034, 2.1543917655944824, 2.2568914890289307, 2.359391212463379, 2.461890935897827, 2.5643906593322754, 2.6668901443481445, 2.769390106201172, 2.871889591217041, 2.9743893146514893, 3.0768890380859375]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 8.0, 5.0, 6.0, 6.0, 10.0, 10.0, 14.0, 23.0, 17.0, 15.0, 30.0, 14.0, 21.0, 32.0, 41.0, 28.0, 34.0, 46.0, 31.0, 38.0, 42.0, 43.0, 35.0, 34.0, 44.0, 36.0, 33.0, 34.0, 32.0, 32.0, 28.0, 20.0, 34.0, 20.0, 22.0, 19.0, 15.0, 8.0, 7.0, 11.0, 4.0, 5.0, 7.0, 2.0, 2.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.5926952362060547, -1.5439839363098145, -1.4952726364135742, -1.446561336517334, -1.3978500366210938, -1.3491387367248535, -1.3004274368286133, -1.251716136932373, -1.2030048370361328, -1.1542935371398926, -1.1055822372436523, -1.056870937347412, -1.0081596374511719, -0.9594483375549316, -0.9107370972633362, -0.862025797367096, -0.8133145570755005, -0.7646032571792603, -0.71589195728302, -0.6671806573867798, -0.6184693574905396, -0.5697580575942993, -0.5210468173027039, -0.4723355174064636, -0.4236242175102234, -0.37491291761398315, -0.3262016177177429, -0.2774903476238251, -0.22877904772758484, -0.1800677478313446, -0.13135647773742676, -0.08264517784118652, -0.03393387794494629, 0.014777414500713348, 0.06348870694637299, 0.11219999194145203, 0.16091129183769226, 0.2096225917339325, 0.25833386182785034, 0.3070451617240906, 0.3557564616203308, 0.40446776151657104, 0.4531790614128113, 0.5018903017044067, 0.550601601600647, 0.5993129014968872, 0.6480242013931274, 0.6967355012893677, 0.7454468011856079, 0.7941581010818481, 0.8428694009780884, 0.8915807008743286, 0.9402920007705688, 0.9890033006668091, 1.0377144813537598, 1.08642578125, 1.1351370811462402, 1.1838483810424805, 1.2325596809387207, 1.281270980834961, 1.3299822807312012, 1.3786935806274414, 1.4274048805236816, 1.4761161804199219, 1.524827480316162]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 7.0, 8.0, 16.0, 16.0, 35.0, 49.0, 55.0, 97.0, 149.0, 262.0, 363.0, 628.0, 1054.0, 1788.0, 3155.0, 5302.0, 9695.0, 17341.0, 33286.0, 64913.0, 138774.0, 329430.0, 812590.0, 1324185.0, 834153.0, 339431.0, 139769.0, 65273.0, 32890.0, 17243.0, 9412.0, 5251.0, 3051.0, 1781.0, 1110.0, 638.0, 401.0, 239.0, 140.0, 99.0, 69.0, 43.0, 31.0, 26.0, 12.0, 8.0, 6.0, 8.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.2005615234375, -0.1939868927001953, -0.18741226196289062, -0.18083763122558594, -0.17426300048828125, -0.16768836975097656, -0.16111373901367188, -0.1545391082763672, -0.1479644775390625, -0.1413898468017578, -0.13481521606445312, -0.12824058532714844, -0.12166595458984375, -0.11509132385253906, -0.10851669311523438, -0.10194206237792969, -0.095367431640625, -0.08879280090332031, -0.08221817016601562, -0.07564353942871094, -0.06906890869140625, -0.06249427795410156, -0.055919647216796875, -0.04934501647949219, -0.0427703857421875, -0.03619575500488281, -0.029621124267578125, -0.023046493530273438, -0.01647186279296875, -0.009897232055664062, -0.003322601318359375, 0.0032520294189453125, 0.00982666015625, 0.016401290893554688, 0.022975921630859375, 0.029550552368164062, 0.03612518310546875, 0.04269981384277344, 0.049274444580078125, 0.05584907531738281, 0.0624237060546875, 0.06899833679199219, 0.07557296752929688, 0.08214759826660156, 0.08872222900390625, 0.09529685974121094, 0.10187149047851562, 0.10844612121582031, 0.115020751953125, 0.12159538269042969, 0.12817001342773438, 0.13474464416503906, 0.14131927490234375, 0.14789390563964844, 0.15446853637695312, 0.1610431671142578, 0.1676177978515625, 0.1741924285888672, 0.18076705932617188, 0.18734169006347656, 0.19391632080078125, 0.20049095153808594, 0.20706558227539062, 0.2136402130126953, 0.22021484375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 8.0, 7.0, 5.0, 7.0, 4.0, 12.0, 12.0, 18.0, 24.0, 28.0, 25.0, 25.0, 37.0, 29.0, 22.0, 34.0, 38.0, 27.0, 40.0, 42.0, 37.0, 44.0, 38.0, 40.0, 34.0, 42.0, 44.0, 37.0, 26.0, 26.0, 30.0, 25.0, 25.0, 28.0, 17.0, 8.0, 15.0, 12.0, 7.0, 6.0, 10.0, 4.0, 5.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.170166015625, -0.16399765014648438, -0.15782928466796875, -0.15166091918945312, -0.1454925537109375, -0.13932418823242188, -0.13315582275390625, -0.12698745727539062, -0.120819091796875, -0.11465072631835938, -0.10848236083984375, -0.10231399536132812, -0.0961456298828125, -0.08997726440429688, -0.08380889892578125, -0.07764053344726562, -0.07147216796875, -0.06530380249023438, -0.05913543701171875, -0.052967071533203125, -0.0467987060546875, -0.040630340576171875, -0.03446197509765625, -0.028293609619140625, -0.022125244140625, -0.015956878662109375, -0.00978851318359375, -0.003620147705078125, 0.0025482177734375, 0.008716583251953125, 0.01488494873046875, 0.021053314208984375, 0.0272216796875, 0.033390045166015625, 0.03955841064453125, 0.045726776123046875, 0.0518951416015625, 0.058063507080078125, 0.06423187255859375, 0.07040023803710938, 0.076568603515625, 0.08273696899414062, 0.08890533447265625, 0.09507369995117188, 0.1012420654296875, 0.10741043090820312, 0.11357879638671875, 0.11974716186523438, 0.12591552734375, 0.13208389282226562, 0.13825225830078125, 0.14442062377929688, 0.1505889892578125, 0.15675735473632812, 0.16292572021484375, 0.16909408569335938, 0.175262451171875, 0.18143081665039062, 0.18759918212890625, 0.19376754760742188, 0.1999359130859375, 0.20610427856445312, 0.21227264404296875, 0.21844100952148438, 0.224609375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 4.0, 6.0, 11.0, 15.0, 27.0, 26.0, 44.0, 58.0, 98.0, 120.0, 163.0, 284.0, 409.0, 703.0, 1188.0, 2456.0, 5112.0, 12398.0, 34283.0, 104178.0, 350703.0, 1561199.0, 1597131.0, 358796.0, 106474.0, 34875.0, 12679.0, 5304.0, 2449.0, 1178.0, 676.0, 414.0, 265.0, 178.0, 129.0, 67.0, 47.0, 41.0, 31.0, 22.0, 14.0, 15.0, 6.0, 5.0, 0.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.431884765625, -0.4183921813964844, -0.40489959716796875, -0.3914070129394531, -0.3779144287109375, -0.3644218444824219, -0.35092926025390625, -0.3374366760253906, -0.323944091796875, -0.3104515075683594, -0.29695892333984375, -0.2834663391113281, -0.2699737548828125, -0.2564811706542969, -0.24298858642578125, -0.22949600219726562, -0.21600341796875, -0.20251083374023438, -0.18901824951171875, -0.17552566528320312, -0.1620330810546875, -0.14854049682617188, -0.13504791259765625, -0.12155532836914062, -0.108062744140625, -0.09457015991210938, -0.08107757568359375, -0.06758499145507812, -0.0540924072265625, -0.040599822998046875, -0.02710723876953125, -0.013614654541015625, -0.0001220703125, 0.013370513916015625, 0.02686309814453125, 0.040355682373046875, 0.0538482666015625, 0.06734085083007812, 0.08083343505859375, 0.09432601928710938, 0.107818603515625, 0.12131118774414062, 0.13480377197265625, 0.14829635620117188, 0.1617889404296875, 0.17528152465820312, 0.18877410888671875, 0.20226669311523438, 0.21575927734375, 0.22925186157226562, 0.24274444580078125, 0.2562370300292969, 0.2697296142578125, 0.2832221984863281, 0.29671478271484375, 0.3102073669433594, 0.323699951171875, 0.3371925354003906, 0.35068511962890625, 0.3641777038574219, 0.3776702880859375, 0.3911628723144531, 0.40465545654296875, 0.4181480407714844, 0.431640625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 5.0, 6.0, 1.0, 3.0, 8.0, 8.0, 8.0, 11.0, 14.0, 11.0, 8.0, 22.0, 35.0, 32.0, 29.0, 33.0, 52.0, 71.0, 79.0, 107.0, 106.0, 141.0, 168.0, 226.0, 283.0, 365.0, 389.0, 325.0, 290.0, 237.0, 179.0, 157.0, 127.0, 97.0, 87.0, 71.0, 50.0, 44.0, 41.0, 31.0, 20.0, 16.0, 22.0, 8.0, 9.0, 12.0, 12.0, 10.0, 5.0, 0.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.3193359375, -0.30954742431640625, -0.2997589111328125, -0.28997039794921875, -0.280181884765625, -0.27039337158203125, -0.2606048583984375, -0.25081634521484375, -0.24102783203125, -0.23123931884765625, -0.2214508056640625, -0.21166229248046875, -0.201873779296875, -0.19208526611328125, -0.1822967529296875, -0.17250823974609375, -0.1627197265625, -0.15293121337890625, -0.1431427001953125, -0.13335418701171875, -0.123565673828125, -0.11377716064453125, -0.1039886474609375, -0.09420013427734375, -0.08441162109375, -0.07462310791015625, -0.0648345947265625, -0.05504608154296875, -0.045257568359375, -0.03546905517578125, -0.0256805419921875, -0.01589202880859375, -0.006103515625, 0.00368499755859375, 0.0134735107421875, 0.02326202392578125, 0.033050537109375, 0.04283905029296875, 0.0526275634765625, 0.06241607666015625, 0.07220458984375, 0.08199310302734375, 0.0917816162109375, 0.10157012939453125, 0.111358642578125, 0.12114715576171875, 0.1309356689453125, 0.14072418212890625, 0.1505126953125, 0.16030120849609375, 0.1700897216796875, 0.17987823486328125, 0.189666748046875, 0.19945526123046875, 0.2092437744140625, 0.21903228759765625, 0.22882080078125, 0.23860931396484375, 0.2483978271484375, 0.25818634033203125, 0.267974853515625, 0.27776336669921875, 0.2875518798828125, 0.29734039306640625, 0.30712890625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 5.0, 1.0, 6.0, 8.0, 28.0, 37.0, 78.0, 117.0, 136.0, 192.0, 138.0, 116.0, 75.0, 28.0, 22.0, 6.0, 5.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.516013145446777, -4.381528854370117, -4.247044086456299, -4.112559795379639, -3.9780752658843994, -3.84359073638916, -3.7091064453125, -3.5746219158172607, -3.4401373863220215, -3.3056528568267822, -3.171168565750122, -3.036684036254883, -2.9021995067596436, -2.7677149772644043, -2.633230686187744, -2.498746156692505, -2.3642618656158447, -2.2297773361206055, -2.0952930450439453, -1.960808515548706, -1.8263239860534668, -1.691839575767517, -1.5573551654815674, -1.4228706359863281, -1.2883862257003784, -1.1539018154144287, -1.0194172859191895, -0.8849328756332397, -0.7504484057426453, -0.6159639358520508, -0.4814795255661011, -0.3469950556755066, -0.2125105857849121, -0.07802613079547882, 0.05645832419395447, 0.19094276428222656, 0.32542723417282104, 0.4599117040634155, 0.5943961143493652, 0.7288805842399597, 0.8633650541305542, 0.9978495240211487, 1.1323339939117432, 1.2668184041976929, 1.4013028144836426, 1.5357873439788818, 1.6702717542648315, 1.8047561645507812, 1.9392406940460205, 2.0737252235412598, 2.20820951461792, 2.342694044113159, 2.4771785736083984, 2.6116628646850586, 2.746147394180298, 2.880631923675537, 3.0151162147521973, 3.1496007442474365, 3.2840850353240967, 3.418569564819336, 3.553054094314575, 3.6875386238098145, 3.8220229148864746, 3.956507444381714, 4.090991973876953]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 3.0, 3.0, 7.0, 9.0, 4.0, 7.0, 8.0, 11.0, 16.0, 15.0, 15.0, 20.0, 20.0, 24.0, 25.0, 22.0, 36.0, 31.0, 32.0, 30.0, 30.0, 38.0, 35.0, 44.0, 57.0, 33.0, 43.0, 37.0, 31.0, 29.0, 38.0, 22.0, 40.0, 20.0, 35.0, 22.0, 19.0, 10.0, 22.0, 12.0, 12.0, 7.0, 6.0, 3.0, 6.0, 6.0, 5.0, 5.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.4504894018173218, -1.4076894521713257, -1.36488938331604, -1.322089433670044, -1.2792894840240479, -1.2364894151687622, -1.1936894655227661, -1.1508893966674805, -1.1080894470214844, -1.0652894973754883, -1.0224894285202026, -0.9796894788742065, -0.9368894696235657, -0.8940894603729248, -0.8512895107269287, -0.8084895014762878, -0.7656895518302917, -0.7228895425796509, -0.6800895929336548, -0.6372895836830139, -0.594489574432373, -0.551689624786377, -0.5088896155357361, -0.4660896062850952, -0.42328962683677673, -0.38048964738845825, -0.3376896381378174, -0.2948896586894989, -0.2520896792411804, -0.20928966999053955, -0.16648969054222107, -0.1236896812915802, -0.08088970184326172, -0.03808971121907234, 0.004710279405117035, 0.04751026630401611, 0.09031026065349579, 0.13311025500297546, 0.17591023445129395, 0.21871024370193481, 0.2615102231502533, 0.3043102025985718, 0.34711021184921265, 0.38991019129753113, 0.4327101707458496, 0.4755101799964905, 0.5183101892471313, 0.5611101388931274, 0.6039101481437683, 0.6467101573944092, 0.6895101070404053, 0.7323101162910461, 0.775110125541687, 0.8179100751876831, 0.860710084438324, 0.9035100936889648, 0.9463100433349609, 0.9891100525856018, 1.0319100618362427, 1.0747100114822388, 1.1175099611282349, 1.1603100299835205, 1.2031099796295166, 1.2459099292755127, 1.2887099981307983]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 6.0, 12.0, 14.0, 22.0, 35.0, 63.0, 82.0, 138.0, 194.0, 327.0, 518.0, 925.0, 1622.0, 2916.0, 5078.0, 9421.0, 17713.0, 33509.0, 61700.0, 107216.0, 161197.0, 193751.0, 173283.0, 121252.0, 71924.0, 39145.0, 21061.0, 11280.0, 6134.0, 3361.0, 1919.0, 1072.0, 642.0, 379.0, 228.0, 162.0, 78.0, 62.0, 43.0, 19.0, 12.0, 6.0, 3.0, 7.0, 7.0, 5.0, 5.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.2283935546875, -0.22093772888183594, -0.21348190307617188, -0.2060260772705078, -0.19857025146484375, -0.1911144256591797, -0.18365859985351562, -0.17620277404785156, -0.1687469482421875, -0.16129112243652344, -0.15383529663085938, -0.1463794708251953, -0.13892364501953125, -0.1314678192138672, -0.12401199340820312, -0.11655616760253906, -0.109100341796875, -0.10164451599121094, -0.09418869018554688, -0.08673286437988281, -0.07927703857421875, -0.07182121276855469, -0.06436538696289062, -0.05690956115722656, -0.0494537353515625, -0.04199790954589844, -0.034542083740234375, -0.027086257934570312, -0.01963043212890625, -0.012174606323242188, -0.004718780517578125, 0.0027370452880859375, 0.01019287109375, 0.017648696899414062, 0.025104522705078125, 0.03256034851074219, 0.04001617431640625, 0.04747200012207031, 0.054927825927734375, 0.06238365173339844, 0.0698394775390625, 0.07729530334472656, 0.08475112915039062, 0.09220695495605469, 0.09966278076171875, 0.10711860656738281, 0.11457443237304688, 0.12203025817871094, 0.129486083984375, 0.13694190979003906, 0.14439773559570312, 0.1518535614013672, 0.15930938720703125, 0.1667652130126953, 0.17422103881835938, 0.18167686462402344, 0.1891326904296875, 0.19658851623535156, 0.20404434204101562, 0.2115001678466797, 0.21895599365234375, 0.2264118194580078, 0.23386764526367188, 0.24132347106933594, 0.248779296875]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 6.0, 10.0, 13.0, 13.0, 17.0, 12.0, 12.0, 25.0, 25.0, 29.0, 37.0, 22.0, 36.0, 34.0, 46.0, 42.0, 33.0, 46.0, 45.0, 46.0, 46.0, 43.0, 33.0, 36.0, 34.0, 37.0, 28.0, 33.0, 30.0, 19.0, 14.0, 15.0, 24.0, 12.0, 17.0, 9.0, 6.0, 2.0, 6.0, 5.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1800537109375, -0.1735706329345703, -0.16708755493164062, -0.16060447692871094, -0.15412139892578125, -0.14763832092285156, -0.14115524291992188, -0.1346721649169922, -0.1281890869140625, -0.12170600891113281, -0.11522293090820312, -0.10873985290527344, -0.10225677490234375, -0.09577369689941406, -0.08929061889648438, -0.08280754089355469, -0.076324462890625, -0.06984138488769531, -0.06335830688476562, -0.05687522888183594, -0.05039215087890625, -0.04390907287597656, -0.037425994873046875, -0.030942916870117188, -0.0244598388671875, -0.017976760864257812, -0.011493682861328125, -0.0050106048583984375, 0.00147247314453125, 0.007955551147460938, 0.014438629150390625, 0.020921707153320312, 0.02740478515625, 0.03388786315917969, 0.040370941162109375, 0.04685401916503906, 0.05333709716796875, 0.05982017517089844, 0.06630325317382812, 0.07278633117675781, 0.0792694091796875, 0.08575248718261719, 0.09223556518554688, 0.09871864318847656, 0.10520172119140625, 0.11168479919433594, 0.11816787719726562, 0.12465095520019531, 0.131134033203125, 0.1376171112060547, 0.14410018920898438, 0.15058326721191406, 0.15706634521484375, 0.16354942321777344, 0.17003250122070312, 0.1765155792236328, 0.1829986572265625, 0.1894817352294922, 0.19596481323242188, 0.20244789123535156, 0.20893096923828125, 0.21541404724121094, 0.22189712524414062, 0.2283802032470703, 0.23486328125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 9.0, 6.0, 15.0, 20.0, 24.0, 38.0, 65.0, 105.0, 222.0, 504.0, 1119.0, 3552.0, 12621.0, 53089.0, 231107.0, 469576.0, 211662.0, 48124.0, 11421.0, 3288.0, 1111.0, 370.0, 226.0, 102.0, 56.0, 38.0, 32.0, 19.0, 8.0, 6.0, 5.0, 5.0, 4.0, 8.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.572265625, -0.5534820556640625, -0.534698486328125, -0.5159149169921875, -0.49713134765625, -0.4783477783203125, -0.459564208984375, -0.4407806396484375, -0.4219970703125, -0.4032135009765625, -0.384429931640625, -0.3656463623046875, -0.34686279296875, -0.3280792236328125, -0.309295654296875, -0.2905120849609375, -0.271728515625, -0.2529449462890625, -0.234161376953125, -0.2153778076171875, -0.19659423828125, -0.1778106689453125, -0.159027099609375, -0.1402435302734375, -0.1214599609375, -0.1026763916015625, -0.083892822265625, -0.0651092529296875, -0.04632568359375, -0.0275421142578125, -0.008758544921875, 0.0100250244140625, 0.02880859375, 0.0475921630859375, 0.066375732421875, 0.0851593017578125, 0.10394287109375, 0.1227264404296875, 0.141510009765625, 0.1602935791015625, 0.1790771484375, 0.1978607177734375, 0.216644287109375, 0.2354278564453125, 0.25421142578125, 0.2729949951171875, 0.291778564453125, 0.3105621337890625, 0.329345703125, 0.3481292724609375, 0.366912841796875, 0.3856964111328125, 0.40447998046875, 0.4232635498046875, 0.442047119140625, 0.4608306884765625, 0.4796142578125, 0.4983978271484375, 0.517181396484375, 0.5359649658203125, 0.55474853515625, 0.5735321044921875, 0.592315673828125, 0.6110992431640625, 0.6298828125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 3.0, 8.0, 4.0, 7.0, 9.0, 9.0, 15.0, 16.0, 21.0, 16.0, 27.0, 32.0, 26.0, 41.0, 32.0, 43.0, 43.0, 40.0, 43.0, 50.0, 49.0, 32.0, 51.0, 41.0, 48.0, 47.0, 25.0, 24.0, 31.0, 31.0, 21.0, 15.0, 29.0, 18.0, 6.0, 7.0, 13.0, 6.0, 4.0, 3.0, 6.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.65673828125, -0.6382064819335938, -0.6196746826171875, -0.6011428833007812, -0.582611083984375, -0.5640792846679688, -0.5455474853515625, -0.5270156860351562, -0.50848388671875, -0.48995208740234375, -0.4714202880859375, -0.45288848876953125, -0.434356689453125, -0.41582489013671875, -0.3972930908203125, -0.37876129150390625, -0.3602294921875, -0.34169769287109375, -0.3231658935546875, -0.30463409423828125, -0.286102294921875, -0.26757049560546875, -0.2490386962890625, -0.23050689697265625, -0.21197509765625, -0.19344329833984375, -0.1749114990234375, -0.15637969970703125, -0.137847900390625, -0.11931610107421875, -0.1007843017578125, -0.08225250244140625, -0.063720703125, -0.04518890380859375, -0.0266571044921875, -0.00812530517578125, 0.010406494140625, 0.02893829345703125, 0.0474700927734375, 0.06600189208984375, 0.08453369140625, 0.10306549072265625, 0.1215972900390625, 0.14012908935546875, 0.158660888671875, 0.17719268798828125, 0.1957244873046875, 0.21425628662109375, 0.2327880859375, 0.25131988525390625, 0.2698516845703125, 0.28838348388671875, 0.306915283203125, 0.32544708251953125, 0.3439788818359375, 0.36251068115234375, 0.38104248046875, 0.39957427978515625, 0.4181060791015625, 0.43663787841796875, 0.455169677734375, 0.47370147705078125, 0.4922332763671875, 0.5107650756835938, 0.529296875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 2.0, 3.0, 18.0, 27.0, 36.0, 35.0, 49.0, 113.0, 142.0, 247.0, 330.0, 604.0, 1057.0, 1818.0, 3542.0, 7103.0, 15579.0, 36163.0, 85685.0, 183725.0, 274149.0, 227294.0, 118487.0, 50960.0, 21529.0, 9552.0, 4707.0, 2306.0, 1259.0, 784.0, 439.0, 282.0, 173.0, 120.0, 89.0, 45.0, 28.0, 26.0, 18.0, 8.0, 10.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1336669921875, -0.12944984436035156, -0.12523269653320312, -0.12101554870605469, -0.11679840087890625, -0.11258125305175781, -0.10836410522460938, -0.10414695739746094, -0.0999298095703125, -0.09571266174316406, -0.09149551391601562, -0.08727836608886719, -0.08306121826171875, -0.07884407043457031, -0.07462692260742188, -0.07040977478027344, -0.066192626953125, -0.06197547912597656, -0.057758331298828125, -0.05354118347167969, -0.04932403564453125, -0.04510688781738281, -0.040889739990234375, -0.03667259216308594, -0.0324554443359375, -0.028238296508789062, -0.024021148681640625, -0.019804000854492188, -0.01558685302734375, -0.011369705200195312, -0.007152557373046875, -0.0029354095458984375, 0.00128173828125, 0.0054988861083984375, 0.009716033935546875, 0.013933181762695312, 0.01815032958984375, 0.022367477416992188, 0.026584625244140625, 0.030801773071289062, 0.0350189208984375, 0.03923606872558594, 0.043453216552734375, 0.04767036437988281, 0.05188751220703125, 0.05610466003417969, 0.060321807861328125, 0.06453895568847656, 0.068756103515625, 0.07297325134277344, 0.07719039916992188, 0.08140754699707031, 0.08562469482421875, 0.08984184265136719, 0.09405899047851562, 0.09827613830566406, 0.1024932861328125, 0.10671043395996094, 0.11092758178710938, 0.11514472961425781, 0.11936187744140625, 0.12357902526855469, 0.12779617309570312, 0.13201332092285156, 0.13623046875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 4.0, 3.0, 7.0, 4.0, 13.0, 11.0, 12.0, 25.0, 26.0, 38.0, 42.0, 43.0, 53.0, 66.0, 75.0, 70.0, 77.0, 72.0, 68.0, 60.0, 47.0, 47.0, 36.0, 23.0, 21.0, 16.0, 16.0, 8.0, 5.0, 6.0, 2.0, 2.0, 2.0, 4.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3511390686035156e-05, -4.224199801683426e-05, -4.097260534763336e-05, -3.9703212678432465e-05, -3.843382000923157e-05, -3.716442734003067e-05, -3.589503467082977e-05, -3.4625642001628876e-05, -3.335624933242798e-05, -3.208685666322708e-05, -3.0817463994026184e-05, -2.9548071324825287e-05, -2.827867865562439e-05, -2.7009285986423492e-05, -2.5739893317222595e-05, -2.4470500648021698e-05, -2.32011079788208e-05, -2.1931715309619904e-05, -2.0662322640419006e-05, -1.939292997121811e-05, -1.8123537302017212e-05, -1.6854144632816315e-05, -1.5584751963615417e-05, -1.431535929441452e-05, -1.3045966625213623e-05, -1.1776573956012726e-05, -1.0507181286811829e-05, -9.237788617610931e-06, -7.968395948410034e-06, -6.699003279209137e-06, -5.42961061000824e-06, -4.1602179408073425e-06, -2.8908252716064453e-06, -1.621432602405548e-06, -3.520399332046509e-07, 9.173527359962463e-07, 2.1867454051971436e-06, 3.4561380743980408e-06, 4.725530743598938e-06, 5.994923412799835e-06, 7.264316082000732e-06, 8.53370875120163e-06, 9.803101420402527e-06, 1.1072494089603424e-05, 1.2341886758804321e-05, 1.3611279428005219e-05, 1.4880672097206116e-05, 1.6150064766407013e-05, 1.741945743560791e-05, 1.8688850104808807e-05, 1.9958242774009705e-05, 2.1227635443210602e-05, 2.24970281124115e-05, 2.3766420781612396e-05, 2.5035813450813293e-05, 2.630520612001419e-05, 2.7574598789215088e-05, 2.8843991458415985e-05, 3.0113384127616882e-05, 3.138277679681778e-05, 3.265216946601868e-05, 3.3921562135219574e-05, 3.519095480442047e-05, 3.646034747362137e-05, 3.7729740142822266e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 6.0, 9.0, 17.0, 24.0, 30.0, 38.0, 63.0, 98.0, 162.0, 308.0, 675.0, 1413.0, 3324.0, 9105.0, 26822.0, 86008.0, 238657.0, 358824.0, 213041.0, 73382.0, 23179.0, 7844.0, 2860.0, 1323.0, 594.0, 293.0, 167.0, 102.0, 55.0, 44.0, 33.0, 13.0, 13.0, 6.0, 9.0, 4.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1790771484375, -0.17337989807128906, -0.16768264770507812, -0.1619853973388672, -0.15628814697265625, -0.1505908966064453, -0.14489364624023438, -0.13919639587402344, -0.1334991455078125, -0.12780189514160156, -0.12210464477539062, -0.11640739440917969, -0.11071014404296875, -0.10501289367675781, -0.09931564331054688, -0.09361839294433594, -0.087921142578125, -0.08222389221191406, -0.07652664184570312, -0.07082939147949219, -0.06513214111328125, -0.05943489074707031, -0.053737640380859375, -0.04804039001464844, -0.0423431396484375, -0.03664588928222656, -0.030948638916015625, -0.025251388549804688, -0.01955413818359375, -0.013856887817382812, -0.008159637451171875, -0.0024623870849609375, 0.00323486328125, 0.008932113647460938, 0.014629364013671875, 0.020326614379882812, 0.02602386474609375, 0.03172111511230469, 0.037418365478515625, 0.04311561584472656, 0.0488128662109375, 0.05451011657714844, 0.060207366943359375, 0.06590461730957031, 0.07160186767578125, 0.07729911804199219, 0.08299636840820312, 0.08869361877441406, 0.094390869140625, 0.10008811950683594, 0.10578536987304688, 0.11148262023925781, 0.11717987060546875, 0.12287712097167969, 0.12857437133789062, 0.13427162170410156, 0.1399688720703125, 0.14566612243652344, 0.15136337280273438, 0.1570606231689453, 0.16275787353515625, 0.1684551239013672, 0.17415237426757812, 0.17984962463378906, 0.185546875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 7.0, 3.0, 4.0, 7.0, 11.0, 14.0, 20.0, 30.0, 43.0, 65.0, 65.0, 94.0, 95.0, 116.0, 102.0, 72.0, 73.0, 49.0, 39.0, 35.0, 28.0, 17.0, 7.0, 4.0, 1.0, 3.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.154296875, -0.147125244140625, -0.13995361328125, -0.132781982421875, -0.1256103515625, -0.118438720703125, -0.11126708984375, -0.104095458984375, -0.096923828125, -0.089752197265625, -0.08258056640625, -0.075408935546875, -0.0682373046875, -0.061065673828125, -0.05389404296875, -0.046722412109375, -0.03955078125, -0.032379150390625, -0.02520751953125, -0.018035888671875, -0.0108642578125, -0.003692626953125, 0.00347900390625, 0.010650634765625, 0.017822265625, 0.024993896484375, 0.03216552734375, 0.039337158203125, 0.0465087890625, 0.053680419921875, 0.06085205078125, 0.068023681640625, 0.0751953125, 0.082366943359375, 0.08953857421875, 0.096710205078125, 0.1038818359375, 0.111053466796875, 0.11822509765625, 0.125396728515625, 0.132568359375, 0.139739990234375, 0.14691162109375, 0.154083251953125, 0.1612548828125, 0.168426513671875, 0.17559814453125, 0.182769775390625, 0.18994140625, 0.197113037109375, 0.20428466796875, 0.211456298828125, 0.2186279296875, 0.225799560546875, 0.23297119140625, 0.240142822265625, 0.247314453125, 0.254486083984375, 0.26165771484375, 0.268829345703125, 0.2760009765625, 0.283172607421875, 0.29034423828125, 0.297515869140625, 0.3046875]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 2.0, 0.0, 0.0, 3.0, 6.0, 6.0, 9.0, 24.0, 41.0, 81.0, 132.0, 162.0, 201.0, 149.0, 99.0, 41.0, 22.0, 13.0, 8.0, 6.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5538761615753174, -2.4527816772460938, -2.35168719291687, -2.2505927085876465, -2.1494979858398438, -2.048403739929199, -1.9473090171813965, -1.8462145328521729, -1.7451200485229492, -1.6440255641937256, -1.542931079864502, -1.4418364763259888, -1.3407419919967651, -1.2396475076675415, -1.1385529041290283, -1.0374584197998047, -0.936363935470581, -0.8352694511413574, -0.734174907207489, -0.6330803632736206, -0.531985878944397, -0.43089139461517334, -0.32979685068130493, -0.22870230674743652, -0.1276078224182129, -0.02651330828666687, 0.07458120584487915, 0.17567571997642517, 0.2767702341079712, 0.3778647184371948, 0.47895926237106323, 0.5800538063049316, 0.6811485290527344, 0.782243013381958, 0.8833375573158264, 0.9844321012496948, 1.0855265855789185, 1.186621069908142, 1.2877156734466553, 1.388810157775879, 1.4899046421051025, 1.5909991264343262, 1.6920936107635498, 1.793188214302063, 1.8942826986312866, 1.9953771829605103, 2.0964717864990234, 2.197566270828247, 2.2986607551574707, 2.3997552394866943, 2.500849723815918, 2.6019442081451416, 2.7030386924743652, 2.804133415222168, 2.9052278995513916, 3.0063223838806152, 3.107416868209839, 3.2085113525390625, 3.309605836868286, 3.4107003211975098, 3.5117950439453125, 3.612889289855957, 3.7139840126037598, 3.8150784969329834, 3.916172981262207]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 5.0, 3.0, 2.0, 8.0, 8.0, 5.0, 8.0, 20.0, 11.0, 17.0, 13.0, 21.0, 23.0, 32.0, 34.0, 36.0, 41.0, 25.0, 40.0, 37.0, 50.0, 41.0, 30.0, 45.0, 27.0, 40.0, 42.0, 44.0, 29.0, 31.0, 23.0, 27.0, 24.0, 27.0, 23.0, 24.0, 11.0, 16.0, 14.0, 11.0, 8.0, 7.0, 8.0, 5.0, 4.0, 4.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.451817274093628, -1.4054875373840332, -1.359157681465149, -1.3128279447555542, -1.26649808883667, -1.2201683521270752, -1.1738386154174805, -1.1275087594985962, -1.081178903579712, -1.0348491668701172, -0.9885193109512329, -0.9421895742416382, -0.8958597183227539, -0.8495299816131592, -0.8032001852989197, -0.7568703889846802, -0.7105406522750854, -0.664210855960846, -0.6178810596466064, -0.5715513229370117, -0.5252214670181274, -0.4788917005062103, -0.4325619339942932, -0.3862321376800537, -0.3399023413658142, -0.2935725450515747, -0.2472427636384964, -0.2009129822254181, -0.1545831859111786, -0.10825338959693909, -0.06192362308502197, -0.01559382677078247, 0.03073596954345703, 0.07706575840711594, 0.12339554727077484, 0.16972532868385315, 0.21605512499809265, 0.26238492131233215, 0.30871468782424927, 0.35504448413848877, 0.40137428045272827, 0.4477040767669678, 0.4940338730812073, 0.5403636693954468, 0.5866934061050415, 0.6330232620239258, 0.6793529987335205, 0.72568279504776, 0.7720125913619995, 0.818342387676239, 0.8646721839904785, 0.9110019207000732, 0.9573317766189575, 1.0036615133285522, 1.0499913692474365, 1.0963211059570312, 1.142650842666626, 1.1889805793762207, 1.235310435295105, 1.2816401720046997, 1.327970027923584, 1.3742997646331787, 1.4206295013427734, 1.4669593572616577, 1.513289213180542]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 4.0, 8.0, 7.0, 12.0, 9.0, 25.0, 36.0, 58.0, 84.0, 178.0, 266.0, 424.0, 680.0, 1236.0, 2322.0, 4716.0, 9583.0, 21164.0, 50126.0, 129925.0, 399204.0, 1253434.0, 1515429.0, 531111.0, 166073.0, 60398.0, 24973.0, 11049.0, 5450.0, 2716.0, 1460.0, 841.0, 465.0, 297.0, 198.0, 116.0, 71.0, 52.0, 37.0, 17.0, 14.0, 12.0, 6.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2119140625, -0.20380020141601562, -0.19568634033203125, -0.18757247924804688, -0.1794586181640625, -0.17134475708007812, -0.16323089599609375, -0.15511703491210938, -0.147003173828125, -0.13888931274414062, -0.13077545166015625, -0.12266159057617188, -0.1145477294921875, -0.10643386840820312, -0.09832000732421875, -0.09020614624023438, -0.08209228515625, -0.07397842407226562, -0.06586456298828125, -0.057750701904296875, -0.0496368408203125, -0.041522979736328125, -0.03340911865234375, -0.025295257568359375, -0.017181396484375, -0.009067535400390625, -0.00095367431640625, 0.007160186767578125, 0.0152740478515625, 0.023387908935546875, 0.03150177001953125, 0.039615631103515625, 0.0477294921875, 0.055843353271484375, 0.06395721435546875, 0.07207107543945312, 0.0801849365234375, 0.08829879760742188, 0.09641265869140625, 0.10452651977539062, 0.112640380859375, 0.12075424194335938, 0.12886810302734375, 0.13698196411132812, 0.1450958251953125, 0.15320968627929688, 0.16132354736328125, 0.16943740844726562, 0.17755126953125, 0.18566513061523438, 0.19377899169921875, 0.20189285278320312, 0.2100067138671875, 0.21812057495117188, 0.22623443603515625, 0.23434829711914062, 0.242462158203125, 0.2505760192871094, 0.25868988037109375, 0.2668037414550781, 0.2749176025390625, 0.2830314636230469, 0.29114532470703125, 0.2992591857910156, 0.307373046875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 1.0, 5.0, 7.0, 10.0, 7.0, 10.0, 10.0, 19.0, 17.0, 21.0, 17.0, 27.0, 30.0, 30.0, 33.0, 37.0, 35.0, 42.0, 43.0, 35.0, 68.0, 45.0, 39.0, 43.0, 42.0, 39.0, 34.0, 31.0, 27.0, 27.0, 33.0, 29.0, 20.0, 20.0, 20.0, 10.0, 9.0, 6.0, 8.0, 6.0, 6.0, 2.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1776123046875, -0.1710681915283203, -0.16452407836914062, -0.15797996520996094, -0.15143585205078125, -0.14489173889160156, -0.13834762573242188, -0.1318035125732422, -0.1252593994140625, -0.11871528625488281, -0.11217117309570312, -0.10562705993652344, -0.09908294677734375, -0.09253883361816406, -0.08599472045898438, -0.07945060729980469, -0.072906494140625, -0.06636238098144531, -0.059818267822265625, -0.05327415466308594, -0.04673004150390625, -0.04018592834472656, -0.033641815185546875, -0.027097702026367188, -0.0205535888671875, -0.014009475708007812, -0.007465362548828125, -0.0009212493896484375, 0.00562286376953125, 0.012166976928710938, 0.018711090087890625, 0.025255203247070312, 0.03179931640625, 0.03834342956542969, 0.044887542724609375, 0.05143165588378906, 0.05797576904296875, 0.06451988220214844, 0.07106399536132812, 0.07760810852050781, 0.0841522216796875, 0.09069633483886719, 0.09724044799804688, 0.10378456115722656, 0.11032867431640625, 0.11687278747558594, 0.12341690063476562, 0.1299610137939453, 0.136505126953125, 0.1430492401123047, 0.14959335327148438, 0.15613746643066406, 0.16268157958984375, 0.16922569274902344, 0.17576980590820312, 0.1823139190673828, 0.1888580322265625, 0.1954021453857422, 0.20194625854492188, 0.20849037170410156, 0.21503448486328125, 0.22157859802246094, 0.22812271118164062, 0.2346668243408203, 0.2412109375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 2.0, 10.0, 10.0, 21.0, 31.0, 47.0, 75.0, 117.0, 234.0, 377.0, 733.0, 1586.0, 3614.0, 9974.0, 32123.0, 131044.0, 739088.0, 2640858.0, 499043.0, 97150.0, 24550.0, 7932.0, 2865.0, 1249.0, 669.0, 336.0, 175.0, 128.0, 80.0, 56.0, 34.0, 21.0, 15.0, 9.0, 9.0, 6.0, 5.0, 3.0, 2.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.54052734375, -0.5248146057128906, -0.5091018676757812, -0.4933891296386719, -0.4776763916015625, -0.4619636535644531, -0.44625091552734375, -0.4305381774902344, -0.414825439453125, -0.3991127014160156, -0.38339996337890625, -0.3676872253417969, -0.3519744873046875, -0.3362617492675781, -0.32054901123046875, -0.3048362731933594, -0.28912353515625, -0.2734107971191406, -0.25769805908203125, -0.24198532104492188, -0.2262725830078125, -0.21055984497070312, -0.19484710693359375, -0.17913436889648438, -0.163421630859375, -0.14770889282226562, -0.13199615478515625, -0.11628341674804688, -0.1005706787109375, -0.08485794067382812, -0.06914520263671875, -0.053432464599609375, -0.0377197265625, -0.022006988525390625, -0.00629425048828125, 0.009418487548828125, 0.0251312255859375, 0.040843963623046875, 0.05655670166015625, 0.07226943969726562, 0.087982177734375, 0.10369491577148438, 0.11940765380859375, 0.13512039184570312, 0.1508331298828125, 0.16654586791992188, 0.18225860595703125, 0.19797134399414062, 0.21368408203125, 0.22939682006835938, 0.24510955810546875, 0.2608222961425781, 0.2765350341796875, 0.2922477722167969, 0.30796051025390625, 0.3236732482910156, 0.339385986328125, 0.3550987243652344, 0.37081146240234375, 0.3865242004394531, 0.4022369384765625, 0.4179496765136719, 0.43366241455078125, 0.4493751525878906, 0.465087890625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 1.0, 6.0, 1.0, 7.0, 15.0, 8.0, 13.0, 24.0, 31.0, 39.0, 52.0, 70.0, 107.0, 146.0, 191.0, 277.0, 406.0, 599.0, 619.0, 438.0, 320.0, 208.0, 140.0, 98.0, 65.0, 58.0, 41.0, 19.0, 14.0, 15.0, 14.0, 8.0, 4.0, 4.0, 5.0, 2.0, 4.0, 0.0, 2.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.3681640625, -0.3545684814453125, -0.340972900390625, -0.3273773193359375, -0.31378173828125, -0.3001861572265625, -0.286590576171875, -0.2729949951171875, -0.2593994140625, -0.2458038330078125, -0.232208251953125, -0.2186126708984375, -0.20501708984375, -0.1914215087890625, -0.177825927734375, -0.1642303466796875, -0.150634765625, -0.1370391845703125, -0.123443603515625, -0.1098480224609375, -0.09625244140625, -0.0826568603515625, -0.069061279296875, -0.0554656982421875, -0.0418701171875, -0.0282745361328125, -0.014678955078125, -0.0010833740234375, 0.01251220703125, 0.0261077880859375, 0.039703369140625, 0.0532989501953125, 0.06689453125, 0.0804901123046875, 0.094085693359375, 0.1076812744140625, 0.12127685546875, 0.1348724365234375, 0.148468017578125, 0.1620635986328125, 0.1756591796875, 0.1892547607421875, 0.202850341796875, 0.2164459228515625, 0.23004150390625, 0.2436370849609375, 0.257232666015625, 0.2708282470703125, 0.284423828125, 0.2980194091796875, 0.311614990234375, 0.3252105712890625, 0.33880615234375, 0.3524017333984375, 0.365997314453125, 0.3795928955078125, 0.3931884765625, 0.4067840576171875, 0.420379638671875, 0.4339752197265625, 0.44757080078125, 0.4611663818359375, 0.474761962890625, 0.4883575439453125, 0.501953125]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 5.0, 7.0, 12.0, 29.0, 40.0, 76.0, 123.0, 129.0, 143.0, 153.0, 119.0, 77.0, 45.0, 20.0, 14.0, 6.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.283090114593506, -4.17725944519043, -4.0714287757873535, -3.9655983448028564, -3.8597679138183594, -3.753937244415283, -3.648106575012207, -3.54227614402771, -3.436445474624634, -3.3306148052215576, -3.2247843742370605, -3.1189537048339844, -3.0131232738494873, -2.907292604446411, -2.801462173461914, -2.695631504058838, -2.5898008346557617, -2.4839701652526855, -2.3781397342681885, -2.2723090648651123, -2.1664786338806152, -2.060647964477539, -1.9548174142837524, -1.8489868640899658, -1.7431564331054688, -1.6373258829116821, -1.5314953327178955, -1.4256646633148193, -1.3198341131210327, -1.214003562927246, -1.1081730127334595, -1.0023424625396729, -0.8965117931365967, -0.7906812429428101, -0.6848506331443787, -0.579020082950592, -0.47318950295448303, -0.367358922958374, -0.2615283727645874, -0.155697762966156, -0.049867212772369385, 0.05596335977315903, 0.16179393231868744, 0.26762449741363525, 0.37345507740974426, 0.47928565740585327, 0.5851162075996399, 0.6909468173980713, 0.7967773675918579, 0.9026079177856445, 1.0084384679794312, 1.1142690181732178, 1.220099687576294, 1.3259302377700806, 1.4317607879638672, 1.5375914573669434, 1.6434218883514404, 1.749252438545227, 1.8550829887390137, 1.9609136581420898, 2.066744089126587, 2.172574758529663, 2.27840518951416, 2.3842358589172363, 2.4900665283203125]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 2.0, 2.0, 7.0, 5.0, 3.0, 5.0, 8.0, 7.0, 11.0, 14.0, 13.0, 30.0, 18.0, 28.0, 30.0, 21.0, 35.0, 26.0, 34.0, 34.0, 41.0, 28.0, 45.0, 45.0, 50.0, 38.0, 39.0, 39.0, 29.0, 35.0, 29.0, 30.0, 36.0, 25.0, 22.0, 30.0, 19.0, 16.0, 13.0, 13.0, 8.0, 6.0, 9.0, 7.0, 6.0, 5.0, 5.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0], "bins": [-1.3442909717559814, -1.3058111667633057, -1.2673313617706299, -1.228851556777954, -1.1903717517852783, -1.1518919467926025, -1.1134121417999268, -1.074932336807251, -1.0364525318145752, -0.9979727268218994, -0.9594929218292236, -0.9210131168365479, -0.8825333118438721, -0.8440535068511963, -0.8055737018585205, -0.7670938968658447, -0.728614091873169, -0.6901342868804932, -0.6516544818878174, -0.6131746768951416, -0.5746948719024658, -0.53621506690979, -0.49773526191711426, -0.4592554569244385, -0.4207756519317627, -0.3822958469390869, -0.34381604194641113, -0.30533623695373535, -0.26685643196105957, -0.2283766269683838, -0.189896821975708, -0.15141701698303223, -0.11293721199035645, -0.07445740699768066, -0.03597760200500488, 0.0025022029876708984, 0.04098200798034668, 0.07946181297302246, 0.11794161796569824, 0.15642142295837402, 0.1949012279510498, 0.23338103294372559, 0.27186083793640137, 0.31034064292907715, 0.34882044792175293, 0.3873002529144287, 0.4257800579071045, 0.4642598628997803, 0.502739667892456, 0.5412194728851318, 0.5796992778778076, 0.6181790828704834, 0.6566588878631592, 0.695138692855835, 0.7336184978485107, 0.7720983028411865, 0.8105781078338623, 0.8490579128265381, 0.8875377178192139, 0.9260175228118896, 0.9644973278045654, 1.0029771327972412, 1.041456937789917, 1.0799367427825928, 1.1184165477752686]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 4.0, 5.0, 9.0, 21.0, 30.0, 35.0, 56.0, 62.0, 107.0, 228.0, 350.0, 630.0, 1149.0, 2064.0, 3920.0, 7853.0, 17351.0, 42224.0, 111220.0, 253911.0, 313132.0, 175752.0, 68604.0, 26506.0, 11563.0, 5512.0, 2782.0, 1501.0, 777.0, 473.0, 266.0, 163.0, 90.0, 66.0, 43.0, 36.0, 19.0, 14.0, 13.0, 6.0, 7.0, 3.0, 2.0, 0.0, 4.0, 1.0, 2.0], "bins": [-0.484130859375, -0.4711341857910156, -0.45813751220703125, -0.4451408386230469, -0.4321441650390625, -0.4191474914550781, -0.40615081787109375, -0.3931541442871094, -0.380157470703125, -0.3671607971191406, -0.35416412353515625, -0.3411674499511719, -0.3281707763671875, -0.3151741027832031, -0.30217742919921875, -0.2891807556152344, -0.27618408203125, -0.2631874084472656, -0.25019073486328125, -0.23719406127929688, -0.2241973876953125, -0.21120071411132812, -0.19820404052734375, -0.18520736694335938, -0.172210693359375, -0.15921401977539062, -0.14621734619140625, -0.13322067260742188, -0.1202239990234375, -0.10722732543945312, -0.09423065185546875, -0.08123397827148438, -0.0682373046875, -0.055240631103515625, -0.04224395751953125, -0.029247283935546875, -0.0162506103515625, -0.003253936767578125, 0.00974273681640625, 0.022739410400390625, 0.035736083984375, 0.048732757568359375, 0.06172943115234375, 0.07472610473632812, 0.0877227783203125, 0.10071945190429688, 0.11371612548828125, 0.12671279907226562, 0.13970947265625, 0.15270614624023438, 0.16570281982421875, 0.17869949340820312, 0.1916961669921875, 0.20469284057617188, 0.21768951416015625, 0.23068618774414062, 0.243682861328125, 0.2566795349121094, 0.26967620849609375, 0.2826728820800781, 0.2956695556640625, 0.3086662292480469, 0.32166290283203125, 0.3346595764160156, 0.34765625]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 5.0, 3.0, 11.0, 15.0, 16.0, 16.0, 15.0, 20.0, 23.0, 28.0, 28.0, 38.0, 36.0, 35.0, 40.0, 36.0, 50.0, 39.0, 41.0, 51.0, 45.0, 47.0, 49.0, 39.0, 36.0, 32.0, 30.0, 32.0, 29.0, 20.0, 23.0, 11.0, 11.0, 19.0, 10.0, 8.0, 4.0, 8.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2005615234375, -0.19386672973632812, -0.18717193603515625, -0.18047714233398438, -0.1737823486328125, -0.16708755493164062, -0.16039276123046875, -0.15369796752929688, -0.147003173828125, -0.14030838012695312, -0.13361358642578125, -0.12691879272460938, -0.1202239990234375, -0.11352920532226562, -0.10683441162109375, -0.10013961791992188, -0.09344482421875, -0.08675003051757812, -0.08005523681640625, -0.07336044311523438, -0.0666656494140625, -0.059970855712890625, -0.05327606201171875, -0.046581268310546875, -0.039886474609375, -0.033191680908203125, -0.02649688720703125, -0.019802093505859375, -0.0131072998046875, -0.006412506103515625, 0.00028228759765625, 0.006977081298828125, 0.013671875, 0.020366668701171875, 0.02706146240234375, 0.033756256103515625, 0.0404510498046875, 0.047145843505859375, 0.05384063720703125, 0.060535430908203125, 0.067230224609375, 0.07392501831054688, 0.08061981201171875, 0.08731460571289062, 0.0940093994140625, 0.10070419311523438, 0.10739898681640625, 0.11409378051757812, 0.12078857421875, 0.12748336791992188, 0.13417816162109375, 0.14087295532226562, 0.1475677490234375, 0.15426254272460938, 0.16095733642578125, 0.16765213012695312, 0.174346923828125, 0.18104171752929688, 0.18773651123046875, 0.19443130493164062, 0.2011260986328125, 0.20782089233398438, 0.21451568603515625, 0.22121047973632812, 0.2279052734375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 3.0, 4.0, 8.0, 8.0, 8.0, 15.0, 24.0, 42.0, 58.0, 78.0, 139.0, 237.0, 425.0, 834.0, 1514.0, 3121.0, 6021.0, 12834.0, 29181.0, 72781.0, 182088.0, 322079.0, 241483.0, 102290.0, 40069.0, 16912.0, 8112.0, 3911.0, 1931.0, 1009.0, 571.0, 306.0, 173.0, 94.0, 64.0, 37.0, 26.0, 18.0, 13.0, 5.0, 11.0, 7.0, 7.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.3798828125, -0.3670845031738281, -0.35428619384765625, -0.3414878845214844, -0.3286895751953125, -0.3158912658691406, -0.30309295654296875, -0.2902946472167969, -0.277496337890625, -0.2646980285644531, -0.25189971923828125, -0.23910140991210938, -0.2263031005859375, -0.21350479125976562, -0.20070648193359375, -0.18790817260742188, -0.17510986328125, -0.16231155395507812, -0.14951324462890625, -0.13671493530273438, -0.1239166259765625, -0.11111831665039062, -0.09832000732421875, -0.08552169799804688, -0.072723388671875, -0.059925079345703125, -0.04712677001953125, -0.034328460693359375, -0.0215301513671875, -0.008731842041015625, 0.00406646728515625, 0.016864776611328125, 0.0296630859375, 0.042461395263671875, 0.05525970458984375, 0.06805801391601562, 0.0808563232421875, 0.09365463256835938, 0.10645294189453125, 0.11925125122070312, 0.132049560546875, 0.14484786987304688, 0.15764617919921875, 0.17044448852539062, 0.1832427978515625, 0.19604110717773438, 0.20883941650390625, 0.22163772583007812, 0.23443603515625, 0.24723434448242188, 0.26003265380859375, 0.2728309631347656, 0.2856292724609375, 0.2984275817871094, 0.31122589111328125, 0.3240242004394531, 0.336822509765625, 0.3496208190917969, 0.36241912841796875, 0.3752174377441406, 0.3880157470703125, 0.4008140563964844, 0.41361236572265625, 0.4264106750488281, 0.439208984375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 6.0, 2.0, 7.0, 11.0, 6.0, 13.0, 13.0, 13.0, 17.0, 17.0, 28.0, 30.0, 27.0, 41.0, 41.0, 45.0, 35.0, 53.0, 48.0, 55.0, 49.0, 44.0, 52.0, 40.0, 44.0, 36.0, 33.0, 29.0, 27.0, 21.0, 31.0, 19.0, 20.0, 11.0, 12.0, 8.0, 9.0, 3.0, 4.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.677734375, -0.6579818725585938, -0.6382293701171875, -0.6184768676757812, -0.598724365234375, -0.5789718627929688, -0.5592193603515625, -0.5394668579101562, -0.51971435546875, -0.49996185302734375, -0.4802093505859375, -0.46045684814453125, -0.440704345703125, -0.42095184326171875, -0.4011993408203125, -0.38144683837890625, -0.3616943359375, -0.34194183349609375, -0.3221893310546875, -0.30243682861328125, -0.282684326171875, -0.26293182373046875, -0.2431793212890625, -0.22342681884765625, -0.20367431640625, -0.18392181396484375, -0.1641693115234375, -0.14441680908203125, -0.124664306640625, -0.10491180419921875, -0.0851593017578125, -0.06540679931640625, -0.045654296875, -0.02590179443359375, -0.0061492919921875, 0.01360321044921875, 0.033355712890625, 0.05310821533203125, 0.0728607177734375, 0.09261322021484375, 0.11236572265625, 0.13211822509765625, 0.1518707275390625, 0.17162322998046875, 0.191375732421875, 0.21112823486328125, 0.2308807373046875, 0.25063323974609375, 0.2703857421875, 0.29013824462890625, 0.3098907470703125, 0.32964324951171875, 0.349395751953125, 0.36914825439453125, 0.3889007568359375, 0.40865325927734375, 0.42840576171875, 0.44815826416015625, 0.4679107666015625, 0.48766326904296875, 0.507415771484375, 0.5271682739257812, 0.5469207763671875, 0.5666732788085938, 0.58642578125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 4.0, 4.0, 7.0, 5.0, 6.0, 12.0, 25.0, 28.0, 49.0, 59.0, 113.0, 186.0, 294.0, 515.0, 929.0, 1774.0, 3399.0, 6590.0, 13699.0, 29905.0, 70039.0, 164068.0, 290699.0, 250128.0, 121722.0, 50820.0, 22160.0, 10473.0, 5167.0, 2568.0, 1349.0, 730.0, 402.0, 255.0, 151.0, 73.0, 59.0, 37.0, 18.0, 11.0, 9.0, 7.0, 5.0, 7.0, 3.0, 7.0, 2.0], "bins": [-0.1646728515625, -0.1605367660522461, -0.1564006805419922, -0.15226459503173828, -0.14812850952148438, -0.14399242401123047, -0.13985633850097656, -0.13572025299072266, -0.13158416748046875, -0.12744808197021484, -0.12331199645996094, -0.11917591094970703, -0.11503982543945312, -0.11090373992919922, -0.10676765441894531, -0.1026315689086914, -0.0984954833984375, -0.0943593978881836, -0.09022331237792969, -0.08608722686767578, -0.08195114135742188, -0.07781505584716797, -0.07367897033691406, -0.06954288482666016, -0.06540679931640625, -0.061270713806152344, -0.05713462829589844, -0.05299854278564453, -0.048862457275390625, -0.04472637176513672, -0.04059028625488281, -0.036454200744628906, -0.032318115234375, -0.028182029724121094, -0.024045944213867188, -0.01990985870361328, -0.015773773193359375, -0.011637687683105469, -0.0075016021728515625, -0.0033655166625976562, 0.00077056884765625, 0.004906654357910156, 0.009042739868164062, 0.013178825378417969, 0.017314910888671875, 0.02145099639892578, 0.025587081909179688, 0.029723167419433594, 0.0338592529296875, 0.037995338439941406, 0.04213142395019531, 0.04626750946044922, 0.050403594970703125, 0.05453968048095703, 0.05867576599121094, 0.06281185150146484, 0.06694793701171875, 0.07108402252197266, 0.07522010803222656, 0.07935619354248047, 0.08349227905273438, 0.08762836456298828, 0.09176445007324219, 0.0959005355834961, 0.10003662109375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 7.0, 9.0, 11.0, 13.0, 23.0, 27.0, 42.0, 61.0, 107.0, 120.0, 138.0, 137.0, 90.0, 62.0, 34.0, 33.0, 23.0, 15.0, 17.0, 12.0, 9.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.751848220825195e-05, -5.5339187383651733e-05, -5.3159892559051514e-05, -5.0980597734451294e-05, -4.8801302909851074e-05, -4.6622008085250854e-05, -4.4442713260650635e-05, -4.2263418436050415e-05, -4.0084123611450195e-05, -3.7904828786849976e-05, -3.5725533962249756e-05, -3.3546239137649536e-05, -3.1366944313049316e-05, -2.9187649488449097e-05, -2.7008354663848877e-05, -2.4829059839248657e-05, -2.2649765014648438e-05, -2.0470470190048218e-05, -1.8291175365447998e-05, -1.611188054084778e-05, -1.3932585716247559e-05, -1.1753290891647339e-05, -9.573996067047119e-06, -7.394701242446899e-06, -5.21540641784668e-06, -3.03611159324646e-06, -8.568167686462402e-07, 1.3224780559539795e-06, 3.5017728805541992e-06, 5.681067705154419e-06, 7.860362529754639e-06, 1.0039657354354858e-05, 1.2218952178955078e-05, 1.4398247003555298e-05, 1.6577541828155518e-05, 1.8756836652755737e-05, 2.0936131477355957e-05, 2.3115426301956177e-05, 2.5294721126556396e-05, 2.7474015951156616e-05, 2.9653310775756836e-05, 3.1832605600357056e-05, 3.4011900424957275e-05, 3.6191195249557495e-05, 3.8370490074157715e-05, 4.0549784898757935e-05, 4.2729079723358154e-05, 4.4908374547958374e-05, 4.7087669372558594e-05, 4.9266964197158813e-05, 5.144625902175903e-05, 5.362555384635925e-05, 5.580484867095947e-05, 5.798414349555969e-05, 6.016343832015991e-05, 6.234273314476013e-05, 6.452202796936035e-05, 6.670132279396057e-05, 6.888061761856079e-05, 7.105991244316101e-05, 7.323920726776123e-05, 7.541850209236145e-05, 7.759779691696167e-05, 7.977709174156189e-05, 8.195638656616211e-05]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 9.0, 8.0, 5.0, 17.0, 22.0, 29.0, 39.0, 52.0, 69.0, 127.0, 171.0, 263.0, 410.0, 740.0, 1429.0, 2812.0, 5442.0, 11232.0, 24141.0, 54925.0, 118129.0, 214855.0, 258346.0, 183274.0, 93112.0, 41746.0, 19084.0, 8754.0, 4257.0, 2136.0, 1147.0, 654.0, 416.0, 222.0, 155.0, 100.0, 55.0, 49.0, 39.0, 21.0, 20.0, 11.0, 9.0, 6.0, 6.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.1158447265625, -0.11202621459960938, -0.10820770263671875, -0.10438919067382812, -0.1005706787109375, -0.09675216674804688, -0.09293365478515625, -0.08911514282226562, -0.085296630859375, -0.08147811889648438, -0.07765960693359375, -0.07384109497070312, -0.0700225830078125, -0.06620407104492188, -0.06238555908203125, -0.058567047119140625, -0.05474853515625, -0.050930023193359375, -0.04711151123046875, -0.043292999267578125, -0.0394744873046875, -0.035655975341796875, -0.03183746337890625, -0.028018951416015625, -0.024200439453125, -0.020381927490234375, -0.01656341552734375, -0.012744903564453125, -0.0089263916015625, -0.005107879638671875, -0.00128936767578125, 0.002529144287109375, 0.00634765625, 0.010166168212890625, 0.01398468017578125, 0.017803192138671875, 0.0216217041015625, 0.025440216064453125, 0.02925872802734375, 0.033077239990234375, 0.036895751953125, 0.040714263916015625, 0.04453277587890625, 0.048351287841796875, 0.0521697998046875, 0.055988311767578125, 0.05980682373046875, 0.06362533569335938, 0.06744384765625, 0.07126235961914062, 0.07508087158203125, 0.07889938354492188, 0.0827178955078125, 0.08653640747070312, 0.09035491943359375, 0.09417343139648438, 0.097991943359375, 0.10181045532226562, 0.10562896728515625, 0.10944747924804688, 0.1132659912109375, 0.11708450317382812, 0.12090301513671875, 0.12472152709960938, 0.1285400390625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 2.0, 3.0, 2.0, 2.0, 8.0, 4.0, 7.0, 15.0, 10.0, 16.0, 27.0, 35.0, 34.0, 52.0, 55.0, 75.0, 66.0, 76.0, 87.0, 62.0, 63.0, 61.0, 52.0, 41.0, 36.0, 26.0, 20.0, 14.0, 16.0, 11.0, 7.0, 5.0, 5.0, 3.0, 2.0, 1.0, 4.0, 0.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.185791015625, -0.1803741455078125, -0.174957275390625, -0.1695404052734375, -0.16412353515625, -0.1587066650390625, -0.153289794921875, -0.1478729248046875, -0.1424560546875, -0.1370391845703125, -0.131622314453125, -0.1262054443359375, -0.12078857421875, -0.1153717041015625, -0.109954833984375, -0.1045379638671875, -0.09912109375, -0.0937042236328125, -0.088287353515625, -0.0828704833984375, -0.07745361328125, -0.0720367431640625, -0.066619873046875, -0.0612030029296875, -0.0557861328125, -0.0503692626953125, -0.044952392578125, -0.0395355224609375, -0.03411865234375, -0.0287017822265625, -0.023284912109375, -0.0178680419921875, -0.012451171875, -0.0070343017578125, -0.001617431640625, 0.0037994384765625, 0.00921630859375, 0.0146331787109375, 0.020050048828125, 0.0254669189453125, 0.0308837890625, 0.0363006591796875, 0.041717529296875, 0.0471343994140625, 0.05255126953125, 0.0579681396484375, 0.063385009765625, 0.0688018798828125, 0.07421875, 0.0796356201171875, 0.085052490234375, 0.0904693603515625, 0.09588623046875, 0.1013031005859375, 0.106719970703125, 0.1121368408203125, 0.1175537109375, 0.1229705810546875, 0.128387451171875, 0.1338043212890625, 0.13922119140625, 0.1446380615234375, 0.150054931640625, 0.1554718017578125, 0.160888671875]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 11.0, 15.0, 55.0, 139.0, 252.0, 274.0, 150.0, 66.0, 22.0, 11.0, 5.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9352967739105225, -2.771942615509033, -2.608588695526123, -2.445234537124634, -2.2818803787231445, -2.1185264587402344, -1.9551723003387451, -1.7918182611465454, -1.6284642219543457, -1.465110182762146, -1.3017561435699463, -1.138401985168457, -0.9750479459762573, -0.8116939067840576, -0.6483398079872131, -0.48498570919036865, -0.32163166999816895, -0.15827760100364685, 0.005076467990875244, 0.16843053698539734, 0.33178460597991943, 0.49513864517211914, 0.6584927439689636, 0.8218468427658081, 0.9852008819580078, 1.1485549211502075, 1.3119089603424072, 1.4752631187438965, 1.6386171579360962, 1.801971197128296, 1.9653253555297852, 2.1286792755126953, 2.2920331954956055, 2.4553873538970947, 2.618741273880005, 2.782095432281494, 2.9454493522644043, 3.1088035106658936, 3.272157669067383, 3.435511589050293, 3.5988657474517822, 3.7622199058532715, 3.9255738258361816, 4.088927745819092, 4.25228214263916, 4.41563606262207, 4.5789899826049805, 4.742344379425049, 4.905698299407959, 5.069052219390869, 5.2324066162109375, 5.395760536193848, 5.559114456176758, 5.722468376159668, 5.885822772979736, 6.0491766929626465, 6.212531089782715, 6.375885009765625, 6.539239406585693, 6.7025933265686035, 6.865947246551514, 7.029301643371582, 7.192655563354492, 7.356009483337402, 7.5193634033203125]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 4.0, 1.0, 5.0, 4.0, 4.0, 6.0, 4.0, 7.0, 11.0, 18.0, 14.0, 15.0, 20.0, 21.0, 24.0, 24.0, 22.0, 40.0, 26.0, 32.0, 26.0, 40.0, 27.0, 24.0, 30.0, 46.0, 42.0, 43.0, 38.0, 36.0, 36.0, 34.0, 30.0, 25.0, 31.0, 29.0, 13.0, 30.0, 19.0, 16.0, 10.0, 12.0, 7.0, 10.0, 15.0, 9.0, 8.0, 11.0, 5.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.4249085187911987, -1.3807636499404907, -1.3366187810897827, -1.2924739122390747, -1.2483291625976562, -1.2041842937469482, -1.1600394248962402, -1.1158945560455322, -1.0717496871948242, -1.0276048183441162, -0.9834599494934082, -0.939315140247345, -0.895170271396637, -0.851025402545929, -0.8068805932998657, -0.7627357244491577, -0.7185908555984497, -0.6744459867477417, -0.6303011178970337, -0.5861563086509705, -0.5420114398002625, -0.49786657094955444, -0.4537217319011688, -0.4095768928527832, -0.3654320240020752, -0.3212871551513672, -0.27714231610298157, -0.23299746215343475, -0.18885260820388794, -0.14470775425434113, -0.10056290030479431, -0.05641806125640869, -0.012273311614990234, 0.03187154233455658, 0.0760163962841034, 0.12016125023365021, 0.16430610418319702, 0.20845095813274384, 0.25259581208229065, 0.29674065113067627, 0.3408855199813843, 0.3850303888320923, 0.4291752278804779, 0.4733200669288635, 0.5174649357795715, 0.5616098046302795, 0.6057546138763428, 0.6498994827270508, 0.6940443515777588, 0.7381892204284668, 0.7823340892791748, 0.826478898525238, 0.870623767375946, 0.914768636226654, 0.9589134454727173, 1.0030583143234253, 1.0472031831741333, 1.0913480520248413, 1.1354929208755493, 1.1796377897262573, 1.2237825393676758, 1.2679274082183838, 1.3120722770690918, 1.3562171459197998, 1.4003620147705078]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 7.0, 6.0, 16.0, 21.0, 35.0, 45.0, 83.0, 124.0, 192.0, 244.0, 421.0, 704.0, 1084.0, 1935.0, 3224.0, 5390.0, 9608.0, 17428.0, 33312.0, 66206.0, 136676.0, 302434.0, 662435.0, 1139512.0, 942053.0, 466947.0, 208195.0, 95385.0, 46223.0, 23999.0, 12694.0, 7178.0, 4034.0, 2420.0, 1551.0, 933.0, 544.0, 312.0, 216.0, 129.0, 92.0, 79.0, 44.0, 35.0, 27.0, 22.0, 7.0, 4.0, 9.0, 5.0, 1.0, 3.0, 1.0, 0.0, 2.0, 3.0, 2.0], "bins": [-0.17626953125, -0.17053985595703125, -0.1648101806640625, -0.15908050537109375, -0.153350830078125, -0.14762115478515625, -0.1418914794921875, -0.13616180419921875, -0.13043212890625, -0.12470245361328125, -0.1189727783203125, -0.11324310302734375, -0.107513427734375, -0.10178375244140625, -0.0960540771484375, -0.09032440185546875, -0.0845947265625, -0.07886505126953125, -0.0731353759765625, -0.06740570068359375, -0.061676025390625, -0.05594635009765625, -0.0502166748046875, -0.04448699951171875, -0.03875732421875, -0.03302764892578125, -0.0272979736328125, -0.02156829833984375, -0.015838623046875, -0.01010894775390625, -0.0043792724609375, 0.00135040283203125, 0.007080078125, 0.01280975341796875, 0.0185394287109375, 0.02426910400390625, 0.029998779296875, 0.03572845458984375, 0.0414581298828125, 0.04718780517578125, 0.05291748046875, 0.05864715576171875, 0.0643768310546875, 0.07010650634765625, 0.075836181640625, 0.08156585693359375, 0.0872955322265625, 0.09302520751953125, 0.0987548828125, 0.10448455810546875, 0.1102142333984375, 0.11594390869140625, 0.121673583984375, 0.12740325927734375, 0.1331329345703125, 0.13886260986328125, 0.14459228515625, 0.15032196044921875, 0.1560516357421875, 0.16178131103515625, 0.167510986328125, 0.17324066162109375, 0.1789703369140625, 0.18470001220703125, 0.1904296875]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 10.0, 12.0, 7.0, 15.0, 18.0, 15.0, 15.0, 22.0, 22.0, 36.0, 31.0, 33.0, 41.0, 41.0, 50.0, 42.0, 53.0, 53.0, 60.0, 35.0, 55.0, 40.0, 46.0, 44.0, 31.0, 28.0, 29.0, 26.0, 20.0, 20.0, 21.0, 10.0, 4.0, 4.0, 1.0, 10.0, 4.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.23779296875, -0.2305450439453125, -0.223297119140625, -0.2160491943359375, -0.20880126953125, -0.2015533447265625, -0.194305419921875, -0.1870574951171875, -0.1798095703125, -0.1725616455078125, -0.165313720703125, -0.1580657958984375, -0.15081787109375, -0.1435699462890625, -0.136322021484375, -0.1290740966796875, -0.121826171875, -0.1145782470703125, -0.107330322265625, -0.1000823974609375, -0.09283447265625, -0.0855865478515625, -0.078338623046875, -0.0710906982421875, -0.0638427734375, -0.0565948486328125, -0.049346923828125, -0.0420989990234375, -0.03485107421875, -0.0276031494140625, -0.020355224609375, -0.0131072998046875, -0.005859375, 0.0013885498046875, 0.008636474609375, 0.0158843994140625, 0.02313232421875, 0.0303802490234375, 0.037628173828125, 0.0448760986328125, 0.0521240234375, 0.0593719482421875, 0.066619873046875, 0.0738677978515625, 0.08111572265625, 0.0883636474609375, 0.095611572265625, 0.1028594970703125, 0.110107421875, 0.1173553466796875, 0.124603271484375, 0.1318511962890625, 0.13909912109375, 0.1463470458984375, 0.153594970703125, 0.1608428955078125, 0.1680908203125, 0.1753387451171875, 0.182586669921875, 0.1898345947265625, 0.19708251953125, 0.2043304443359375, 0.211578369140625, 0.2188262939453125, 0.22607421875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 9.0, 7.0, 15.0, 11.0, 34.0, 35.0, 54.0, 123.0, 165.0, 304.0, 605.0, 1310.0, 3393.0, 10106.0, 37172.0, 174952.0, 1193251.0, 2330249.0, 351298.0, 66125.0, 16380.0, 5031.0, 1942.0, 808.0, 395.0, 187.0, 121.0, 83.0, 33.0, 28.0, 19.0, 12.0, 12.0, 6.0, 3.0, 4.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.394775390625, -0.3784599304199219, -0.36214447021484375, -0.3458290100097656, -0.3295135498046875, -0.3131980895996094, -0.29688262939453125, -0.2805671691894531, -0.264251708984375, -0.24793624877929688, -0.23162078857421875, -0.21530532836914062, -0.1989898681640625, -0.18267440795898438, -0.16635894775390625, -0.15004348754882812, -0.13372802734375, -0.11741256713867188, -0.10109710693359375, -0.08478164672851562, -0.0684661865234375, -0.052150726318359375, -0.03583526611328125, -0.019519805908203125, -0.003204345703125, 0.013111114501953125, 0.02942657470703125, 0.045742034912109375, 0.0620574951171875, 0.07837295532226562, 0.09468841552734375, 0.11100387573242188, 0.1273193359375, 0.14363479614257812, 0.15995025634765625, 0.17626571655273438, 0.1925811767578125, 0.20889663696289062, 0.22521209716796875, 0.24152755737304688, 0.257843017578125, 0.2741584777832031, 0.29047393798828125, 0.3067893981933594, 0.3231048583984375, 0.3394203186035156, 0.35573577880859375, 0.3720512390136719, 0.38836669921875, 0.4046821594238281, 0.42099761962890625, 0.4373130798339844, 0.4536285400390625, 0.4699440002441406, 0.48625946044921875, 0.5025749206542969, 0.518890380859375, 0.5352058410644531, 0.5515213012695312, 0.5678367614746094, 0.5841522216796875, 0.6004676818847656, 0.6167831420898438, 0.6330986022949219, 0.6494140625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 2.0, 7.0, 9.0, 5.0, 6.0, 10.0, 13.0, 15.0, 16.0, 26.0, 36.0, 55.0, 68.0, 99.0, 143.0, 174.0, 228.0, 363.0, 431.0, 548.0, 424.0, 391.0, 262.0, 189.0, 146.0, 104.0, 75.0, 64.0, 48.0, 30.0, 18.0, 13.0, 15.0, 14.0, 11.0, 8.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.356201171875, -0.3437004089355469, -0.33119964599609375, -0.3186988830566406, -0.3061981201171875, -0.2936973571777344, -0.28119659423828125, -0.2686958312988281, -0.256195068359375, -0.24369430541992188, -0.23119354248046875, -0.21869277954101562, -0.2061920166015625, -0.19369125366210938, -0.18119049072265625, -0.16868972778320312, -0.15618896484375, -0.14368820190429688, -0.13118743896484375, -0.11868667602539062, -0.1061859130859375, -0.09368515014648438, -0.08118438720703125, -0.06868362426757812, -0.056182861328125, -0.043682098388671875, -0.03118133544921875, -0.018680572509765625, -0.0061798095703125, 0.006320953369140625, 0.01882171630859375, 0.031322479248046875, 0.0438232421875, 0.056324005126953125, 0.06882476806640625, 0.08132553100585938, 0.0938262939453125, 0.10632705688476562, 0.11882781982421875, 0.13132858276367188, 0.143829345703125, 0.15633010864257812, 0.16883087158203125, 0.18133163452148438, 0.1938323974609375, 0.20633316040039062, 0.21883392333984375, 0.23133468627929688, 0.24383544921875, 0.2563362121582031, 0.26883697509765625, 0.2813377380371094, 0.2938385009765625, 0.3063392639160156, 0.31884002685546875, 0.3313407897949219, 0.343841552734375, 0.3563423156738281, 0.36884307861328125, 0.3813438415527344, 0.3938446044921875, 0.4063453674316406, 0.41884613037109375, 0.4313468933105469, 0.44384765625]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 6.0, 5.0, 9.0, 15.0, 25.0, 53.0, 68.0, 86.0, 115.0, 143.0, 139.0, 109.0, 89.0, 50.0, 32.0, 21.0, 17.0, 6.0, 8.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.999173164367676, -2.9131922721862793, -2.827211380004883, -2.7412302494049072, -2.6552493572235107, -2.5692684650421143, -2.4832873344421387, -2.397306442260742, -2.3113255500793457, -2.225344657897949, -2.1393637657165527, -2.053382635116577, -1.9674017429351807, -1.8814208507537842, -1.7954398393630981, -1.709458827972412, -1.6234779357910156, -1.5374970436096191, -1.451516032218933, -1.365535020828247, -1.2795541286468506, -1.193573236465454, -1.107592225074768, -1.021611213684082, -0.9356303215026855, -0.8496493697166443, -0.763668417930603, -0.6776874661445618, -0.5917065143585205, -0.5057255625724792, -0.419744610786438, -0.33376365900039673, -0.24778270721435547, -0.1618017554283142, -0.07582080364227295, 0.01016014814376831, 0.09614109992980957, 0.18212205171585083, 0.2681030035018921, 0.35408395528793335, 0.4400649070739746, 0.5260458588600159, 0.6120268106460571, 0.6980077624320984, 0.7839887142181396, 0.8699696660041809, 0.9559506177902222, 1.0419316291809082, 1.1279125213623047, 1.2138934135437012, 1.2998744249343872, 1.3858554363250732, 1.4718363285064697, 1.5578172206878662, 1.6437982320785522, 1.7297792434692383, 1.8157601356506348, 1.9017410278320312, 1.9877220392227173, 2.0737030506134033, 2.1596839427948, 2.2456648349761963, 2.331645965576172, 2.4176268577575684, 2.503607749938965]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 7.0, 7.0, 6.0, 6.0, 11.0, 9.0, 15.0, 18.0, 9.0, 12.0, 20.0, 20.0, 26.0, 35.0, 21.0, 28.0, 31.0, 47.0, 46.0, 38.0, 41.0, 44.0, 45.0, 46.0, 60.0, 43.0, 49.0, 29.0, 25.0, 39.0, 30.0, 26.0, 26.0, 14.0, 18.0, 18.0, 9.0, 9.0, 5.0, 5.0, 4.0, 4.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.7047348022460938, -1.6578364372253418, -1.6109380722045898, -1.564039707183838, -1.5171414613723755, -1.4702430963516235, -1.4233447313308716, -1.3764463663101196, -1.3295480012893677, -1.2826496362686157, -1.2357512712478638, -1.1888530254364014, -1.1419546604156494, -1.0950562953948975, -1.0481579303741455, -1.0012595653533936, -0.9543612599372864, -0.9074628949165344, -0.8605645895004272, -0.8136662244796753, -0.7667678594589233, -0.7198694944381714, -0.6729711890220642, -0.6260728240013123, -0.5791745185852051, -0.5322761535644531, -0.48537781834602356, -0.438479483127594, -0.39158111810684204, -0.3446827828884125, -0.2977844476699829, -0.25088608264923096, -0.203987717628479, -0.15708936750888824, -0.11019102483987808, -0.06329268217086792, -0.01639433205127716, 0.0305040180683136, 0.07740235328674316, 0.12430071830749512, 0.17119905352592468, 0.21809740364551544, 0.2649957537651062, 0.31189408898353577, 0.35879242420196533, 0.4056907892227173, 0.45258912444114685, 0.4994874894618988, 0.5463858246803284, 0.5932841897010803, 0.6401824951171875, 0.6870808601379395, 0.7339792251586914, 0.7808775901794434, 0.8277758955955505, 0.8746742606163025, 0.9215725660324097, 0.9684709310531616, 1.0153692960739136, 1.062267541885376, 1.109165906906128, 1.1560642719268799, 1.2029626369476318, 1.2498610019683838, 1.2967593669891357]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 4.0, 9.0, 14.0, 33.0, 45.0, 84.0, 139.0, 241.0, 447.0, 893.0, 1679.0, 3324.0, 6948.0, 14865.0, 35873.0, 96663.0, 235101.0, 321310.0, 199470.0, 77992.0, 29021.0, 12513.0, 5767.0, 2949.0, 1504.0, 777.0, 374.0, 227.0, 100.0, 70.0, 45.0, 18.0, 15.0, 16.0, 7.0, 7.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.444091796875, -0.4289817810058594, -0.41387176513671875, -0.3987617492675781, -0.3836517333984375, -0.3685417175292969, -0.35343170166015625, -0.3383216857910156, -0.323211669921875, -0.3081016540527344, -0.29299163818359375, -0.2778816223144531, -0.2627716064453125, -0.24766159057617188, -0.23255157470703125, -0.21744155883789062, -0.20233154296875, -0.18722152709960938, -0.17211151123046875, -0.15700149536132812, -0.1418914794921875, -0.12678146362304688, -0.11167144775390625, -0.09656143188476562, -0.081451416015625, -0.06634140014648438, -0.05123138427734375, -0.036121368408203125, -0.0210113525390625, -0.005901336669921875, 0.00920867919921875, 0.024318695068359375, 0.0394287109375, 0.054538726806640625, 0.06964874267578125, 0.08475875854492188, 0.0998687744140625, 0.11497879028320312, 0.13008880615234375, 0.14519882202148438, 0.160308837890625, 0.17541885375976562, 0.19052886962890625, 0.20563888549804688, 0.2207489013671875, 0.23585891723632812, 0.25096893310546875, 0.2660789489746094, 0.28118896484375, 0.2962989807128906, 0.31140899658203125, 0.3265190124511719, 0.3416290283203125, 0.3567390441894531, 0.37184906005859375, 0.3869590759277344, 0.402069091796875, 0.4171791076660156, 0.43228912353515625, 0.4473991394042969, 0.4625091552734375, 0.4776191711425781, 0.49272918701171875, 0.5078392028808594, 0.52294921875]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 2.0, 6.0, 1.0, 3.0, 3.0, 8.0, 13.0, 12.0, 10.0, 10.0, 17.0, 14.0, 12.0, 24.0, 31.0, 30.0, 29.0, 31.0, 37.0, 33.0, 41.0, 36.0, 45.0, 43.0, 48.0, 41.0, 37.0, 54.0, 33.0, 37.0, 34.0, 28.0, 22.0, 24.0, 27.0, 18.0, 20.0, 16.0, 14.0, 8.0, 10.0, 11.0, 10.0, 9.0, 5.0, 5.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1822509765625, -0.1758136749267578, -0.16937637329101562, -0.16293907165527344, -0.15650177001953125, -0.15006446838378906, -0.14362716674804688, -0.1371898651123047, -0.1307525634765625, -0.12431526184082031, -0.11787796020507812, -0.11144065856933594, -0.10500335693359375, -0.09856605529785156, -0.09212875366210938, -0.08569145202636719, -0.079254150390625, -0.07281684875488281, -0.06637954711914062, -0.05994224548339844, -0.05350494384765625, -0.04706764221191406, -0.040630340576171875, -0.03419303894042969, -0.0277557373046875, -0.021318435668945312, -0.014881134033203125, -0.008443832397460938, -0.00200653076171875, 0.0044307708740234375, 0.010868072509765625, 0.017305374145507812, 0.02374267578125, 0.030179977416992188, 0.036617279052734375, 0.04305458068847656, 0.04949188232421875, 0.05592918395996094, 0.062366485595703125, 0.06880378723144531, 0.0752410888671875, 0.08167839050292969, 0.08811569213867188, 0.09455299377441406, 0.10099029541015625, 0.10742759704589844, 0.11386489868164062, 0.12030220031738281, 0.126739501953125, 0.1331768035888672, 0.13961410522460938, 0.14605140686035156, 0.15248870849609375, 0.15892601013183594, 0.16536331176757812, 0.1718006134033203, 0.1782379150390625, 0.1846752166748047, 0.19111251831054688, 0.19754981994628906, 0.20398712158203125, 0.21042442321777344, 0.21686172485351562, 0.2232990264892578, 0.229736328125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 4.0, 2.0, 3.0, 8.0, 15.0, 8.0, 19.0, 31.0, 35.0, 75.0, 117.0, 227.0, 438.0, 1135.0, 3037.0, 9037.0, 29719.0, 124726.0, 434887.0, 334296.0, 79950.0, 20261.0, 6487.0, 2277.0, 863.0, 385.0, 191.0, 124.0, 71.0, 38.0, 35.0, 19.0, 9.0, 7.0, 10.0, 7.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.80908203125, -0.784454345703125, -0.75982666015625, -0.735198974609375, -0.7105712890625, -0.685943603515625, -0.66131591796875, -0.636688232421875, -0.612060546875, -0.587432861328125, -0.56280517578125, -0.538177490234375, -0.5135498046875, -0.488922119140625, -0.46429443359375, -0.439666748046875, -0.4150390625, -0.390411376953125, -0.36578369140625, -0.341156005859375, -0.3165283203125, -0.291900634765625, -0.26727294921875, -0.242645263671875, -0.218017578125, -0.193389892578125, -0.16876220703125, -0.144134521484375, -0.1195068359375, -0.094879150390625, -0.07025146484375, -0.045623779296875, -0.02099609375, 0.003631591796875, 0.02825927734375, 0.052886962890625, 0.0775146484375, 0.102142333984375, 0.12677001953125, 0.151397705078125, 0.176025390625, 0.200653076171875, 0.22528076171875, 0.249908447265625, 0.2745361328125, 0.299163818359375, 0.32379150390625, 0.348419189453125, 0.373046875, 0.397674560546875, 0.42230224609375, 0.446929931640625, 0.4715576171875, 0.496185302734375, 0.52081298828125, 0.545440673828125, 0.570068359375, 0.594696044921875, 0.61932373046875, 0.643951416015625, 0.6685791015625, 0.693206787109375, 0.71783447265625, 0.742462158203125, 0.76708984375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 4.0, 4.0, 9.0, 10.0, 13.0, 7.0, 21.0, 18.0, 27.0, 24.0, 16.0, 33.0, 31.0, 24.0, 51.0, 48.0, 41.0, 46.0, 36.0, 49.0, 49.0, 43.0, 45.0, 45.0, 38.0, 37.0, 30.0, 36.0, 23.0, 16.0, 23.0, 20.0, 19.0, 16.0, 12.0, 10.0, 9.0, 3.0, 5.0, 5.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6669921875, -0.6449661254882812, -0.6229400634765625, -0.6009140014648438, -0.578887939453125, -0.5568618774414062, -0.5348358154296875, -0.5128097534179688, -0.49078369140625, -0.46875762939453125, -0.4467315673828125, -0.42470550537109375, -0.402679443359375, -0.38065338134765625, -0.3586273193359375, -0.33660125732421875, -0.3145751953125, -0.29254913330078125, -0.2705230712890625, -0.24849700927734375, -0.226470947265625, -0.20444488525390625, -0.1824188232421875, -0.16039276123046875, -0.13836669921875, -0.11634063720703125, -0.0943145751953125, -0.07228851318359375, -0.050262451171875, -0.02823638916015625, -0.0062103271484375, 0.01581573486328125, 0.037841796875, 0.05986785888671875, 0.0818939208984375, 0.10391998291015625, 0.125946044921875, 0.14797210693359375, 0.1699981689453125, 0.19202423095703125, 0.21405029296875, 0.23607635498046875, 0.2581024169921875, 0.28012847900390625, 0.302154541015625, 0.32418060302734375, 0.3462066650390625, 0.36823272705078125, 0.3902587890625, 0.41228485107421875, 0.4343109130859375, 0.45633697509765625, 0.478363037109375, 0.5003890991210938, 0.5224151611328125, 0.5444412231445312, 0.56646728515625, 0.5884933471679688, 0.6105194091796875, 0.6325454711914062, 0.654571533203125, 0.6765975952148438, 0.6986236572265625, 0.7206497192382812, 0.74267578125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 4.0, 4.0, 7.0, 9.0, 14.0, 12.0, 25.0, 49.0, 71.0, 111.0, 167.0, 270.0, 492.0, 837.0, 1399.0, 2460.0, 4692.0, 9055.0, 18211.0, 43110.0, 111206.0, 253851.0, 309037.0, 172691.0, 67226.0, 26795.0, 12434.0, 6409.0, 3443.0, 1964.0, 988.0, 578.0, 338.0, 218.0, 122.0, 93.0, 52.0, 31.0, 33.0, 24.0, 8.0, 7.0, 3.0, 1.0, 1.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.1573486328125, -0.15261459350585938, -0.14788055419921875, -0.14314651489257812, -0.1384124755859375, -0.13367843627929688, -0.12894439697265625, -0.12421035766601562, -0.119476318359375, -0.11474227905273438, -0.11000823974609375, -0.10527420043945312, -0.1005401611328125, -0.09580612182617188, -0.09107208251953125, -0.08633804321289062, -0.08160400390625, -0.07686996459960938, -0.07213592529296875, -0.06740188598632812, -0.0626678466796875, -0.057933807373046875, -0.05319976806640625, -0.048465728759765625, -0.043731689453125, -0.038997650146484375, -0.03426361083984375, -0.029529571533203125, -0.0247955322265625, -0.020061492919921875, -0.01532745361328125, -0.010593414306640625, -0.005859375, -0.001125335693359375, 0.00360870361328125, 0.008342742919921875, 0.0130767822265625, 0.017810821533203125, 0.02254486083984375, 0.027278900146484375, 0.032012939453125, 0.036746978759765625, 0.04148101806640625, 0.046215057373046875, 0.0509490966796875, 0.055683135986328125, 0.06041717529296875, 0.06515121459960938, 0.06988525390625, 0.07461929321289062, 0.07935333251953125, 0.08408737182617188, 0.0888214111328125, 0.09355545043945312, 0.09828948974609375, 0.10302352905273438, 0.107757568359375, 0.11249160766601562, 0.11722564697265625, 0.12195968627929688, 0.1266937255859375, 0.13142776489257812, 0.13616180419921875, 0.14089584350585938, 0.1456298828125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 2.0, 1.0, 3.0, 6.0, 8.0, 9.0, 12.0, 19.0, 28.0, 34.0, 50.0, 67.0, 83.0, 104.0, 118.0, 97.0, 87.0, 70.0, 69.0, 34.0, 27.0, 21.0, 16.0, 5.0, 8.0, 6.0, 4.0, 2.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.312131881713867e-05, -6.10649585723877e-05, -5.900859832763672e-05, -5.695223808288574e-05, -5.4895877838134766e-05, -5.283951759338379e-05, -5.078315734863281e-05, -4.8726797103881836e-05, -4.667043685913086e-05, -4.461407661437988e-05, -4.2557716369628906e-05, -4.050135612487793e-05, -3.844499588012695e-05, -3.6388635635375977e-05, -3.4332275390625e-05, -3.2275915145874023e-05, -3.0219554901123047e-05, -2.816319465637207e-05, -2.6106834411621094e-05, -2.4050474166870117e-05, -2.199411392211914e-05, -1.9937753677368164e-05, -1.7881393432617188e-05, -1.582503318786621e-05, -1.3768672943115234e-05, -1.1712312698364258e-05, -9.655952453613281e-06, -7.599592208862305e-06, -5.543231964111328e-06, -3.4868717193603516e-06, -1.430511474609375e-06, 6.258487701416016e-07, 2.682209014892578e-06, 4.738569259643555e-06, 6.794929504394531e-06, 8.851289749145508e-06, 1.0907649993896484e-05, 1.2964010238647461e-05, 1.5020370483398438e-05, 1.7076730728149414e-05, 1.913309097290039e-05, 2.1189451217651367e-05, 2.3245811462402344e-05, 2.530217170715332e-05, 2.7358531951904297e-05, 2.9414892196655273e-05, 3.147125244140625e-05, 3.3527612686157227e-05, 3.55839729309082e-05, 3.764033317565918e-05, 3.9696693420410156e-05, 4.175305366516113e-05, 4.380941390991211e-05, 4.5865774154663086e-05, 4.792213439941406e-05, 4.997849464416504e-05, 5.2034854888916016e-05, 5.409121513366699e-05, 5.614757537841797e-05, 5.8203935623168945e-05, 6.026029586791992e-05, 6.23166561126709e-05, 6.437301635742188e-05, 6.642937660217285e-05, 6.848573684692383e-05]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 11.0, 6.0, 8.0, 15.0, 16.0, 27.0, 41.0, 99.0, 132.0, 256.0, 442.0, 989.0, 2198.0, 5811.0, 16260.0, 49573.0, 149797.0, 327879.0, 303718.0, 127480.0, 41128.0, 13827.0, 4995.0, 1913.0, 880.0, 444.0, 247.0, 155.0, 67.0, 57.0, 32.0, 16.0, 12.0, 8.0, 9.0, 4.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.187255859375, -0.18156814575195312, -0.17588043212890625, -0.17019271850585938, -0.1645050048828125, -0.15881729125976562, -0.15312957763671875, -0.14744186401367188, -0.141754150390625, -0.13606643676757812, -0.13037872314453125, -0.12469100952148438, -0.1190032958984375, -0.11331558227539062, -0.10762786865234375, -0.10194015502929688, -0.09625244140625, -0.09056472778320312, -0.08487701416015625, -0.07918930053710938, -0.0735015869140625, -0.06781387329101562, -0.06212615966796875, -0.056438446044921875, -0.050750732421875, -0.045063018798828125, -0.03937530517578125, -0.033687591552734375, -0.0279998779296875, -0.022312164306640625, -0.01662445068359375, -0.010936737060546875, -0.0052490234375, 0.000438690185546875, 0.00612640380859375, 0.011814117431640625, 0.0175018310546875, 0.023189544677734375, 0.02887725830078125, 0.034564971923828125, 0.040252685546875, 0.045940399169921875, 0.05162811279296875, 0.057315826416015625, 0.0630035400390625, 0.06869125366210938, 0.07437896728515625, 0.08006668090820312, 0.08575439453125, 0.09144210815429688, 0.09712982177734375, 0.10281753540039062, 0.1085052490234375, 0.11419296264648438, 0.11988067626953125, 0.12556838989257812, 0.131256103515625, 0.13694381713867188, 0.14263153076171875, 0.14831924438476562, 0.1540069580078125, 0.15969467163085938, 0.16538238525390625, 0.17107009887695312, 0.1767578125]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 6.0, 5.0, 12.0, 14.0, 11.0, 16.0, 17.0, 36.0, 33.0, 33.0, 31.0, 46.0, 46.0, 43.0, 44.0, 68.0, 61.0, 65.0, 74.0, 64.0, 39.0, 35.0, 38.0, 32.0, 22.0, 21.0, 18.0, 13.0, 12.0, 13.0, 7.0, 8.0, 6.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.130615234375, -0.12562179565429688, -0.12062835693359375, -0.11563491821289062, -0.1106414794921875, -0.10564804077148438, -0.10065460205078125, -0.09566116333007812, -0.090667724609375, -0.08567428588867188, -0.08068084716796875, -0.07568740844726562, -0.0706939697265625, -0.06570053100585938, -0.06070709228515625, -0.055713653564453125, -0.05072021484375, -0.045726776123046875, -0.04073333740234375, -0.035739898681640625, -0.0307464599609375, -0.025753021240234375, -0.02075958251953125, -0.015766143798828125, -0.010772705078125, -0.005779266357421875, -0.00078582763671875, 0.004207611083984375, 0.0092010498046875, 0.014194488525390625, 0.01918792724609375, 0.024181365966796875, 0.0291748046875, 0.034168243408203125, 0.03916168212890625, 0.044155120849609375, 0.0491485595703125, 0.054141998291015625, 0.05913543701171875, 0.06412887573242188, 0.069122314453125, 0.07411575317382812, 0.07910919189453125, 0.08410263061523438, 0.0890960693359375, 0.09408950805664062, 0.09908294677734375, 0.10407638549804688, 0.10906982421875, 0.11406326293945312, 0.11905670166015625, 0.12405014038085938, 0.1290435791015625, 0.13403701782226562, 0.13903045654296875, 0.14402389526367188, 0.149017333984375, 0.15401077270507812, 0.15900421142578125, 0.16399765014648438, 0.1689910888671875, 0.17398452758789062, 0.17897796630859375, 0.18397140502929688, 0.18896484375]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 4.0, 1.0, 5.0, 2.0, 0.0, 6.0, 9.0, 19.0, 31.0, 55.0, 75.0, 120.0, 153.0, 170.0, 140.0, 81.0, 63.0, 37.0, 17.0, 13.0, 6.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9310479164123535, -2.8197879791259766, -2.7085282802581787, -2.5972683429718018, -2.486008644104004, -2.374748706817627, -2.26348876953125, -2.152229070663452, -2.0409693717956543, -1.929709553718567, -1.8184497356414795, -1.7071897983551025, -1.5959300994873047, -1.4846701622009277, -1.3734103441238403, -1.262150526046753, -1.150890588760376, -1.0396307706832886, -0.9283709526062012, -0.817111074924469, -0.7058512568473816, -0.5945914387702942, -0.483331561088562, -0.3720717430114746, -0.2608119249343872, -0.1495520919561386, -0.038292258977890015, 0.07296758890151978, 0.18422740697860718, 0.2954872250556946, 0.40674710273742676, 0.5180069208145142, 0.6292667388916016, 0.740526556968689, 0.8517863750457764, 0.9630462527275085, 1.0743060111999512, 1.1855659484863281, 1.2968257665634155, 1.408085584640503, 1.5193454027175903, 1.6306052207946777, 1.7418650388717651, 1.8531248569488525, 1.9643847942352295, 2.0756444931030273, 2.1869044303894043, 2.2981643676757812, 2.409424066543579, 2.520684003829956, 2.631943702697754, 2.743203639984131, 2.8544633388519287, 2.9657232761383057, 3.0769829750061035, 3.1882429122924805, 3.2995028495788574, 3.4107627868652344, 3.5220224857330322, 3.633282423019409, 3.744542121887207, 3.855802059173584, 3.967061996459961, 4.07832145690918, 4.189581394195557]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 3.0, 2.0, 4.0, 5.0, 11.0, 10.0, 17.0, 17.0, 13.0, 19.0, 21.0, 27.0, 24.0, 27.0, 32.0, 28.0, 32.0, 34.0, 34.0, 41.0, 44.0, 39.0, 44.0, 38.0, 35.0, 41.0, 46.0, 44.0, 24.0, 31.0, 37.0, 35.0, 16.0, 26.0, 15.0, 14.0, 16.0, 10.0, 13.0, 8.0, 10.0, 2.0, 9.0, 3.0, 1.0, 3.0, 1.0, 3.0, 2.0], "bins": [-1.9154976606369019, -1.8640453815460205, -1.8125929832458496, -1.7611405849456787, -1.7096883058547974, -1.658236026763916, -1.6067836284637451, -1.5553312301635742, -1.5038789510726929, -1.4524266719818115, -1.4009742736816406, -1.3495218753814697, -1.2980695962905884, -1.246617317199707, -1.1951649188995361, -1.1437125205993652, -1.0922602415084839, -1.0408079624176025, -0.9893555641174316, -0.9379032254219055, -0.8864508867263794, -0.8349985480308533, -0.7835462093353271, -0.732093870639801, -0.6806415319442749, -0.6291891932487488, -0.5777368545532227, -0.5262845158576965, -0.4748321771621704, -0.4233798384666443, -0.37192749977111816, -0.32047516107559204, -0.26902270317077637, -0.21757036447525024, -0.16611802577972412, -0.114665687084198, -0.06321334838867188, -0.011761009693145752, 0.03969132900238037, 0.0911436676979065, 0.14259600639343262, 0.19404834508895874, 0.24550068378448486, 0.296953022480011, 0.3484053611755371, 0.39985769987106323, 0.45131003856658936, 0.5027623772621155, 0.5542147159576416, 0.6056670546531677, 0.6571193933486938, 0.70857173204422, 0.7600240707397461, 0.8114764094352722, 0.8629287481307983, 0.9143810868263245, 0.9658334255218506, 1.0172858238220215, 1.0687381029129028, 1.1201903820037842, 1.171642780303955, 1.223095178604126, 1.2745474576950073, 1.3259997367858887, 1.3774521350860596]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 3.0, 2.0, 10.0, 19.0, 16.0, 34.0, 42.0, 71.0, 126.0, 158.0, 231.0, 432.0, 711.0, 1213.0, 2031.0, 3451.0, 6076.0, 11007.0, 21756.0, 43937.0, 96380.0, 221005.0, 501852.0, 989783.0, 1135452.0, 645504.0, 285541.0, 119807.0, 53043.0, 25284.0, 13088.0, 6781.0, 3847.0, 2141.0, 1265.0, 825.0, 500.0, 286.0, 200.0, 136.0, 80.0, 56.0, 33.0, 21.0, 23.0, 9.0, 5.0, 8.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1776123046875, -0.17130088806152344, -0.16498947143554688, -0.1586780548095703, -0.15236663818359375, -0.1460552215576172, -0.13974380493164062, -0.13343238830566406, -0.1271209716796875, -0.12080955505371094, -0.11449813842773438, -0.10818672180175781, -0.10187530517578125, -0.09556388854980469, -0.08925247192382812, -0.08294105529785156, -0.076629638671875, -0.07031822204589844, -0.06400680541992188, -0.05769538879394531, -0.05138397216796875, -0.04507255554199219, -0.038761138916015625, -0.03244972229003906, -0.0261383056640625, -0.019826889038085938, -0.013515472412109375, -0.0072040557861328125, -0.00089263916015625, 0.0054187774658203125, 0.011730194091796875, 0.018041610717773438, 0.02435302734375, 0.030664443969726562, 0.036975860595703125, 0.04328727722167969, 0.04959869384765625, 0.05591011047363281, 0.062221527099609375, 0.06853294372558594, 0.0748443603515625, 0.08115577697753906, 0.08746719360351562, 0.09377861022949219, 0.10009002685546875, 0.10640144348144531, 0.11271286010742188, 0.11902427673339844, 0.125335693359375, 0.13164710998535156, 0.13795852661132812, 0.1442699432373047, 0.15058135986328125, 0.1568927764892578, 0.16320419311523438, 0.16951560974121094, 0.1758270263671875, 0.18213844299316406, 0.18844985961914062, 0.1947612762451172, 0.20107269287109375, 0.2073841094970703, 0.21369552612304688, 0.22000694274902344, 0.226318359375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 5.0, 8.0, 8.0, 14.0, 13.0, 5.0, 11.0, 24.0, 20.0, 21.0, 18.0, 24.0, 20.0, 32.0, 35.0, 40.0, 38.0, 50.0, 42.0, 48.0, 47.0, 43.0, 36.0, 38.0, 38.0, 37.0, 39.0, 23.0, 30.0, 26.0, 23.0, 22.0, 18.0, 18.0, 14.0, 7.0, 12.0, 11.0, 6.0, 6.0, 10.0, 3.0, 6.0, 5.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1881103515625, -0.18162155151367188, -0.17513275146484375, -0.16864395141601562, -0.1621551513671875, -0.15566635131835938, -0.14917755126953125, -0.14268875122070312, -0.136199951171875, -0.12971115112304688, -0.12322235107421875, -0.11673355102539062, -0.1102447509765625, -0.10375595092773438, -0.09726715087890625, -0.09077835083007812, -0.08428955078125, -0.07780075073242188, -0.07131195068359375, -0.06482315063476562, -0.0583343505859375, -0.051845550537109375, -0.04535675048828125, -0.038867950439453125, -0.032379150390625, -0.025890350341796875, -0.01940155029296875, -0.012912750244140625, -0.0064239501953125, 6.4849853515625e-05, 0.00655364990234375, 0.013042449951171875, 0.01953125, 0.026020050048828125, 0.03250885009765625, 0.038997650146484375, 0.0454864501953125, 0.051975250244140625, 0.05846405029296875, 0.06495285034179688, 0.071441650390625, 0.07793045043945312, 0.08441925048828125, 0.09090805053710938, 0.0973968505859375, 0.10388565063476562, 0.11037445068359375, 0.11686325073242188, 0.12335205078125, 0.12984085083007812, 0.13632965087890625, 0.14281845092773438, 0.1493072509765625, 0.15579605102539062, 0.16228485107421875, 0.16877365112304688, 0.175262451171875, 0.18175125122070312, 0.18824005126953125, 0.19472885131835938, 0.2012176513671875, 0.20770645141601562, 0.21419525146484375, 0.22068405151367188, 0.2271728515625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 4.0, 0.0, 1.0, 4.0, 2.0, 10.0, 10.0, 17.0, 33.0, 48.0, 69.0, 131.0, 249.0, 436.0, 968.0, 2332.0, 6455.0, 20357.0, 80436.0, 421312.0, 2449237.0, 1000042.0, 159054.0, 36237.0, 10414.0, 3677.0, 1414.0, 616.0, 293.0, 197.0, 87.0, 60.0, 34.0, 21.0, 13.0, 6.0, 7.0, 3.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.406494140625, -0.3900489807128906, -0.37360382080078125, -0.3571586608886719, -0.3407135009765625, -0.3242683410644531, -0.30782318115234375, -0.2913780212402344, -0.274932861328125, -0.2584877014160156, -0.24204254150390625, -0.22559738159179688, -0.2091522216796875, -0.19270706176757812, -0.17626190185546875, -0.15981674194335938, -0.14337158203125, -0.12692642211914062, -0.11048126220703125, -0.09403610229492188, -0.0775909423828125, -0.061145782470703125, -0.04470062255859375, -0.028255462646484375, -0.011810302734375, 0.004634857177734375, 0.02108001708984375, 0.037525177001953125, 0.0539703369140625, 0.07041549682617188, 0.08686065673828125, 0.10330581665039062, 0.1197509765625, 0.13619613647460938, 0.15264129638671875, 0.16908645629882812, 0.1855316162109375, 0.20197677612304688, 0.21842193603515625, 0.23486709594726562, 0.251312255859375, 0.2677574157714844, 0.28420257568359375, 0.3006477355957031, 0.3170928955078125, 0.3335380554199219, 0.34998321533203125, 0.3664283752441406, 0.38287353515625, 0.3993186950683594, 0.41576385498046875, 0.4322090148925781, 0.4486541748046875, 0.4650993347167969, 0.48154449462890625, 0.4979896545410156, 0.514434814453125, 0.5308799743652344, 0.5473251342773438, 0.5637702941894531, 0.5802154541015625, 0.5966606140136719, 0.6131057739257812, 0.6295509338378906, 0.64599609375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 7.0, 7.0, 12.0, 15.0, 23.0, 34.0, 43.0, 74.0, 109.0, 133.0, 277.0, 408.0, 610.0, 696.0, 519.0, 388.0, 223.0, 168.0, 113.0, 74.0, 51.0, 28.0, 22.0, 17.0, 16.0, 7.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3515625, -0.33330535888671875, -0.3150482177734375, -0.29679107666015625, -0.278533935546875, -0.26027679443359375, -0.2420196533203125, -0.22376251220703125, -0.20550537109375, -0.18724822998046875, -0.1689910888671875, -0.15073394775390625, -0.132476806640625, -0.11421966552734375, -0.0959625244140625, -0.07770538330078125, -0.0594482421875, -0.04119110107421875, -0.0229339599609375, -0.00467681884765625, 0.013580322265625, 0.03183746337890625, 0.0500946044921875, 0.06835174560546875, 0.08660888671875, 0.10486602783203125, 0.1231231689453125, 0.14138031005859375, 0.159637451171875, 0.17789459228515625, 0.1961517333984375, 0.21440887451171875, 0.232666015625, 0.25092315673828125, 0.2691802978515625, 0.28743743896484375, 0.305694580078125, 0.32395172119140625, 0.3422088623046875, 0.36046600341796875, 0.37872314453125, 0.39698028564453125, 0.4152374267578125, 0.43349456787109375, 0.451751708984375, 0.47000885009765625, 0.4882659912109375, 0.5065231323242188, 0.5247802734375, 0.5430374145507812, 0.5612945556640625, 0.5795516967773438, 0.597808837890625, 0.6160659790039062, 0.6343231201171875, 0.6525802612304688, 0.67083740234375, 0.6890945434570312, 0.7073516845703125, 0.7256088256835938, 0.743865966796875, 0.7621231079101562, 0.7803802490234375, 0.7986373901367188, 0.81689453125]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 7.0, 7.0, 33.0, 83.0, 179.0, 297.0, 211.0, 121.0, 43.0, 15.0, 2.0, 4.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.668066024780273, -6.467572212219238, -6.267077922821045, -6.06658411026001, -5.866089820861816, -5.665596008300781, -5.465102195739746, -5.264607906341553, -5.064113616943359, -4.863619804382324, -4.663125514984131, -4.462631702423096, -4.262137413024902, -4.061643600463867, -3.861149549484253, -3.6606554985046387, -3.4601616859436035, -3.2596676349639893, -3.059173583984375, -2.85867977142334, -2.6581854820251465, -2.4576916694641113, -2.257197618484497, -2.056703567504883, -1.8562095165252686, -1.6557154655456543, -1.45522141456604, -1.2547274827957153, -1.054233431816101, -0.8537393808364868, -0.6532454490661621, -0.45275139808654785, -0.2522573471069336, -0.051763325929641724, 0.14873069524765015, 0.34922468662261963, 0.5497187376022339, 0.7502127885818481, 0.9507067203521729, 1.151200771331787, 1.3516948223114014, 1.5521888732910156, 1.7526829242706299, 1.9531768560409546, 2.1536707878112793, 2.3541650772094727, 2.554658889770508, 2.755152940750122, 2.9556469917297363, 3.1561410427093506, 3.356635093688965, 3.55712890625, 3.7576231956481934, 3.9581170082092285, 4.158611297607422, 4.359105110168457, 4.559598922729492, 4.760092735290527, 4.960587024688721, 5.161080837249756, 5.361575126647949, 5.562068939208984, 5.7625627517700195, 5.963057041168213, 6.163551330566406]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 2.0, 7.0, 4.0, 3.0, 8.0, 7.0, 6.0, 10.0, 10.0, 13.0, 16.0, 18.0, 18.0, 28.0, 22.0, 34.0, 33.0, 22.0, 28.0, 35.0, 43.0, 41.0, 40.0, 33.0, 45.0, 40.0, 41.0, 43.0, 36.0, 39.0, 32.0, 24.0, 24.0, 21.0, 29.0, 26.0, 19.0, 17.0, 11.0, 17.0, 11.0, 13.0, 9.0, 7.0, 4.0, 3.0, 6.0, 3.0, 1.0, 4.0, 1.0, 3.0, 1.0], "bins": [-1.6624239683151245, -1.6147022247314453, -1.5669806003570557, -1.5192588567733765, -1.4715372323989868, -1.4238154888153076, -1.376093864440918, -1.3283721208572388, -1.2806503772735596, -1.2329286336898804, -1.1852070093154907, -1.1374852657318115, -1.0897636413574219, -1.0420418977737427, -0.9943202137947083, -0.9465985298156738, -0.8988768458366394, -0.851155161857605, -0.8034334778785706, -0.7557117938995361, -0.7079900503158569, -0.6602683663368225, -0.6125466823577881, -0.5648249387741089, -0.5171033143997192, -0.4693816304206848, -0.421659916639328, -0.3739382326602936, -0.32621651887893677, -0.27849483489990234, -0.23077315092086792, -0.1830514371395111, -0.1353297233581543, -0.08760802447795868, -0.03988633304834366, 0.007835358381271362, 0.05555705726146698, 0.1032787561416626, 0.15100044012069702, 0.19872215390205383, 0.24644383788108826, 0.2941655218601227, 0.3418872356414795, 0.3896089196205139, 0.43733060359954834, 0.48505231738090515, 0.5327739715576172, 0.5804957151412964, 0.6282173991203308, 0.6759390830993652, 0.7236607670783997, 0.7713824510574341, 0.8191041946411133, 0.8668258786201477, 0.9145475625991821, 0.9622693061828613, 1.009990930557251, 1.0577126741409302, 1.1054342985153198, 1.153156042098999, 1.2008776664733887, 1.2485994100570679, 1.296321153640747, 1.3440427780151367, 1.391764521598816]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 3.0, 4.0, 5.0, 10.0, 26.0, 16.0, 26.0, 40.0, 73.0, 80.0, 122.0, 234.0, 377.0, 584.0, 1002.0, 1875.0, 3620.0, 7460.0, 16431.0, 39754.0, 95109.0, 194353.0, 268755.0, 217967.0, 113809.0, 48890.0, 19918.0, 8714.0, 4076.0, 2186.0, 1171.0, 731.0, 415.0, 250.0, 153.0, 111.0, 73.0, 37.0, 23.0, 21.0, 19.0, 14.0, 11.0, 1.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.397216796875, -0.38465118408203125, -0.3720855712890625, -0.35951995849609375, -0.346954345703125, -0.33438873291015625, -0.3218231201171875, -0.30925750732421875, -0.29669189453125, -0.28412628173828125, -0.2715606689453125, -0.25899505615234375, -0.246429443359375, -0.23386383056640625, -0.2212982177734375, -0.20873260498046875, -0.1961669921875, -0.18360137939453125, -0.1710357666015625, -0.15847015380859375, -0.145904541015625, -0.13333892822265625, -0.1207733154296875, -0.10820770263671875, -0.09564208984375, -0.08307647705078125, -0.0705108642578125, -0.05794525146484375, -0.045379638671875, -0.03281402587890625, -0.0202484130859375, -0.00768280029296875, 0.0048828125, 0.01744842529296875, 0.0300140380859375, 0.04257965087890625, 0.055145263671875, 0.06771087646484375, 0.0802764892578125, 0.09284210205078125, 0.10540771484375, 0.11797332763671875, 0.1305389404296875, 0.14310455322265625, 0.155670166015625, 0.16823577880859375, 0.1808013916015625, 0.19336700439453125, 0.2059326171875, 0.21849822998046875, 0.2310638427734375, 0.24362945556640625, 0.256195068359375, 0.26876068115234375, 0.2813262939453125, 0.29389190673828125, 0.30645751953125, 0.31902313232421875, 0.3315887451171875, 0.34415435791015625, 0.356719970703125, 0.36928558349609375, 0.3818511962890625, 0.39441680908203125, 0.406982421875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 10.0, 7.0, 13.0, 8.0, 17.0, 14.0, 19.0, 22.0, 23.0, 32.0, 25.0, 38.0, 37.0, 53.0, 30.0, 34.0, 33.0, 39.0, 39.0, 43.0, 41.0, 47.0, 47.0, 42.0, 33.0, 38.0, 34.0, 24.0, 27.0, 22.0, 20.0, 16.0, 11.0, 14.0, 9.0, 9.0, 7.0, 5.0, 7.0, 5.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2294921875, -0.22152328491210938, -0.21355438232421875, -0.20558547973632812, -0.1976165771484375, -0.18964767456054688, -0.18167877197265625, -0.17370986938476562, -0.165740966796875, -0.15777206420898438, -0.14980316162109375, -0.14183425903320312, -0.1338653564453125, -0.12589645385742188, -0.11792755126953125, -0.10995864868164062, -0.10198974609375, -0.09402084350585938, -0.08605194091796875, -0.07808303833007812, -0.0701141357421875, -0.062145233154296875, -0.05417633056640625, -0.046207427978515625, -0.038238525390625, -0.030269622802734375, -0.02230072021484375, -0.014331817626953125, -0.0063629150390625, 0.001605987548828125, 0.00957489013671875, 0.017543792724609375, 0.0255126953125, 0.033481597900390625, 0.04145050048828125, 0.049419403076171875, 0.0573883056640625, 0.06535720825195312, 0.07332611083984375, 0.08129501342773438, 0.089263916015625, 0.09723281860351562, 0.10520172119140625, 0.11317062377929688, 0.1211395263671875, 0.12910842895507812, 0.13707733154296875, 0.14504623413085938, 0.15301513671875, 0.16098403930664062, 0.16895294189453125, 0.17692184448242188, 0.1848907470703125, 0.19285964965820312, 0.20082855224609375, 0.20879745483398438, 0.216766357421875, 0.22473526000976562, 0.23270416259765625, 0.24067306518554688, 0.2486419677734375, 0.2566108703613281, 0.26457977294921875, 0.2725486755371094, 0.280517578125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 7.0, 8.0, 13.0, 22.0, 43.0, 52.0, 104.0, 164.0, 327.0, 666.0, 1192.0, 2603.0, 5693.0, 13766.0, 38079.0, 111645.0, 280261.0, 337954.0, 164645.0, 56356.0, 20058.0, 8064.0, 3580.0, 1578.0, 764.0, 377.0, 226.0, 137.0, 74.0, 26.0, 18.0, 16.0, 15.0, 10.0, 7.0, 5.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.5810546875, -0.5654296875, -0.5498046875, -0.5341796875, -0.5185546875, -0.5029296875, -0.4873046875, -0.4716796875, -0.4560546875, -0.4404296875, -0.4248046875, -0.4091796875, -0.3935546875, -0.3779296875, -0.3623046875, -0.3466796875, -0.3310546875, -0.3154296875, -0.2998046875, -0.2841796875, -0.2685546875, -0.2529296875, -0.2373046875, -0.2216796875, -0.2060546875, -0.1904296875, -0.1748046875, -0.1591796875, -0.1435546875, -0.1279296875, -0.1123046875, -0.0966796875, -0.0810546875, -0.0654296875, -0.0498046875, -0.0341796875, -0.0185546875, -0.0029296875, 0.0126953125, 0.0283203125, 0.0439453125, 0.0595703125, 0.0751953125, 0.0908203125, 0.1064453125, 0.1220703125, 0.1376953125, 0.1533203125, 0.1689453125, 0.1845703125, 0.2001953125, 0.2158203125, 0.2314453125, 0.2470703125, 0.2626953125, 0.2783203125, 0.2939453125, 0.3095703125, 0.3251953125, 0.3408203125, 0.3564453125, 0.3720703125, 0.3876953125, 0.4033203125, 0.4189453125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 2.0, 3.0, 4.0, 5.0, 10.0, 11.0, 14.0, 13.0, 9.0, 17.0, 17.0, 22.0, 22.0, 23.0, 31.0, 48.0, 47.0, 56.0, 49.0, 46.0, 45.0, 41.0, 46.0, 61.0, 39.0, 43.0, 36.0, 34.0, 35.0, 41.0, 19.0, 21.0, 17.0, 16.0, 15.0, 8.0, 8.0, 11.0, 7.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.69091796875, -0.6678314208984375, -0.644744873046875, -0.6216583251953125, -0.59857177734375, -0.5754852294921875, -0.552398681640625, -0.5293121337890625, -0.5062255859375, -0.4831390380859375, -0.460052490234375, -0.4369659423828125, -0.41387939453125, -0.3907928466796875, -0.367706298828125, -0.3446197509765625, -0.321533203125, -0.2984466552734375, -0.275360107421875, -0.2522735595703125, -0.22918701171875, -0.2061004638671875, -0.183013916015625, -0.1599273681640625, -0.1368408203125, -0.1137542724609375, -0.090667724609375, -0.0675811767578125, -0.04449462890625, -0.0214080810546875, 0.001678466796875, 0.0247650146484375, 0.0478515625, 0.0709381103515625, 0.094024658203125, 0.1171112060546875, 0.14019775390625, 0.1632843017578125, 0.186370849609375, 0.2094573974609375, 0.2325439453125, 0.2556304931640625, 0.278717041015625, 0.3018035888671875, 0.32489013671875, 0.3479766845703125, 0.371063232421875, 0.3941497802734375, 0.417236328125, 0.4403228759765625, 0.463409423828125, 0.4864959716796875, 0.50958251953125, 0.5326690673828125, 0.555755615234375, 0.5788421630859375, 0.6019287109375, 0.6250152587890625, 0.648101806640625, 0.6711883544921875, 0.69427490234375, 0.7173614501953125, 0.740447998046875, 0.7635345458984375, 0.78662109375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 4.0, 4.0, 5.0, 8.0, 5.0, 16.0, 28.0, 59.0, 107.0, 161.0, 363.0, 787.0, 1724.0, 4557.0, 11837.0, 32471.0, 88906.0, 213075.0, 320852.0, 222534.0, 95113.0, 34913.0, 12619.0, 4830.0, 1985.0, 862.0, 363.0, 155.0, 90.0, 53.0, 39.0, 14.0, 3.0, 7.0, 7.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10772705078125, -0.1036672592163086, -0.09960746765136719, -0.09554767608642578, -0.09148788452148438, -0.08742809295654297, -0.08336830139160156, -0.07930850982666016, -0.07524871826171875, -0.07118892669677734, -0.06712913513183594, -0.06306934356689453, -0.059009552001953125, -0.05494976043701172, -0.05088996887207031, -0.046830177307128906, -0.0427703857421875, -0.038710594177246094, -0.03465080261230469, -0.03059101104736328, -0.026531219482421875, -0.02247142791748047, -0.018411636352539062, -0.014351844787597656, -0.01029205322265625, -0.006232261657714844, -0.0021724700927734375, 0.0018873214721679688, 0.005947113037109375, 0.010006904602050781, 0.014066696166992188, 0.018126487731933594, 0.022186279296875, 0.026246070861816406, 0.030305862426757812, 0.03436565399169922, 0.038425445556640625, 0.04248523712158203, 0.04654502868652344, 0.050604820251464844, 0.05466461181640625, 0.058724403381347656, 0.06278419494628906, 0.06684398651123047, 0.07090377807617188, 0.07496356964111328, 0.07902336120605469, 0.0830831527709961, 0.0871429443359375, 0.0912027359008789, 0.09526252746582031, 0.09932231903076172, 0.10338211059570312, 0.10744190216064453, 0.11150169372558594, 0.11556148529052734, 0.11962127685546875, 0.12368106842041016, 0.12774085998535156, 0.13180065155029297, 0.13586044311523438, 0.13992023468017578, 0.1439800262451172, 0.1480398178100586, 0.152099609375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 6.0, 3.0, 6.0, 7.0, 4.0, 5.0, 14.0, 18.0, 26.0, 28.0, 41.0, 37.0, 49.0, 66.0, 69.0, 89.0, 75.0, 72.0, 71.0, 55.0, 47.0, 50.0, 35.0, 39.0, 24.0, 16.0, 12.0, 7.0, 4.0, 9.0, 5.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.2928924560546875e-05, -5.1480717957019806e-05, -5.003251135349274e-05, -4.858430474996567e-05, -4.71360981464386e-05, -4.568789154291153e-05, -4.423968493938446e-05, -4.279147833585739e-05, -4.134327173233032e-05, -3.989506512880325e-05, -3.8446858525276184e-05, -3.6998651921749115e-05, -3.5550445318222046e-05, -3.410223871469498e-05, -3.265403211116791e-05, -3.120582550764084e-05, -2.975761890411377e-05, -2.83094123005867e-05, -2.686120569705963e-05, -2.5412999093532562e-05, -2.3964792490005493e-05, -2.2516585886478424e-05, -2.1068379282951355e-05, -1.9620172679424286e-05, -1.8171966075897217e-05, -1.6723759472370148e-05, -1.527555286884308e-05, -1.382734626531601e-05, -1.237913966178894e-05, -1.0930933058261871e-05, -9.482726454734802e-06, -8.034519851207733e-06, -6.586313247680664e-06, -5.138106644153595e-06, -3.689900040626526e-06, -2.2416934370994568e-06, -7.934868335723877e-07, 6.547197699546814e-07, 2.1029263734817505e-06, 3.5511329770088196e-06, 4.999339580535889e-06, 6.447546184062958e-06, 7.895752787590027e-06, 9.343959391117096e-06, 1.0792165994644165e-05, 1.2240372598171234e-05, 1.3688579201698303e-05, 1.5136785805225372e-05, 1.658499240875244e-05, 1.803319901227951e-05, 1.948140561580658e-05, 2.092961221933365e-05, 2.2377818822860718e-05, 2.3826025426387787e-05, 2.5274232029914856e-05, 2.6722438633441925e-05, 2.8170645236968994e-05, 2.9618851840496063e-05, 3.106705844402313e-05, 3.25152650475502e-05, 3.396347165107727e-05, 3.541167825460434e-05, 3.685988485813141e-05, 3.830809146165848e-05, 3.975629806518555e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 7.0, 5.0, 3.0, 14.0, 11.0, 13.0, 43.0, 58.0, 75.0, 113.0, 181.0, 323.0, 604.0, 1028.0, 2024.0, 4187.0, 9307.0, 21142.0, 49221.0, 109415.0, 204692.0, 263349.0, 197124.0, 103052.0, 45832.0, 19797.0, 8690.0, 3989.0, 1918.0, 996.0, 531.0, 306.0, 206.0, 88.0, 71.0, 52.0, 32.0, 18.0, 9.0, 12.0, 6.0, 6.0, 2.0, 3.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0], "bins": [-0.12481689453125, -0.12129688262939453, -0.11777687072753906, -0.1142568588256836, -0.11073684692382812, -0.10721683502197266, -0.10369682312011719, -0.10017681121826172, -0.09665679931640625, -0.09313678741455078, -0.08961677551269531, -0.08609676361083984, -0.08257675170898438, -0.0790567398071289, -0.07553672790527344, -0.07201671600341797, -0.0684967041015625, -0.06497669219970703, -0.06145668029785156, -0.057936668395996094, -0.054416656494140625, -0.050896644592285156, -0.04737663269042969, -0.04385662078857422, -0.04033660888671875, -0.03681659698486328, -0.03329658508300781, -0.029776573181152344, -0.026256561279296875, -0.022736549377441406, -0.019216537475585938, -0.01569652557373047, -0.012176513671875, -0.008656501770019531, -0.0051364898681640625, -0.0016164779663085938, 0.001903533935546875, 0.005423545837402344, 0.008943557739257812, 0.012463569641113281, 0.01598358154296875, 0.01950359344482422, 0.023023605346679688, 0.026543617248535156, 0.030063629150390625, 0.033583641052246094, 0.03710365295410156, 0.04062366485595703, 0.0441436767578125, 0.04766368865966797, 0.05118370056152344, 0.054703712463378906, 0.058223724365234375, 0.061743736267089844, 0.06526374816894531, 0.06878376007080078, 0.07230377197265625, 0.07582378387451172, 0.07934379577636719, 0.08286380767822266, 0.08638381958007812, 0.0899038314819336, 0.09342384338378906, 0.09694385528564453, 0.1004638671875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 4.0, 1.0, 10.0, 7.0, 13.0, 11.0, 12.0, 14.0, 17.0, 26.0, 32.0, 28.0, 46.0, 43.0, 46.0, 54.0, 65.0, 63.0, 47.0, 57.0, 51.0, 53.0, 40.0, 39.0, 41.0, 44.0, 30.0, 20.0, 20.0, 16.0, 15.0, 12.0, 8.0, 7.0, 9.0, 2.0, 0.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1502685546875, -0.14590072631835938, -0.14153289794921875, -0.13716506958007812, -0.1327972412109375, -0.12842941284179688, -0.12406158447265625, -0.11969375610351562, -0.115325927734375, -0.11095809936523438, -0.10659027099609375, -0.10222244262695312, -0.0978546142578125, -0.09348678588867188, -0.08911895751953125, -0.08475112915039062, -0.08038330078125, -0.07601547241210938, -0.07164764404296875, -0.06727981567382812, -0.0629119873046875, -0.058544158935546875, -0.05417633056640625, -0.049808502197265625, -0.045440673828125, -0.041072845458984375, -0.03670501708984375, -0.032337188720703125, -0.0279693603515625, -0.023601531982421875, -0.01923370361328125, -0.014865875244140625, -0.010498046875, -0.006130218505859375, -0.00176239013671875, 0.002605438232421875, 0.0069732666015625, 0.011341094970703125, 0.01570892333984375, 0.020076751708984375, 0.024444580078125, 0.028812408447265625, 0.03318023681640625, 0.037548065185546875, 0.0419158935546875, 0.046283721923828125, 0.05065155029296875, 0.055019378662109375, 0.05938720703125, 0.06375503540039062, 0.06812286376953125, 0.07249069213867188, 0.0768585205078125, 0.08122634887695312, 0.08559417724609375, 0.08996200561523438, 0.094329833984375, 0.09869766235351562, 0.10306549072265625, 0.10743331909179688, 0.1118011474609375, 0.11616897583007812, 0.12053680419921875, 0.12490463256835938, 0.1292724609375]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 8.0, 5.0, 5.0, 27.0, 35.0, 38.0, 74.0, 94.0, 146.0, 145.0, 156.0, 97.0, 65.0, 46.0, 28.0, 12.0, 6.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0944294929504395, -1.9904919862747192, -1.8865545988082886, -1.7826170921325684, -1.6786795854568481, -1.574742078781128, -1.4708046913146973, -1.366867184638977, -1.2629296779632568, -1.1589921712875366, -1.055054783821106, -0.9511172771453857, -0.8471797704696655, -0.7432423233985901, -0.6393048763275146, -0.5353673696517944, -0.43142998218536377, -0.32749250531196594, -0.2235550433397293, -0.11961758136749268, -0.01568010449409485, 0.08825737237930298, 0.19219481945037842, 0.29613232612609863, 0.4000697731971741, 0.5040072202682495, 0.6079447269439697, 0.7118821740150452, 0.8158196210861206, 0.9197571277618408, 1.0236945152282715, 1.1276321411132812, 1.231569528579712, 1.3355070352554321, 1.4394444227218628, 1.543381929397583, 1.6473194360733032, 1.7512569427490234, 1.855194330215454, 1.9591318368911743, 2.0630693435668945, 2.167006731033325, 2.270944356918335, 2.3748817443847656, 2.4788191318511963, 2.582756757736206, 2.6866941452026367, 2.7906317710876465, 2.894568920135498, 2.9985063076019287, 3.1024439334869385, 3.206381320953369, 3.3103187084198, 3.4142563343048096, 3.5181937217712402, 3.62213134765625, 3.7260687351226807, 3.8300061225891113, 3.933943748474121, 4.037880897521973, 4.141818523406982, 4.245756149291992, 4.349693298339844, 4.4536309242248535, 4.557568550109863]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 6.0, 3.0, 11.0, 13.0, 7.0, 4.0, 14.0, 11.0, 13.0, 17.0, 10.0, 19.0, 23.0, 24.0, 23.0, 22.0, 22.0, 30.0, 35.0, 29.0, 37.0, 46.0, 24.0, 44.0, 40.0, 46.0, 31.0, 37.0, 33.0, 40.0, 40.0, 27.0, 31.0, 28.0, 25.0, 21.0, 19.0, 12.0, 13.0, 15.0, 14.0, 10.0, 12.0, 7.0, 4.0, 4.0, 3.0, 1.0, 4.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.7009193897247314, -1.646073341369629, -1.5912272930145264, -1.5363812446594238, -1.4815351963043213, -1.4266891479492188, -1.3718432188034058, -1.3169971704483032, -1.2621511220932007, -1.2073050737380981, -1.1524590253829956, -1.097612977027893, -1.04276704788208, -0.9879209399223328, -0.933074951171875, -0.8782289028167725, -0.8233828544616699, -0.7685368061065674, -0.7136907577514648, -0.6588447690010071, -0.6039987206459045, -0.549152672290802, -0.49430665373802185, -0.4394606351852417, -0.38461458683013916, -0.3297685384750366, -0.27492251992225647, -0.22007648646831512, -0.16523045301437378, -0.11038440465927124, -0.05553838610649109, -0.0006923675537109375, 0.05415356159210205, 0.1089995950460434, 0.16384562849998474, 0.2186916619539261, 0.27353769540786743, 0.32838374376296997, 0.3832297623157501, 0.4380757808685303, 0.4929218292236328, 0.5477678775787354, 0.6026139259338379, 0.6574599146842957, 0.7123059630393982, 0.7671520113945007, 0.8219980001449585, 0.876844048500061, 0.9316900968551636, 0.9865361452102661, 1.0413821935653687, 1.0962282419204712, 1.1510741710662842, 1.2059202194213867, 1.2607662677764893, 1.3156123161315918, 1.3704583644866943, 1.4253044128417969, 1.4801504611968994, 1.534996509552002, 1.5898425579071045, 1.644688606262207, 1.69953453540802, 1.7543805837631226, 1.809226632118225]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 2.0, 4.0, 8.0, 26.0, 23.0, 52.0, 79.0, 160.0, 275.0, 435.0, 782.0, 1383.0, 2545.0, 4511.0, 8838.0, 18549.0, 43714.0, 116084.0, 356995.0, 1063370.0, 1566267.0, 674976.0, 208242.0, 71182.0, 28629.0, 12887.0, 6535.0, 3357.0, 1892.0, 1041.0, 596.0, 338.0, 197.0, 131.0, 74.0, 42.0, 22.0, 20.0, 5.0, 7.0, 8.0, 6.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.22412109375, -0.21488571166992188, -0.20565032958984375, -0.19641494750976562, -0.1871795654296875, -0.17794418334960938, -0.16870880126953125, -0.15947341918945312, -0.150238037109375, -0.14100265502929688, -0.13176727294921875, -0.12253189086914062, -0.1132965087890625, -0.10406112670898438, -0.09482574462890625, -0.08559036254882812, -0.07635498046875, -0.06711959838867188, -0.05788421630859375, -0.048648834228515625, -0.0394134521484375, -0.030178070068359375, -0.02094268798828125, -0.011707305908203125, -0.002471923828125, 0.006763458251953125, 0.01599884033203125, 0.025234222412109375, 0.0344696044921875, 0.043704986572265625, 0.05294036865234375, 0.062175750732421875, 0.0714111328125, 0.08064651489257812, 0.08988189697265625, 0.09911727905273438, 0.1083526611328125, 0.11758804321289062, 0.12682342529296875, 0.13605880737304688, 0.145294189453125, 0.15452957153320312, 0.16376495361328125, 0.17300033569335938, 0.1822357177734375, 0.19147109985351562, 0.20070648193359375, 0.20994186401367188, 0.21917724609375, 0.22841262817382812, 0.23764801025390625, 0.24688339233398438, 0.2561187744140625, 0.2653541564941406, 0.27458953857421875, 0.2838249206542969, 0.293060302734375, 0.3022956848144531, 0.31153106689453125, 0.3207664489746094, 0.3300018310546875, 0.3392372131347656, 0.34847259521484375, 0.3577079772949219, 0.366943359375]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 2.0, 1.0, 6.0, 3.0, 4.0, 7.0, 6.0, 6.0, 4.0, 13.0, 17.0, 11.0, 11.0, 17.0, 18.0, 25.0, 35.0, 28.0, 28.0, 34.0, 27.0, 38.0, 45.0, 37.0, 34.0, 41.0, 44.0, 43.0, 33.0, 25.0, 42.0, 34.0, 29.0, 26.0, 25.0, 26.0, 20.0, 27.0, 18.0, 18.0, 20.0, 12.0, 9.0, 9.0, 8.0, 6.0, 9.0, 4.0, 8.0, 5.0, 3.0, 1.0, 6.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1768798828125, -0.17090415954589844, -0.16492843627929688, -0.1589527130126953, -0.15297698974609375, -0.1470012664794922, -0.14102554321289062, -0.13504981994628906, -0.1290740966796875, -0.12309837341308594, -0.11712265014648438, -0.11114692687988281, -0.10517120361328125, -0.09919548034667969, -0.09321975708007812, -0.08724403381347656, -0.081268310546875, -0.07529258728027344, -0.06931686401367188, -0.06334114074707031, -0.05736541748046875, -0.05138969421386719, -0.045413970947265625, -0.03943824768066406, -0.0334625244140625, -0.027486801147460938, -0.021511077880859375, -0.015535354614257812, -0.00955963134765625, -0.0035839080810546875, 0.002391815185546875, 0.008367538452148438, 0.01434326171875, 0.020318984985351562, 0.026294708251953125, 0.03227043151855469, 0.03824615478515625, 0.04422187805175781, 0.050197601318359375, 0.05617332458496094, 0.0621490478515625, 0.06812477111816406, 0.07410049438476562, 0.08007621765136719, 0.08605194091796875, 0.09202766418457031, 0.09800338745117188, 0.10397911071777344, 0.109954833984375, 0.11593055725097656, 0.12190628051757812, 0.1278820037841797, 0.13385772705078125, 0.1398334503173828, 0.14580917358398438, 0.15178489685058594, 0.1577606201171875, 0.16373634338378906, 0.16971206665039062, 0.1756877899169922, 0.18166351318359375, 0.1876392364501953, 0.19361495971679688, 0.19959068298339844, 0.20556640625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 6.0, 5.0, 8.0, 26.0, 20.0, 42.0, 53.0, 106.0, 186.0, 353.0, 558.0, 1013.0, 1871.0, 3682.0, 7552.0, 16981.0, 42101.0, 123714.0, 458745.0, 2061875.0, 1108216.0, 242554.0, 74064.0, 27408.0, 11802.0, 5392.0, 2694.0, 1412.0, 767.0, 432.0, 270.0, 145.0, 94.0, 61.0, 29.0, 13.0, 13.0, 10.0, 2.0, 4.0, 5.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.46337890625, -0.45111083984375, -0.4388427734375, -0.42657470703125, -0.414306640625, -0.40203857421875, -0.3897705078125, -0.37750244140625, -0.365234375, -0.35296630859375, -0.3406982421875, -0.32843017578125, -0.316162109375, -0.30389404296875, -0.2916259765625, -0.27935791015625, -0.26708984375, -0.25482177734375, -0.2425537109375, -0.23028564453125, -0.218017578125, -0.20574951171875, -0.1934814453125, -0.18121337890625, -0.1689453125, -0.15667724609375, -0.1444091796875, -0.13214111328125, -0.119873046875, -0.10760498046875, -0.0953369140625, -0.08306884765625, -0.07080078125, -0.05853271484375, -0.0462646484375, -0.03399658203125, -0.021728515625, -0.00946044921875, 0.0028076171875, 0.01507568359375, 0.02734375, 0.03961181640625, 0.0518798828125, 0.06414794921875, 0.076416015625, 0.08868408203125, 0.1009521484375, 0.11322021484375, 0.12548828125, 0.13775634765625, 0.1500244140625, 0.16229248046875, 0.174560546875, 0.18682861328125, 0.1990966796875, 0.21136474609375, 0.2236328125, 0.23590087890625, 0.2481689453125, 0.26043701171875, 0.272705078125, 0.28497314453125, 0.2972412109375, 0.30950927734375, 0.32177734375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 7.0, 8.0, 6.0, 6.0, 6.0, 13.0, 15.0, 22.0, 24.0, 36.0, 53.0, 67.0, 80.0, 94.0, 175.0, 198.0, 313.0, 430.0, 571.0, 504.0, 391.0, 288.0, 216.0, 146.0, 102.0, 74.0, 55.0, 41.0, 37.0, 27.0, 20.0, 14.0, 8.0, 4.0, 5.0, 7.0, 4.0, 2.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.497802734375, -0.4835548400878906, -0.46930694580078125, -0.4550590515136719, -0.4408111572265625, -0.4265632629394531, -0.41231536865234375, -0.3980674743652344, -0.383819580078125, -0.3695716857910156, -0.35532379150390625, -0.3410758972167969, -0.3268280029296875, -0.3125801086425781, -0.29833221435546875, -0.2840843200683594, -0.26983642578125, -0.2555885314941406, -0.24134063720703125, -0.22709274291992188, -0.2128448486328125, -0.19859695434570312, -0.18434906005859375, -0.17010116577148438, -0.155853271484375, -0.14160537719726562, -0.12735748291015625, -0.11310958862304688, -0.0988616943359375, -0.08461380004882812, -0.07036590576171875, -0.056118011474609375, -0.0418701171875, -0.027622222900390625, -0.01337432861328125, 0.000873565673828125, 0.0151214599609375, 0.029369354248046875, 0.04361724853515625, 0.057865142822265625, 0.072113037109375, 0.08636093139648438, 0.10060882568359375, 0.11485671997070312, 0.1291046142578125, 0.14335250854492188, 0.15760040283203125, 0.17184829711914062, 0.18609619140625, 0.20034408569335938, 0.21459197998046875, 0.22883987426757812, 0.2430877685546875, 0.2573356628417969, 0.27158355712890625, 0.2858314514160156, 0.300079345703125, 0.3143272399902344, 0.32857513427734375, 0.3428230285644531, 0.3570709228515625, 0.3713188171386719, 0.38556671142578125, 0.3998146057128906, 0.4140625]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 6.0, 4.0, 1.0, 8.0, 25.0, 57.0, 155.0, 292.0, 284.0, 115.0, 42.0, 12.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.028602600097656, -9.77835750579834, -9.528112411499023, -9.277868270874023, -9.027623176574707, -8.77737808227539, -8.527132987976074, -8.276887893676758, -8.026643753051758, -7.776398658752441, -7.526154041290283, -7.275908946990967, -7.025664329528809, -6.775419235229492, -6.525174140930176, -6.274929046630859, -6.024683952331543, -5.774438858032227, -5.524194240570068, -5.273949146270752, -5.023704528808594, -4.773459434509277, -4.523214340209961, -4.2729692459106445, -4.022724628448486, -3.772479772567749, -3.5222349166870117, -3.2719898223876953, -3.021744966506958, -2.7715001106262207, -2.5212550163269043, -2.271010160446167, -2.020766258239746, -1.7705214023590088, -1.520276427268982, -1.270031452178955, -1.0197865962982178, -0.7695417404174805, -0.5192967653274536, -0.26905179023742676, -0.018806934356689453, 0.23143798112869263, 0.4816828966140747, 0.7319278120994568, 0.9821727275848389, 1.2324175834655762, 1.482662558555603, 1.7329075336456299, 1.9831523895263672, 2.2333972454071045, 2.483642101287842, 2.733887195587158, 2.9841320514678955, 3.234376907348633, 3.484622001647949, 3.7348668575286865, 3.985111713409424, 4.23535680770874, 4.485601425170898, 4.735846519470215, 4.986091613769531, 5.2363362312316895, 5.486581325531006, 5.736825942993164, 5.9870710372924805]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 9.0, 10.0, 7.0, 7.0, 8.0, 18.0, 20.0, 25.0, 20.0, 35.0, 33.0, 46.0, 44.0, 36.0, 39.0, 50.0, 45.0, 59.0, 53.0, 36.0, 34.0, 52.0, 45.0, 50.0, 38.0, 24.0, 23.0, 33.0, 24.0, 15.0, 15.0, 15.0, 7.0, 4.0, 7.0, 6.0, 4.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7441456317901611, -1.6884320974349976, -1.632718563079834, -1.5770050287246704, -1.5212914943695068, -1.4655779600143433, -1.4098644256591797, -1.3541508913040161, -1.2984373569488525, -1.242723822593689, -1.1870102882385254, -1.1312967538833618, -1.0755832195281982, -1.0198696851730347, -0.9641561508178711, -0.9084426164627075, -0.8527290225028992, -0.7970154881477356, -0.741301953792572, -0.6855884194374084, -0.6298748850822449, -0.5741612911224365, -0.518447756767273, -0.46273425221443176, -0.4070207178592682, -0.3513071835041046, -0.29559364914894104, -0.23988009989261627, -0.1841665655374527, -0.12845301628112793, -0.07273948192596436, -0.01702594757080078, 0.03868758678436279, 0.09440112113952637, 0.15011465549468994, 0.2058282047510147, 0.2615417242050171, 0.31725528836250305, 0.3729688227176666, 0.4286823570728302, 0.4843958914279938, 0.5401094555854797, 0.5958229899406433, 0.6515365242958069, 0.7072500586509705, 0.762963593006134, 0.8186771273612976, 0.8743906617164612, 0.9301041960716248, 0.9858177304267883, 1.0415313243865967, 1.0972448587417603, 1.1529583930969238, 1.2086719274520874, 1.264385461807251, 1.3200989961624146, 1.3758125305175781, 1.4315260648727417, 1.4872395992279053, 1.5429531335830688, 1.5986666679382324, 1.654380202293396, 1.7100937366485596, 1.7658072710037231, 1.8215208053588867]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 4.0, 2.0, 3.0, 3.0, 3.0, 5.0, 5.0, 18.0, 19.0, 22.0, 33.0, 49.0, 75.0, 121.0, 187.0, 293.0, 478.0, 775.0, 1185.0, 2024.0, 3526.0, 5638.0, 9983.0, 17431.0, 30186.0, 50777.0, 81988.0, 121059.0, 155436.0, 163133.0, 141129.0, 101836.0, 66133.0, 39902.0, 23056.0, 13298.0, 7614.0, 4423.0, 2599.0, 1602.0, 875.0, 553.0, 374.0, 246.0, 162.0, 89.0, 63.0, 53.0, 30.0, 19.0, 17.0, 12.0, 6.0, 7.0, 7.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1995849609375, -0.19298934936523438, -0.18639373779296875, -0.17979812622070312, -0.1732025146484375, -0.16660690307617188, -0.16001129150390625, -0.15341567993164062, -0.146820068359375, -0.14022445678710938, -0.13362884521484375, -0.12703323364257812, -0.1204376220703125, -0.11384201049804688, -0.10724639892578125, -0.10065078735351562, -0.09405517578125, -0.08745956420898438, -0.08086395263671875, -0.07426834106445312, -0.0676727294921875, -0.061077117919921875, -0.05448150634765625, -0.047885894775390625, -0.041290283203125, -0.034694671630859375, -0.02809906005859375, -0.021503448486328125, -0.0149078369140625, -0.008312225341796875, -0.00171661376953125, 0.004878997802734375, 0.011474609375, 0.018070220947265625, 0.02466583251953125, 0.031261444091796875, 0.0378570556640625, 0.044452667236328125, 0.05104827880859375, 0.057643890380859375, 0.064239501953125, 0.07083511352539062, 0.07743072509765625, 0.08402633666992188, 0.0906219482421875, 0.09721755981445312, 0.10381317138671875, 0.11040878295898438, 0.11700439453125, 0.12360000610351562, 0.13019561767578125, 0.13679122924804688, 0.1433868408203125, 0.14998245239257812, 0.15657806396484375, 0.16317367553710938, 0.169769287109375, 0.17636489868164062, 0.18296051025390625, 0.18955612182617188, 0.1961517333984375, 0.20274734497070312, 0.20934295654296875, 0.21593856811523438, 0.2225341796875]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 6.0, 4.0, 2.0, 6.0, 6.0, 9.0, 7.0, 16.0, 16.0, 16.0, 24.0, 19.0, 25.0, 24.0, 24.0, 34.0, 38.0, 29.0, 26.0, 34.0, 41.0, 46.0, 40.0, 31.0, 37.0, 38.0, 39.0, 38.0, 40.0, 41.0, 20.0, 23.0, 29.0, 20.0, 25.0, 18.0, 20.0, 9.0, 8.0, 13.0, 15.0, 12.0, 10.0, 4.0, 4.0, 4.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0, 4.0, 0.0, 2.0], "bins": [-0.21240234375, -0.20580101013183594, -0.19919967651367188, -0.1925983428955078, -0.18599700927734375, -0.1793956756591797, -0.17279434204101562, -0.16619300842285156, -0.1595916748046875, -0.15299034118652344, -0.14638900756835938, -0.1397876739501953, -0.13318634033203125, -0.1265850067138672, -0.11998367309570312, -0.11338233947753906, -0.106781005859375, -0.10017967224121094, -0.09357833862304688, -0.08697700500488281, -0.08037567138671875, -0.07377433776855469, -0.06717300415039062, -0.06057167053222656, -0.0539703369140625, -0.04736900329589844, -0.040767669677734375, -0.03416633605957031, -0.02756500244140625, -0.020963668823242188, -0.014362335205078125, -0.0077610015869140625, -0.00115966796875, 0.0054416656494140625, 0.012042999267578125, 0.018644332885742188, 0.02524566650390625, 0.03184700012207031, 0.038448333740234375, 0.04504966735839844, 0.0516510009765625, 0.05825233459472656, 0.06485366821289062, 0.07145500183105469, 0.07805633544921875, 0.08465766906738281, 0.09125900268554688, 0.09786033630371094, 0.104461669921875, 0.11106300354003906, 0.11766433715820312, 0.12426567077636719, 0.13086700439453125, 0.1374683380126953, 0.14406967163085938, 0.15067100524902344, 0.1572723388671875, 0.16387367248535156, 0.17047500610351562, 0.1770763397216797, 0.18367767333984375, 0.1902790069580078, 0.19688034057617188, 0.20348167419433594, 0.2100830078125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 4.0, 10.0, 13.0, 10.0, 13.0, 32.0, 43.0, 52.0, 78.0, 99.0, 153.0, 241.0, 379.0, 629.0, 1003.0, 1647.0, 2832.0, 4971.0, 9120.0, 17262.0, 32962.0, 61620.0, 111686.0, 181553.0, 246692.0, 163073.0, 97808.0, 53100.0, 28125.0, 14563.0, 8031.0, 4397.0, 2473.0, 1490.0, 832.0, 543.0, 327.0, 214.0, 133.0, 87.0, 78.0, 54.0, 38.0, 33.0, 11.0, 16.0, 6.0, 7.0, 7.0, 4.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.260498046875, -0.2524528503417969, -0.24440765380859375, -0.23636245727539062, -0.2283172607421875, -0.22027206420898438, -0.21222686767578125, -0.20418167114257812, -0.196136474609375, -0.18809127807617188, -0.18004608154296875, -0.17200088500976562, -0.1639556884765625, -0.15591049194335938, -0.14786529541015625, -0.13982009887695312, -0.13177490234375, -0.12372970581054688, -0.11568450927734375, -0.10763931274414062, -0.0995941162109375, -0.09154891967773438, -0.08350372314453125, -0.07545852661132812, -0.067413330078125, -0.059368133544921875, -0.05132293701171875, -0.043277740478515625, -0.0352325439453125, -0.027187347412109375, -0.01914215087890625, -0.011096954345703125, -0.0030517578125, 0.004993438720703125, 0.01303863525390625, 0.021083831787109375, 0.0291290283203125, 0.037174224853515625, 0.04521942138671875, 0.053264617919921875, 0.061309814453125, 0.06935501098632812, 0.07740020751953125, 0.08544540405273438, 0.0934906005859375, 0.10153579711914062, 0.10958099365234375, 0.11762619018554688, 0.12567138671875, 0.13371658325195312, 0.14176177978515625, 0.14980697631835938, 0.1578521728515625, 0.16589736938476562, 0.17394256591796875, 0.18198776245117188, 0.190032958984375, 0.19807815551757812, 0.20612335205078125, 0.21416854858398438, 0.2222137451171875, 0.23025894165039062, 0.23830413818359375, 0.24634933471679688, 0.25439453125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 3.0, 4.0, 3.0, 9.0, 6.0, 12.0, 13.0, 25.0, 33.0, 21.0, 31.0, 38.0, 57.0, 37.0, 66.0, 51.0, 75.0, 68.0, 59.0, 52.0, 54.0, 54.0, 37.0, 28.0, 37.0, 25.0, 27.0, 18.0, 16.0, 14.0, 14.0, 7.0, 3.0, 6.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8251953125, -0.7985000610351562, -0.7718048095703125, -0.7451095581054688, -0.718414306640625, -0.6917190551757812, -0.6650238037109375, -0.6383285522460938, -0.61163330078125, -0.5849380493164062, -0.5582427978515625, -0.5315475463867188, -0.504852294921875, -0.47815704345703125, -0.4514617919921875, -0.42476654052734375, -0.3980712890625, -0.37137603759765625, -0.3446807861328125, -0.31798553466796875, -0.291290283203125, -0.26459503173828125, -0.2378997802734375, -0.21120452880859375, -0.18450927734375, -0.15781402587890625, -0.1311187744140625, -0.10442352294921875, -0.077728271484375, -0.05103302001953125, -0.0243377685546875, 0.00235748291015625, 0.029052734375, 0.05574798583984375, 0.0824432373046875, 0.10913848876953125, 0.135833740234375, 0.16252899169921875, 0.1892242431640625, 0.21591949462890625, 0.24261474609375, 0.26930999755859375, 0.2960052490234375, 0.32270050048828125, 0.349395751953125, 0.37609100341796875, 0.4027862548828125, 0.42948150634765625, 0.4561767578125, 0.48287200927734375, 0.5095672607421875, 0.5362625122070312, 0.562957763671875, 0.5896530151367188, 0.6163482666015625, 0.6430435180664062, 0.66973876953125, 0.6964340209960938, 0.7231292724609375, 0.7498245239257812, 0.776519775390625, 0.8032150268554688, 0.8299102783203125, 0.8566055297851562, 0.88330078125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 3.0, 8.0, 8.0, 14.0, 26.0, 27.0, 43.0, 48.0, 73.0, 101.0, 153.0, 228.0, 310.0, 463.0, 684.0, 1026.0, 1556.0, 2425.0, 4007.0, 6370.0, 10949.0, 18780.0, 31772.0, 54155.0, 88833.0, 137680.0, 208709.0, 174886.0, 119361.0, 74959.0, 44869.0, 26616.0, 15351.0, 9147.0, 5384.0, 3283.0, 2087.0, 1385.0, 891.0, 576.0, 364.0, 282.0, 204.0, 135.0, 87.0, 61.0, 49.0, 50.0, 22.0, 23.0, 16.0, 6.0, 8.0, 1.0, 4.0, 3.0, 2.0, 2.0], "bins": [-0.05047607421875, -0.04893827438354492, -0.047400474548339844, -0.045862674713134766, -0.04432487487792969, -0.04278707504272461, -0.04124927520751953, -0.03971147537231445, -0.038173675537109375, -0.0366358757019043, -0.03509807586669922, -0.03356027603149414, -0.03202247619628906, -0.030484676361083984, -0.028946876525878906, -0.027409076690673828, -0.02587127685546875, -0.024333477020263672, -0.022795677185058594, -0.021257877349853516, -0.019720077514648438, -0.01818227767944336, -0.01664447784423828, -0.015106678009033203, -0.013568878173828125, -0.012031078338623047, -0.010493278503417969, -0.00895547866821289, -0.0074176788330078125, -0.005879878997802734, -0.004342079162597656, -0.002804279327392578, -0.0012664794921875, 0.0002713203430175781, 0.0018091201782226562, 0.0033469200134277344, 0.0048847198486328125, 0.006422519683837891, 0.007960319519042969, 0.009498119354248047, 0.011035919189453125, 0.012573719024658203, 0.014111518859863281, 0.01564931869506836, 0.017187118530273438, 0.018724918365478516, 0.020262718200683594, 0.021800518035888672, 0.02333831787109375, 0.024876117706298828, 0.026413917541503906, 0.027951717376708984, 0.029489517211914062, 0.03102731704711914, 0.03256511688232422, 0.0341029167175293, 0.035640716552734375, 0.03717851638793945, 0.03871631622314453, 0.04025411605834961, 0.04179191589355469, 0.043329715728759766, 0.044867515563964844, 0.04640531539916992, 0.047943115234375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 6.0, 1.0, 3.0, 4.0, 3.0, 2.0, 3.0, 6.0, 5.0, 8.0, 12.0, 7.0, 12.0, 14.0, 15.0, 11.0, 23.0, 29.0, 20.0, 24.0, 42.0, 40.0, 37.0, 47.0, 40.0, 46.0, 60.0, 65.0, 42.0, 41.0, 39.0, 36.0, 34.0, 31.0, 32.0, 17.0, 20.0, 24.0, 17.0, 16.0, 15.0, 9.0, 10.0, 9.0, 4.0, 5.0, 5.0, 5.0, 3.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 3.0], "bins": [-2.580881118774414e-05, -2.5054439902305603e-05, -2.4300068616867065e-05, -2.3545697331428528e-05, -2.279132604598999e-05, -2.2036954760551453e-05, -2.1282583475112915e-05, -2.0528212189674377e-05, -1.977384090423584e-05, -1.9019469618797302e-05, -1.8265098333358765e-05, -1.7510727047920227e-05, -1.675635576248169e-05, -1.6001984477043152e-05, -1.5247613191604614e-05, -1.4493241906166077e-05, -1.3738870620727539e-05, -1.2984499335289001e-05, -1.2230128049850464e-05, -1.1475756764411926e-05, -1.0721385478973389e-05, -9.967014193534851e-06, -9.212642908096313e-06, -8.458271622657776e-06, -7.703900337219238e-06, -6.949529051780701e-06, -6.195157766342163e-06, -5.4407864809036255e-06, -4.686415195465088e-06, -3.93204391002655e-06, -3.1776726245880127e-06, -2.423301339149475e-06, -1.6689300537109375e-06, -9.145587682723999e-07, -1.601874828338623e-07, 5.941838026046753e-07, 1.3485550880432129e-06, 2.1029263734817505e-06, 2.857297658920288e-06, 3.6116689443588257e-06, 4.366040229797363e-06, 5.120411515235901e-06, 5.8747828006744385e-06, 6.629154086112976e-06, 7.383525371551514e-06, 8.137896656990051e-06, 8.892267942428589e-06, 9.646639227867126e-06, 1.0401010513305664e-05, 1.1155381798744202e-05, 1.190975308418274e-05, 1.2664124369621277e-05, 1.3418495655059814e-05, 1.4172866940498352e-05, 1.492723822593689e-05, 1.5681609511375427e-05, 1.6435980796813965e-05, 1.7190352082252502e-05, 1.794472336769104e-05, 1.8699094653129578e-05, 1.9453465938568115e-05, 2.0207837224006653e-05, 2.096220850944519e-05, 2.1716579794883728e-05, 2.2470951080322266e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 9.0, 5.0, 12.0, 10.0, 20.0, 26.0, 34.0, 68.0, 139.0, 188.0, 306.0, 530.0, 965.0, 1757.0, 3351.0, 6230.0, 12728.0, 25073.0, 51516.0, 101355.0, 183061.0, 274419.0, 183409.0, 101122.0, 50680.0, 25435.0, 12405.0, 6360.0, 3209.0, 1708.0, 1014.0, 590.0, 313.0, 174.0, 122.0, 71.0, 59.0, 25.0, 19.0, 17.0, 10.0, 6.0, 5.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.07958984375, -0.07740926742553711, -0.07522869110107422, -0.07304811477661133, -0.07086753845214844, -0.06868696212768555, -0.06650638580322266, -0.06432580947875977, -0.062145233154296875, -0.059964656829833984, -0.057784080505371094, -0.0556035041809082, -0.05342292785644531, -0.05124235153198242, -0.04906177520751953, -0.04688119888305664, -0.04470062255859375, -0.04252004623413086, -0.04033946990966797, -0.03815889358520508, -0.03597831726074219, -0.0337977409362793, -0.031617164611816406, -0.029436588287353516, -0.027256011962890625, -0.025075435638427734, -0.022894859313964844, -0.020714282989501953, -0.018533706665039062, -0.016353130340576172, -0.014172554016113281, -0.01199197769165039, -0.0098114013671875, -0.007630825042724609, -0.005450248718261719, -0.003269672393798828, -0.0010890960693359375, 0.0010914802551269531, 0.0032720565795898438, 0.005452632904052734, 0.007633209228515625, 0.009813785552978516, 0.011994361877441406, 0.014174938201904297, 0.016355514526367188, 0.018536090850830078, 0.02071666717529297, 0.02289724349975586, 0.02507781982421875, 0.02725839614868164, 0.02943897247314453, 0.03161954879760742, 0.03380012512207031, 0.0359807014465332, 0.038161277770996094, 0.040341854095458984, 0.042522430419921875, 0.044703006744384766, 0.046883583068847656, 0.04906415939331055, 0.05124473571777344, 0.05342531204223633, 0.05560588836669922, 0.05778646469116211, 0.059967041015625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 4.0, 6.0, 5.0, 11.0, 7.0, 9.0, 19.0, 22.0, 13.0, 23.0, 27.0, 36.0, 31.0, 49.0, 52.0, 59.0, 64.0, 64.0, 70.0, 70.0, 56.0, 42.0, 49.0, 43.0, 41.0, 31.0, 30.0, 13.0, 10.0, 12.0, 7.0, 4.0, 9.0, 7.0, 6.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10845947265625, -0.10482215881347656, -0.10118484497070312, -0.09754753112792969, -0.09391021728515625, -0.09027290344238281, -0.08663558959960938, -0.08299827575683594, -0.0793609619140625, -0.07572364807128906, -0.07208633422851562, -0.06844902038574219, -0.06481170654296875, -0.06117439270019531, -0.057537078857421875, -0.05389976501464844, -0.050262451171875, -0.04662513732910156, -0.042987823486328125, -0.03935050964355469, -0.03571319580078125, -0.03207588195800781, -0.028438568115234375, -0.024801254272460938, -0.0211639404296875, -0.017526626586914062, -0.013889312744140625, -0.010251998901367188, -0.00661468505859375, -0.0029773712158203125, 0.000659942626953125, 0.0042972564697265625, 0.0079345703125, 0.011571884155273438, 0.015209197998046875, 0.018846511840820312, 0.02248382568359375, 0.026121139526367188, 0.029758453369140625, 0.03339576721191406, 0.0370330810546875, 0.04067039489746094, 0.044307708740234375, 0.04794502258300781, 0.05158233642578125, 0.05521965026855469, 0.058856964111328125, 0.06249427795410156, 0.066131591796875, 0.06976890563964844, 0.07340621948242188, 0.07704353332519531, 0.08068084716796875, 0.08431816101074219, 0.08795547485351562, 0.09159278869628906, 0.0952301025390625, 0.09886741638183594, 0.10250473022460938, 0.10614204406738281, 0.10977935791015625, 0.11341667175292969, 0.11705398559570312, 0.12069129943847656, 0.12432861328125]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 8.0, 6.0, 18.0, 22.0, 43.0, 60.0, 96.0, 115.0, 117.0, 151.0, 117.0, 84.0, 59.0, 43.0, 19.0, 11.0, 9.0, 10.0, 5.0, 4.0, 4.0, 0.0, 2.0], "bins": [-4.130890369415283, -4.047792434692383, -3.9646944999694824, -3.881596565246582, -3.7984986305236816, -3.715400457382202, -3.6323025226593018, -3.5492045879364014, -3.466106653213501, -3.3830087184906006, -3.2999107837677, -3.2168128490448, -3.1337146759033203, -3.05061674118042, -2.9675188064575195, -2.884420871734619, -2.8013229370117188, -2.7182250022888184, -2.635127067565918, -2.5520291328430176, -2.468931198120117, -2.3858330249786377, -2.3027350902557373, -2.219637155532837, -2.1365392208099365, -2.053441286087036, -1.9703433513641357, -1.8872452974319458, -1.8041473627090454, -1.721049427986145, -1.637951374053955, -1.5548534393310547, -1.4717552661895752, -1.3886573314666748, -1.3055593967437744, -1.2224613428115845, -1.139363408088684, -1.0562654733657837, -0.9731674790382385, -0.8900694847106934, -0.806971549987793, -0.7238736152648926, -0.6407756209373474, -0.5576776266098022, -0.47457969188690186, -0.3914817273616791, -0.3083837628364563, -0.22528576850891113, -0.14218783378601074, -0.059089869260787964, 0.024008095264434814, 0.10710605978965759, 0.19020402431488037, 0.27330198884010315, 0.3563999533653259, 0.4394979476928711, 0.5225958824157715, 0.6056938171386719, 0.688791811466217, 0.7718898057937622, 0.8549877405166626, 0.938085675239563, 1.021183729171753, 1.1042816638946533, 1.1873795986175537]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 4.0, 7.0, 4.0, 8.0, 10.0, 8.0, 4.0, 13.0, 14.0, 11.0, 17.0, 18.0, 25.0, 26.0, 24.0, 32.0, 39.0, 40.0, 40.0, 29.0, 41.0, 38.0, 32.0, 49.0, 50.0, 49.0, 48.0, 26.0, 25.0, 35.0, 27.0, 24.0, 29.0, 24.0, 23.0, 22.0, 17.0, 13.0, 8.0, 12.0, 8.0, 8.0, 8.0, 6.0, 6.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.6128857135772705, -1.564487338066101, -1.516088843345642, -1.4676904678344727, -1.4192919731140137, -1.3708935976028442, -1.3224952220916748, -1.2740967273712158, -1.2256983518600464, -1.177299976348877, -1.128901481628418, -1.0805031061172485, -1.032104730606079, -0.9837062358856201, -0.9353078603744507, -0.8869094252586365, -0.8385109901428223, -0.7901125550270081, -0.7417141199111938, -0.6933157444000244, -0.6449173092842102, -0.596518874168396, -0.5481204986572266, -0.49972206354141235, -0.45132362842559814, -0.40292519330978394, -0.3545267879962921, -0.3061283826828003, -0.2577299475669861, -0.20933152735233307, -0.16093310713768005, -0.11253470182418823, -0.06413626670837402, -0.01573784649372101, 0.03266057372093201, 0.08105899393558502, 0.12945741415023804, 0.17785583436489105, 0.22625425457954407, 0.2746526598930359, 0.3230510950088501, 0.3714495301246643, 0.41984793543815613, 0.46824634075164795, 0.5166447758674622, 0.5650432109832764, 0.6134415864944458, 0.66184002161026, 0.7102384567260742, 0.7586368918418884, 0.8070353269577026, 0.8554337024688721, 0.9038321375846863, 0.9522305727005005, 1.00062894821167, 1.049027442932129, 1.0974258184432983, 1.1458241939544678, 1.1942226886749268, 1.2426210641860962, 1.2910194396972656, 1.3394179344177246, 1.387816309928894, 1.4362146854400635, 1.4846131801605225]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 4.0, 11.0, 12.0, 11.0, 26.0, 37.0, 58.0, 77.0, 119.0, 212.0, 376.0, 722.0, 1543.0, 3463.0, 8239.0, 21265.0, 63758.0, 237497.0, 760903.0, 1392295.0, 1112261.0, 422194.0, 112685.0, 34297.0, 12438.0, 5148.0, 2295.0, 1071.0, 538.0, 301.0, 166.0, 84.0, 65.0, 36.0, 29.0, 19.0, 10.0, 7.0, 5.0, 4.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2169189453125, -0.2077770233154297, -0.19863510131835938, -0.18949317932128906, -0.18035125732421875, -0.17120933532714844, -0.16206741333007812, -0.1529254913330078, -0.1437835693359375, -0.1346416473388672, -0.12549972534179688, -0.11635780334472656, -0.10721588134765625, -0.09807395935058594, -0.08893203735351562, -0.07979011535644531, -0.070648193359375, -0.06150627136230469, -0.052364349365234375, -0.04322242736816406, -0.03408050537109375, -0.024938583374023438, -0.015796661376953125, -0.0066547393798828125, 0.0024871826171875, 0.011629104614257812, 0.020771026611328125, 0.029912948608398438, 0.03905487060546875, 0.04819679260253906, 0.057338714599609375, 0.06648063659667969, 0.07562255859375, 0.08476448059082031, 0.09390640258789062, 0.10304832458496094, 0.11219024658203125, 0.12133216857910156, 0.13047409057617188, 0.1396160125732422, 0.1487579345703125, 0.1578998565673828, 0.16704177856445312, 0.17618370056152344, 0.18532562255859375, 0.19446754455566406, 0.20360946655273438, 0.2127513885498047, 0.221893310546875, 0.2310352325439453, 0.24017715454101562, 0.24931907653808594, 0.25846099853515625, 0.26760292053222656, 0.2767448425292969, 0.2858867645263672, 0.2950286865234375, 0.3041706085205078, 0.3133125305175781, 0.32245445251464844, 0.33159637451171875, 0.34073829650878906, 0.3498802185058594, 0.3590221405029297, 0.3681640625]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 4.0, 1.0, 5.0, 6.0, 9.0, 4.0, 14.0, 13.0, 14.0, 18.0, 22.0, 26.0, 18.0, 28.0, 28.0, 38.0, 31.0, 38.0, 40.0, 35.0, 29.0, 40.0, 49.0, 40.0, 35.0, 38.0, 35.0, 41.0, 37.0, 35.0, 24.0, 23.0, 26.0, 23.0, 23.0, 23.0, 14.0, 11.0, 12.0, 12.0, 10.0, 10.0, 5.0, 7.0, 6.0, 7.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.19677734375, -0.1908130645751953, -0.18484878540039062, -0.17888450622558594, -0.17292022705078125, -0.16695594787597656, -0.16099166870117188, -0.1550273895263672, -0.1490631103515625, -0.1430988311767578, -0.13713455200195312, -0.13117027282714844, -0.12520599365234375, -0.11924171447753906, -0.11327743530273438, -0.10731315612792969, -0.101348876953125, -0.09538459777832031, -0.08942031860351562, -0.08345603942871094, -0.07749176025390625, -0.07152748107910156, -0.06556320190429688, -0.05959892272949219, -0.0536346435546875, -0.04767036437988281, -0.041706085205078125, -0.03574180603027344, -0.02977752685546875, -0.023813247680664062, -0.017848968505859375, -0.011884689331054688, -0.00592041015625, 4.38690185546875e-05, 0.006008148193359375, 0.011972427368164062, 0.01793670654296875, 0.023900985717773438, 0.029865264892578125, 0.03582954406738281, 0.0417938232421875, 0.04775810241699219, 0.053722381591796875, 0.05968666076660156, 0.06565093994140625, 0.07161521911621094, 0.07757949829101562, 0.08354377746582031, 0.089508056640625, 0.09547233581542969, 0.10143661499023438, 0.10740089416503906, 0.11336517333984375, 0.11932945251464844, 0.12529373168945312, 0.1312580108642578, 0.1372222900390625, 0.1431865692138672, 0.14915084838867188, 0.15511512756347656, 0.16107940673828125, 0.16704368591308594, 0.17300796508789062, 0.1789722442626953, 0.1849365234375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 1.0, 2.0, 10.0, 4.0, 11.0, 12.0, 14.0, 27.0, 37.0, 45.0, 78.0, 109.0, 147.0, 283.0, 476.0, 830.0, 1854.0, 4171.0, 12384.0, 50770.0, 346683.0, 2881796.0, 775854.0, 89562.0, 18721.0, 5716.0, 2191.0, 1063.0, 553.0, 315.0, 176.0, 121.0, 79.0, 47.0, 47.0, 29.0, 27.0, 19.0, 7.0, 5.0, 4.0, 1.0, 3.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.6123046875, -0.5956039428710938, -0.5789031982421875, -0.5622024536132812, -0.545501708984375, -0.5288009643554688, -0.5121002197265625, -0.49539947509765625, -0.47869873046875, -0.46199798583984375, -0.4452972412109375, -0.42859649658203125, -0.411895751953125, -0.39519500732421875, -0.3784942626953125, -0.36179351806640625, -0.3450927734375, -0.32839202880859375, -0.3116912841796875, -0.29499053955078125, -0.278289794921875, -0.26158905029296875, -0.2448883056640625, -0.22818756103515625, -0.21148681640625, -0.19478607177734375, -0.1780853271484375, -0.16138458251953125, -0.144683837890625, -0.12798309326171875, -0.1112823486328125, -0.09458160400390625, -0.077880859375, -0.06118011474609375, -0.0444793701171875, -0.02777862548828125, -0.011077880859375, 0.00562286376953125, 0.0223236083984375, 0.03902435302734375, 0.05572509765625, 0.07242584228515625, 0.0891265869140625, 0.10582733154296875, 0.122528076171875, 0.13922882080078125, 0.1559295654296875, 0.17263031005859375, 0.1893310546875, 0.20603179931640625, 0.2227325439453125, 0.23943328857421875, 0.256134033203125, 0.27283477783203125, 0.2895355224609375, 0.30623626708984375, 0.32293701171875, 0.33963775634765625, 0.3563385009765625, 0.37303924560546875, 0.389739990234375, 0.40644073486328125, 0.4231414794921875, 0.43984222412109375, 0.45654296875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 5.0, 1.0, 4.0, 1.0, 3.0, 3.0, 5.0, 7.0, 15.0, 17.0, 20.0, 24.0, 32.0, 63.0, 73.0, 94.0, 133.0, 185.0, 245.0, 321.0, 409.0, 434.0, 429.0, 371.0, 331.0, 234.0, 164.0, 121.0, 107.0, 59.0, 44.0, 26.0, 28.0, 19.0, 17.0, 9.0, 6.0, 2.0, 4.0, 8.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.414794921875, -0.3998985290527344, -0.38500213623046875, -0.3701057434082031, -0.3552093505859375, -0.3403129577636719, -0.32541656494140625, -0.3105201721191406, -0.295623779296875, -0.2807273864746094, -0.26583099365234375, -0.2509346008300781, -0.2360382080078125, -0.22114181518554688, -0.20624542236328125, -0.19134902954101562, -0.17645263671875, -0.16155624389648438, -0.14665985107421875, -0.13176345825195312, -0.1168670654296875, -0.10197067260742188, -0.08707427978515625, -0.07217788696289062, -0.057281494140625, -0.042385101318359375, -0.02748870849609375, -0.012592315673828125, 0.0023040771484375, 0.017200469970703125, 0.03209686279296875, 0.046993255615234375, 0.0618896484375, 0.07678604125976562, 0.09168243408203125, 0.10657882690429688, 0.1214752197265625, 0.13637161254882812, 0.15126800537109375, 0.16616439819335938, 0.181060791015625, 0.19595718383789062, 0.21085357666015625, 0.22574996948242188, 0.2406463623046875, 0.2555427551269531, 0.27043914794921875, 0.2853355407714844, 0.30023193359375, 0.3151283264160156, 0.33002471923828125, 0.3449211120605469, 0.3598175048828125, 0.3747138977050781, 0.38961029052734375, 0.4045066833496094, 0.419403076171875, 0.4342994689941406, 0.44919586181640625, 0.4640922546386719, 0.4789886474609375, 0.4938850402832031, 0.5087814331054688, 0.5236778259277344, 0.53857421875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 2.0, 3.0, 4.0, 6.0, 5.0, 6.0, 18.0, 14.0, 27.0, 40.0, 56.0, 70.0, 91.0, 101.0, 121.0, 118.0, 104.0, 62.0, 49.0, 41.0, 22.0, 16.0, 7.0, 3.0, 5.0, 6.0, 5.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.986452102661133, -2.839566469192505, -2.692681074142456, -2.545795440673828, -2.3989100456237793, -2.2520244121551514, -2.1051387786865234, -1.958253264427185, -1.8113677501678467, -1.6644822359085083, -1.51759672164917, -1.370711088180542, -1.2238255739212036, -1.0769400596618652, -0.9300544857978821, -0.7831689119338989, -0.6362833976745605, -0.4893978536128998, -0.342512309551239, -0.19562676548957825, -0.04874122142791748, 0.0981442928314209, 0.24502986669540405, 0.3919154405593872, 0.5388009548187256, 0.685686469078064, 0.8325720429420471, 0.9794576168060303, 1.1263431310653687, 1.273228645324707, 1.420114278793335, 1.5669997930526733, 1.7138848304748535, 1.860770344734192, 2.0076558589935303, 2.154541492462158, 2.301426887512207, 2.448312520980835, 2.595198154449463, 2.7420835494995117, 2.8889691829681396, 3.0358548164367676, 3.1827402114868164, 3.3296258449554443, 3.4765114784240723, 3.623396873474121, 3.770282506942749, 3.917168140411377, 4.064053535461426, 4.210938930511475, 4.357824802398682, 4.5047101974487305, 4.651595592498779, 4.798480987548828, 4.945366859436035, 5.092252254486084, 5.239137649536133, 5.386023044586182, 5.532908916473389, 5.6797943115234375, 5.826679706573486, 5.973565101623535, 6.120450973510742, 6.267336368560791, 6.414222240447998]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 6.0, 7.0, 11.0, 7.0, 12.0, 21.0, 18.0, 15.0, 25.0, 30.0, 35.0, 39.0, 45.0, 44.0, 56.0, 54.0, 46.0, 60.0, 51.0, 46.0, 55.0, 49.0, 30.0, 52.0, 33.0, 34.0, 30.0, 19.0, 17.0, 14.0, 7.0, 13.0, 7.0, 2.0, 4.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.424018621444702, -2.350886583328247, -2.277754545211792, -2.204622507095337, -2.131490707397461, -2.058358669281006, -1.9852266311645508, -1.9120945930480957, -1.8389625549316406, -1.7658305168151855, -1.6926984786987305, -1.619566559791565, -1.5464345216751099, -1.4733024835586548, -1.4001705646514893, -1.3270385265350342, -1.253906488418579, -1.180774450302124, -1.107642412185669, -1.0345104932785034, -0.9613784551620483, -0.8882464170455933, -0.815114438533783, -0.7419824600219727, -0.6688504219055176, -0.5957183837890625, -0.5225864052772522, -0.4494543969631195, -0.3763223886489868, -0.3031903803348541, -0.23005837202072144, -0.15692639350891113, -0.08379459381103516, -0.010662585496902466, 0.062469422817230225, 0.13560143113136292, 0.2087334394454956, 0.2818654477596283, 0.354997456073761, 0.4281294345855713, 0.5012614727020264, 0.5743935108184814, 0.6475254893302917, 0.720657467842102, 0.7937895059585571, 0.8669215440750122, 0.9400535225868225, 1.0131855010986328, 1.086317539215088, 1.159449577331543, 1.232581615447998, 1.3057135343551636, 1.3788455724716187, 1.4519776105880737, 1.5251095294952393, 1.5982415676116943, 1.6713736057281494, 1.7445056438446045, 1.8176376819610596, 1.890769600868225, 1.9639016389846802, 2.0370335578918457, 2.110165596008301, 2.183297634124756, 2.256429672241211]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 3.0, 2.0, 4.0, 4.0, 11.0, 8.0, 20.0, 26.0, 29.0, 53.0, 75.0, 116.0, 174.0, 266.0, 464.0, 712.0, 1261.0, 2223.0, 4181.0, 8475.0, 17478.0, 40869.0, 96047.0, 212725.0, 301375.0, 201031.0, 89548.0, 37684.0, 16849.0, 7787.0, 3874.0, 2088.0, 1232.0, 668.0, 416.0, 288.0, 151.0, 106.0, 75.0, 61.0, 31.0, 22.0, 19.0, 15.0, 10.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2193603515625, -0.21106910705566406, -0.20277786254882812, -0.1944866180419922, -0.18619537353515625, -0.1779041290283203, -0.16961288452148438, -0.16132164001464844, -0.1530303955078125, -0.14473915100097656, -0.13644790649414062, -0.1281566619873047, -0.11986541748046875, -0.11157417297363281, -0.10328292846679688, -0.09499168395996094, -0.086700439453125, -0.07840919494628906, -0.07011795043945312, -0.06182670593261719, -0.05353546142578125, -0.04524421691894531, -0.036952972412109375, -0.028661727905273438, -0.0203704833984375, -0.012079238891601562, -0.003787994384765625, 0.0045032501220703125, 0.01279449462890625, 0.021085739135742188, 0.029376983642578125, 0.03766822814941406, 0.04595947265625, 0.05425071716308594, 0.06254196166992188, 0.07083320617675781, 0.07912445068359375, 0.08741569519042969, 0.09570693969726562, 0.10399818420410156, 0.1122894287109375, 0.12058067321777344, 0.12887191772460938, 0.1371631622314453, 0.14545440673828125, 0.1537456512451172, 0.16203689575195312, 0.17032814025878906, 0.178619384765625, 0.18691062927246094, 0.19520187377929688, 0.2034931182861328, 0.21178436279296875, 0.2200756072998047, 0.22836685180664062, 0.23665809631347656, 0.2449493408203125, 0.25324058532714844, 0.2615318298339844, 0.2698230743408203, 0.27811431884765625, 0.2864055633544922, 0.2946968078613281, 0.30298805236816406, 0.311279296875]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 7.0, 11.0, 10.0, 12.0, 12.0, 15.0, 19.0, 37.0, 32.0, 33.0, 28.0, 52.0, 37.0, 49.0, 43.0, 47.0, 54.0, 60.0, 48.0, 33.0, 46.0, 41.0, 34.0, 38.0, 34.0, 31.0, 23.0, 29.0, 29.0, 16.0, 14.0, 8.0, 8.0, 6.0, 5.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.261474609375, -0.2524833679199219, -0.24349212646484375, -0.23450088500976562, -0.2255096435546875, -0.21651840209960938, -0.20752716064453125, -0.19853591918945312, -0.189544677734375, -0.18055343627929688, -0.17156219482421875, -0.16257095336914062, -0.1535797119140625, -0.14458847045898438, -0.13559722900390625, -0.12660598754882812, -0.11761474609375, -0.10862350463867188, -0.09963226318359375, -0.09064102172851562, -0.0816497802734375, -0.07265853881835938, -0.06366729736328125, -0.054676055908203125, -0.045684814453125, -0.036693572998046875, -0.02770233154296875, -0.018711090087890625, -0.0097198486328125, -0.000728607177734375, 0.00826263427734375, 0.017253875732421875, 0.0262451171875, 0.035236358642578125, 0.04422760009765625, 0.053218841552734375, 0.0622100830078125, 0.07120132446289062, 0.08019256591796875, 0.08918380737304688, 0.098175048828125, 0.10716629028320312, 0.11615753173828125, 0.12514877319335938, 0.1341400146484375, 0.14313125610351562, 0.15212249755859375, 0.16111373901367188, 0.17010498046875, 0.17909622192382812, 0.18808746337890625, 0.19707870483398438, 0.2060699462890625, 0.21506118774414062, 0.22405242919921875, 0.23304367065429688, 0.242034912109375, 0.2510261535644531, 0.26001739501953125, 0.2690086364746094, 0.2779998779296875, 0.2869911193847656, 0.29598236083984375, 0.3049736022949219, 0.31396484375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 0.0, 7.0, 7.0, 10.0, 13.0, 14.0, 21.0, 27.0, 50.0, 60.0, 77.0, 136.0, 272.0, 561.0, 1287.0, 3541.0, 13048.0, 77235.0, 675398.0, 237287.0, 29301.0, 6357.0, 2065.0, 823.0, 374.0, 223.0, 129.0, 74.0, 55.0, 31.0, 12.0, 14.0, 11.0, 7.0, 9.0, 7.0, 1.0, 3.0, 2.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.51708984375, -0.5013008117675781, -0.48551177978515625, -0.4697227478027344, -0.4539337158203125, -0.4381446838378906, -0.42235565185546875, -0.4065666198730469, -0.390777587890625, -0.3749885559082031, -0.35919952392578125, -0.3434104919433594, -0.3276214599609375, -0.3118324279785156, -0.29604339599609375, -0.2802543640136719, -0.26446533203125, -0.24867630004882812, -0.23288726806640625, -0.21709823608398438, -0.2013092041015625, -0.18552017211914062, -0.16973114013671875, -0.15394210815429688, -0.138153076171875, -0.12236404418945312, -0.10657501220703125, -0.09078598022460938, -0.0749969482421875, -0.059207916259765625, -0.04341888427734375, -0.027629852294921875, -0.0118408203125, 0.003948211669921875, 0.01973724365234375, 0.035526275634765625, 0.0513153076171875, 0.06710433959960938, 0.08289337158203125, 0.09868240356445312, 0.114471435546875, 0.13026046752929688, 0.14604949951171875, 0.16183853149414062, 0.1776275634765625, 0.19341659545898438, 0.20920562744140625, 0.22499465942382812, 0.24078369140625, 0.2565727233886719, 0.27236175537109375, 0.2881507873535156, 0.3039398193359375, 0.3197288513183594, 0.33551788330078125, 0.3513069152832031, 0.367095947265625, 0.3828849792480469, 0.39867401123046875, 0.4144630432128906, 0.4302520751953125, 0.4460411071777344, 0.46183013916015625, 0.4776191711425781, 0.493408203125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 8.0, 7.0, 13.0, 14.0, 19.0, 22.0, 18.0, 24.0, 38.0, 53.0, 39.0, 45.0, 38.0, 43.0, 56.0, 44.0, 60.0, 40.0, 66.0, 39.0, 41.0, 50.0, 40.0, 27.0, 34.0, 24.0, 9.0, 25.0, 10.0, 14.0, 11.0, 8.0, 1.0, 7.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.69580078125, -0.6740951538085938, -0.6523895263671875, -0.6306838989257812, -0.608978271484375, -0.5872726440429688, -0.5655670166015625, -0.5438613891601562, -0.52215576171875, -0.5004501342773438, -0.4787445068359375, -0.45703887939453125, -0.435333251953125, -0.41362762451171875, -0.3919219970703125, -0.37021636962890625, -0.3485107421875, -0.32680511474609375, -0.3050994873046875, -0.28339385986328125, -0.261688232421875, -0.23998260498046875, -0.2182769775390625, -0.19657135009765625, -0.17486572265625, -0.15316009521484375, -0.1314544677734375, -0.10974884033203125, -0.088043212890625, -0.06633758544921875, -0.0446319580078125, -0.02292633056640625, -0.001220703125, 0.02048492431640625, 0.0421905517578125, 0.06389617919921875, 0.085601806640625, 0.10730743408203125, 0.1290130615234375, 0.15071868896484375, 0.17242431640625, 0.19412994384765625, 0.2158355712890625, 0.23754119873046875, 0.259246826171875, 0.28095245361328125, 0.3026580810546875, 0.32436370849609375, 0.3460693359375, 0.36777496337890625, 0.3894805908203125, 0.41118621826171875, 0.432891845703125, 0.45459747314453125, 0.4763031005859375, 0.49800872802734375, 0.51971435546875, 0.5414199829101562, 0.5631256103515625, 0.5848312377929688, 0.606536865234375, 0.6282424926757812, 0.6499481201171875, 0.6716537475585938, 0.693359375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 5.0, 4.0, 9.0, 6.0, 16.0, 15.0, 44.0, 65.0, 99.0, 162.0, 335.0, 1063.0, 7554.0, 710396.0, 321567.0, 5695.0, 884.0, 260.0, 132.0, 89.0, 64.0, 35.0, 18.0, 11.0, 4.0, 6.0, 5.0, 4.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.441650390625, -0.4278221130371094, -0.41399383544921875, -0.4001655578613281, -0.3863372802734375, -0.3725090026855469, -0.35868072509765625, -0.3448524475097656, -0.331024169921875, -0.3171958923339844, -0.30336761474609375, -0.2895393371582031, -0.2757110595703125, -0.2618827819824219, -0.24805450439453125, -0.23422622680664062, -0.22039794921875, -0.20656967163085938, -0.19274139404296875, -0.17891311645507812, -0.1650848388671875, -0.15125656127929688, -0.13742828369140625, -0.12360000610351562, -0.109771728515625, -0.09594345092773438, -0.08211517333984375, -0.06828689575195312, -0.0544586181640625, -0.040630340576171875, -0.02680206298828125, -0.012973785400390625, 0.0008544921875, 0.014682769775390625, 0.02851104736328125, 0.042339324951171875, 0.0561676025390625, 0.06999588012695312, 0.08382415771484375, 0.09765243530273438, 0.111480712890625, 0.12530899047851562, 0.13913726806640625, 0.15296554565429688, 0.1667938232421875, 0.18062210083007812, 0.19445037841796875, 0.20827865600585938, 0.22210693359375, 0.23593521118164062, 0.24976348876953125, 0.2635917663574219, 0.2774200439453125, 0.2912483215332031, 0.30507659912109375, 0.3189048767089844, 0.332733154296875, 0.3465614318847656, 0.36038970947265625, 0.3742179870605469, 0.3880462646484375, 0.4018745422363281, 0.41570281982421875, 0.4295310974121094, 0.443359375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 6.0, 6.0, 4.0, 7.0, 9.0, 14.0, 17.0, 26.0, 40.0, 42.0, 74.0, 88.0, 104.0, 116.0, 108.0, 83.0, 65.0, 60.0, 44.0, 36.0, 21.0, 14.0, 7.0, 2.0, 4.0, 2.0, 6.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.664327621459961e-05, -2.5462359189987183e-05, -2.4281442165374756e-05, -2.310052514076233e-05, -2.1919608116149902e-05, -2.0738691091537476e-05, -1.955777406692505e-05, -1.8376857042312622e-05, -1.7195940017700195e-05, -1.601502299308777e-05, -1.4834105968475342e-05, -1.3653188943862915e-05, -1.2472271919250488e-05, -1.1291354894638062e-05, -1.0110437870025635e-05, -8.929520845413208e-06, -7.748603820800781e-06, -6.5676867961883545e-06, -5.386769771575928e-06, -4.205852746963501e-06, -3.0249357223510742e-06, -1.8440186977386475e-06, -6.631016731262207e-07, 5.178153514862061e-07, 1.6987323760986328e-06, 2.8796494007110596e-06, 4.060566425323486e-06, 5.241483449935913e-06, 6.42240047454834e-06, 7.603317499160767e-06, 8.784234523773193e-06, 9.96515154838562e-06, 1.1146068572998047e-05, 1.2326985597610474e-05, 1.35079026222229e-05, 1.4688819646835327e-05, 1.5869736671447754e-05, 1.705065369606018e-05, 1.8231570720672607e-05, 1.9412487745285034e-05, 2.059340476989746e-05, 2.1774321794509888e-05, 2.2955238819122314e-05, 2.413615584373474e-05, 2.5317072868347168e-05, 2.6497989892959595e-05, 2.767890691757202e-05, 2.8859823942184448e-05, 3.0040740966796875e-05, 3.12216579914093e-05, 3.240257501602173e-05, 3.3583492040634155e-05, 3.476440906524658e-05, 3.594532608985901e-05, 3.7126243114471436e-05, 3.830716013908386e-05, 3.948807716369629e-05, 4.0668994188308716e-05, 4.184991121292114e-05, 4.303082823753357e-05, 4.4211745262145996e-05, 4.539266228675842e-05, 4.657357931137085e-05, 4.7754496335983276e-05, 4.89354133605957e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 4.0, 12.0, 27.0, 55.0, 95.0, 244.0, 705.0, 3029.0, 44103.0, 959052.0, 37312.0, 2718.0, 687.0, 240.0, 115.0, 78.0, 36.0, 19.0, 17.0, 7.0, 6.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.437744140625, -0.4242668151855469, -0.41078948974609375, -0.3973121643066406, -0.3838348388671875, -0.3703575134277344, -0.35688018798828125, -0.3434028625488281, -0.329925537109375, -0.3164482116699219, -0.30297088623046875, -0.2894935607910156, -0.2760162353515625, -0.2625389099121094, -0.24906158447265625, -0.23558425903320312, -0.22210693359375, -0.20862960815429688, -0.19515228271484375, -0.18167495727539062, -0.1681976318359375, -0.15472030639648438, -0.14124298095703125, -0.12776565551757812, -0.114288330078125, -0.10081100463867188, -0.08733367919921875, -0.07385635375976562, -0.0603790283203125, -0.046901702880859375, -0.03342437744140625, -0.019947052001953125, -0.0064697265625, 0.007007598876953125, 0.02048492431640625, 0.033962249755859375, 0.0474395751953125, 0.060916900634765625, 0.07439422607421875, 0.08787155151367188, 0.101348876953125, 0.11482620239257812, 0.12830352783203125, 0.14178085327148438, 0.1552581787109375, 0.16873550415039062, 0.18221282958984375, 0.19569015502929688, 0.20916748046875, 0.22264480590820312, 0.23612213134765625, 0.24959945678710938, 0.2630767822265625, 0.2765541076660156, 0.29003143310546875, 0.3035087585449219, 0.316986083984375, 0.3304634094238281, 0.34394073486328125, 0.3574180603027344, 0.3708953857421875, 0.3843727111816406, 0.39785003662109375, 0.4113273620605469, 0.4248046875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 4.0, 9.0, 15.0, 26.0, 45.0, 81.0, 156.0, 230.0, 217.0, 94.0, 56.0, 31.0, 12.0, 9.0, 3.0, 6.0, 4.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.487060546875, -0.4721260070800781, -0.45719146728515625, -0.4422569274902344, -0.4273223876953125, -0.4123878479003906, -0.39745330810546875, -0.3825187683105469, -0.367584228515625, -0.3526496887207031, -0.33771514892578125, -0.3227806091308594, -0.3078460693359375, -0.2929115295410156, -0.27797698974609375, -0.2630424499511719, -0.24810791015625, -0.23317337036132812, -0.21823883056640625, -0.20330429077148438, -0.1883697509765625, -0.17343521118164062, -0.15850067138671875, -0.14356613159179688, -0.128631591796875, -0.11369705200195312, -0.09876251220703125, -0.08382797241210938, -0.0688934326171875, -0.053958892822265625, -0.03902435302734375, -0.024089813232421875, -0.0091552734375, 0.005779266357421875, 0.02071380615234375, 0.035648345947265625, 0.0505828857421875, 0.06551742553710938, 0.08045196533203125, 0.09538650512695312, 0.110321044921875, 0.12525558471679688, 0.14019012451171875, 0.15512466430664062, 0.1700592041015625, 0.18499374389648438, 0.19992828369140625, 0.21486282348632812, 0.22979736328125, 0.24473190307617188, 0.25966644287109375, 0.2746009826660156, 0.2895355224609375, 0.3044700622558594, 0.31940460205078125, 0.3343391418457031, 0.349273681640625, 0.3642082214355469, 0.37914276123046875, 0.3940773010253906, 0.4090118408203125, 0.4239463806152344, 0.43888092041015625, 0.4538154602050781, 0.46875]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 2.0, 16.0, 21.0, 24.0, 41.0, 72.0, 77.0, 134.0, 148.0, 128.0, 95.0, 79.0, 49.0, 39.0, 21.0, 14.0, 12.0, 7.0, 4.0, 5.0, 2.0, 3.0, 5.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.244434356689453, -2.130798578262329, -2.017162799835205, -1.903527021408081, -1.7898913621902466, -1.6762555837631226, -1.5626198053359985, -1.448984146118164, -1.33534836769104, -1.221712589263916, -1.108076810836792, -0.9944410920143127, -0.8808053731918335, -0.7671695947647095, -0.6535338163375854, -0.5398980975151062, -0.4262622594833374, -0.31262651085853577, -0.19899074733257294, -0.08535498380661011, 0.02828076481819153, 0.14191651344299316, 0.2555522918701172, 0.36918801069259644, 0.48282378911972046, 0.5964595675468445, 0.7100952863693237, 0.8237310647964478, 0.9373668432235718, 1.0510025024414062, 1.1646382808685303, 1.2782740592956543, 1.3919098377227783, 1.5055456161499023, 1.6191813945770264, 1.7328171730041504, 1.8464528322219849, 1.9600886106491089, 2.0737242698669434, 2.1873600482940674, 2.3009958267211914, 2.4146316051483154, 2.5282673835754395, 2.6419031620025635, 2.7555389404296875, 2.8691744804382324, 2.9828104972839355, 3.0964460372924805, 3.2100820541381836, 3.3237178325653076, 3.4373536109924316, 3.5509893894195557, 3.6646251678466797, 3.7782607078552246, 3.8918967247009277, 4.005532264709473, 4.119167804718018, 4.2328033447265625, 4.346439361572266, 4.4600749015808105, 4.573710918426514, 4.687346458435059, 4.800982475280762, 4.914618015289307, 5.02825403213501]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 5.0, 5.0, 5.0, 10.0, 19.0, 14.0, 16.0, 19.0, 19.0, 42.0, 47.0, 48.0, 74.0, 70.0, 68.0, 75.0, 69.0, 64.0, 66.0, 40.0, 50.0, 33.0, 30.0, 36.0, 24.0, 14.0, 11.0, 6.0, 8.0, 7.0, 1.0, 3.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.9931352138519287, -2.894886016845703, -2.7966365814208984, -2.6983871459960938, -2.600137948989868, -2.5018887519836426, -2.403639316558838, -2.305389881134033, -2.2071406841278076, -2.108891487121582, -2.0106420516967773, -1.9123927354812622, -1.814143419265747, -1.715894103050232, -1.6176447868347168, -1.5193954706192017, -1.4211461544036865, -1.3228968381881714, -1.2246475219726562, -1.1263982057571411, -1.028148889541626, -0.9298995733261108, -0.8316502571105957, -0.7334009408950806, -0.6351516246795654, -0.5369023084640503, -0.43865299224853516, -0.34040367603302, -0.24215435981750488, -0.14390504360198975, -0.04565572738647461, 0.05259358882904053, 0.15084266662597656, 0.2490919828414917, 0.34734129905700684, 0.445590615272522, 0.5438399314880371, 0.6420892477035522, 0.7403385639190674, 0.8385878801345825, 0.9368371963500977, 1.0350865125656128, 1.133335828781128, 1.231585144996643, 1.3298344612121582, 1.4280837774276733, 1.5263330936431885, 1.6245824098587036, 1.7228317260742188, 1.8210810422897339, 1.919330358505249, 2.0175795555114746, 2.1158289909362793, 2.214078426361084, 2.3123276233673096, 2.410576820373535, 2.50882625579834, 2.6070756912231445, 2.70532488822937, 2.8035740852355957, 2.9018235206604004, 3.000072956085205, 3.0983221530914307, 3.1965713500976562, 3.294820785522461]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 7.0, 14.0, 9.0, 6.0, 9.0, 14.0, 14.0, 26.0, 28.0, 31.0, 42.0, 52.0, 71.0, 148.0, 227.0, 80.0, 55.0, 32.0, 31.0, 28.0, 19.0, 8.0, 10.0, 8.0, 6.0, 10.0, 4.0, 6.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.381103515625, -0.3696098327636719, -0.35811614990234375, -0.3466224670410156, -0.3351287841796875, -0.3236351013183594, -0.31214141845703125, -0.3006477355957031, -0.289154052734375, -0.2776603698730469, -0.26616668701171875, -0.2546730041503906, -0.2431793212890625, -0.23168563842773438, -0.22019195556640625, -0.20869827270507812, -0.19720458984375, -0.18571090698242188, -0.17421722412109375, -0.16272354125976562, -0.1512298583984375, -0.13973617553710938, -0.12824249267578125, -0.11674880981445312, -0.105255126953125, -0.09376144409179688, -0.08226776123046875, -0.07077407836914062, -0.0592803955078125, -0.047786712646484375, -0.03629302978515625, -0.024799346923828125, -0.0133056640625, -0.001811981201171875, 0.00968170166015625, 0.021175384521484375, 0.0326690673828125, 0.044162750244140625, 0.05565643310546875, 0.06715011596679688, 0.078643798828125, 0.09013748168945312, 0.10163116455078125, 0.11312484741210938, 0.1246185302734375, 0.13611221313476562, 0.14760589599609375, 0.15909957885742188, 0.17059326171875, 0.18208694458007812, 0.19358062744140625, 0.20507431030273438, 0.2165679931640625, 0.22806167602539062, 0.23955535888671875, 0.2510490417480469, 0.262542724609375, 0.2740364074707031, 0.28553009033203125, 0.2970237731933594, 0.3085174560546875, 0.3200111389160156, 0.33150482177734375, 0.3429985046386719, 0.3544921875]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 3.0, 8.0, 21.0, 22.0, 42.0, 65.0, 133.0, 228.0, 565.0, 1584.0, 6420.0, 74690.0, 8283641.0, 16336.0, 3053.0, 920.0, 371.0, 204.0, 114.0, 51.0, 38.0, 19.0, 14.0, 17.0, 8.0, 7.0, 3.0, 2.0, 3.0, 0.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9379535913467407, -1.8796736001968384, -1.8213937282562256, -1.7631137371063232, -1.7048338651657104, -1.646553874015808, -1.5882740020751953, -1.529994010925293, -1.4717140197753906, -1.4134340286254883, -1.3551541566848755, -1.2968741655349731, -1.2385942935943604, -1.180314302444458, -1.1220343112945557, -1.0637544393539429, -1.00547456741333, -0.9471946358680725, -0.8889147043228149, -0.8306347131729126, -0.772354781627655, -0.7140748500823975, -0.6557949185371399, -0.5975149869918823, -0.53923499584198, -0.4809550642967224, -0.42267510294914246, -0.3643951714038849, -0.30611521005630493, -0.24783527851104736, -0.1895553469657898, -0.13127538561820984, -0.07299542427062988, -0.014715481549501419, 0.043564461171627045, 0.10184440016746521, 0.16012434661388397, 0.21840429306030273, 0.2766842246055603, 0.33496418595314026, 0.3932441174983978, 0.4515240490436554, 0.5098040103912354, 0.5680839419364929, 0.6263638734817505, 0.6846438646316528, 0.7429237365722656, 0.801203727722168, 0.8594836592674255, 0.9177635908126831, 0.9760435223579407, 1.0343234539031982, 1.0926034450531006, 1.150883436203003, 1.2091633081436157, 1.267443299293518, 1.3257231712341309, 1.3840031623840332, 1.442283034324646, 1.5005630254745483, 1.5588428974151611, 1.6171228885650635, 1.6754028797149658, 1.7336827516555786, 1.791962742805481]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 5.0, 6.0, 3.0, 5.0, 3.0, 2.0, 3.0, 2.0, 2.0, 6.0, 5.0, 5.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 3.0, 0.0, 2.0, 4.0, 3.0, 2.0, 3.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.4320980310440063, -1.3883832693099976, -1.3446685075759888, -1.3009538650512695, -1.2572391033172607, -1.213524341583252, -1.1698095798492432, -1.1260948181152344, -1.0823800563812256, -1.0386652946472168, -0.9949505925178528, -0.951235830783844, -0.90752112865448, -0.8638063669204712, -0.8200916051864624, -0.7763768434524536, -0.7326622009277344, -0.6889474391937256, -0.6452327370643616, -0.6015179753303528, -0.5578032732009888, -0.51408851146698, -0.4703737497329712, -0.4266590178012848, -0.3829442858695984, -0.339229553937912, -0.2955148220062256, -0.2518000602722168, -0.2080853283405304, -0.164370596408844, -0.1206558346748352, -0.0769411027431488, -0.03322649002075195, 0.010488249361515045, 0.05420298874378204, 0.09791773557662964, 0.14163246750831604, 0.18534719944000244, 0.22906196117401123, 0.27277669310569763, 0.31649142503738403, 0.36020615696907043, 0.40392088890075684, 0.4476356506347656, 0.491350382566452, 0.5350651144981384, 0.5787798762321472, 0.6224945783615112, 0.66620934009552, 0.7099241018295288, 0.7536388039588928, 0.7973535656929016, 0.8410682678222656, 0.8847830295562744, 0.9284977912902832, 0.972212553024292, 1.0159273147583008, 1.0596420764923096, 1.1033568382263184, 1.1470715999603271, 1.1907862424850464, 1.2345010042190552, 1.278215765953064, 1.3219305276870728, 1.365645170211792]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 2.0, 5.0, 5.0, 8.0, 7.0, 16.0, 15.0, 20.0, 23.0, 31.0, 35.0, 37.0, 74.0, 57.0, 62.0, 68.0, 87.0, 70.0, 58.0, 78.0, 44.0, 46.0, 35.0, 37.0, 25.0, 17.0, 12.0, 7.0, 1.0, 7.0, 3.0, 5.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.279541015625, -0.27188873291015625, -0.2642364501953125, -0.25658416748046875, -0.248931884765625, -0.24127960205078125, -0.2336273193359375, -0.22597503662109375, -0.21832275390625, -0.21067047119140625, -0.2030181884765625, -0.19536590576171875, -0.187713623046875, -0.18006134033203125, -0.1724090576171875, -0.16475677490234375, -0.1571044921875, -0.14945220947265625, -0.1417999267578125, -0.13414764404296875, -0.126495361328125, -0.11884307861328125, -0.1111907958984375, -0.10353851318359375, -0.09588623046875, -0.08823394775390625, -0.0805816650390625, -0.07292938232421875, -0.065277099609375, -0.05762481689453125, -0.0499725341796875, -0.04232025146484375, -0.03466796875, -0.02701568603515625, -0.0193634033203125, -0.01171112060546875, -0.004058837890625, 0.00359344482421875, 0.0112457275390625, 0.01889801025390625, 0.02655029296875, 0.03420257568359375, 0.0418548583984375, 0.04950714111328125, 0.057159423828125, 0.06481170654296875, 0.0724639892578125, 0.08011627197265625, 0.0877685546875, 0.09542083740234375, 0.1030731201171875, 0.11072540283203125, 0.118377685546875, 0.12602996826171875, 0.1336822509765625, 0.14133453369140625, 0.14898681640625, 0.15663909912109375, 0.1642913818359375, 0.17194366455078125, 0.179595947265625, 0.18724822998046875, 0.1949005126953125, 0.20255279541015625, 0.210205078125]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 2.0, 4.0, 3.0, 8.0, 13.0, 17.0, 29.0, 34.0, 54.0, 76.0, 122.0, 180.0, 311.0, 540.0, 966.0, 1754.0, 3615.0, 7624.0, 17935.0, 50805.0, 192073.0, 172171.0, 45460.0, 16354.0, 6953.0, 3319.0, 1690.0, 894.0, 477.0, 298.0, 168.0, 124.0, 78.0, 37.0, 29.0, 16.0, 13.0, 8.0, 11.0, 6.0, 3.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.638671875, -2.532928466796875, -2.42718505859375, -2.321441650390625, -2.2156982421875, -2.109954833984375, -2.00421142578125, -1.898468017578125, -1.792724609375, -1.686981201171875, -1.58123779296875, -1.475494384765625, -1.3697509765625, -1.264007568359375, -1.15826416015625, -1.052520751953125, -0.94677734375, -0.841033935546875, -0.73529052734375, -0.629547119140625, -0.5238037109375, -0.418060302734375, -0.31231689453125, -0.206573486328125, -0.100830078125, 0.004913330078125, 0.11065673828125, 0.216400146484375, 0.3221435546875, 0.427886962890625, 0.53363037109375, 0.639373779296875, 0.7451171875, 0.850860595703125, 0.95660400390625, 1.062347412109375, 1.1680908203125, 1.273834228515625, 1.37957763671875, 1.485321044921875, 1.591064453125, 1.696807861328125, 1.80255126953125, 1.908294677734375, 2.0140380859375, 2.119781494140625, 2.22552490234375, 2.331268310546875, 2.43701171875, 2.542755126953125, 2.64849853515625, 2.754241943359375, 2.8599853515625, 2.965728759765625, 3.07147216796875, 3.177215576171875, 3.282958984375, 3.388702392578125, 3.49444580078125, 3.600189208984375, 3.7059326171875, 3.811676025390625, 3.91741943359375, 4.023162841796875, 4.12890625]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 6.0, 2.0, 7.0, 5.0, 13.0, 17.0, 15.0, 17.0, 18.0, 18.0, 27.0, 27.0, 34.0, 33.0, 37.0, 56.0, 49.0, 59.0, 51.0, 52.0, 61.0, 44.0, 51.0, 33.0, 36.0, 29.0, 37.0, 24.0, 21.0, 24.0, 24.0, 22.0, 10.0, 13.0, 11.0, 4.0, 2.0, 9.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.27001953125, -0.2611961364746094, -0.25237274169921875, -0.24354934692382812, -0.2347259521484375, -0.22590255737304688, -0.21707916259765625, -0.20825576782226562, -0.199432373046875, -0.19060897827148438, -0.18178558349609375, -0.17296218872070312, -0.1641387939453125, -0.15531539916992188, -0.14649200439453125, -0.13766860961914062, -0.12884521484375, -0.12002182006835938, -0.11119842529296875, -0.10237503051757812, -0.0935516357421875, -0.08472824096679688, -0.07590484619140625, -0.06708145141601562, -0.058258056640625, -0.049434661865234375, -0.04061126708984375, -0.031787872314453125, -0.0229644775390625, -0.014141082763671875, -0.00531768798828125, 0.003505706787109375, 0.0123291015625, 0.021152496337890625, 0.02997589111328125, 0.038799285888671875, 0.0476226806640625, 0.056446075439453125, 0.06526947021484375, 0.07409286499023438, 0.082916259765625, 0.09173965454101562, 0.10056304931640625, 0.10938644409179688, 0.1182098388671875, 0.12703323364257812, 0.13585662841796875, 0.14468002319335938, 0.15350341796875, 0.16232681274414062, 0.17115020751953125, 0.17997360229492188, 0.1887969970703125, 0.19762039184570312, 0.20644378662109375, 0.21526718139648438, 0.224090576171875, 0.23291397094726562, 0.24173736572265625, 0.2505607604980469, 0.2593841552734375, 0.2682075500488281, 0.27703094482421875, 0.2858543395996094, 0.294677734375]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 0.0, 4.0, 3.0, 7.0, 11.0, 8.0, 18.0, 12.0, 11.0, 21.0, 22.0, 33.0, 41.0, 37.0, 52.0, 43.0, 39.0, 30.0, 22.0, 20.0, 13.0, 6.0, 13.0, 5.0, 6.0, 3.0, 4.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0747687816619873, -1.0402421951293945, -1.0057154893875122, -0.9711889028549194, -0.9366622567176819, -0.9021356105804443, -0.8676090240478516, -0.833082377910614, -0.7985557317733765, -0.7640290856361389, -0.7295024991035461, -0.6949758529663086, -0.660449206829071, -0.6259225606918335, -0.5913959741592407, -0.5568693280220032, -0.5223427414894104, -0.48781612515449524, -0.4532894790172577, -0.41876286268234253, -0.384236216545105, -0.3497096002101898, -0.31518298387527466, -0.2806563377380371, -0.24612972140312195, -0.2116030901670456, -0.17707645893096924, -0.14254984259605408, -0.10802321135997772, -0.07349658012390137, -0.038969963788986206, -0.004443332552909851, 0.030083298683166504, 0.06460992991924286, 0.09913655370473862, 0.13366317749023438, 0.16818980872631073, 0.20271643996238708, 0.23724305629730225, 0.2717697024345398, 0.30629631876945496, 0.3408229351043701, 0.37534958124160767, 0.4098761975765228, 0.444402813911438, 0.47892946004867554, 0.5134561061859131, 0.5479826927185059, 0.5825093388557434, 0.617035984992981, 0.6515625715255737, 0.6860892176628113, 0.7206158638000488, 0.7551424503326416, 0.7896690964698792, 0.8241957426071167, 0.8587223291397095, 0.893248975276947, 0.9277755618095398, 0.9623022079467773, 0.9968288540840149, 1.0313555002212524, 1.0658820867538452, 1.100408673286438, 1.1349353790283203]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 6.0, 6.0, 6.0, 5.0, 1.0, 13.0, 1.0, 9.0, 11.0, 15.0, 16.0, 19.0, 23.0, 35.0, 34.0, 47.0, 40.0, 52.0, 33.0, 27.0, 17.0, 15.0, 8.0, 8.0, 4.0, 7.0, 3.0, 5.0, 5.0, 4.0, 1.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.28456449508667, -1.245125412940979, -1.205686330795288, -1.1662472486495972, -1.1268081665039062, -1.0873689651489258, -1.0479298830032349, -1.008490800857544, -0.969051718711853, -0.9296126365661621, -0.8901735544204712, -0.8507344126701355, -0.8112953305244446, -0.7718562483787537, -0.732417106628418, -0.692978024482727, -0.6535389423370361, -0.6140998601913452, -0.5746607780456543, -0.5352216362953186, -0.4957825541496277, -0.45634347200393677, -0.41690436005592346, -0.37746524810791016, -0.33802616596221924, -0.2985870838165283, -0.259147971868515, -0.2197088748216629, -0.1802697777748108, -0.14083068072795868, -0.10139158368110657, -0.06195247173309326, -0.022513389587402344, 0.016925707459449768, 0.05636480450630188, 0.09580390155315399, 0.1352429986000061, 0.17468209564685822, 0.21412119269371033, 0.25356030464172363, 0.29299938678741455, 0.33243846893310547, 0.3718775808811188, 0.4113166928291321, 0.450755774974823, 0.4901948571205139, 0.5296339988708496, 0.5690730810165405, 0.6085121631622314, 0.6479512453079224, 0.6873903274536133, 0.726829469203949, 0.7662685513496399, 0.8057076334953308, 0.8451467752456665, 0.8845858573913574, 0.9240249395370483, 0.9634640216827393, 1.0029031038284302, 1.042342185974121, 1.0817813873291016, 1.1212204694747925, 1.1606595516204834, 1.2000986337661743, 1.2395377159118652]}, "eval/loss": 3.0510671138763428, "eval/bleu": 1.5827445667544166e-18, "eval/runtime": 2619.9089, "eval/samples_per_second": 5.634, "eval/steps_per_second": 0.704, "train/train_runtime": 93795.5595, "train/train_samples_per_second": 6.633, "train/train_steps_per_second": 0.104, "train/total_flos": 0.0, "train/train_loss": 3.260483605049765} \ No newline at end of file