diff --git "a/wandb/run-20220324_170220-1u8cita3/files/wandb-summary.json" "b/wandb/run-20220324_170220-1u8cita3/files/wandb-summary.json" --- "a/wandb/run-20220324_170220-1u8cita3/files/wandb-summary.json" +++ "b/wandb/run-20220324_170220-1u8cita3/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 0.2698, "train/learning_rate": 1.8436619718309862e-06, "train/epoch": 23.54, "train/global_step": 21000, "_runtime": 28161, "_timestamp": 1648169501, "_step": 4502, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 8.0, 5.0, 4.0, 5.0, 13.0, 9.0, 10.0, 10.0, 18.0, 13.0, 20.0, 20.0, 37.0, 28.0, 49.0, 40.0, 44.0, 46.0, 46.0, 47.0, 44.0, 46.0, 56.0, 44.0, 46.0, 55.0, 45.0, 30.0, 29.0, 31.0, 14.0, 12.0, 18.0, 18.0, 12.0, 8.0, 6.0, 7.0, 5.0, 4.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.981430053710938, -12.646739959716797, -12.312049865722656, -11.977359771728516, -11.642669677734375, -11.307978630065918, -10.973288536071777, -10.638598442077637, -10.303908348083496, -9.969218254089355, -9.634528160095215, -9.299838066101074, -8.965147018432617, -8.630456924438477, -8.295766830444336, -7.961076736450195, -7.626386642456055, -7.291696548461914, -6.957006454467773, -6.622315883636475, -6.287625789642334, -5.952935695648193, -5.6182451248168945, -5.283555030822754, -4.948864936828613, -4.614174842834473, -4.279484748840332, -3.944794178009033, -3.6101040840148926, -3.275413990020752, -2.9407236576080322, -2.6060333251953125, -2.271343231201172, -1.9366530179977417, -1.6019628047943115, -1.2672725915908813, -0.9325823783874512, -0.597892165184021, -0.2632019519805908, 0.0714883804321289, 0.40617847442626953, 0.7408686876296997, 1.0755589008331299, 1.41024911403656, 1.7449393272399902, 2.079629421234131, 2.4143197536468506, 2.7490100860595703, 3.083700180053711, 3.4183902740478516, 3.7530806064605713, 4.087770938873291, 4.422461032867432, 4.757151126861572, 5.091841697692871, 5.426531791687012, 5.761221885681152, 6.095911979675293, 6.430602073669434, 6.765292644500732, 7.099982738494873, 7.434672832489014, 7.7693634033203125, 8.104053497314453, 8.438743591308594]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 7.0, 3.0, 4.0, 4.0, 6.0, 5.0, 9.0, 15.0, 12.0, 17.0, 16.0, 22.0, 26.0, 19.0, 22.0, 23.0, 38.0, 37.0, 37.0, 29.0, 50.0, 33.0, 44.0, 49.0, 35.0, 28.0, 52.0, 36.0, 30.0, 39.0, 41.0, 34.0, 33.0, 26.0, 15.0, 25.0, 17.0, 11.0, 13.0, 13.0, 11.0, 5.0, 5.0, 4.0, 4.0, 4.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.618212699890137, -9.323406219482422, -9.028599739074707, -8.733793258666992, -8.438987731933594, -8.144181251525879, -7.849374771118164, -7.554568290710449, -7.259761810302734, -6.9649553298950195, -6.670148849487305, -6.375342845916748, -6.080536365509033, -5.785729885101318, -5.490923881530762, -5.196117401123047, -4.901310920715332, -4.606504440307617, -4.311697959899902, -4.016891956329346, -3.722085475921631, -3.427278995513916, -3.1324727535247803, -2.8376665115356445, -2.5428600311279297, -2.248053550720215, -1.953247308731079, -1.6584409475326538, -1.3636345863342285, -1.0688282251358032, -0.7740218639373779, -0.4792156219482422, -0.18440914154052734, 0.11039721965789795, 0.40520358085632324, 0.7000099420547485, 0.9948163032531738, 1.2896226644515991, 1.5844290256500244, 1.8792352676391602, 2.174041748046875, 2.46884822845459, 2.7636544704437256, 3.0584607124328613, 3.353267192840576, 3.648073673248291, 3.9428799152374268, 4.2376861572265625, 4.532492637634277, 4.827299118041992, 5.122105598449707, 5.416911602020264, 5.7117180824279785, 6.006524562835693, 6.30133056640625, 6.596137046813965, 6.89094352722168, 7.1857500076293945, 7.480556488037109, 7.775362491607666, 8.070169448852539, 8.364974975585938, 8.659781455993652, 8.954587936401367, 9.249394416809082]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [2.0, 2.0, 6.0, 7.0, 8.0, 7.0, 21.0, 29.0, 47.0, 60.0, 83.0, 145.0, 219.0, 372.0, 520.0, 795.0, 1278.0, 1922.0, 3016.0, 4307.0, 6816.0, 10469.0, 16196.0, 24939.0, 39269.0, 60206.0, 92172.0, 140268.0, 214920.0, 320295.0, 456301.0, 578334.0, 602154.0, 508242.0, 371726.0, 254118.0, 168718.0, 111143.0, 72107.0, 46901.0, 30598.0, 19473.0, 12688.0, 8281.0, 5209.0, 3509.0, 2165.0, 1494.0, 977.0, 623.0, 407.0, 269.0, 167.0, 119.0, 62.0, 31.0, 43.0, 18.0, 9.0, 9.0, 7.0, 0.0, 4.0, 2.0], "bins": [-11.2421875, -10.89306640625, -10.5439453125, -10.19482421875, -9.845703125, -9.49658203125, -9.1474609375, -8.79833984375, -8.44921875, -8.10009765625, -7.7509765625, -7.40185546875, -7.052734375, -6.70361328125, -6.3544921875, -6.00537109375, -5.65625, -5.30712890625, -4.9580078125, -4.60888671875, -4.259765625, -3.91064453125, -3.5615234375, -3.21240234375, -2.86328125, -2.51416015625, -2.1650390625, -1.81591796875, -1.466796875, -1.11767578125, -0.7685546875, -0.41943359375, -0.0703125, 0.27880859375, 0.6279296875, 0.97705078125, 1.326171875, 1.67529296875, 2.0244140625, 2.37353515625, 2.72265625, 3.07177734375, 3.4208984375, 3.77001953125, 4.119140625, 4.46826171875, 4.8173828125, 5.16650390625, 5.515625, 5.86474609375, 6.2138671875, 6.56298828125, 6.912109375, 7.26123046875, 7.6103515625, 7.95947265625, 8.30859375, 8.65771484375, 9.0068359375, 9.35595703125, 9.705078125, 10.05419921875, 10.4033203125, 10.75244140625, 11.1015625]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 4.0, 0.0, 2.0, 2.0, 4.0, 2.0, 6.0, 5.0, 9.0, 14.0, 10.0, 14.0, 16.0, 19.0, 14.0, 18.0, 25.0, 23.0, 21.0, 28.0, 40.0, 21.0, 35.0, 45.0, 29.0, 37.0, 32.0, 33.0, 35.0, 39.0, 32.0, 37.0, 35.0, 30.0, 53.0, 33.0, 34.0, 29.0, 20.0, 16.0, 14.0, 14.0, 14.0, 18.0, 8.0, 12.0, 9.0, 1.0, 6.0, 4.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-9.7734375, -9.472412109375, -9.17138671875, -8.870361328125, -8.5693359375, -8.268310546875, -7.96728515625, -7.666259765625, -7.365234375, -7.064208984375, -6.76318359375, -6.462158203125, -6.1611328125, -5.860107421875, -5.55908203125, -5.258056640625, -4.95703125, -4.656005859375, -4.35498046875, -4.053955078125, -3.7529296875, -3.451904296875, -3.15087890625, -2.849853515625, -2.548828125, -2.247802734375, -1.94677734375, -1.645751953125, -1.3447265625, -1.043701171875, -0.74267578125, -0.441650390625, -0.140625, 0.160400390625, 0.46142578125, 0.762451171875, 1.0634765625, 1.364501953125, 1.66552734375, 1.966552734375, 2.267578125, 2.568603515625, 2.86962890625, 3.170654296875, 3.4716796875, 3.772705078125, 4.07373046875, 4.374755859375, 4.67578125, 4.976806640625, 5.27783203125, 5.578857421875, 5.8798828125, 6.180908203125, 6.48193359375, 6.782958984375, 7.083984375, 7.385009765625, 7.68603515625, 7.987060546875, 8.2880859375, 8.589111328125, 8.89013671875, 9.191162109375, 9.4921875]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 7.0, 8.0, 10.0, 22.0, 28.0, 52.0, 75.0, 118.0, 190.0, 340.0, 522.0, 843.0, 1308.0, 2074.0, 3405.0, 5344.0, 8691.0, 14098.0, 22372.0, 36517.0, 58581.0, 93363.0, 146320.0, 224243.0, 332323.0, 463920.0, 583071.0, 604563.0, 506673.0, 373356.0, 255562.0, 168013.0, 108195.0, 68103.0, 42417.0, 26441.0, 16490.0, 10122.0, 6164.0, 3896.0, 2450.0, 1598.0, 886.0, 546.0, 346.0, 232.0, 143.0, 103.0, 42.0, 51.0, 24.0, 14.0, 8.0, 5.0, 1.0, 3.0, 3.0], "bins": [-11.921875, -11.5728759765625, -11.223876953125, -10.8748779296875, -10.52587890625, -10.1768798828125, -9.827880859375, -9.4788818359375, -9.1298828125, -8.7808837890625, -8.431884765625, -8.0828857421875, -7.73388671875, -7.3848876953125, -7.035888671875, -6.6868896484375, -6.337890625, -5.9888916015625, -5.639892578125, -5.2908935546875, -4.94189453125, -4.5928955078125, -4.243896484375, -3.8948974609375, -3.5458984375, -3.1968994140625, -2.847900390625, -2.4989013671875, -2.14990234375, -1.8009033203125, -1.451904296875, -1.1029052734375, -0.75390625, -0.4049072265625, -0.055908203125, 0.2930908203125, 0.64208984375, 0.9910888671875, 1.340087890625, 1.6890869140625, 2.0380859375, 2.3870849609375, 2.736083984375, 3.0850830078125, 3.43408203125, 3.7830810546875, 4.132080078125, 4.4810791015625, 4.830078125, 5.1790771484375, 5.528076171875, 5.8770751953125, 6.22607421875, 6.5750732421875, 6.924072265625, 7.2730712890625, 7.6220703125, 7.9710693359375, 8.320068359375, 8.6690673828125, 9.01806640625, 9.3670654296875, 9.716064453125, 10.0650634765625, 10.4140625]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 4.0, 2.0, 7.0, 8.0, 12.0, 15.0, 18.0, 23.0, 28.0, 54.0, 44.0, 66.0, 68.0, 72.0, 109.0, 157.0, 169.0, 215.0, 228.0, 238.0, 274.0, 247.0, 285.0, 274.0, 243.0, 211.0, 174.0, 147.0, 146.0, 103.0, 93.0, 78.0, 53.0, 51.0, 46.0, 17.0, 22.0, 27.0, 17.0, 8.0, 8.0, 8.0, 2.0, 5.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.90234375, -5.72607421875, -5.5498046875, -5.37353515625, -5.197265625, -5.02099609375, -4.8447265625, -4.66845703125, -4.4921875, -4.31591796875, -4.1396484375, -3.96337890625, -3.787109375, -3.61083984375, -3.4345703125, -3.25830078125, -3.08203125, -2.90576171875, -2.7294921875, -2.55322265625, -2.376953125, -2.20068359375, -2.0244140625, -1.84814453125, -1.671875, -1.49560546875, -1.3193359375, -1.14306640625, -0.966796875, -0.79052734375, -0.6142578125, -0.43798828125, -0.26171875, -0.08544921875, 0.0908203125, 0.26708984375, 0.443359375, 0.61962890625, 0.7958984375, 0.97216796875, 1.1484375, 1.32470703125, 1.5009765625, 1.67724609375, 1.853515625, 2.02978515625, 2.2060546875, 2.38232421875, 2.55859375, 2.73486328125, 2.9111328125, 3.08740234375, 3.263671875, 3.43994140625, 3.6162109375, 3.79248046875, 3.96875, 4.14501953125, 4.3212890625, 4.49755859375, 4.673828125, 4.85009765625, 5.0263671875, 5.20263671875, 5.37890625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 1.0, 4.0, 6.0, 2.0, 4.0, 5.0, 10.0, 16.0, 11.0, 18.0, 24.0, 30.0, 28.0, 29.0, 38.0, 31.0, 45.0, 42.0, 46.0, 42.0, 40.0, 49.0, 53.0, 43.0, 48.0, 35.0, 40.0, 33.0, 40.0, 24.0, 22.0, 28.0, 14.0, 22.0, 19.0, 17.0, 16.0, 12.0, 2.0, 4.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-13.513638496398926, -13.121552467346191, -12.729466438293457, -12.337380409240723, -11.945294380187988, -11.553208351135254, -11.161123275756836, -10.769037246704102, -10.376951217651367, -9.984865188598633, -9.592779159545898, -9.200693130493164, -8.80860710144043, -8.416521072387695, -8.024435043334961, -7.632349491119385, -7.240262985229492, -6.848176956176758, -6.456090927124023, -6.064004898071289, -5.671918869018555, -5.27983283996582, -4.887747287750244, -4.49566125869751, -4.103575229644775, -3.711489200592041, -3.3194031715393066, -2.9273173809051514, -2.535231351852417, -2.1431453227996826, -1.7510595321655273, -1.358973503112793, -0.966888427734375, -0.5748024582862854, -0.1827164888381958, 0.20936942100524902, 0.6014554500579834, 0.9935414791107178, 1.385627269744873, 1.7777132987976074, 2.169799327850342, 2.561885356903076, 2.9539713859558105, 3.346057176589966, 3.7381432056427, 4.1302289962768555, 4.52231502532959, 4.914401054382324, 5.306487083435059, 5.698573112487793, 6.090659141540527, 6.482745170593262, 6.874831199645996, 7.2669172286987305, 7.659002780914307, 8.051088333129883, 8.443174362182617, 8.835260391235352, 9.227346420288086, 9.61943244934082, 10.011518478393555, 10.403604507446289, 10.795690536499023, 11.187776565551758, 11.579862594604492]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 4.0, 2.0, 5.0, 7.0, 3.0, 6.0, 6.0, 20.0, 20.0, 24.0, 13.0, 17.0, 20.0, 31.0, 19.0, 31.0, 28.0, 33.0, 31.0, 37.0, 43.0, 27.0, 39.0, 45.0, 39.0, 38.0, 51.0, 39.0, 36.0, 34.0, 35.0, 25.0, 24.0, 28.0, 21.0, 23.0, 19.0, 16.0, 13.0, 7.0, 7.0, 8.0, 5.0, 5.0, 3.0, 6.0, 2.0, 2.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.48029899597168, -11.11240291595459, -10.744505882263184, -10.376609802246094, -10.008712768554688, -9.640816688537598, -9.272920608520508, -8.905023574829102, -8.537127494812012, -8.169231414794922, -7.801334381103516, -7.433438301086426, -7.065541744232178, -6.69764518737793, -6.32974910736084, -5.961852550506592, -5.593955993652344, -5.226059436798096, -4.858162879943848, -4.490266799926758, -4.12237024307251, -3.7544736862182617, -3.3865773677825928, -3.018681049346924, -2.650784492492676, -2.2828879356384277, -1.9149916172027588, -1.5470951795578003, -1.1791987419128418, -0.8113023042678833, -0.4434058666229248, -0.07550954818725586, 0.2923870086669922, 0.6602834463119507, 1.0281798839569092, 1.3960763216018677, 1.7639727592468262, 2.131869316101074, 2.499765634536743, 2.867661952972412, 3.23555850982666, 3.603455066680908, 3.971351385116577, 4.339247703552246, 4.707144260406494, 5.075040817260742, 5.442936897277832, 5.81083345413208, 6.178730010986328, 6.546626567840576, 6.914523124694824, 7.282419204711914, 7.650315761566162, 8.01821231842041, 8.3861083984375, 8.754005432128906, 9.121901512145996, 9.489797592163086, 9.857694625854492, 10.225590705871582, 10.593486785888672, 10.961383819580078, 11.329279899597168, 11.697175979614258, 12.065073013305664]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 8.0, 3.0, 10.0, 15.0, 14.0, 24.0, 27.0, 48.0, 60.0, 83.0, 121.0, 206.0, 290.0, 474.0, 662.0, 971.0, 1453.0, 2292.0, 3578.0, 5762.0, 9238.0, 15306.0, 25022.0, 41442.0, 65389.0, 99706.0, 138315.0, 165104.0, 151970.0, 114336.0, 77675.0, 49384.0, 30472.0, 18662.0, 11390.0, 6843.0, 4274.0, 2729.0, 1711.0, 1158.0, 747.0, 495.0, 344.0, 230.0, 163.0, 105.0, 89.0, 58.0, 31.0, 21.0, 21.0, 13.0, 7.0, 6.0, 7.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-4.63671875, -4.48565673828125, -4.3345947265625, -4.18353271484375, -4.032470703125, -3.88140869140625, -3.7303466796875, -3.57928466796875, -3.42822265625, -3.27716064453125, -3.1260986328125, -2.97503662109375, -2.823974609375, -2.67291259765625, -2.5218505859375, -2.37078857421875, -2.2197265625, -2.06866455078125, -1.9176025390625, -1.76654052734375, -1.615478515625, -1.46441650390625, -1.3133544921875, -1.16229248046875, -1.01123046875, -0.86016845703125, -0.7091064453125, -0.55804443359375, -0.406982421875, -0.25592041015625, -0.1048583984375, 0.04620361328125, 0.197265625, 0.34832763671875, 0.4993896484375, 0.65045166015625, 0.801513671875, 0.95257568359375, 1.1036376953125, 1.25469970703125, 1.40576171875, 1.55682373046875, 1.7078857421875, 1.85894775390625, 2.010009765625, 2.16107177734375, 2.3121337890625, 2.46319580078125, 2.6142578125, 2.76531982421875, 2.9163818359375, 3.06744384765625, 3.218505859375, 3.36956787109375, 3.5206298828125, 3.67169189453125, 3.82275390625, 3.97381591796875, 4.1248779296875, 4.27593994140625, 4.427001953125, 4.57806396484375, 4.7291259765625, 4.88018798828125, 5.03125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 4.0, 3.0, 7.0, 3.0, 10.0, 14.0, 9.0, 8.0, 19.0, 22.0, 21.0, 22.0, 27.0, 28.0, 31.0, 34.0, 35.0, 42.0, 47.0, 32.0, 26.0, 55.0, 43.0, 49.0, 44.0, 35.0, 45.0, 44.0, 36.0, 35.0, 31.0, 23.0, 17.0, 24.0, 19.0, 14.0, 7.0, 7.0, 12.0, 3.0, 5.0, 5.0, 1.0, 7.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.0234375, -12.60009765625, -12.1767578125, -11.75341796875, -11.330078125, -10.90673828125, -10.4833984375, -10.06005859375, -9.63671875, -9.21337890625, -8.7900390625, -8.36669921875, -7.943359375, -7.52001953125, -7.0966796875, -6.67333984375, -6.25, -5.82666015625, -5.4033203125, -4.97998046875, -4.556640625, -4.13330078125, -3.7099609375, -3.28662109375, -2.86328125, -2.43994140625, -2.0166015625, -1.59326171875, -1.169921875, -0.74658203125, -0.3232421875, 0.10009765625, 0.5234375, 0.94677734375, 1.3701171875, 1.79345703125, 2.216796875, 2.64013671875, 3.0634765625, 3.48681640625, 3.91015625, 4.33349609375, 4.7568359375, 5.18017578125, 5.603515625, 6.02685546875, 6.4501953125, 6.87353515625, 7.296875, 7.72021484375, 8.1435546875, 8.56689453125, 8.990234375, 9.41357421875, 9.8369140625, 10.26025390625, 10.68359375, 11.10693359375, 11.5302734375, 11.95361328125, 12.376953125, 12.80029296875, 13.2236328125, 13.64697265625, 14.0703125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 4.0, 4.0, 10.0, 12.0, 14.0, 18.0, 26.0, 29.0, 44.0, 99.0, 146.0, 264.0, 688.0, 1872.0, 6283.0, 24898.0, 672361.0, 312133.0, 21219.0, 5468.0, 1689.0, 615.0, 274.0, 146.0, 74.0, 51.0, 43.0, 17.0, 18.0, 15.0, 14.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-21.9375, -21.250732421875, -20.56396484375, -19.877197265625, -19.1904296875, -18.503662109375, -17.81689453125, -17.130126953125, -16.443359375, -15.756591796875, -15.06982421875, -14.383056640625, -13.6962890625, -13.009521484375, -12.32275390625, -11.635986328125, -10.94921875, -10.262451171875, -9.57568359375, -8.888916015625, -8.2021484375, -7.515380859375, -6.82861328125, -6.141845703125, -5.455078125, -4.768310546875, -4.08154296875, -3.394775390625, -2.7080078125, -2.021240234375, -1.33447265625, -0.647705078125, 0.0390625, 0.725830078125, 1.41259765625, 2.099365234375, 2.7861328125, 3.472900390625, 4.15966796875, 4.846435546875, 5.533203125, 6.219970703125, 6.90673828125, 7.593505859375, 8.2802734375, 8.967041015625, 9.65380859375, 10.340576171875, 11.02734375, 11.714111328125, 12.40087890625, 13.087646484375, 13.7744140625, 14.461181640625, 15.14794921875, 15.834716796875, 16.521484375, 17.208251953125, 17.89501953125, 18.581787109375, 19.2685546875, 19.955322265625, 20.64208984375, 21.328857421875, 22.015625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 5.0, 4.0, 8.0, 15.0, 10.0, 16.0, 9.0, 14.0, 22.0, 24.0, 19.0, 24.0, 33.0, 36.0, 38.0, 35.0, 44.0, 29.0, 45.0, 51.0, 45.0, 46.0, 48.0, 50.0, 51.0, 30.0, 29.0, 35.0, 34.0, 29.0, 30.0, 15.0, 23.0, 15.0, 10.0, 9.0, 9.0, 5.0, 2.0, 2.0, 6.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-12.7421875, -12.3887939453125, -12.035400390625, -11.6820068359375, -11.32861328125, -10.9752197265625, -10.621826171875, -10.2684326171875, -9.9150390625, -9.5616455078125, -9.208251953125, -8.8548583984375, -8.50146484375, -8.1480712890625, -7.794677734375, -7.4412841796875, -7.087890625, -6.7344970703125, -6.381103515625, -6.0277099609375, -5.67431640625, -5.3209228515625, -4.967529296875, -4.6141357421875, -4.2607421875, -3.9073486328125, -3.553955078125, -3.2005615234375, -2.84716796875, -2.4937744140625, -2.140380859375, -1.7869873046875, -1.43359375, -1.0802001953125, -0.726806640625, -0.3734130859375, -0.02001953125, 0.3333740234375, 0.686767578125, 1.0401611328125, 1.3935546875, 1.7469482421875, 2.100341796875, 2.4537353515625, 2.80712890625, 3.1605224609375, 3.513916015625, 3.8673095703125, 4.220703125, 4.5740966796875, 4.927490234375, 5.2808837890625, 5.63427734375, 5.9876708984375, 6.341064453125, 6.6944580078125, 7.0478515625, 7.4012451171875, 7.754638671875, 8.1080322265625, 8.46142578125, 8.8148193359375, 9.168212890625, 9.5216064453125, 9.875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 6.0, 3.0, 4.0, 7.0, 18.0, 12.0, 20.0, 26.0, 55.0, 67.0, 76.0, 156.0, 241.0, 460.0, 785.0, 1536.0, 3244.0, 7438.0, 22435.0, 290144.0, 679050.0, 26986.0, 8510.0, 3529.0, 1696.0, 856.0, 436.0, 274.0, 153.0, 94.0, 65.0, 37.0, 40.0, 34.0, 21.0, 9.0, 12.0, 9.0, 7.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.482421875, -3.366607666015625, -3.25079345703125, -3.134979248046875, -3.0191650390625, -2.903350830078125, -2.78753662109375, -2.671722412109375, -2.555908203125, -2.440093994140625, -2.32427978515625, -2.208465576171875, -2.0926513671875, -1.976837158203125, -1.86102294921875, -1.745208740234375, -1.62939453125, -1.513580322265625, -1.39776611328125, -1.281951904296875, -1.1661376953125, -1.050323486328125, -0.93450927734375, -0.818695068359375, -0.702880859375, -0.587066650390625, -0.47125244140625, -0.355438232421875, -0.2396240234375, -0.123809814453125, -0.00799560546875, 0.107818603515625, 0.2236328125, 0.339447021484375, 0.45526123046875, 0.571075439453125, 0.6868896484375, 0.802703857421875, 0.91851806640625, 1.034332275390625, 1.150146484375, 1.265960693359375, 1.38177490234375, 1.497589111328125, 1.6134033203125, 1.729217529296875, 1.84503173828125, 1.960845947265625, 2.07666015625, 2.192474365234375, 2.30828857421875, 2.424102783203125, 2.5399169921875, 2.655731201171875, 2.77154541015625, 2.887359619140625, 3.003173828125, 3.118988037109375, 3.23480224609375, 3.350616455078125, 3.4664306640625, 3.582244873046875, 3.69805908203125, 3.813873291015625, 3.9296875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 5.0, 7.0, 5.0, 4.0, 11.0, 18.0, 12.0, 21.0, 25.0, 35.0, 38.0, 46.0, 63.0, 66.0, 79.0, 82.0, 71.0, 87.0, 65.0, 54.0, 33.0, 32.0, 33.0, 28.0, 26.0, 14.0, 8.0, 6.0, 4.0, 4.0, 8.0, 2.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00023829936981201172, -0.00023101456463336945, -0.00022372975945472717, -0.0002164449542760849, -0.00020916014909744263, -0.00020187534391880035, -0.00019459053874015808, -0.0001873057335615158, -0.00018002092838287354, -0.00017273612320423126, -0.000165451318025589, -0.00015816651284694672, -0.00015088170766830444, -0.00014359690248966217, -0.0001363120973110199, -0.00012902729213237762, -0.00012174248695373535, -0.00011445768177509308, -0.0001071728765964508, -9.988807141780853e-05, -9.260326623916626e-05, -8.531846106052399e-05, -7.803365588188171e-05, -7.074885070323944e-05, -6.346404552459717e-05, -5.6179240345954895e-05, -4.889443516731262e-05, -4.160962998867035e-05, -3.4324824810028076e-05, -2.7040019631385803e-05, -1.975521445274353e-05, -1.2470409274101257e-05, -5.185604095458984e-06, 2.0992010831832886e-06, 9.384006261825562e-06, 1.6668811440467834e-05, 2.3953616619110107e-05, 3.123842179775238e-05, 3.852322697639465e-05, 4.5808032155036926e-05, 5.30928373336792e-05, 6.037764251232147e-05, 6.766244769096375e-05, 7.494725286960602e-05, 8.223205804824829e-05, 8.951686322689056e-05, 9.680166840553284e-05, 0.00010408647358417511, 0.00011137127876281738, 0.00011865608394145966, 0.00012594088912010193, 0.0001332256942987442, 0.00014051049947738647, 0.00014779530465602875, 0.00015508010983467102, 0.0001623649150133133, 0.00016964972019195557, 0.00017693452537059784, 0.0001842193305492401, 0.00019150413572788239, 0.00019878894090652466, 0.00020607374608516693, 0.0002133585512638092, 0.00022064335644245148, 0.00022792816162109375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 6.0, 8.0, 10.0, 14.0, 15.0, 32.0, 47.0, 69.0, 99.0, 131.0, 225.0, 344.0, 509.0, 749.0, 1067.0, 1563.0, 2370.0, 3712.0, 6072.0, 9899.0, 16800.0, 29805.0, 54783.0, 96989.0, 158531.0, 212669.0, 181089.0, 116705.0, 66030.0, 36179.0, 20347.0, 11623.0, 7167.0, 4323.0, 2822.0, 1945.0, 1261.0, 847.0, 575.0, 348.0, 288.0, 167.0, 111.0, 63.0, 52.0, 37.0, 33.0, 9.0, 9.0, 7.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.9345703125, -1.8753509521484375, -1.816131591796875, -1.7569122314453125, -1.69769287109375, -1.6384735107421875, -1.579254150390625, -1.5200347900390625, -1.4608154296875, -1.4015960693359375, -1.342376708984375, -1.2831573486328125, -1.22393798828125, -1.1647186279296875, -1.105499267578125, -1.0462799072265625, -0.987060546875, -0.9278411865234375, -0.868621826171875, -0.8094024658203125, -0.75018310546875, -0.6909637451171875, -0.631744384765625, -0.5725250244140625, -0.5133056640625, -0.4540863037109375, -0.394866943359375, -0.3356475830078125, -0.27642822265625, -0.2172088623046875, -0.157989501953125, -0.0987701416015625, -0.03955078125, 0.0196685791015625, 0.078887939453125, 0.1381072998046875, 0.19732666015625, 0.2565460205078125, 0.315765380859375, 0.3749847412109375, 0.4342041015625, 0.4934234619140625, 0.552642822265625, 0.6118621826171875, 0.67108154296875, 0.7303009033203125, 0.789520263671875, 0.8487396240234375, 0.907958984375, 0.9671783447265625, 1.026397705078125, 1.0856170654296875, 1.14483642578125, 1.2040557861328125, 1.263275146484375, 1.3224945068359375, 1.3817138671875, 1.4409332275390625, 1.500152587890625, 1.5593719482421875, 1.61859130859375, 1.6778106689453125, 1.737030029296875, 1.7962493896484375, 1.85546875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 4.0, 5.0, 3.0, 10.0, 6.0, 6.0, 5.0, 6.0, 9.0, 13.0, 20.0, 20.0, 19.0, 29.0, 30.0, 37.0, 52.0, 53.0, 59.0, 57.0, 56.0, 70.0, 71.0, 48.0, 68.0, 47.0, 25.0, 37.0, 23.0, 20.0, 15.0, 14.0, 9.0, 13.0, 4.0, 7.0, 8.0, 8.0, 5.0, 0.0, 7.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.69091796875, -0.6704788208007812, -0.6500396728515625, -0.6296005249023438, -0.609161376953125, -0.5887222290039062, -0.5682830810546875, -0.5478439331054688, -0.52740478515625, -0.5069656372070312, -0.4865264892578125, -0.46608734130859375, -0.445648193359375, -0.42520904541015625, -0.4047698974609375, -0.38433074951171875, -0.3638916015625, -0.34345245361328125, -0.3230133056640625, -0.30257415771484375, -0.282135009765625, -0.26169586181640625, -0.2412567138671875, -0.22081756591796875, -0.20037841796875, -0.17993927001953125, -0.1595001220703125, -0.13906097412109375, -0.118621826171875, -0.09818267822265625, -0.0777435302734375, -0.05730438232421875, -0.036865234375, -0.01642608642578125, 0.0040130615234375, 0.02445220947265625, 0.044891357421875, 0.06533050537109375, 0.0857696533203125, 0.10620880126953125, 0.12664794921875, 0.14708709716796875, 0.1675262451171875, 0.18796539306640625, 0.208404541015625, 0.22884368896484375, 0.2492828369140625, 0.26972198486328125, 0.2901611328125, 0.31060028076171875, 0.3310394287109375, 0.35147857666015625, 0.371917724609375, 0.39235687255859375, 0.4127960205078125, 0.43323516845703125, 0.45367431640625, 0.47411346435546875, 0.4945526123046875, 0.5149917602539062, 0.535430908203125, 0.5558700561523438, 0.5763092041015625, 0.5967483520507812, 0.6171875]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 4.0, 5.0, 2.0, 5.0, 2.0, 11.0, 8.0, 14.0, 16.0, 19.0, 22.0, 24.0, 29.0, 36.0, 29.0, 40.0, 48.0, 36.0, 50.0, 46.0, 38.0, 48.0, 49.0, 39.0, 52.0, 38.0, 33.0, 40.0, 31.0, 26.0, 29.0, 20.0, 23.0, 12.0, 18.0, 22.0, 11.0, 9.0, 6.0, 4.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-13.6079740524292, -13.222247123718262, -12.836519241333008, -12.45079231262207, -12.065064430236816, -11.679337501525879, -11.293609619140625, -10.907882690429688, -10.52215576171875, -10.136428833007812, -9.750700950622559, -9.364974021911621, -8.979246139526367, -8.59351921081543, -8.207792282104492, -7.822064399719238, -7.436336994171143, -7.050609588623047, -6.664882183074951, -6.2791547775268555, -5.893427848815918, -5.507700443267822, -5.121973037719727, -4.736246109008789, -4.350518226623535, -3.9647908210754395, -3.579063653945923, -3.193336248397827, -2.8076090812683105, -2.421881675720215, -2.036154270172119, -1.6504271030426025, -1.264699935913086, -0.8789726495742798, -0.49324530363082886, -0.10751795768737793, 0.2782093286514282, 0.6639366149902344, 1.04966402053833, 1.4353911876678467, 1.8211185932159424, 2.206845998764038, 2.5925731658935547, 2.9783005714416504, 3.364027976989746, 3.7497551441192627, 4.1354827880859375, 4.521209716796875, 4.906937122344971, 5.292664527893066, 5.678391933441162, 6.064119338989258, 6.449846267700195, 6.835573673248291, 7.221301078796387, 7.607028007507324, 7.992755889892578, 8.378482818603516, 8.76421070098877, 9.149937629699707, 9.535665512084961, 9.921392440795898, 10.307119369506836, 10.69284725189209, 11.078574180603027]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 1.0, 5.0, 3.0, 2.0, 5.0, 5.0, 8.0, 5.0, 11.0, 16.0, 24.0, 20.0, 21.0, 15.0, 28.0, 26.0, 29.0, 32.0, 28.0, 37.0, 36.0, 41.0, 36.0, 29.0, 51.0, 39.0, 38.0, 55.0, 48.0, 36.0, 32.0, 29.0, 29.0, 29.0, 22.0, 20.0, 25.0, 17.0, 13.0, 10.0, 13.0, 7.0, 4.0, 6.0, 3.0, 4.0, 5.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.223437309265137, -11.846229553222656, -11.469021797180176, -11.091814041137695, -10.714607238769531, -10.33739948272705, -9.96019172668457, -9.58298397064209, -9.20577621459961, -8.828568458557129, -8.451360702514648, -8.074152946472168, -7.696945667266846, -7.319737911224365, -6.942530632019043, -6.5653228759765625, -6.188115119934082, -5.810907363891602, -5.433699607849121, -5.056492328643799, -4.679284572601318, -4.302076816558838, -3.9248692989349365, -3.547661781311035, -3.1704540252685547, -2.793246269226074, -2.416038751602173, -2.0388312339782715, -1.661623477935791, -1.2844158411026, -0.9072082042694092, -0.5300006866455078, -0.15279388427734375, 0.22441375255584717, 0.6016213893890381, 0.978829026222229, 1.35603666305542, 1.7332442998886108, 2.1104519367218018, 2.487659454345703, 2.8648672103881836, 3.242074966430664, 3.6192824840545654, 3.996490001678467, 4.373697757720947, 4.750905513763428, 5.12811279296875, 5.5053205490112305, 5.882528305053711, 6.259736061096191, 6.636943817138672, 7.014151096343994, 7.391358852386475, 7.768566608428955, 8.145773887634277, 8.522981643676758, 8.900189399719238, 9.277397155761719, 9.6546049118042, 10.03181266784668, 10.409019470214844, 10.786227226257324, 11.163434982299805, 11.540642738342285, 11.917850494384766]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 5.0, 7.0, 11.0, 28.0, 30.0, 52.0, 91.0, 160.0, 215.0, 350.0, 561.0, 834.0, 1328.0, 1988.0, 2965.0, 4507.0, 6677.0, 9828.0, 13992.0, 19744.0, 27379.0, 36574.0, 47186.0, 59465.0, 70974.0, 81244.0, 88658.0, 91205.0, 88932.0, 82153.0, 71812.0, 60067.0, 48831.0, 37274.0, 28161.0, 20352.0, 14669.0, 9938.0, 6845.0, 4700.0, 2987.0, 2063.0, 1345.0, 870.0, 579.0, 392.0, 206.0, 114.0, 84.0, 56.0, 28.0, 23.0, 14.0, 4.0, 6.0, 5.0, 2.0, 1.0, 0.0, 2.0], "bins": [-8.0234375, -7.76904296875, -7.5146484375, -7.26025390625, -7.005859375, -6.75146484375, -6.4970703125, -6.24267578125, -5.98828125, -5.73388671875, -5.4794921875, -5.22509765625, -4.970703125, -4.71630859375, -4.4619140625, -4.20751953125, -3.953125, -3.69873046875, -3.4443359375, -3.18994140625, -2.935546875, -2.68115234375, -2.4267578125, -2.17236328125, -1.91796875, -1.66357421875, -1.4091796875, -1.15478515625, -0.900390625, -0.64599609375, -0.3916015625, -0.13720703125, 0.1171875, 0.37158203125, 0.6259765625, 0.88037109375, 1.134765625, 1.38916015625, 1.6435546875, 1.89794921875, 2.15234375, 2.40673828125, 2.6611328125, 2.91552734375, 3.169921875, 3.42431640625, 3.6787109375, 3.93310546875, 4.1875, 4.44189453125, 4.6962890625, 4.95068359375, 5.205078125, 5.45947265625, 5.7138671875, 5.96826171875, 6.22265625, 6.47705078125, 6.7314453125, 6.98583984375, 7.240234375, 7.49462890625, 7.7490234375, 8.00341796875, 8.2578125]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 4.0, 1.0, 4.0, 4.0, 6.0, 4.0, 7.0, 9.0, 8.0, 14.0, 9.0, 14.0, 25.0, 14.0, 13.0, 24.0, 20.0, 20.0, 23.0, 27.0, 31.0, 29.0, 31.0, 40.0, 31.0, 48.0, 38.0, 29.0, 39.0, 40.0, 37.0, 36.0, 34.0, 34.0, 32.0, 26.0, 25.0, 27.0, 24.0, 17.0, 16.0, 16.0, 9.0, 10.0, 12.0, 9.0, 7.0, 6.0, 6.0, 6.0, 4.0, 1.0, 1.0, 2.0, 5.0, 0.0, 3.0, 4.0], "bins": [-11.46875, -11.1224365234375, -10.776123046875, -10.4298095703125, -10.08349609375, -9.7371826171875, -9.390869140625, -9.0445556640625, -8.6982421875, -8.3519287109375, -8.005615234375, -7.6593017578125, -7.31298828125, -6.9666748046875, -6.620361328125, -6.2740478515625, -5.927734375, -5.5814208984375, -5.235107421875, -4.8887939453125, -4.54248046875, -4.1961669921875, -3.849853515625, -3.5035400390625, -3.1572265625, -2.8109130859375, -2.464599609375, -2.1182861328125, -1.77197265625, -1.4256591796875, -1.079345703125, -0.7330322265625, -0.38671875, -0.0404052734375, 0.305908203125, 0.6522216796875, 0.99853515625, 1.3448486328125, 1.691162109375, 2.0374755859375, 2.3837890625, 2.7301025390625, 3.076416015625, 3.4227294921875, 3.76904296875, 4.1153564453125, 4.461669921875, 4.8079833984375, 5.154296875, 5.5006103515625, 5.846923828125, 6.1932373046875, 6.53955078125, 6.8858642578125, 7.232177734375, 7.5784912109375, 7.9248046875, 8.2711181640625, 8.617431640625, 8.9637451171875, 9.31005859375, 9.6563720703125, 10.002685546875, 10.3489990234375, 10.6953125]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 9.0, 4.0, 10.0, 26.0, 32.0, 49.0, 82.0, 118.0, 206.0, 263.0, 362.0, 575.0, 797.0, 1241.0, 1820.0, 2647.0, 3921.0, 5597.0, 8101.0, 11438.0, 16292.0, 22731.0, 30562.0, 40485.0, 52179.0, 64081.0, 76809.0, 85886.0, 91561.0, 91634.0, 87025.0, 77677.0, 66165.0, 53990.0, 42279.0, 31658.0, 23394.0, 17127.0, 12273.0, 8586.0, 6045.0, 4071.0, 2773.0, 1952.0, 1296.0, 917.0, 611.0, 405.0, 253.0, 189.0, 129.0, 89.0, 61.0, 25.0, 25.0, 14.0, 8.0, 7.0, 2.0, 4.0, 2.0], "bins": [-10.5234375, -10.1953125, -9.8671875, -9.5390625, -9.2109375, -8.8828125, -8.5546875, -8.2265625, -7.8984375, -7.5703125, -7.2421875, -6.9140625, -6.5859375, -6.2578125, -5.9296875, -5.6015625, -5.2734375, -4.9453125, -4.6171875, -4.2890625, -3.9609375, -3.6328125, -3.3046875, -2.9765625, -2.6484375, -2.3203125, -1.9921875, -1.6640625, -1.3359375, -1.0078125, -0.6796875, -0.3515625, -0.0234375, 0.3046875, 0.6328125, 0.9609375, 1.2890625, 1.6171875, 1.9453125, 2.2734375, 2.6015625, 2.9296875, 3.2578125, 3.5859375, 3.9140625, 4.2421875, 4.5703125, 4.8984375, 5.2265625, 5.5546875, 5.8828125, 6.2109375, 6.5390625, 6.8671875, 7.1953125, 7.5234375, 7.8515625, 8.1796875, 8.5078125, 8.8359375, 9.1640625, 9.4921875, 9.8203125, 10.1484375, 10.4765625]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 6.0, 9.0, 7.0, 4.0, 4.0, 2.0, 10.0, 14.0, 12.0, 13.0, 13.0, 22.0, 18.0, 20.0, 28.0, 22.0, 20.0, 43.0, 34.0, 36.0, 42.0, 34.0, 40.0, 39.0, 38.0, 29.0, 45.0, 43.0, 38.0, 32.0, 41.0, 28.0, 24.0, 25.0, 23.0, 22.0, 22.0, 20.0, 14.0, 9.0, 14.0, 14.0, 5.0, 7.0, 6.0, 7.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0], "bins": [-8.8359375, -8.5914306640625, -8.346923828125, -8.1024169921875, -7.85791015625, -7.6134033203125, -7.368896484375, -7.1243896484375, -6.8798828125, -6.6353759765625, -6.390869140625, -6.1463623046875, -5.90185546875, -5.6573486328125, -5.412841796875, -5.1683349609375, -4.923828125, -4.6793212890625, -4.434814453125, -4.1903076171875, -3.94580078125, -3.7012939453125, -3.456787109375, -3.2122802734375, -2.9677734375, -2.7232666015625, -2.478759765625, -2.2342529296875, -1.98974609375, -1.7452392578125, -1.500732421875, -1.2562255859375, -1.01171875, -0.7672119140625, -0.522705078125, -0.2781982421875, -0.03369140625, 0.2108154296875, 0.455322265625, 0.6998291015625, 0.9443359375, 1.1888427734375, 1.433349609375, 1.6778564453125, 1.92236328125, 2.1668701171875, 2.411376953125, 2.6558837890625, 2.900390625, 3.1448974609375, 3.389404296875, 3.6339111328125, 3.87841796875, 4.1229248046875, 4.367431640625, 4.6119384765625, 4.8564453125, 5.1009521484375, 5.345458984375, 5.5899658203125, 5.83447265625, 6.0789794921875, 6.323486328125, 6.5679931640625, 6.8125]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 7.0, 9.0, 5.0, 18.0, 27.0, 41.0, 59.0, 82.0, 153.0, 203.0, 330.0, 533.0, 747.0, 1198.0, 1938.0, 3231.0, 5057.0, 8193.0, 13507.0, 21450.0, 33222.0, 49705.0, 70838.0, 94312.0, 115567.0, 126510.0, 124117.0, 108731.0, 86603.0, 62865.0, 42878.0, 28250.0, 18382.0, 11156.0, 7076.0, 4360.0, 2654.0, 1652.0, 1021.0, 679.0, 389.0, 265.0, 194.0, 119.0, 70.0, 60.0, 30.0, 28.0, 14.0, 9.0, 7.0, 6.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-3.4609375, -3.3521728515625, -3.243408203125, -3.1346435546875, -3.02587890625, -2.9171142578125, -2.808349609375, -2.6995849609375, -2.5908203125, -2.4820556640625, -2.373291015625, -2.2645263671875, -2.15576171875, -2.0469970703125, -1.938232421875, -1.8294677734375, -1.720703125, -1.6119384765625, -1.503173828125, -1.3944091796875, -1.28564453125, -1.1768798828125, -1.068115234375, -0.9593505859375, -0.8505859375, -0.7418212890625, -0.633056640625, -0.5242919921875, -0.41552734375, -0.3067626953125, -0.197998046875, -0.0892333984375, 0.01953125, 0.1282958984375, 0.237060546875, 0.3458251953125, 0.45458984375, 0.5633544921875, 0.672119140625, 0.7808837890625, 0.8896484375, 0.9984130859375, 1.107177734375, 1.2159423828125, 1.32470703125, 1.4334716796875, 1.542236328125, 1.6510009765625, 1.759765625, 1.8685302734375, 1.977294921875, 2.0860595703125, 2.19482421875, 2.3035888671875, 2.412353515625, 2.5211181640625, 2.6298828125, 2.7386474609375, 2.847412109375, 2.9561767578125, 3.06494140625, 3.1737060546875, 3.282470703125, 3.3912353515625, 3.5]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 5.0, 2.0, 6.0, 4.0, 11.0, 7.0, 11.0, 12.0, 18.0, 17.0, 18.0, 31.0, 37.0, 23.0, 39.0, 33.0, 40.0, 49.0, 52.0, 51.0, 56.0, 48.0, 50.0, 38.0, 32.0, 47.0, 38.0, 26.0, 35.0, 32.0, 25.0, 21.0, 13.0, 13.0, 21.0, 8.0, 4.0, 8.0, 7.0, 3.0, 6.0, 2.0, 1.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0003566741943359375, -0.0003433153033256531, -0.00032995641231536865, -0.00031659752130508423, -0.0003032386302947998, -0.0002898797392845154, -0.00027652084827423096, -0.00026316195726394653, -0.0002498030662536621, -0.00023644417524337769, -0.00022308528423309326, -0.00020972639322280884, -0.00019636750221252441, -0.00018300861120224, -0.00016964972019195557, -0.00015629082918167114, -0.00014293193817138672, -0.0001295730471611023, -0.00011621415615081787, -0.00010285526514053345, -8.949637413024902e-05, -7.61374831199646e-05, -6.277859210968018e-05, -4.941970109939575e-05, -3.606081008911133e-05, -2.2701919078826904e-05, -9.34302806854248e-06, 4.015862941741943e-06, 1.7374753952026367e-05, 3.073364496231079e-05, 4.4092535972595215e-05, 5.745142698287964e-05, 7.081031799316406e-05, 8.416920900344849e-05, 9.752810001373291e-05, 0.00011088699102401733, 0.00012424588203430176, 0.00013760477304458618, 0.0001509636640548706, 0.00016432255506515503, 0.00017768144607543945, 0.00019104033708572388, 0.0002043992280960083, 0.00021775811910629272, 0.00023111701011657715, 0.00024447590112686157, 0.000257834792137146, 0.0002711936831474304, 0.00028455257415771484, 0.00029791146516799927, 0.0003112703561782837, 0.0003246292471885681, 0.00033798813819885254, 0.00035134702920913696, 0.0003647059202194214, 0.0003780648112297058, 0.00039142370223999023, 0.00040478259325027466, 0.0004181414842605591, 0.0004315003752708435, 0.00044485926628112793, 0.00045821815729141235, 0.0004715770483016968, 0.0004849359393119812, 0.0004982948303222656]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 7.0, 5.0, 8.0, 16.0, 32.0, 54.0, 69.0, 99.0, 172.0, 289.0, 452.0, 699.0, 1109.0, 1854.0, 3220.0, 5160.0, 8586.0, 14468.0, 23572.0, 36953.0, 56067.0, 79215.0, 103193.0, 123121.0, 130550.0, 123079.0, 103621.0, 79626.0, 56024.0, 37105.0, 23550.0, 14462.0, 8852.0, 5245.0, 3086.0, 1912.0, 1167.0, 679.0, 453.0, 273.0, 146.0, 108.0, 73.0, 48.0, 24.0, 24.0, 11.0, 7.0, 12.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.5859375, -3.475616455078125, -3.36529541015625, -3.254974365234375, -3.1446533203125, -3.034332275390625, -2.92401123046875, -2.813690185546875, -2.703369140625, -2.593048095703125, -2.48272705078125, -2.372406005859375, -2.2620849609375, -2.151763916015625, -2.04144287109375, -1.931121826171875, -1.82080078125, -1.710479736328125, -1.60015869140625, -1.489837646484375, -1.3795166015625, -1.269195556640625, -1.15887451171875, -1.048553466796875, -0.938232421875, -0.827911376953125, -0.71759033203125, -0.607269287109375, -0.4969482421875, -0.386627197265625, -0.27630615234375, -0.165985107421875, -0.0556640625, 0.054656982421875, 0.16497802734375, 0.275299072265625, 0.3856201171875, 0.495941162109375, 0.60626220703125, 0.716583251953125, 0.826904296875, 0.937225341796875, 1.04754638671875, 1.157867431640625, 1.2681884765625, 1.378509521484375, 1.48883056640625, 1.599151611328125, 1.70947265625, 1.819793701171875, 1.93011474609375, 2.040435791015625, 2.1507568359375, 2.261077880859375, 2.37139892578125, 2.481719970703125, 2.592041015625, 2.702362060546875, 2.81268310546875, 2.923004150390625, 3.0333251953125, 3.143646240234375, 3.25396728515625, 3.364288330078125, 3.474609375]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 5.0, 7.0, 3.0, 8.0, 14.0, 13.0, 20.0, 27.0, 21.0, 28.0, 26.0, 26.0, 34.0, 44.0, 48.0, 62.0, 52.0, 59.0, 42.0, 51.0, 51.0, 46.0, 53.0, 37.0, 35.0, 35.0, 31.0, 22.0, 14.0, 21.0, 10.0, 5.0, 11.0, 9.0, 9.0, 5.0, 7.0, 0.0, 2.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.689453125, -1.640045166015625, -1.59063720703125, -1.541229248046875, -1.4918212890625, -1.442413330078125, -1.39300537109375, -1.343597412109375, -1.294189453125, -1.244781494140625, -1.19537353515625, -1.145965576171875, -1.0965576171875, -1.047149658203125, -0.99774169921875, -0.948333740234375, -0.89892578125, -0.849517822265625, -0.80010986328125, -0.750701904296875, -0.7012939453125, -0.651885986328125, -0.60247802734375, -0.553070068359375, -0.503662109375, -0.454254150390625, -0.40484619140625, -0.355438232421875, -0.3060302734375, -0.256622314453125, -0.20721435546875, -0.157806396484375, -0.1083984375, -0.058990478515625, -0.00958251953125, 0.039825439453125, 0.0892333984375, 0.138641357421875, 0.18804931640625, 0.237457275390625, 0.286865234375, 0.336273193359375, 0.38568115234375, 0.435089111328125, 0.4844970703125, 0.533905029296875, 0.58331298828125, 0.632720947265625, 0.68212890625, 0.731536865234375, 0.78094482421875, 0.830352783203125, 0.8797607421875, 0.929168701171875, 0.97857666015625, 1.027984619140625, 1.077392578125, 1.126800537109375, 1.17620849609375, 1.225616455078125, 1.2750244140625, 1.324432373046875, 1.37384033203125, 1.423248291015625, 1.47265625]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 2.0, 1.0, 5.0, 6.0, 8.0, 4.0, 14.0, 9.0, 16.0, 23.0, 26.0, 28.0, 38.0, 29.0, 45.0, 42.0, 56.0, 61.0, 58.0, 47.0, 54.0, 60.0, 46.0, 50.0, 46.0, 34.0, 31.0, 32.0, 28.0, 24.0, 15.0, 16.0, 14.0, 12.0, 10.0, 7.0, 4.0, 3.0, 1.0, 0.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.573022842407227, -14.113362312316895, -13.653701782226562, -13.194040298461914, -12.734379768371582, -12.27471923828125, -11.815057754516602, -11.35539722442627, -10.895736694335938, -10.436076164245605, -9.976415634155273, -9.516754150390625, -9.057093620300293, -8.597433090209961, -8.137771606445312, -7.6781110763549805, -7.218450546264648, -6.758790016174316, -6.299129009246826, -5.839468002319336, -5.379807472229004, -4.920146942138672, -4.460485935211182, -4.000824928283691, -3.5411643981933594, -3.0815036296844482, -2.621842861175537, -2.162182092666626, -1.7025213241577148, -1.2428605556488037, -0.7831997871398926, -0.32353901863098145, 0.1361217498779297, 0.5957825183868408, 1.055443286895752, 1.515104055404663, 1.9747648239135742, 2.4344255924224854, 2.8940863609313965, 3.3537471294403076, 3.8134078979492188, 4.273068428039551, 4.732729434967041, 5.192390441894531, 5.652050971984863, 6.111711502075195, 6.5713725090026855, 7.031033515930176, 7.490694046020508, 7.95035457611084, 8.410015106201172, 8.86967658996582, 9.329337120056152, 9.788997650146484, 10.248659133911133, 10.708319664001465, 11.167980194091797, 11.627640724182129, 12.087301254272461, 12.54696273803711, 13.006623268127441, 13.466283798217773, 13.925945281982422, 14.385605812072754, 14.845266342163086]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 8.0, 3.0, 8.0, 7.0, 9.0, 15.0, 14.0, 23.0, 18.0, 18.0, 29.0, 20.0, 35.0, 34.0, 40.0, 32.0, 33.0, 40.0, 34.0, 36.0, 47.0, 48.0, 39.0, 39.0, 38.0, 42.0, 41.0, 38.0, 32.0, 25.0, 25.0, 23.0, 23.0, 12.0, 14.0, 15.0, 16.0, 5.0, 5.0, 6.0, 3.0, 5.0, 4.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-13.273531913757324, -12.853752136230469, -12.433971405029297, -12.014191627502441, -11.594411849975586, -11.174631118774414, -10.754851341247559, -10.335071563720703, -9.915290832519531, -9.495511054992676, -9.075730323791504, -8.655950546264648, -8.236169815063477, -7.816390037536621, -7.396610260009766, -6.976830005645752, -6.557049751281738, -6.137269496917725, -5.717489242553711, -5.2977094650268555, -4.877929210662842, -4.458148956298828, -4.038369178771973, -3.618588924407959, -3.1988086700439453, -2.7790284156799316, -2.359248399734497, -1.939468264579773, -1.5196881294250488, -1.0999078750610352, -0.6801278591156006, -0.260347843170166, 0.15943336486816406, 0.5792135000228882, 0.9989936351776123, 1.4187737703323364, 1.8385539054870605, 2.258334159851074, 2.678114175796509, 3.0978941917419434, 3.517674446105957, 3.9374547004699707, 4.357234954833984, 4.77701473236084, 5.1967949867248535, 5.616575241088867, 6.036355018615723, 6.456135272979736, 6.87591552734375, 7.295695781707764, 7.715476036071777, 8.135255813598633, 8.555036544799805, 8.97481632232666, 9.394596099853516, 9.814376831054688, 10.234156608581543, 10.653936386108398, 11.07371711730957, 11.493496894836426, 11.913276672363281, 12.333057403564453, 12.752837181091309, 13.172616958618164, 13.592397689819336]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 7.0, 3.0, 6.0, 14.0, 13.0, 37.0, 60.0, 86.0, 154.0, 213.0, 316.0, 545.0, 943.0, 1503.0, 2361.0, 3946.0, 6379.0, 10663.0, 17507.0, 29515.0, 49431.0, 83863.0, 139540.0, 232801.0, 376588.0, 556971.0, 684260.0, 659508.0, 504226.0, 330901.0, 202143.0, 120891.0, 71621.0, 42351.0, 25706.0, 15319.0, 9314.0, 5591.0, 3471.0, 1987.0, 1291.0, 824.0, 558.0, 336.0, 199.0, 111.0, 70.0, 54.0, 31.0, 23.0, 17.0, 10.0, 6.0, 4.0, 5.0, 2.0, 0.0, 3.0, 1.0], "bins": [-11.3046875, -10.9498291015625, -10.594970703125, -10.2401123046875, -9.88525390625, -9.5303955078125, -9.175537109375, -8.8206787109375, -8.4658203125, -8.1109619140625, -7.756103515625, -7.4012451171875, -7.04638671875, -6.6915283203125, -6.336669921875, -5.9818115234375, -5.626953125, -5.2720947265625, -4.917236328125, -4.5623779296875, -4.20751953125, -3.8526611328125, -3.497802734375, -3.1429443359375, -2.7880859375, -2.4332275390625, -2.078369140625, -1.7235107421875, -1.36865234375, -1.0137939453125, -0.658935546875, -0.3040771484375, 0.05078125, 0.4056396484375, 0.760498046875, 1.1153564453125, 1.47021484375, 1.8250732421875, 2.179931640625, 2.5347900390625, 2.8896484375, 3.2445068359375, 3.599365234375, 3.9542236328125, 4.30908203125, 4.6639404296875, 5.018798828125, 5.3736572265625, 5.728515625, 6.0833740234375, 6.438232421875, 6.7930908203125, 7.14794921875, 7.5028076171875, 7.857666015625, 8.2125244140625, 8.5673828125, 8.9222412109375, 9.277099609375, 9.6319580078125, 9.98681640625, 10.3416748046875, 10.696533203125, 11.0513916015625, 11.40625]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 7.0, 0.0, 3.0, 2.0, 4.0, 3.0, 8.0, 8.0, 11.0, 13.0, 17.0, 17.0, 18.0, 14.0, 31.0, 23.0, 30.0, 31.0, 34.0, 33.0, 37.0, 38.0, 40.0, 40.0, 43.0, 35.0, 43.0, 38.0, 32.0, 44.0, 36.0, 36.0, 26.0, 30.0, 27.0, 20.0, 26.0, 20.0, 16.0, 12.0, 13.0, 8.0, 13.0, 8.0, 9.0, 10.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0], "bins": [-12.1953125, -11.8505859375, -11.505859375, -11.1611328125, -10.81640625, -10.4716796875, -10.126953125, -9.7822265625, -9.4375, -9.0927734375, -8.748046875, -8.4033203125, -8.05859375, -7.7138671875, -7.369140625, -7.0244140625, -6.6796875, -6.3349609375, -5.990234375, -5.6455078125, -5.30078125, -4.9560546875, -4.611328125, -4.2666015625, -3.921875, -3.5771484375, -3.232421875, -2.8876953125, -2.54296875, -2.1982421875, -1.853515625, -1.5087890625, -1.1640625, -0.8193359375, -0.474609375, -0.1298828125, 0.21484375, 0.5595703125, 0.904296875, 1.2490234375, 1.59375, 1.9384765625, 2.283203125, 2.6279296875, 2.97265625, 3.3173828125, 3.662109375, 4.0068359375, 4.3515625, 4.6962890625, 5.041015625, 5.3857421875, 5.73046875, 6.0751953125, 6.419921875, 6.7646484375, 7.109375, 7.4541015625, 7.798828125, 8.1435546875, 8.48828125, 8.8330078125, 9.177734375, 9.5224609375, 9.8671875]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 5.0, 3.0, 5.0, 6.0, 13.0, 14.0, 35.0, 67.0, 110.0, 177.0, 293.0, 478.0, 818.0, 1292.0, 2208.0, 3800.0, 6294.0, 10558.0, 17777.0, 29857.0, 50294.0, 83717.0, 137411.0, 221864.0, 341418.0, 492383.0, 627509.0, 641891.0, 525516.0, 370960.0, 243622.0, 152883.0, 92756.0, 56237.0, 33578.0, 19579.0, 11604.0, 7020.0, 4162.0, 2484.0, 1419.0, 870.0, 525.0, 283.0, 198.0, 128.0, 68.0, 43.0, 21.0, 16.0, 9.0, 8.0, 8.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.84375, -10.4951171875, -10.146484375, -9.7978515625, -9.44921875, -9.1005859375, -8.751953125, -8.4033203125, -8.0546875, -7.7060546875, -7.357421875, -7.0087890625, -6.66015625, -6.3115234375, -5.962890625, -5.6142578125, -5.265625, -4.9169921875, -4.568359375, -4.2197265625, -3.87109375, -3.5224609375, -3.173828125, -2.8251953125, -2.4765625, -2.1279296875, -1.779296875, -1.4306640625, -1.08203125, -0.7333984375, -0.384765625, -0.0361328125, 0.3125, 0.6611328125, 1.009765625, 1.3583984375, 1.70703125, 2.0556640625, 2.404296875, 2.7529296875, 3.1015625, 3.4501953125, 3.798828125, 4.1474609375, 4.49609375, 4.8447265625, 5.193359375, 5.5419921875, 5.890625, 6.2392578125, 6.587890625, 6.9365234375, 7.28515625, 7.6337890625, 7.982421875, 8.3310546875, 8.6796875, 9.0283203125, 9.376953125, 9.7255859375, 10.07421875, 10.4228515625, 10.771484375, 11.1201171875, 11.46875]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 4.0, 6.0, 6.0, 12.0, 10.0, 18.0, 32.0, 27.0, 45.0, 59.0, 67.0, 90.0, 99.0, 101.0, 141.0, 183.0, 221.0, 230.0, 246.0, 284.0, 249.0, 269.0, 251.0, 232.0, 197.0, 177.0, 159.0, 139.0, 128.0, 91.0, 61.0, 47.0, 48.0, 40.0, 28.0, 24.0, 15.0, 12.0, 5.0, 7.0, 6.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.31640625, -5.15411376953125, -4.9918212890625, -4.82952880859375, -4.667236328125, -4.50494384765625, -4.3426513671875, -4.18035888671875, -4.01806640625, -3.85577392578125, -3.6934814453125, -3.53118896484375, -3.368896484375, -3.20660400390625, -3.0443115234375, -2.88201904296875, -2.7197265625, -2.55743408203125, -2.3951416015625, -2.23284912109375, -2.070556640625, -1.90826416015625, -1.7459716796875, -1.58367919921875, -1.42138671875, -1.25909423828125, -1.0968017578125, -0.93450927734375, -0.772216796875, -0.60992431640625, -0.4476318359375, -0.28533935546875, -0.123046875, 0.03924560546875, 0.2015380859375, 0.36383056640625, 0.526123046875, 0.68841552734375, 0.8507080078125, 1.01300048828125, 1.17529296875, 1.33758544921875, 1.4998779296875, 1.66217041015625, 1.824462890625, 1.98675537109375, 2.1490478515625, 2.31134033203125, 2.4736328125, 2.63592529296875, 2.7982177734375, 2.96051025390625, 3.122802734375, 3.28509521484375, 3.4473876953125, 3.60968017578125, 3.77197265625, 3.93426513671875, 4.0965576171875, 4.25885009765625, 4.421142578125, 4.58343505859375, 4.7457275390625, 4.90802001953125, 5.0703125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 6.0, 9.0, 6.0, 6.0, 14.0, 11.0, 15.0, 22.0, 21.0, 32.0, 29.0, 45.0, 41.0, 46.0, 44.0, 32.0, 44.0, 50.0, 61.0, 56.0, 53.0, 53.0, 42.0, 46.0, 37.0, 24.0, 27.0, 22.0, 24.0, 13.0, 14.0, 11.0, 6.0, 13.0, 4.0, 8.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.387712478637695, -12.963226318359375, -12.538741111755371, -12.11425495147705, -11.68976879119873, -11.265283584594727, -10.840797424316406, -10.416311264038086, -9.991826057434082, -9.567339897155762, -9.142854690551758, -8.718368530273438, -8.293882369995117, -7.869397163391113, -7.444911003112793, -7.020425319671631, -6.5959391593933105, -6.171453475952148, -5.746967315673828, -5.322481632232666, -4.897995948791504, -4.473509788513184, -4.0490241050720215, -3.6245384216308594, -3.200052499771118, -2.775566577911377, -2.351080894470215, -1.9265949726104736, -1.502109169960022, -1.0776233673095703, -0.6531374454498291, -0.228651762008667, 0.19583415985107422, 0.6203199625015259, 1.0448057651519775, 1.4692916870117188, 1.8937774896621704, 2.318263292312622, 2.7427492141723633, 3.1672348976135254, 3.5917208194732666, 4.016206741333008, 4.44069242477417, 4.865178108215332, 5.289664268493652, 5.7141499519348145, 6.138635635375977, 6.563121795654297, 6.987607479095459, 7.412093162536621, 7.836579322814941, 8.261064529418945, 8.685550689697266, 9.110036849975586, 9.534523010253906, 9.95900821685791, 10.38349437713623, 10.80798053741455, 11.232465744018555, 11.656951904296875, 12.081438064575195, 12.5059232711792, 12.93040943145752, 13.354894638061523, 13.779380798339844]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 7.0, 6.0, 10.0, 6.0, 10.0, 14.0, 21.0, 17.0, 26.0, 23.0, 21.0, 32.0, 21.0, 43.0, 29.0, 41.0, 44.0, 44.0, 31.0, 49.0, 44.0, 45.0, 34.0, 30.0, 40.0, 42.0, 45.0, 23.0, 26.0, 27.0, 27.0, 16.0, 22.0, 16.0, 11.0, 11.0, 4.0, 5.0, 5.0, 7.0, 10.0, 6.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-11.65938663482666, -11.271221160888672, -10.883055686950684, -10.494890213012695, -10.106724739074707, -9.718559265136719, -9.330392837524414, -8.942228317260742, -8.554061889648438, -8.16589641571045, -7.777730941772461, -7.389565467834473, -7.001399993896484, -6.613234519958496, -6.22506856918335, -5.836903095245361, -5.448738098144531, -5.060572624206543, -4.672407150268555, -4.284241676330566, -3.896075963973999, -3.5079104900360107, -3.1197447776794434, -2.731579303741455, -2.343413829803467, -1.9552483558654785, -1.5670827627182007, -1.1789171695709229, -0.7907516956329346, -0.4025862216949463, -0.014420509338378906, 0.3737449645996094, 0.7619104385375977, 1.150075912475586, 1.5382415056228638, 1.9264070987701416, 2.31457257270813, 2.702738046646118, 3.0909037590026855, 3.479069232940674, 3.867234706878662, 4.25540018081665, 4.643565654754639, 5.031731605529785, 5.419897079467773, 5.808062553405762, 6.19622802734375, 6.584393501281738, 6.972558975219727, 7.360724449157715, 7.748889923095703, 8.137055397033691, 8.52522087097168, 8.913386344909668, 9.301551818847656, 9.689718246459961, 10.077882766723633, 10.466048240661621, 10.85421371459961, 11.242379188537598, 11.630544662475586, 12.018710136413574, 12.406875610351562, 12.795042037963867, 13.183207511901855]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 7.0, 13.0, 25.0, 38.0, 63.0, 104.0, 191.0, 278.0, 465.0, 786.0, 1159.0, 1816.0, 2836.0, 4451.0, 6810.0, 10111.0, 14807.0, 21555.0, 29911.0, 40807.0, 53143.0, 66959.0, 80602.0, 91656.0, 97975.0, 97731.0, 91627.0, 80226.0, 66185.0, 52709.0, 40183.0, 29139.0, 21085.0, 14783.0, 9905.0, 6541.0, 4284.0, 2817.0, 1800.0, 1126.0, 687.0, 462.0, 287.0, 165.0, 98.0, 67.0, 39.0, 24.0, 12.0, 8.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.66015625, -4.514404296875, -4.36865234375, -4.222900390625, -4.0771484375, -3.931396484375, -3.78564453125, -3.639892578125, -3.494140625, -3.348388671875, -3.20263671875, -3.056884765625, -2.9111328125, -2.765380859375, -2.61962890625, -2.473876953125, -2.328125, -2.182373046875, -2.03662109375, -1.890869140625, -1.7451171875, -1.599365234375, -1.45361328125, -1.307861328125, -1.162109375, -1.016357421875, -0.87060546875, -0.724853515625, -0.5791015625, -0.433349609375, -0.28759765625, -0.141845703125, 0.00390625, 0.149658203125, 0.29541015625, 0.441162109375, 0.5869140625, 0.732666015625, 0.87841796875, 1.024169921875, 1.169921875, 1.315673828125, 1.46142578125, 1.607177734375, 1.7529296875, 1.898681640625, 2.04443359375, 2.190185546875, 2.3359375, 2.481689453125, 2.62744140625, 2.773193359375, 2.9189453125, 3.064697265625, 3.21044921875, 3.356201171875, 3.501953125, 3.647705078125, 3.79345703125, 3.939208984375, 4.0849609375, 4.230712890625, 4.37646484375, 4.522216796875, 4.66796875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 3.0, 1.0, 6.0, 8.0, 11.0, 16.0, 17.0, 12.0, 16.0, 18.0, 33.0, 28.0, 35.0, 32.0, 27.0, 41.0, 38.0, 41.0, 49.0, 50.0, 44.0, 47.0, 42.0, 42.0, 52.0, 42.0, 31.0, 32.0, 32.0, 20.0, 20.0, 26.0, 25.0, 9.0, 9.0, 13.0, 7.0, 7.0, 7.0, 5.0, 6.0, 1.0, 4.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.515625, -11.13818359375, -10.7607421875, -10.38330078125, -10.005859375, -9.62841796875, -9.2509765625, -8.87353515625, -8.49609375, -8.11865234375, -7.7412109375, -7.36376953125, -6.986328125, -6.60888671875, -6.2314453125, -5.85400390625, -5.4765625, -5.09912109375, -4.7216796875, -4.34423828125, -3.966796875, -3.58935546875, -3.2119140625, -2.83447265625, -2.45703125, -2.07958984375, -1.7021484375, -1.32470703125, -0.947265625, -0.56982421875, -0.1923828125, 0.18505859375, 0.5625, 0.93994140625, 1.3173828125, 1.69482421875, 2.072265625, 2.44970703125, 2.8271484375, 3.20458984375, 3.58203125, 3.95947265625, 4.3369140625, 4.71435546875, 5.091796875, 5.46923828125, 5.8466796875, 6.22412109375, 6.6015625, 6.97900390625, 7.3564453125, 7.73388671875, 8.111328125, 8.48876953125, 8.8662109375, 9.24365234375, 9.62109375, 9.99853515625, 10.3759765625, 10.75341796875, 11.130859375, 11.50830078125, 11.8857421875, 12.26318359375, 12.640625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 3.0, 7.0, 2.0, 6.0, 13.0, 10.0, 16.0, 20.0, 32.0, 41.0, 68.0, 112.0, 198.0, 370.0, 636.0, 1291.0, 2499.0, 4746.0, 9567.0, 18999.0, 44089.0, 736861.0, 172399.0, 28165.0, 13903.0, 6970.0, 3482.0, 1826.0, 1043.0, 501.0, 264.0, 142.0, 93.0, 61.0, 33.0, 22.0, 20.0, 14.0, 11.0, 7.0, 5.0, 5.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-22.484375, -21.837646484375, -21.19091796875, -20.544189453125, -19.8974609375, -19.250732421875, -18.60400390625, -17.957275390625, -17.310546875, -16.663818359375, -16.01708984375, -15.370361328125, -14.7236328125, -14.076904296875, -13.43017578125, -12.783447265625, -12.13671875, -11.489990234375, -10.84326171875, -10.196533203125, -9.5498046875, -8.903076171875, -8.25634765625, -7.609619140625, -6.962890625, -6.316162109375, -5.66943359375, -5.022705078125, -4.3759765625, -3.729248046875, -3.08251953125, -2.435791015625, -1.7890625, -1.142333984375, -0.49560546875, 0.151123046875, 0.7978515625, 1.444580078125, 2.09130859375, 2.738037109375, 3.384765625, 4.031494140625, 4.67822265625, 5.324951171875, 5.9716796875, 6.618408203125, 7.26513671875, 7.911865234375, 8.55859375, 9.205322265625, 9.85205078125, 10.498779296875, 11.1455078125, 11.792236328125, 12.43896484375, 13.085693359375, 13.732421875, 14.379150390625, 15.02587890625, 15.672607421875, 16.3193359375, 16.966064453125, 17.61279296875, 18.259521484375, 18.90625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 1.0, 1.0, 2.0, 10.0, 2.0, 9.0, 9.0, 9.0, 8.0, 11.0, 6.0, 11.0, 17.0, 25.0, 22.0, 31.0, 27.0, 34.0, 32.0, 27.0, 37.0, 36.0, 39.0, 51.0, 46.0, 47.0, 44.0, 54.0, 49.0, 39.0, 28.0, 35.0, 36.0, 21.0, 31.0, 23.0, 13.0, 11.0, 9.0, 14.0, 9.0, 8.0, 4.0, 4.0, 8.0, 7.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-12.765625, -12.367431640625, -11.96923828125, -11.571044921875, -11.1728515625, -10.774658203125, -10.37646484375, -9.978271484375, -9.580078125, -9.181884765625, -8.78369140625, -8.385498046875, -7.9873046875, -7.589111328125, -7.19091796875, -6.792724609375, -6.39453125, -5.996337890625, -5.59814453125, -5.199951171875, -4.8017578125, -4.403564453125, -4.00537109375, -3.607177734375, -3.208984375, -2.810791015625, -2.41259765625, -2.014404296875, -1.6162109375, -1.218017578125, -0.81982421875, -0.421630859375, -0.0234375, 0.374755859375, 0.77294921875, 1.171142578125, 1.5693359375, 1.967529296875, 2.36572265625, 2.763916015625, 3.162109375, 3.560302734375, 3.95849609375, 4.356689453125, 4.7548828125, 5.153076171875, 5.55126953125, 5.949462890625, 6.34765625, 6.745849609375, 7.14404296875, 7.542236328125, 7.9404296875, 8.338623046875, 8.73681640625, 9.135009765625, 9.533203125, 9.931396484375, 10.32958984375, 10.727783203125, 11.1259765625, 11.524169921875, 11.92236328125, 12.320556640625, 12.71875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 6.0, 1.0, 8.0, 6.0, 9.0, 16.0, 17.0, 30.0, 40.0, 74.0, 100.0, 149.0, 203.0, 338.0, 524.0, 894.0, 1582.0, 3028.0, 5755.0, 11954.0, 27721.0, 168780.0, 740288.0, 51179.0, 17879.0, 8434.0, 4215.0, 2173.0, 1208.0, 707.0, 475.0, 272.0, 168.0, 108.0, 58.0, 49.0, 44.0, 23.0, 16.0, 12.0, 7.0, 3.0, 6.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.1015625, -3.97442626953125, -3.8472900390625, -3.72015380859375, -3.593017578125, -3.46588134765625, -3.3387451171875, -3.21160888671875, -3.08447265625, -2.95733642578125, -2.8302001953125, -2.70306396484375, -2.575927734375, -2.44879150390625, -2.3216552734375, -2.19451904296875, -2.0673828125, -1.94024658203125, -1.8131103515625, -1.68597412109375, -1.558837890625, -1.43170166015625, -1.3045654296875, -1.17742919921875, -1.05029296875, -0.92315673828125, -0.7960205078125, -0.66888427734375, -0.541748046875, -0.41461181640625, -0.2874755859375, -0.16033935546875, -0.033203125, 0.09393310546875, 0.2210693359375, 0.34820556640625, 0.475341796875, 0.60247802734375, 0.7296142578125, 0.85675048828125, 0.98388671875, 1.11102294921875, 1.2381591796875, 1.36529541015625, 1.492431640625, 1.61956787109375, 1.7467041015625, 1.87384033203125, 2.0009765625, 2.12811279296875, 2.2552490234375, 2.38238525390625, 2.509521484375, 2.63665771484375, 2.7637939453125, 2.89093017578125, 3.01806640625, 3.14520263671875, 3.2723388671875, 3.39947509765625, 3.526611328125, 3.65374755859375, 3.7808837890625, 3.90802001953125, 4.03515625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 10.0, 3.0, 4.0, 11.0, 14.0, 12.0, 14.0, 15.0, 20.0, 27.0, 29.0, 40.0, 39.0, 42.0, 44.0, 51.0, 73.0, 86.0, 60.0, 53.0, 56.0, 51.0, 29.0, 35.0, 33.0, 24.0, 30.0, 16.0, 10.0, 11.0, 14.0, 7.0, 8.0, 8.0, 6.0, 5.0, 4.0, 2.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0008635520935058594, -0.0008371397852897644, -0.0008107274770736694, -0.0007843151688575745, -0.0007579028606414795, -0.0007314905524253845, -0.0007050782442092896, -0.0006786659359931946, -0.0006522536277770996, -0.0006258413195610046, -0.0005994290113449097, -0.0005730167031288147, -0.0005466043949127197, -0.0005201920866966248, -0.0004937797784805298, -0.0004673674702644348, -0.00044095516204833984, -0.0004145428538322449, -0.0003881305456161499, -0.00036171823740005493, -0.00033530592918395996, -0.000308893620967865, -0.00028248131275177, -0.00025606900453567505, -0.00022965669631958008, -0.0002032443881034851, -0.00017683207988739014, -0.00015041977167129517, -0.0001240074634552002, -9.759515523910522e-05, -7.118284702301025e-05, -4.477053880691528e-05, -1.8358230590820312e-05, 8.054077625274658e-06, 3.446638584136963e-05, 6.08786940574646e-05, 8.729100227355957e-05, 0.00011370331048965454, 0.0001401156187057495, 0.00016652792692184448, 0.00019294023513793945, 0.00021935254335403442, 0.0002457648515701294, 0.00027217715978622437, 0.00029858946800231934, 0.0003250017762184143, 0.0003514140844345093, 0.00037782639265060425, 0.0004042387008666992, 0.0004306510090827942, 0.00045706331729888916, 0.00048347562551498413, 0.0005098879337310791, 0.0005363002419471741, 0.000562712550163269, 0.000589124858379364, 0.000615537166595459, 0.000641949474811554, 0.0006683617830276489, 0.0006947740912437439, 0.0007211863994598389, 0.0007475987076759338, 0.0007740110158920288, 0.0008004233241081238, 0.0008268356323242188]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 7.0, 3.0, 5.0, 6.0, 3.0, 2.0, 3.0, 7.0, 14.0, 24.0, 27.0, 42.0, 46.0, 69.0, 128.0, 193.0, 355.0, 634.0, 1336.0, 2913.0, 6764.0, 16982.0, 47186.0, 140584.0, 336762.0, 309748.0, 119100.0, 39833.0, 14714.0, 5949.0, 2529.0, 1141.0, 643.0, 299.0, 160.0, 99.0, 75.0, 34.0, 36.0, 38.0, 15.0, 13.0, 12.0, 8.0, 5.0, 8.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.337890625, -3.229949951171875, -3.12200927734375, -3.014068603515625, -2.9061279296875, -2.798187255859375, -2.69024658203125, -2.582305908203125, -2.474365234375, -2.366424560546875, -2.25848388671875, -2.150543212890625, -2.0426025390625, -1.934661865234375, -1.82672119140625, -1.718780517578125, -1.61083984375, -1.502899169921875, -1.39495849609375, -1.287017822265625, -1.1790771484375, -1.071136474609375, -0.96319580078125, -0.855255126953125, -0.747314453125, -0.639373779296875, -0.53143310546875, -0.423492431640625, -0.3155517578125, -0.207611083984375, -0.09967041015625, 0.008270263671875, 0.1162109375, 0.224151611328125, 0.33209228515625, 0.440032958984375, 0.5479736328125, 0.655914306640625, 0.76385498046875, 0.871795654296875, 0.979736328125, 1.087677001953125, 1.19561767578125, 1.303558349609375, 1.4114990234375, 1.519439697265625, 1.62738037109375, 1.735321044921875, 1.84326171875, 1.951202392578125, 2.05914306640625, 2.167083740234375, 2.2750244140625, 2.382965087890625, 2.49090576171875, 2.598846435546875, 2.706787109375, 2.814727783203125, 2.92266845703125, 3.030609130859375, 3.1385498046875, 3.246490478515625, 3.35443115234375, 3.462371826171875, 3.5703125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 1.0, 5.0, 5.0, 11.0, 7.0, 9.0, 12.0, 14.0, 33.0, 28.0, 41.0, 50.0, 66.0, 72.0, 85.0, 83.0, 79.0, 93.0, 62.0, 60.0, 41.0, 42.0, 25.0, 20.0, 12.0, 13.0, 10.0, 7.0, 8.0, 4.0, 2.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6953125, -0.66748046875, -0.6396484375, -0.61181640625, -0.583984375, -0.55615234375, -0.5283203125, -0.50048828125, -0.47265625, -0.44482421875, -0.4169921875, -0.38916015625, -0.361328125, -0.33349609375, -0.3056640625, -0.27783203125, -0.25, -0.22216796875, -0.1943359375, -0.16650390625, -0.138671875, -0.11083984375, -0.0830078125, -0.05517578125, -0.02734375, 0.00048828125, 0.0283203125, 0.05615234375, 0.083984375, 0.11181640625, 0.1396484375, 0.16748046875, 0.1953125, 0.22314453125, 0.2509765625, 0.27880859375, 0.306640625, 0.33447265625, 0.3623046875, 0.39013671875, 0.41796875, 0.44580078125, 0.4736328125, 0.50146484375, 0.529296875, 0.55712890625, 0.5849609375, 0.61279296875, 0.640625, 0.66845703125, 0.6962890625, 0.72412109375, 0.751953125, 0.77978515625, 0.8076171875, 0.83544921875, 0.86328125, 0.89111328125, 0.9189453125, 0.94677734375, 0.974609375, 1.00244140625, 1.0302734375, 1.05810546875, 1.0859375]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 6.0, 0.0, 5.0, 2.0, 2.0, 7.0, 6.0, 9.0, 10.0, 9.0, 13.0, 12.0, 19.0, 17.0, 19.0, 21.0, 33.0, 36.0, 30.0, 51.0, 42.0, 43.0, 31.0, 46.0, 44.0, 43.0, 39.0, 53.0, 37.0, 33.0, 41.0, 28.0, 47.0, 30.0, 21.0, 15.0, 23.0, 11.0, 11.0, 11.0, 11.0, 13.0, 8.0, 6.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 4.0, 0.0, 1.0], "bins": [-10.691387176513672, -10.367181777954102, -10.042975425720215, -9.718770027160645, -9.394564628601074, -9.070358276367188, -8.746152877807617, -8.421947479248047, -8.097742080688477, -7.773536205291748, -7.449330806732178, -7.125124931335449, -6.800919532775879, -6.47671365737915, -6.152507781982422, -5.828302383422852, -5.504096031188965, -5.179890155792236, -4.855684757232666, -4.5314788818359375, -4.207273483276367, -3.8830676078796387, -3.55886173248291, -3.2346560955047607, -2.9104504585266113, -2.586244821548462, -2.2620391845703125, -1.937833309173584, -1.6136276721954346, -1.2894220352172852, -0.9652162790298462, -0.6410105228424072, -0.3168058395385742, 0.007399857044219971, 0.33160555362701416, 0.6558112502098083, 0.9800169467926025, 1.304222583770752, 1.628428339958191, 1.9526340961456299, 2.2768397331237793, 2.6010453701019287, 2.925251007080078, 3.2494568824768066, 3.573662519454956, 3.8978681564331055, 4.222074031829834, 4.5462799072265625, 4.870485305786133, 5.194691181182861, 5.518896579742432, 5.84310245513916, 6.1673078536987305, 6.491513729095459, 6.8157196044921875, 7.139925003051758, 7.464130878448486, 7.788336753845215, 8.112542152404785, 8.436747550964355, 8.760953903198242, 9.085159301757812, 9.409364700317383, 9.73357105255127, 10.05777645111084]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 3.0, 5.0, 6.0, 4.0, 6.0, 10.0, 12.0, 15.0, 15.0, 16.0, 25.0, 28.0, 27.0, 26.0, 29.0, 34.0, 36.0, 36.0, 36.0, 38.0, 52.0, 41.0, 35.0, 46.0, 34.0, 41.0, 47.0, 38.0, 28.0, 29.0, 29.0, 23.0, 20.0, 28.0, 21.0, 15.0, 13.0, 13.0, 13.0, 1.0, 10.0, 7.0, 3.0, 4.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.928473472595215, -9.588860511779785, -9.249247550964355, -8.90963363647461, -8.57002067565918, -8.23040771484375, -7.89079475402832, -7.551181793212891, -7.211568355560303, -6.871955394744873, -6.532341957092285, -6.1927289962768555, -5.853116035461426, -5.513502597808838, -5.173889636993408, -4.83427619934082, -4.494663238525391, -4.155050277709961, -3.815436840057373, -3.4758238792419434, -3.1362106800079346, -2.796597480773926, -2.456984519958496, -2.1173713207244873, -1.7777581214904785, -1.4381449222564697, -1.0985318422317505, -0.7589187622070312, -0.41930556297302246, -0.07969236373901367, 0.259920597076416, 0.5995337963104248, 0.9391460418701172, 1.278759241104126, 1.6183723211288452, 1.9579854011535645, 2.2975986003875732, 2.637211799621582, 2.9768247604370117, 3.3164379596710205, 3.6560511589050293, 3.995664358139038, 4.335277557373047, 4.674890518188477, 5.014503479003906, 5.354116916656494, 5.693729877471924, 6.033343315124512, 6.372956275939941, 6.712569236755371, 7.052182674407959, 7.391795635223389, 7.731409072875977, 8.071022033691406, 8.410634994506836, 8.750247955322266, 9.089860916137695, 9.429473876953125, 9.769086837768555, 10.108699798583984, 10.44831371307373, 10.78792667388916, 11.12753963470459, 11.46715259552002, 11.806766510009766]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 14.0, 20.0, 17.0, 41.0, 55.0, 87.0, 129.0, 188.0, 304.0, 502.0, 753.0, 1195.0, 1898.0, 2861.0, 4535.0, 6922.0, 10352.0, 15700.0, 22830.0, 32469.0, 44832.0, 59630.0, 75372.0, 90274.0, 100268.0, 104336.0, 100836.0, 89992.0, 75899.0, 59464.0, 45411.0, 32588.0, 22780.0, 15787.0, 10513.0, 6991.0, 4550.0, 2947.0, 1906.0, 1135.0, 742.0, 514.0, 318.0, 193.0, 144.0, 85.0, 66.0, 53.0, 20.0, 13.0, 11.0, 9.0, 4.0, 6.0, 1.0, 1.0, 1.0], "bins": [-7.36328125, -7.13677978515625, -6.9102783203125, -6.68377685546875, -6.457275390625, -6.23077392578125, -6.0042724609375, -5.77777099609375, -5.55126953125, -5.32476806640625, -5.0982666015625, -4.87176513671875, -4.645263671875, -4.41876220703125, -4.1922607421875, -3.96575927734375, -3.7392578125, -3.51275634765625, -3.2862548828125, -3.05975341796875, -2.833251953125, -2.60675048828125, -2.3802490234375, -2.15374755859375, -1.92724609375, -1.70074462890625, -1.4742431640625, -1.24774169921875, -1.021240234375, -0.79473876953125, -0.5682373046875, -0.34173583984375, -0.115234375, 0.11126708984375, 0.3377685546875, 0.56427001953125, 0.790771484375, 1.01727294921875, 1.2437744140625, 1.47027587890625, 1.69677734375, 1.92327880859375, 2.1497802734375, 2.37628173828125, 2.602783203125, 2.82928466796875, 3.0557861328125, 3.28228759765625, 3.5087890625, 3.73529052734375, 3.9617919921875, 4.18829345703125, 4.414794921875, 4.64129638671875, 4.8677978515625, 5.09429931640625, 5.32080078125, 5.54730224609375, 5.7738037109375, 6.00030517578125, 6.226806640625, 6.45330810546875, 6.6798095703125, 6.90631103515625, 7.1328125]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 3.0, 5.0, 4.0, 8.0, 10.0, 11.0, 7.0, 19.0, 18.0, 19.0, 20.0, 33.0, 41.0, 33.0, 42.0, 39.0, 37.0, 33.0, 39.0, 44.0, 40.0, 56.0, 51.0, 46.0, 41.0, 41.0, 37.0, 29.0, 31.0, 29.0, 22.0, 22.0, 17.0, 14.0, 15.0, 8.0, 10.0, 14.0, 4.0, 2.0, 1.0, 2.0, 5.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.6171875, -10.246826171875, -9.87646484375, -9.506103515625, -9.1357421875, -8.765380859375, -8.39501953125, -8.024658203125, -7.654296875, -7.283935546875, -6.91357421875, -6.543212890625, -6.1728515625, -5.802490234375, -5.43212890625, -5.061767578125, -4.69140625, -4.321044921875, -3.95068359375, -3.580322265625, -3.2099609375, -2.839599609375, -2.46923828125, -2.098876953125, -1.728515625, -1.358154296875, -0.98779296875, -0.617431640625, -0.2470703125, 0.123291015625, 0.49365234375, 0.864013671875, 1.234375, 1.604736328125, 1.97509765625, 2.345458984375, 2.7158203125, 3.086181640625, 3.45654296875, 3.826904296875, 4.197265625, 4.567626953125, 4.93798828125, 5.308349609375, 5.6787109375, 6.049072265625, 6.41943359375, 6.789794921875, 7.16015625, 7.530517578125, 7.90087890625, 8.271240234375, 8.6416015625, 9.011962890625, 9.38232421875, 9.752685546875, 10.123046875, 10.493408203125, 10.86376953125, 11.234130859375, 11.6044921875, 11.974853515625, 12.34521484375, 12.715576171875, 13.0859375]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 16.0, 10.0, 18.0, 36.0, 65.0, 85.0, 141.0, 196.0, 320.0, 519.0, 860.0, 1275.0, 2082.0, 3303.0, 5028.0, 7704.0, 11960.0, 17971.0, 26345.0, 37633.0, 52555.0, 69518.0, 87427.0, 101773.0, 110061.0, 108177.0, 99420.0, 83435.0, 65706.0, 48991.0, 34919.0, 24404.0, 16121.0, 10817.0, 6949.0, 4618.0, 2932.0, 1910.0, 1194.0, 786.0, 448.0, 315.0, 195.0, 122.0, 58.0, 51.0, 29.0, 28.0, 18.0, 3.0, 8.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0], "bins": [-10.015625, -9.7015380859375, -9.387451171875, -9.0733642578125, -8.75927734375, -8.4451904296875, -8.131103515625, -7.8170166015625, -7.5029296875, -7.1888427734375, -6.874755859375, -6.5606689453125, -6.24658203125, -5.9324951171875, -5.618408203125, -5.3043212890625, -4.990234375, -4.6761474609375, -4.362060546875, -4.0479736328125, -3.73388671875, -3.4197998046875, -3.105712890625, -2.7916259765625, -2.4775390625, -2.1634521484375, -1.849365234375, -1.5352783203125, -1.22119140625, -0.9071044921875, -0.593017578125, -0.2789306640625, 0.03515625, 0.3492431640625, 0.663330078125, 0.9774169921875, 1.29150390625, 1.6055908203125, 1.919677734375, 2.2337646484375, 2.5478515625, 2.8619384765625, 3.176025390625, 3.4901123046875, 3.80419921875, 4.1182861328125, 4.432373046875, 4.7464599609375, 5.060546875, 5.3746337890625, 5.688720703125, 6.0028076171875, 6.31689453125, 6.6309814453125, 6.945068359375, 7.2591552734375, 7.5732421875, 7.8873291015625, 8.201416015625, 8.5155029296875, 8.82958984375, 9.1436767578125, 9.457763671875, 9.7718505859375, 10.0859375]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 9.0, 9.0, 9.0, 8.0, 19.0, 12.0, 15.0, 27.0, 23.0, 21.0, 26.0, 24.0, 27.0, 34.0, 37.0, 35.0, 33.0, 38.0, 54.0, 39.0, 37.0, 34.0, 37.0, 47.0, 41.0, 40.0, 33.0, 30.0, 39.0, 28.0, 29.0, 20.0, 19.0, 21.0, 13.0, 6.0, 9.0, 7.0, 5.0, 3.0, 2.0, 2.0, 5.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.71875, -8.48150634765625, -8.2442626953125, -8.00701904296875, -7.769775390625, -7.53253173828125, -7.2952880859375, -7.05804443359375, -6.82080078125, -6.58355712890625, -6.3463134765625, -6.10906982421875, -5.871826171875, -5.63458251953125, -5.3973388671875, -5.16009521484375, -4.9228515625, -4.68560791015625, -4.4483642578125, -4.21112060546875, -3.973876953125, -3.73663330078125, -3.4993896484375, -3.26214599609375, -3.02490234375, -2.78765869140625, -2.5504150390625, -2.31317138671875, -2.075927734375, -1.83868408203125, -1.6014404296875, -1.36419677734375, -1.126953125, -0.88970947265625, -0.6524658203125, -0.41522216796875, -0.177978515625, 0.05926513671875, 0.2965087890625, 0.53375244140625, 0.77099609375, 1.00823974609375, 1.2454833984375, 1.48272705078125, 1.719970703125, 1.95721435546875, 2.1944580078125, 2.43170166015625, 2.6689453125, 2.90618896484375, 3.1434326171875, 3.38067626953125, 3.617919921875, 3.85516357421875, 4.0924072265625, 4.32965087890625, 4.56689453125, 4.80413818359375, 5.0413818359375, 5.27862548828125, 5.515869140625, 5.75311279296875, 5.9903564453125, 6.22760009765625, 6.46484375]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 1.0, 8.0, 7.0, 16.0, 24.0, 24.0, 32.0, 53.0, 75.0, 90.0, 125.0, 173.0, 241.0, 330.0, 455.0, 708.0, 1018.0, 1635.0, 2817.0, 4950.0, 9595.0, 18616.0, 37947.0, 73457.0, 129947.0, 189177.0, 204428.0, 161808.0, 100097.0, 53637.0, 26734.0, 13479.0, 6833.0, 3717.0, 2102.0, 1309.0, 898.0, 572.0, 402.0, 304.0, 183.0, 148.0, 112.0, 81.0, 59.0, 47.0, 35.0, 16.0, 13.0, 13.0, 5.0, 8.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.671875, -4.5174560546875, -4.363037109375, -4.2086181640625, -4.05419921875, -3.8997802734375, -3.745361328125, -3.5909423828125, -3.4365234375, -3.2821044921875, -3.127685546875, -2.9732666015625, -2.81884765625, -2.6644287109375, -2.510009765625, -2.3555908203125, -2.201171875, -2.0467529296875, -1.892333984375, -1.7379150390625, -1.58349609375, -1.4290771484375, -1.274658203125, -1.1202392578125, -0.9658203125, -0.8114013671875, -0.656982421875, -0.5025634765625, -0.34814453125, -0.1937255859375, -0.039306640625, 0.1151123046875, 0.26953125, 0.4239501953125, 0.578369140625, 0.7327880859375, 0.88720703125, 1.0416259765625, 1.196044921875, 1.3504638671875, 1.5048828125, 1.6593017578125, 1.813720703125, 1.9681396484375, 2.12255859375, 2.2769775390625, 2.431396484375, 2.5858154296875, 2.740234375, 2.8946533203125, 3.049072265625, 3.2034912109375, 3.35791015625, 3.5123291015625, 3.666748046875, 3.8211669921875, 3.9755859375, 4.1300048828125, 4.284423828125, 4.4388427734375, 4.59326171875, 4.7476806640625, 4.902099609375, 5.0565185546875, 5.2109375]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 7.0, 6.0, 14.0, 15.0, 16.0, 26.0, 39.0, 58.0, 64.0, 88.0, 88.0, 83.0, 111.0, 82.0, 73.0, 63.0, 54.0, 33.0, 21.0, 17.0, 7.0, 14.0, 6.0, 8.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0008411407470703125, -0.0008178353309631348, -0.000794529914855957, -0.0007712244987487793, -0.0007479190826416016, -0.0007246136665344238, -0.0007013082504272461, -0.0006780028343200684, -0.0006546974182128906, -0.0006313920021057129, -0.0006080865859985352, -0.0005847811698913574, -0.0005614757537841797, -0.000538170337677002, -0.0005148649215698242, -0.0004915595054626465, -0.00046825408935546875, -0.000444948673248291, -0.0004216432571411133, -0.00039833784103393555, -0.0003750324249267578, -0.0003517270088195801, -0.00032842159271240234, -0.0003051161766052246, -0.0002818107604980469, -0.00025850534439086914, -0.0002351999282836914, -0.00021189451217651367, -0.00018858909606933594, -0.0001652836799621582, -0.00014197826385498047, -0.00011867284774780273, -9.5367431640625e-05, -7.206201553344727e-05, -4.875659942626953e-05, -2.5451183319091797e-05, -2.1457672119140625e-06, 2.1159648895263672e-05, 4.4465065002441406e-05, 6.777048110961914e-05, 9.107589721679688e-05, 0.00011438131332397461, 0.00013768672943115234, 0.00016099214553833008, 0.0001842975616455078, 0.00020760297775268555, 0.00023090839385986328, 0.000254213809967041, 0.00027751922607421875, 0.0003008246421813965, 0.0003241300582885742, 0.00034743547439575195, 0.0003707408905029297, 0.0003940463066101074, 0.00041735172271728516, 0.0004406571388244629, 0.0004639625549316406, 0.00048726797103881836, 0.0005105733871459961, 0.0005338788032531738, 0.0005571842193603516, 0.0005804896354675293, 0.000603795051574707, 0.0006271004676818848, 0.0006504058837890625]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 5.0, 7.0, 12.0, 15.0, 15.0, 39.0, 40.0, 58.0, 86.0, 134.0, 207.0, 288.0, 452.0, 617.0, 1049.0, 1720.0, 2877.0, 4904.0, 8276.0, 14565.0, 25895.0, 44007.0, 71926.0, 107370.0, 139598.0, 156553.0, 147393.0, 116728.0, 80923.0, 51160.0, 30375.0, 17234.0, 9765.0, 5623.0, 3299.0, 1939.0, 1202.0, 730.0, 445.0, 315.0, 210.0, 148.0, 112.0, 68.0, 59.0, 39.0, 32.0, 19.0, 13.0, 9.0, 4.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.6953125, -3.578521728515625, -3.46173095703125, -3.344940185546875, -3.2281494140625, -3.111358642578125, -2.99456787109375, -2.877777099609375, -2.760986328125, -2.644195556640625, -2.52740478515625, -2.410614013671875, -2.2938232421875, -2.177032470703125, -2.06024169921875, -1.943450927734375, -1.82666015625, -1.709869384765625, -1.59307861328125, -1.476287841796875, -1.3594970703125, -1.242706298828125, -1.12591552734375, -1.009124755859375, -0.892333984375, -0.775543212890625, -0.65875244140625, -0.541961669921875, -0.4251708984375, -0.308380126953125, -0.19158935546875, -0.074798583984375, 0.0419921875, 0.158782958984375, 0.27557373046875, 0.392364501953125, 0.5091552734375, 0.625946044921875, 0.74273681640625, 0.859527587890625, 0.976318359375, 1.093109130859375, 1.20989990234375, 1.326690673828125, 1.4434814453125, 1.560272216796875, 1.67706298828125, 1.793853759765625, 1.91064453125, 2.027435302734375, 2.14422607421875, 2.261016845703125, 2.3778076171875, 2.494598388671875, 2.61138916015625, 2.728179931640625, 2.844970703125, 2.961761474609375, 3.07855224609375, 3.195343017578125, 3.3121337890625, 3.428924560546875, 3.54571533203125, 3.662506103515625, 3.779296875]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 1.0, 4.0, 4.0, 5.0, 10.0, 6.0, 17.0, 10.0, 22.0, 27.0, 35.0, 34.0, 38.0, 59.0, 61.0, 58.0, 64.0, 75.0, 58.0, 80.0, 61.0, 45.0, 43.0, 49.0, 38.0, 22.0, 16.0, 12.0, 10.0, 9.0, 6.0, 6.0, 3.0, 3.0, 4.0, 4.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0], "bins": [-2.2109375, -2.1529541015625, -2.094970703125, -2.0369873046875, -1.97900390625, -1.9210205078125, -1.863037109375, -1.8050537109375, -1.7470703125, -1.6890869140625, -1.631103515625, -1.5731201171875, -1.51513671875, -1.4571533203125, -1.399169921875, -1.3411865234375, -1.283203125, -1.2252197265625, -1.167236328125, -1.1092529296875, -1.05126953125, -0.9932861328125, -0.935302734375, -0.8773193359375, -0.8193359375, -0.7613525390625, -0.703369140625, -0.6453857421875, -0.58740234375, -0.5294189453125, -0.471435546875, -0.4134521484375, -0.35546875, -0.2974853515625, -0.239501953125, -0.1815185546875, -0.12353515625, -0.0655517578125, -0.007568359375, 0.0504150390625, 0.1083984375, 0.1663818359375, 0.224365234375, 0.2823486328125, 0.34033203125, 0.3983154296875, 0.456298828125, 0.5142822265625, 0.572265625, 0.6302490234375, 0.688232421875, 0.7462158203125, 0.80419921875, 0.8621826171875, 0.920166015625, 0.9781494140625, 1.0361328125, 1.0941162109375, 1.152099609375, 1.2100830078125, 1.26806640625, 1.3260498046875, 1.384033203125, 1.4420166015625, 1.5]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 5.0, 3.0, 7.0, 8.0, 9.0, 11.0, 17.0, 16.0, 18.0, 17.0, 30.0, 29.0, 32.0, 34.0, 39.0, 39.0, 54.0, 53.0, 49.0, 42.0, 41.0, 49.0, 46.0, 45.0, 37.0, 48.0, 35.0, 35.0, 23.0, 34.0, 20.0, 13.0, 10.0, 16.0, 15.0, 6.0, 7.0, 3.0, 3.0, 1.0, 4.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-11.57734203338623, -11.213099479675293, -10.848855972290039, -10.484613418579102, -10.120369911193848, -9.75612735748291, -9.391883850097656, -9.027641296386719, -8.663398742675781, -8.299156188964844, -7.93491268157959, -7.570670127868652, -7.206426620483398, -6.842184066772461, -6.477941036224365, -6.1136980056762695, -5.749454498291016, -5.38521146774292, -5.020968437194824, -4.656725883483887, -4.292482376098633, -3.928239583969116, -3.5639967918395996, -3.199753761291504, -2.835510730743408, -2.4712677001953125, -2.107024669647217, -1.7427818775177002, -1.3785388469696045, -1.0142958164215088, -0.6500530242919922, -0.2858099937438965, 0.07843399047851562, 0.44267696142196655, 0.8069199323654175, 1.1711628437042236, 1.5354058742523193, 1.899648904800415, 2.2638916969299316, 2.6281347274780273, 2.992377758026123, 3.3566207885742188, 3.7208638191223145, 4.08510684967041, 4.449349403381348, 4.813592910766602, 5.177835464477539, 5.542078495025635, 5.9063215255737305, 6.270564556121826, 6.634807586669922, 6.999050140380859, 7.363293647766113, 7.727536201477051, 8.091779708862305, 8.456022262573242, 8.82026481628418, 9.184507369995117, 9.548750877380371, 9.912993431091309, 10.277236938476562, 10.6414794921875, 11.005722045898438, 11.369965553283691, 11.734209060668945]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 5.0, 0.0, 2.0, 1.0, 3.0, 4.0, 6.0, 6.0, 7.0, 8.0, 9.0, 16.0, 19.0, 23.0, 11.0, 26.0, 33.0, 25.0, 32.0, 28.0, 32.0, 37.0, 35.0, 39.0, 35.0, 51.0, 36.0, 52.0, 46.0, 39.0, 31.0, 31.0, 35.0, 28.0, 22.0, 21.0, 28.0, 30.0, 15.0, 18.0, 18.0, 11.0, 16.0, 7.0, 11.0, 5.0, 6.0, 3.0, 7.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-12.020426750183105, -11.677760124206543, -11.33509349822998, -10.992425918579102, -10.649759292602539, -10.307092666625977, -9.964426040649414, -9.621759414672852, -9.279092788696289, -8.936426162719727, -8.593759536743164, -8.251092910766602, -7.908425331115723, -7.56575870513916, -7.223092079162598, -6.880425453186035, -6.537757873535156, -6.195091247558594, -5.852424144744873, -5.5097575187683105, -5.16709041595459, -4.824423789978027, -4.481757164001465, -4.139090538024902, -3.7964234352111816, -3.45375657081604, -3.1110897064208984, -2.768423080444336, -2.4257562160491943, -2.0830893516540527, -1.7404227256774902, -1.3977558612823486, -1.0550899505615234, -0.7124231457710266, -0.3697563409805298, -0.027089595794677734, 0.31557726860046387, 0.6582441329956055, 1.000910758972168, 1.3435776233673096, 1.6862444877624512, 2.0289113521575928, 2.3715782165527344, 2.714244842529297, 3.0569117069244385, 3.39957857131958, 3.7422451972961426, 4.084912300109863, 4.427578926086426, 4.770245552062988, 5.112912654876709, 5.4555792808532715, 5.798246383666992, 6.140913009643555, 6.483579635620117, 6.82624626159668, 7.1689133644104, 7.511579990386963, 7.854247093200684, 8.196913719177246, 8.539580345153809, 8.882247924804688, 9.22491455078125, 9.567581176757812, 9.910247802734375]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 14.0, 14.0, 22.0, 30.0, 55.0, 96.0, 150.0, 232.0, 336.0, 548.0, 843.0, 1348.0, 2157.0, 3537.0, 5651.0, 9285.0, 15326.0, 24776.0, 41234.0, 67190.0, 110717.0, 179993.0, 281054.0, 408595.0, 531364.0, 594886.0, 565640.0, 459839.0, 329120.0, 215408.0, 135534.0, 81407.0, 49755.0, 30023.0, 18371.0, 11109.0, 6994.0, 4326.0, 2730.0, 1638.0, 1081.0, 637.0, 424.0, 268.0, 190.0, 118.0, 77.0, 60.0, 33.0, 26.0, 13.0, 7.0, 5.0, 4.0, 0.0, 1.0, 1.0, 2.0], "bins": [-7.3515625, -7.11962890625, -6.8876953125, -6.65576171875, -6.423828125, -6.19189453125, -5.9599609375, -5.72802734375, -5.49609375, -5.26416015625, -5.0322265625, -4.80029296875, -4.568359375, -4.33642578125, -4.1044921875, -3.87255859375, -3.640625, -3.40869140625, -3.1767578125, -2.94482421875, -2.712890625, -2.48095703125, -2.2490234375, -2.01708984375, -1.78515625, -1.55322265625, -1.3212890625, -1.08935546875, -0.857421875, -0.62548828125, -0.3935546875, -0.16162109375, 0.0703125, 0.30224609375, 0.5341796875, 0.76611328125, 0.998046875, 1.22998046875, 1.4619140625, 1.69384765625, 1.92578125, 2.15771484375, 2.3896484375, 2.62158203125, 2.853515625, 3.08544921875, 3.3173828125, 3.54931640625, 3.78125, 4.01318359375, 4.2451171875, 4.47705078125, 4.708984375, 4.94091796875, 5.1728515625, 5.40478515625, 5.63671875, 5.86865234375, 6.1005859375, 6.33251953125, 6.564453125, 6.79638671875, 7.0283203125, 7.26025390625, 7.4921875]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 2.0, 4.0, 0.0, 5.0, 4.0, 7.0, 7.0, 10.0, 10.0, 15.0, 19.0, 13.0, 22.0, 24.0, 23.0, 29.0, 27.0, 37.0, 41.0, 51.0, 36.0, 41.0, 37.0, 50.0, 43.0, 44.0, 39.0, 52.0, 35.0, 36.0, 35.0, 29.0, 19.0, 15.0, 26.0, 18.0, 17.0, 19.0, 19.0, 6.0, 11.0, 8.0, 7.0, 5.0, 1.0, 3.0, 3.0, 6.0, 3.0, 0.0, 0.0, 1.0], "bins": [-10.953125, -10.6473388671875, -10.341552734375, -10.0357666015625, -9.72998046875, -9.4241943359375, -9.118408203125, -8.8126220703125, -8.5068359375, -8.2010498046875, -7.895263671875, -7.5894775390625, -7.28369140625, -6.9779052734375, -6.672119140625, -6.3663330078125, -6.060546875, -5.7547607421875, -5.448974609375, -5.1431884765625, -4.83740234375, -4.5316162109375, -4.225830078125, -3.9200439453125, -3.6142578125, -3.3084716796875, -3.002685546875, -2.6968994140625, -2.39111328125, -2.0853271484375, -1.779541015625, -1.4737548828125, -1.16796875, -0.8621826171875, -0.556396484375, -0.2506103515625, 0.05517578125, 0.3609619140625, 0.666748046875, 0.9725341796875, 1.2783203125, 1.5841064453125, 1.889892578125, 2.1956787109375, 2.50146484375, 2.8072509765625, 3.113037109375, 3.4188232421875, 3.724609375, 4.0303955078125, 4.336181640625, 4.6419677734375, 4.94775390625, 5.2535400390625, 5.559326171875, 5.8651123046875, 6.1708984375, 6.4766845703125, 6.782470703125, 7.0882568359375, 7.39404296875, 7.6998291015625, 8.005615234375, 8.3114013671875, 8.6171875]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 3.0, 1.0, 12.0, 16.0, 25.0, 34.0, 52.0, 103.0, 149.0, 265.0, 455.0, 733.0, 1245.0, 1887.0, 3255.0, 5549.0, 9073.0, 15486.0, 26496.0, 44911.0, 74217.0, 123053.0, 198609.0, 307690.0, 442881.0, 572369.0, 620972.0, 556362.0, 425069.0, 290162.0, 186269.0, 115559.0, 69361.0, 41591.0, 24623.0, 14412.0, 8672.0, 5018.0, 2954.0, 1856.0, 1111.0, 713.0, 410.0, 237.0, 143.0, 81.0, 62.0, 39.0, 17.0, 16.0, 4.0, 6.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.4140625, -8.128173828125, -7.84228515625, -7.556396484375, -7.2705078125, -6.984619140625, -6.69873046875, -6.412841796875, -6.126953125, -5.841064453125, -5.55517578125, -5.269287109375, -4.9833984375, -4.697509765625, -4.41162109375, -4.125732421875, -3.83984375, -3.553955078125, -3.26806640625, -2.982177734375, -2.6962890625, -2.410400390625, -2.12451171875, -1.838623046875, -1.552734375, -1.266845703125, -0.98095703125, -0.695068359375, -0.4091796875, -0.123291015625, 0.16259765625, 0.448486328125, 0.734375, 1.020263671875, 1.30615234375, 1.592041015625, 1.8779296875, 2.163818359375, 2.44970703125, 2.735595703125, 3.021484375, 3.307373046875, 3.59326171875, 3.879150390625, 4.1650390625, 4.450927734375, 4.73681640625, 5.022705078125, 5.30859375, 5.594482421875, 5.88037109375, 6.166259765625, 6.4521484375, 6.738037109375, 7.02392578125, 7.309814453125, 7.595703125, 7.881591796875, 8.16748046875, 8.453369140625, 8.7392578125, 9.025146484375, 9.31103515625, 9.596923828125, 9.8828125]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 4.0, 5.0, 5.0, 8.0, 15.0, 18.0, 23.0, 28.0, 23.0, 40.0, 41.0, 63.0, 70.0, 93.0, 121.0, 147.0, 153.0, 213.0, 210.0, 262.0, 245.0, 278.0, 292.0, 256.0, 213.0, 184.0, 183.0, 155.0, 144.0, 116.0, 102.0, 66.0, 70.0, 62.0, 53.0, 31.0, 32.0, 21.0, 8.0, 9.0, 5.0, 3.0, 6.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.140625, -4.00250244140625, -3.8643798828125, -3.72625732421875, -3.588134765625, -3.45001220703125, -3.3118896484375, -3.17376708984375, -3.03564453125, -2.89752197265625, -2.7593994140625, -2.62127685546875, -2.483154296875, -2.34503173828125, -2.2069091796875, -2.06878662109375, -1.9306640625, -1.79254150390625, -1.6544189453125, -1.51629638671875, -1.378173828125, -1.24005126953125, -1.1019287109375, -0.96380615234375, -0.82568359375, -0.68756103515625, -0.5494384765625, -0.41131591796875, -0.273193359375, -0.13507080078125, 0.0030517578125, 0.14117431640625, 0.279296875, 0.41741943359375, 0.5555419921875, 0.69366455078125, 0.831787109375, 0.96990966796875, 1.1080322265625, 1.24615478515625, 1.38427734375, 1.52239990234375, 1.6605224609375, 1.79864501953125, 1.936767578125, 2.07489013671875, 2.2130126953125, 2.35113525390625, 2.4892578125, 2.62738037109375, 2.7655029296875, 2.90362548828125, 3.041748046875, 3.17987060546875, 3.3179931640625, 3.45611572265625, 3.59423828125, 3.73236083984375, 3.8704833984375, 4.00860595703125, 4.146728515625, 4.28485107421875, 4.4229736328125, 4.56109619140625, 4.69921875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 5.0, 4.0, 6.0, 5.0, 11.0, 9.0, 15.0, 17.0, 26.0, 24.0, 35.0, 29.0, 36.0, 36.0, 39.0, 47.0, 60.0, 51.0, 54.0, 57.0, 45.0, 39.0, 49.0, 47.0, 45.0, 41.0, 38.0, 25.0, 23.0, 24.0, 11.0, 13.0, 10.0, 9.0, 9.0, 7.0, 2.0, 5.0, 1.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.926458358764648, -8.541315078735352, -8.156170845031738, -7.771027565002441, -7.3858842849731445, -7.0007405281066895, -6.615596771240234, -6.2304534912109375, -5.845309734344482, -5.460165977478027, -5.0750226974487305, -4.689878940582275, -4.30473518371582, -3.9195919036865234, -3.5344481468200684, -3.1493046283721924, -2.7641611099243164, -2.3790175914764404, -1.993873953819275, -1.6087303161621094, -1.2235867977142334, -0.8384432792663574, -0.45329952239990234, -0.06815600395202637, 0.3169875144958496, 0.7021310925483704, 1.0872746706008911, 1.4724183082580566, 1.8575618267059326, 2.2427053451538086, 2.6278491020202637, 3.0129926204681396, 3.398135185241699, 3.783278703689575, 4.168422222137451, 4.553565979003906, 4.938709259033203, 5.323853015899658, 5.708996772766113, 6.09414005279541, 6.479283809661865, 6.86442756652832, 7.249570846557617, 7.634714603424072, 8.019858360290527, 8.405001640319824, 8.790145874023438, 9.175289154052734, 9.560432434082031, 9.945575714111328, 10.330719947814941, 10.715863227844238, 11.101006507873535, 11.486150741577148, 11.871294021606445, 12.256437301635742, 12.641580581665039, 13.026723861694336, 13.41186809539795, 13.797011375427246, 14.182154655456543, 14.567298889160156, 14.952442169189453, 15.33758544921875, 15.722729682922363]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 7.0, 5.0, 4.0, 10.0, 13.0, 8.0, 17.0, 26.0, 26.0, 25.0, 32.0, 25.0, 24.0, 46.0, 39.0, 41.0, 34.0, 47.0, 52.0, 54.0, 41.0, 57.0, 40.0, 39.0, 40.0, 29.0, 34.0, 32.0, 22.0, 26.0, 27.0, 14.0, 11.0, 10.0, 12.0, 4.0, 6.0, 9.0, 2.0, 5.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-12.244256019592285, -11.874797821044922, -11.505339622497559, -11.135881423950195, -10.766423225402832, -10.396965026855469, -10.027507781982422, -9.658048629760742, -9.288591384887695, -8.919133186340332, -8.549674987792969, -8.180216789245605, -7.810758590698242, -7.441300392150879, -7.071842670440674, -6.7023844718933105, -6.332925796508789, -5.963467597961426, -5.5940093994140625, -5.224551200866699, -4.855093002319336, -4.485634803771973, -4.116177082061768, -3.7467188835144043, -3.377260684967041, -3.0078024864196777, -2.6383442878723145, -2.2688863277435303, -1.899428129196167, -1.5299699306488037, -1.1605119705200195, -0.7910537719726562, -0.42159557342529297, -0.05213743448257446, 0.31732070446014404, 0.6867787837982178, 1.056236982345581, 1.4256951808929443, 1.7951531410217285, 2.164611339569092, 2.534069538116455, 2.9035277366638184, 3.2729859352111816, 3.642443895339966, 4.01190185546875, 4.381360054016113, 4.750818252563477, 5.12027645111084, 5.489734649658203, 5.859192848205566, 6.22865104675293, 6.598109245300293, 6.967567443847656, 7.3370256423950195, 7.706483364105225, 8.07594108581543, 8.44540023803711, 8.814858436584473, 9.184316635131836, 9.5537748336792, 9.923233032226562, 10.292691230773926, 10.662149429321289, 11.031606674194336, 11.4010648727417]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 5.0, 2.0, 5.0, 6.0, 8.0, 21.0, 38.0, 55.0, 62.0, 125.0, 188.0, 276.0, 442.0, 727.0, 1119.0, 1828.0, 2716.0, 4258.0, 6192.0, 9263.0, 13400.0, 19620.0, 27932.0, 37480.0, 48989.0, 62409.0, 75483.0, 85616.0, 93587.0, 95484.0, 91381.0, 83280.0, 71316.0, 57953.0, 45144.0, 34037.0, 24662.0, 17584.0, 12038.0, 8154.0, 5474.0, 3601.0, 2274.0, 1537.0, 978.0, 666.0, 420.0, 271.0, 174.0, 109.0, 69.0, 53.0, 22.0, 14.0, 5.0, 4.0, 6.0, 5.0, 0.0, 2.0, 2.0], "bins": [-4.1171875, -3.9898681640625, -3.862548828125, -3.7352294921875, -3.60791015625, -3.4805908203125, -3.353271484375, -3.2259521484375, -3.0986328125, -2.9713134765625, -2.843994140625, -2.7166748046875, -2.58935546875, -2.4620361328125, -2.334716796875, -2.2073974609375, -2.080078125, -1.9527587890625, -1.825439453125, -1.6981201171875, -1.57080078125, -1.4434814453125, -1.316162109375, -1.1888427734375, -1.0615234375, -0.9342041015625, -0.806884765625, -0.6795654296875, -0.55224609375, -0.4249267578125, -0.297607421875, -0.1702880859375, -0.04296875, 0.0843505859375, 0.211669921875, 0.3389892578125, 0.46630859375, 0.5936279296875, 0.720947265625, 0.8482666015625, 0.9755859375, 1.1029052734375, 1.230224609375, 1.3575439453125, 1.48486328125, 1.6121826171875, 1.739501953125, 1.8668212890625, 1.994140625, 2.1214599609375, 2.248779296875, 2.3760986328125, 2.50341796875, 2.6307373046875, 2.758056640625, 2.8853759765625, 3.0126953125, 3.1400146484375, 3.267333984375, 3.3946533203125, 3.52197265625, 3.6492919921875, 3.776611328125, 3.9039306640625, 4.03125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 1.0, 5.0, 9.0, 6.0, 10.0, 7.0, 13.0, 14.0, 25.0, 18.0, 27.0, 26.0, 25.0, 39.0, 35.0, 33.0, 42.0, 61.0, 46.0, 41.0, 45.0, 44.0, 44.0, 46.0, 44.0, 36.0, 22.0, 38.0, 34.0, 22.0, 24.0, 14.0, 17.0, 19.0, 20.0, 11.0, 10.0, 7.0, 8.0, 3.0, 5.0, 5.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-11.4453125, -11.114013671875, -10.78271484375, -10.451416015625, -10.1201171875, -9.788818359375, -9.45751953125, -9.126220703125, -8.794921875, -8.463623046875, -8.13232421875, -7.801025390625, -7.4697265625, -7.138427734375, -6.80712890625, -6.475830078125, -6.14453125, -5.813232421875, -5.48193359375, -5.150634765625, -4.8193359375, -4.488037109375, -4.15673828125, -3.825439453125, -3.494140625, -3.162841796875, -2.83154296875, -2.500244140625, -2.1689453125, -1.837646484375, -1.50634765625, -1.175048828125, -0.84375, -0.512451171875, -0.18115234375, 0.150146484375, 0.4814453125, 0.812744140625, 1.14404296875, 1.475341796875, 1.806640625, 2.137939453125, 2.46923828125, 2.800537109375, 3.1318359375, 3.463134765625, 3.79443359375, 4.125732421875, 4.45703125, 4.788330078125, 5.11962890625, 5.450927734375, 5.7822265625, 6.113525390625, 6.44482421875, 6.776123046875, 7.107421875, 7.438720703125, 7.77001953125, 8.101318359375, 8.4326171875, 8.763916015625, 9.09521484375, 9.426513671875, 9.7578125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 4.0, 1.0, 4.0, 9.0, 15.0, 4.0, 14.0, 12.0, 15.0, 31.0, 38.0, 53.0, 76.0, 117.0, 200.0, 329.0, 578.0, 1025.0, 1969.0, 3893.0, 7212.0, 14328.0, 28583.0, 169672.0, 735171.0, 43887.0, 20076.0, 10111.0, 5238.0, 2640.0, 1414.0, 718.0, 407.0, 245.0, 154.0, 90.0, 57.0, 46.0, 33.0, 24.0, 11.0, 18.0, 9.0, 13.0, 8.0, 7.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-22.8125, -22.146240234375, -21.47998046875, -20.813720703125, -20.1474609375, -19.481201171875, -18.81494140625, -18.148681640625, -17.482421875, -16.816162109375, -16.14990234375, -15.483642578125, -14.8173828125, -14.151123046875, -13.48486328125, -12.818603515625, -12.15234375, -11.486083984375, -10.81982421875, -10.153564453125, -9.4873046875, -8.821044921875, -8.15478515625, -7.488525390625, -6.822265625, -6.156005859375, -5.48974609375, -4.823486328125, -4.1572265625, -3.490966796875, -2.82470703125, -2.158447265625, -1.4921875, -0.825927734375, -0.15966796875, 0.506591796875, 1.1728515625, 1.839111328125, 2.50537109375, 3.171630859375, 3.837890625, 4.504150390625, 5.17041015625, 5.836669921875, 6.5029296875, 7.169189453125, 7.83544921875, 8.501708984375, 9.16796875, 9.834228515625, 10.50048828125, 11.166748046875, 11.8330078125, 12.499267578125, 13.16552734375, 13.831787109375, 14.498046875, 15.164306640625, 15.83056640625, 16.496826171875, 17.1630859375, 17.829345703125, 18.49560546875, 19.161865234375, 19.828125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 6.0, 2.0, 7.0, 10.0, 5.0, 12.0, 16.0, 11.0, 10.0, 14.0, 26.0, 32.0, 40.0, 31.0, 32.0, 46.0, 47.0, 35.0, 32.0, 48.0, 51.0, 45.0, 50.0, 56.0, 41.0, 36.0, 35.0, 41.0, 36.0, 25.0, 21.0, 21.0, 15.0, 14.0, 17.0, 15.0, 7.0, 5.0, 7.0, 3.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.625, -15.1866455078125, -14.748291015625, -14.3099365234375, -13.87158203125, -13.4332275390625, -12.994873046875, -12.5565185546875, -12.1181640625, -11.6798095703125, -11.241455078125, -10.8031005859375, -10.36474609375, -9.9263916015625, -9.488037109375, -9.0496826171875, -8.611328125, -8.1729736328125, -7.734619140625, -7.2962646484375, -6.85791015625, -6.4195556640625, -5.981201171875, -5.5428466796875, -5.1044921875, -4.6661376953125, -4.227783203125, -3.7894287109375, -3.35107421875, -2.9127197265625, -2.474365234375, -2.0360107421875, -1.59765625, -1.1593017578125, -0.720947265625, -0.2825927734375, 0.15576171875, 0.5941162109375, 1.032470703125, 1.4708251953125, 1.9091796875, 2.3475341796875, 2.785888671875, 3.2242431640625, 3.66259765625, 4.1009521484375, 4.539306640625, 4.9776611328125, 5.416015625, 5.8543701171875, 6.292724609375, 6.7310791015625, 7.16943359375, 7.6077880859375, 8.046142578125, 8.4844970703125, 8.9228515625, 9.3612060546875, 9.799560546875, 10.2379150390625, 10.67626953125, 11.1146240234375, 11.552978515625, 11.9913330078125, 12.4296875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 4.0, 7.0, 3.0, 11.0, 18.0, 22.0, 26.0, 47.0, 80.0, 140.0, 205.0, 308.0, 532.0, 885.0, 1477.0, 2747.0, 4896.0, 9638.0, 19567.0, 50877.0, 669237.0, 225609.0, 31408.0, 14373.0, 7365.0, 3851.0, 2161.0, 1180.0, 742.0, 392.0, 258.0, 173.0, 97.0, 68.0, 43.0, 42.0, 24.0, 12.0, 10.0, 6.0, 8.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.17578125, -5.03118896484375, -4.8865966796875, -4.74200439453125, -4.597412109375, -4.45281982421875, -4.3082275390625, -4.16363525390625, -4.01904296875, -3.87445068359375, -3.7298583984375, -3.58526611328125, -3.440673828125, -3.29608154296875, -3.1514892578125, -3.00689697265625, -2.8623046875, -2.71771240234375, -2.5731201171875, -2.42852783203125, -2.283935546875, -2.13934326171875, -1.9947509765625, -1.85015869140625, -1.70556640625, -1.56097412109375, -1.4163818359375, -1.27178955078125, -1.127197265625, -0.98260498046875, -0.8380126953125, -0.69342041015625, -0.548828125, -0.40423583984375, -0.2596435546875, -0.11505126953125, 0.029541015625, 0.17413330078125, 0.3187255859375, 0.46331787109375, 0.60791015625, 0.75250244140625, 0.8970947265625, 1.04168701171875, 1.186279296875, 1.33087158203125, 1.4754638671875, 1.62005615234375, 1.7646484375, 1.90924072265625, 2.0538330078125, 2.19842529296875, 2.343017578125, 2.48760986328125, 2.6322021484375, 2.77679443359375, 2.92138671875, 3.06597900390625, 3.2105712890625, 3.35516357421875, 3.499755859375, 3.64434814453125, 3.7889404296875, 3.93353271484375, 4.078125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 1.0, 6.0, 7.0, 10.0, 7.0, 21.0, 12.0, 20.0, 28.0, 33.0, 35.0, 50.0, 58.0, 49.0, 48.0, 58.0, 55.0, 55.0, 56.0, 62.0, 53.0, 37.0, 47.0, 37.0, 33.0, 22.0, 19.0, 15.0, 12.0, 9.0, 9.0, 5.0, 11.0, 4.0, 3.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0013265609741210938, -0.0012861639261245728, -0.0012457668781280518, -0.0012053698301315308, -0.0011649727821350098, -0.0011245757341384888, -0.0010841786861419678, -0.0010437816381454468, -0.0010033845901489258, -0.0009629875421524048, -0.0009225904941558838, -0.0008821934461593628, -0.0008417963981628418, -0.0008013993501663208, -0.0007610023021697998, -0.0007206052541732788, -0.0006802082061767578, -0.0006398111581802368, -0.0005994141101837158, -0.0005590170621871948, -0.0005186200141906738, -0.00047822296619415283, -0.00043782591819763184, -0.00039742887020111084, -0.00035703182220458984, -0.00031663477420806885, -0.00027623772621154785, -0.00023584067821502686, -0.00019544363021850586, -0.00015504658222198486, -0.00011464953422546387, -7.425248622894287e-05, -3.3855438232421875e-05, 6.541609764099121e-06, 4.693865776062012e-05, 8.733570575714111e-05, 0.0001277327537536621, 0.0001681298017501831, 0.0002085268497467041, 0.0002489238977432251, 0.0002893209457397461, 0.0003297179937362671, 0.0003701150417327881, 0.0004105120897293091, 0.0004509091377258301, 0.0004913061857223511, 0.0005317032337188721, 0.0005721002817153931, 0.0006124973297119141, 0.0006528943777084351, 0.0006932914257049561, 0.000733688473701477, 0.000774085521697998, 0.000814482569694519, 0.00085487961769104, 0.000895276665687561, 0.000935673713684082, 0.000976070761680603, 0.001016467809677124, 0.001056864857673645, 0.001097261905670166, 0.001137658953666687, 0.001178056001663208, 0.001218453049659729, 0.00125885009765625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 5.0, 5.0, 8.0, 7.0, 11.0, 20.0, 23.0, 31.0, 63.0, 95.0, 116.0, 158.0, 297.0, 444.0, 729.0, 1105.0, 2043.0, 3719.0, 6855.0, 14122.0, 31127.0, 74916.0, 181959.0, 321357.0, 233111.0, 98959.0, 40164.0, 17865.0, 8608.0, 4462.0, 2535.0, 1372.0, 835.0, 499.0, 315.0, 205.0, 137.0, 86.0, 60.0, 49.0, 30.0, 15.0, 15.0, 10.0, 5.0, 4.0, 3.0, 6.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.96875, -2.877838134765625, -2.78692626953125, -2.696014404296875, -2.6051025390625, -2.514190673828125, -2.42327880859375, -2.332366943359375, -2.241455078125, -2.150543212890625, -2.05963134765625, -1.968719482421875, -1.8778076171875, -1.786895751953125, -1.69598388671875, -1.605072021484375, -1.51416015625, -1.423248291015625, -1.33233642578125, -1.241424560546875, -1.1505126953125, -1.059600830078125, -0.96868896484375, -0.877777099609375, -0.786865234375, -0.695953369140625, -0.60504150390625, -0.514129638671875, -0.4232177734375, -0.332305908203125, -0.24139404296875, -0.150482177734375, -0.0595703125, 0.031341552734375, 0.12225341796875, 0.213165283203125, 0.3040771484375, 0.394989013671875, 0.48590087890625, 0.576812744140625, 0.667724609375, 0.758636474609375, 0.84954833984375, 0.940460205078125, 1.0313720703125, 1.122283935546875, 1.21319580078125, 1.304107666015625, 1.39501953125, 1.485931396484375, 1.57684326171875, 1.667755126953125, 1.7586669921875, 1.849578857421875, 1.94049072265625, 2.031402587890625, 2.122314453125, 2.213226318359375, 2.30413818359375, 2.395050048828125, 2.4859619140625, 2.576873779296875, 2.66778564453125, 2.758697509765625, 2.849609375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 10.0, 3.0, 9.0, 10.0, 17.0, 13.0, 17.0, 23.0, 37.0, 42.0, 49.0, 47.0, 64.0, 65.0, 72.0, 75.0, 51.0, 83.0, 60.0, 55.0, 46.0, 34.0, 22.0, 21.0, 15.0, 14.0, 12.0, 8.0, 6.0, 4.0, 8.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.70654296875, -0.6806640625, -0.65478515625, -0.62890625, -0.60302734375, -0.5771484375, -0.55126953125, -0.525390625, -0.49951171875, -0.4736328125, -0.44775390625, -0.421875, -0.39599609375, -0.3701171875, -0.34423828125, -0.318359375, -0.29248046875, -0.2666015625, -0.24072265625, -0.21484375, -0.18896484375, -0.1630859375, -0.13720703125, -0.111328125, -0.08544921875, -0.0595703125, -0.03369140625, -0.0078125, 0.01806640625, 0.0439453125, 0.06982421875, 0.095703125, 0.12158203125, 0.1474609375, 0.17333984375, 0.19921875, 0.22509765625, 0.2509765625, 0.27685546875, 0.302734375, 0.32861328125, 0.3544921875, 0.38037109375, 0.40625, 0.43212890625, 0.4580078125, 0.48388671875, 0.509765625, 0.53564453125, 0.5615234375, 0.58740234375, 0.61328125, 0.63916015625, 0.6650390625, 0.69091796875, 0.716796875, 0.74267578125, 0.7685546875, 0.79443359375, 0.8203125, 0.84619140625, 0.8720703125, 0.89794921875, 0.923828125, 0.94970703125]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 9.0, 9.0, 6.0, 10.0, 15.0, 13.0, 14.0, 21.0, 27.0, 25.0, 37.0, 33.0, 51.0, 58.0, 67.0, 46.0, 52.0, 52.0, 52.0, 47.0, 51.0, 44.0, 41.0, 42.0, 31.0, 37.0, 29.0, 16.0, 13.0, 9.0, 19.0, 12.0, 10.0, 5.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.789351463317871, -9.416946411132812, -9.04454231262207, -8.672137260437012, -8.29973316192627, -7.927328109741211, -7.5549235343933105, -7.18251895904541, -6.81011438369751, -6.437709808349609, -6.065305233001709, -5.692900657653809, -5.32049560546875, -4.948091506958008, -4.575686454772949, -4.203281879425049, -3.8308773040771484, -3.458472728729248, -3.0860681533813477, -2.713663339614868, -2.3412587642669678, -1.9688541889190674, -1.596449375152588, -1.2240447998046875, -0.8516402244567871, -0.47923558950424194, -0.10683095455169678, 0.26557374000549316, 0.6379783153533936, 1.010382890701294, 1.3827877044677734, 1.7551922798156738, 2.127596855163574, 2.5000014305114746, 2.872406005859375, 3.2448108196258545, 3.617215394973755, 3.9896199703216553, 4.362024784088135, 4.734429359436035, 5.1068339347839355, 5.479238510131836, 5.851643085479736, 6.224047660827637, 6.596452713012695, 6.9688568115234375, 7.341261863708496, 7.7136664390563965, 8.086071014404297, 8.458476066589355, 8.830880165100098, 9.203285217285156, 9.575689315795898, 9.948094367980957, 10.320499420166016, 10.692903518676758, 11.0653076171875, 11.437712669372559, 11.8101167678833, 12.18252182006836, 12.554925918579102, 12.92733097076416, 13.299736022949219, 13.672140121459961, 14.04454517364502]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 5.0, 4.0, 6.0, 9.0, 16.0, 19.0, 20.0, 21.0, 28.0, 19.0, 27.0, 21.0, 28.0, 42.0, 38.0, 49.0, 43.0, 47.0, 51.0, 34.0, 46.0, 47.0, 38.0, 41.0, 31.0, 26.0, 31.0, 36.0, 34.0, 18.0, 26.0, 19.0, 8.0, 15.0, 11.0, 6.0, 8.0, 4.0, 7.0, 5.0, 3.0, 3.0, 4.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-10.787904739379883, -10.463221549987793, -10.138538360595703, -9.813854217529297, -9.489171028137207, -9.164487838745117, -8.839804649353027, -8.515121459960938, -8.190437316894531, -7.865754127502441, -7.541070461273193, -7.2163872718811035, -6.8917036056518555, -6.567020416259766, -6.242337226867676, -5.917654037475586, -5.592970848083496, -5.268287658691406, -4.943603992462158, -4.618920803070068, -4.29423713684082, -3.9695539474487305, -3.6448707580566406, -3.3201873302459717, -2.9955039024353027, -2.670820474624634, -2.346137046813965, -2.021453857421875, -1.696770429611206, -1.372087001800537, -1.0474036931991577, -0.7227203845977783, -0.3980369567871094, -0.0733535885810852, 0.25132977962493896, 0.5760131478309631, 0.9006965160369873, 1.2253799438476562, 1.5500632524490356, 1.874746561050415, 2.199429988861084, 2.524113416671753, 2.848796844482422, 3.1734800338745117, 3.4981634616851807, 3.8228468894958496, 4.1475300788879395, 4.4722137451171875, 4.796896934509277, 5.121580123901367, 5.446263790130615, 5.770946979522705, 6.095630645751953, 6.420313835144043, 6.744997024536133, 7.069680213928223, 7.394363880157471, 7.7190470695495605, 8.043730735778809, 8.368413925170898, 8.693097114562988, 9.017780303955078, 9.342464447021484, 9.667147636413574, 9.991830825805664]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 5.0, 13.0, 23.0, 38.0, 54.0, 76.0, 146.0, 182.0, 326.0, 466.0, 691.0, 1153.0, 1808.0, 2867.0, 4422.0, 6990.0, 10721.0, 16147.0, 24058.0, 35048.0, 49565.0, 65757.0, 84277.0, 99188.0, 109937.0, 110102.0, 102551.0, 87354.0, 69541.0, 52162.0, 37454.0, 25869.0, 17263.0, 11519.0, 7543.0, 4810.0, 3006.0, 1967.0, 1288.0, 742.0, 511.0, 336.0, 212.0, 126.0, 101.0, 59.0, 28.0, 25.0, 15.0, 5.0, 7.0, 2.0, 2.0, 2.0, 0.0, 2.0], "bins": [-6.359375, -6.16717529296875, -5.9749755859375, -5.78277587890625, -5.590576171875, -5.39837646484375, -5.2061767578125, -5.01397705078125, -4.82177734375, -4.62957763671875, -4.4373779296875, -4.24517822265625, -4.052978515625, -3.86077880859375, -3.6685791015625, -3.47637939453125, -3.2841796875, -3.09197998046875, -2.8997802734375, -2.70758056640625, -2.515380859375, -2.32318115234375, -2.1309814453125, -1.93878173828125, -1.74658203125, -1.55438232421875, -1.3621826171875, -1.16998291015625, -0.977783203125, -0.78558349609375, -0.5933837890625, -0.40118408203125, -0.208984375, -0.01678466796875, 0.1754150390625, 0.36761474609375, 0.559814453125, 0.75201416015625, 0.9442138671875, 1.13641357421875, 1.32861328125, 1.52081298828125, 1.7130126953125, 1.90521240234375, 2.097412109375, 2.28961181640625, 2.4818115234375, 2.67401123046875, 2.8662109375, 3.05841064453125, 3.2506103515625, 3.44281005859375, 3.635009765625, 3.82720947265625, 4.0194091796875, 4.21160888671875, 4.40380859375, 4.59600830078125, 4.7882080078125, 4.98040771484375, 5.172607421875, 5.36480712890625, 5.5570068359375, 5.74920654296875, 5.94140625]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 2.0, 5.0, 7.0, 5.0, 4.0, 9.0, 12.0, 12.0, 21.0, 9.0, 19.0, 32.0, 18.0, 30.0, 30.0, 38.0, 31.0, 48.0, 37.0, 46.0, 41.0, 46.0, 42.0, 39.0, 36.0, 38.0, 33.0, 30.0, 24.0, 25.0, 26.0, 28.0, 25.0, 29.0, 27.0, 15.0, 14.0, 12.0, 9.0, 6.0, 9.0, 4.0, 12.0, 2.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-9.8515625, -9.5567626953125, -9.261962890625, -8.9671630859375, -8.67236328125, -8.3775634765625, -8.082763671875, -7.7879638671875, -7.4931640625, -7.1983642578125, -6.903564453125, -6.6087646484375, -6.31396484375, -6.0191650390625, -5.724365234375, -5.4295654296875, -5.134765625, -4.8399658203125, -4.545166015625, -4.2503662109375, -3.95556640625, -3.6607666015625, -3.365966796875, -3.0711669921875, -2.7763671875, -2.4815673828125, -2.186767578125, -1.8919677734375, -1.59716796875, -1.3023681640625, -1.007568359375, -0.7127685546875, -0.41796875, -0.1231689453125, 0.171630859375, 0.4664306640625, 0.76123046875, 1.0560302734375, 1.350830078125, 1.6456298828125, 1.9404296875, 2.2352294921875, 2.530029296875, 2.8248291015625, 3.11962890625, 3.4144287109375, 3.709228515625, 4.0040283203125, 4.298828125, 4.5936279296875, 4.888427734375, 5.1832275390625, 5.47802734375, 5.7728271484375, 6.067626953125, 6.3624267578125, 6.6572265625, 6.9520263671875, 7.246826171875, 7.5416259765625, 7.83642578125, 8.1312255859375, 8.426025390625, 8.7208251953125, 9.015625]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [5.0, 2.0, 2.0, 8.0, 7.0, 10.0, 9.0, 23.0, 36.0, 52.0, 56.0, 96.0, 160.0, 250.0, 322.0, 531.0, 832.0, 1199.0, 1691.0, 2713.0, 4170.0, 6474.0, 9912.0, 15452.0, 23686.0, 36142.0, 53371.0, 74994.0, 99222.0, 119587.0, 129089.0, 121343.0, 103201.0, 78259.0, 55802.0, 38022.0, 25296.0, 16414.0, 10529.0, 6719.0, 4466.0, 2863.0, 1910.0, 1241.0, 800.0, 525.0, 329.0, 242.0, 144.0, 125.0, 71.0, 58.0, 38.0, 22.0, 17.0, 13.0, 7.0, 7.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-8.25, -7.9801025390625, -7.710205078125, -7.4403076171875, -7.17041015625, -6.9005126953125, -6.630615234375, -6.3607177734375, -6.0908203125, -5.8209228515625, -5.551025390625, -5.2811279296875, -5.01123046875, -4.7413330078125, -4.471435546875, -4.2015380859375, -3.931640625, -3.6617431640625, -3.391845703125, -3.1219482421875, -2.85205078125, -2.5821533203125, -2.312255859375, -2.0423583984375, -1.7724609375, -1.5025634765625, -1.232666015625, -0.9627685546875, -0.69287109375, -0.4229736328125, -0.153076171875, 0.1168212890625, 0.38671875, 0.6566162109375, 0.926513671875, 1.1964111328125, 1.46630859375, 1.7362060546875, 2.006103515625, 2.2760009765625, 2.5458984375, 2.8157958984375, 3.085693359375, 3.3555908203125, 3.62548828125, 3.8953857421875, 4.165283203125, 4.4351806640625, 4.705078125, 4.9749755859375, 5.244873046875, 5.5147705078125, 5.78466796875, 6.0545654296875, 6.324462890625, 6.5943603515625, 6.8642578125, 7.1341552734375, 7.404052734375, 7.6739501953125, 7.94384765625, 8.2137451171875, 8.483642578125, 8.7535400390625, 9.0234375]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 6.0, 8.0, 4.0, 8.0, 4.0, 14.0, 12.0, 19.0, 15.0, 21.0, 25.0, 27.0, 23.0, 35.0, 39.0, 37.0, 36.0, 40.0, 40.0, 48.0, 47.0, 48.0, 37.0, 37.0, 39.0, 29.0, 33.0, 31.0, 32.0, 23.0, 29.0, 28.0, 25.0, 13.0, 15.0, 15.0, 14.0, 8.0, 7.0, 3.0, 6.0, 3.0, 6.0, 2.0, 2.0, 8.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-7.17578125, -6.95892333984375, -6.7420654296875, -6.52520751953125, -6.308349609375, -6.09149169921875, -5.8746337890625, -5.65777587890625, -5.44091796875, -5.22406005859375, -5.0072021484375, -4.79034423828125, -4.573486328125, -4.35662841796875, -4.1397705078125, -3.92291259765625, -3.7060546875, -3.48919677734375, -3.2723388671875, -3.05548095703125, -2.838623046875, -2.62176513671875, -2.4049072265625, -2.18804931640625, -1.97119140625, -1.75433349609375, -1.5374755859375, -1.32061767578125, -1.103759765625, -0.88690185546875, -0.6700439453125, -0.45318603515625, -0.236328125, -0.01947021484375, 0.1973876953125, 0.41424560546875, 0.631103515625, 0.84796142578125, 1.0648193359375, 1.28167724609375, 1.49853515625, 1.71539306640625, 1.9322509765625, 2.14910888671875, 2.365966796875, 2.58282470703125, 2.7996826171875, 3.01654052734375, 3.2333984375, 3.45025634765625, 3.6671142578125, 3.88397216796875, 4.100830078125, 4.31768798828125, 4.5345458984375, 4.75140380859375, 4.96826171875, 5.18511962890625, 5.4019775390625, 5.61883544921875, 5.835693359375, 6.05255126953125, 6.2694091796875, 6.48626708984375, 6.703125]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 4.0, 9.0, 24.0, 18.0, 24.0, 45.0, 57.0, 104.0, 173.0, 263.0, 362.0, 633.0, 957.0, 1437.0, 2125.0, 3449.0, 5331.0, 8347.0, 12807.0, 19903.0, 31727.0, 49356.0, 77126.0, 112294.0, 145943.0, 156466.0, 136210.0, 99251.0, 66285.0, 42574.0, 26920.0, 17139.0, 11033.0, 7133.0, 4631.0, 2966.0, 1955.0, 1228.0, 798.0, 490.0, 342.0, 225.0, 140.0, 78.0, 66.0, 32.0, 34.0, 11.0, 13.0, 3.0, 8.0, 4.0, 2.0, 3.0, 1.0, 2.0], "bins": [-4.65625, -4.51654052734375, -4.3768310546875, -4.23712158203125, -4.097412109375, -3.95770263671875, -3.8179931640625, -3.67828369140625, -3.53857421875, -3.39886474609375, -3.2591552734375, -3.11944580078125, -2.979736328125, -2.84002685546875, -2.7003173828125, -2.56060791015625, -2.4208984375, -2.28118896484375, -2.1414794921875, -2.00177001953125, -1.862060546875, -1.72235107421875, -1.5826416015625, -1.44293212890625, -1.30322265625, -1.16351318359375, -1.0238037109375, -0.88409423828125, -0.744384765625, -0.60467529296875, -0.4649658203125, -0.32525634765625, -0.185546875, -0.04583740234375, 0.0938720703125, 0.23358154296875, 0.373291015625, 0.51300048828125, 0.6527099609375, 0.79241943359375, 0.93212890625, 1.07183837890625, 1.2115478515625, 1.35125732421875, 1.490966796875, 1.63067626953125, 1.7703857421875, 1.91009521484375, 2.0498046875, 2.18951416015625, 2.3292236328125, 2.46893310546875, 2.608642578125, 2.74835205078125, 2.8880615234375, 3.02777099609375, 3.16748046875, 3.30718994140625, 3.4468994140625, 3.58660888671875, 3.726318359375, 3.86602783203125, 4.0057373046875, 4.14544677734375, 4.28515625]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 2.0, 4.0, 8.0, 6.0, 5.0, 14.0, 15.0, 18.0, 20.0, 26.0, 42.0, 45.0, 80.0, 62.0, 68.0, 81.0, 97.0, 71.0, 60.0, 48.0, 36.0, 32.0, 31.0, 31.0, 18.0, 13.0, 12.0, 12.0, 15.0, 13.0, 4.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005578994750976562, -0.0005384758114814758, -0.0005190521478652954, -0.000499628484249115, -0.00048020482063293457, -0.00046078115701675415, -0.00044135749340057373, -0.0004219338297843933, -0.0004025101661682129, -0.00038308650255203247, -0.00036366283893585205, -0.00034423917531967163, -0.0003248155117034912, -0.0003053918480873108, -0.00028596818447113037, -0.00026654452085494995, -0.00024712085723876953, -0.0002276971936225891, -0.0002082735300064087, -0.00018884986639022827, -0.00016942620277404785, -0.00015000253915786743, -0.000130578875541687, -0.00011115521192550659, -9.173154830932617e-05, -7.230788469314575e-05, -5.288422107696533e-05, -3.346055746078491e-05, -1.4036893844604492e-05, 5.386769771575928e-06, 2.4810433387756348e-05, 4.423409700393677e-05, 6.365776062011719e-05, 8.308142423629761e-05, 0.00010250508785247803, 0.00012192875146865845, 0.00014135241508483887, 0.0001607760787010193, 0.0001801997423171997, 0.00019962340593338013, 0.00021904706954956055, 0.00023847073316574097, 0.0002578943967819214, 0.0002773180603981018, 0.0002967417240142822, 0.00031616538763046265, 0.00033558905124664307, 0.0003550127148628235, 0.0003744363784790039, 0.0003938600420951843, 0.00041328370571136475, 0.00043270736932754517, 0.0004521310329437256, 0.000471554696559906, 0.0004909783601760864, 0.0005104020237922668, 0.0005298256874084473, 0.0005492493510246277, 0.0005686730146408081, 0.0005880966782569885, 0.0006075203418731689, 0.0006269440054893494, 0.0006463676691055298, 0.0006657913327217102, 0.0006852149963378906]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 9.0, 15.0, 16.0, 17.0, 30.0, 36.0, 51.0, 88.0, 99.0, 190.0, 247.0, 353.0, 545.0, 760.0, 1162.0, 1751.0, 2716.0, 4096.0, 6329.0, 9998.0, 16070.0, 25856.0, 42648.0, 70061.0, 108371.0, 152258.0, 171997.0, 149897.0, 105622.0, 67408.0, 41385.0, 25118.0, 15770.0, 9772.0, 6159.0, 3894.0, 2598.0, 1612.0, 1098.0, 775.0, 532.0, 373.0, 240.0, 189.0, 104.0, 63.0, 59.0, 31.0, 43.0, 21.0, 9.0, 9.0, 9.0, 3.0, 3.0, 4.0], "bins": [-5.8125, -5.64385986328125, -5.4752197265625, -5.30657958984375, -5.137939453125, -4.96929931640625, -4.8006591796875, -4.63201904296875, -4.46337890625, -4.29473876953125, -4.1260986328125, -3.95745849609375, -3.788818359375, -3.62017822265625, -3.4515380859375, -3.28289794921875, -3.1142578125, -2.94561767578125, -2.7769775390625, -2.60833740234375, -2.439697265625, -2.27105712890625, -2.1024169921875, -1.93377685546875, -1.76513671875, -1.59649658203125, -1.4278564453125, -1.25921630859375, -1.090576171875, -0.92193603515625, -0.7532958984375, -0.58465576171875, -0.416015625, -0.24737548828125, -0.0787353515625, 0.08990478515625, 0.258544921875, 0.42718505859375, 0.5958251953125, 0.76446533203125, 0.93310546875, 1.10174560546875, 1.2703857421875, 1.43902587890625, 1.607666015625, 1.77630615234375, 1.9449462890625, 2.11358642578125, 2.2822265625, 2.45086669921875, 2.6195068359375, 2.78814697265625, 2.956787109375, 3.12542724609375, 3.2940673828125, 3.46270751953125, 3.63134765625, 3.79998779296875, 3.9686279296875, 4.13726806640625, 4.305908203125, 4.47454833984375, 4.6431884765625, 4.81182861328125, 4.98046875]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 5.0, 4.0, 6.0, 6.0, 14.0, 14.0, 11.0, 14.0, 7.0, 14.0, 28.0, 18.0, 23.0, 38.0, 52.0, 46.0, 46.0, 47.0, 50.0, 46.0, 51.0, 56.0, 54.0, 41.0, 39.0, 44.0, 41.0, 31.0, 23.0, 25.0, 23.0, 24.0, 11.0, 10.0, 6.0, 10.0, 3.0, 7.0, 5.0, 5.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.76953125, -1.7042236328125, -1.638916015625, -1.5736083984375, -1.50830078125, -1.4429931640625, -1.377685546875, -1.3123779296875, -1.2470703125, -1.1817626953125, -1.116455078125, -1.0511474609375, -0.98583984375, -0.9205322265625, -0.855224609375, -0.7899169921875, -0.724609375, -0.6593017578125, -0.593994140625, -0.5286865234375, -0.46337890625, -0.3980712890625, -0.332763671875, -0.2674560546875, -0.2021484375, -0.1368408203125, -0.071533203125, -0.0062255859375, 0.05908203125, 0.1243896484375, 0.189697265625, 0.2550048828125, 0.3203125, 0.3856201171875, 0.450927734375, 0.5162353515625, 0.58154296875, 0.6468505859375, 0.712158203125, 0.7774658203125, 0.8427734375, 0.9080810546875, 0.973388671875, 1.0386962890625, 1.10400390625, 1.1693115234375, 1.234619140625, 1.2999267578125, 1.365234375, 1.4305419921875, 1.495849609375, 1.5611572265625, 1.62646484375, 1.6917724609375, 1.757080078125, 1.8223876953125, 1.8876953125, 1.9530029296875, 2.018310546875, 2.0836181640625, 2.14892578125, 2.2142333984375, 2.279541015625, 2.3448486328125, 2.41015625]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 4.0, 6.0, 4.0, 8.0, 11.0, 11.0, 12.0, 17.0, 25.0, 33.0, 34.0, 32.0, 42.0, 44.0, 56.0, 51.0, 49.0, 53.0, 64.0, 68.0, 57.0, 42.0, 44.0, 51.0, 36.0, 33.0, 27.0, 27.0, 20.0, 11.0, 10.0, 9.0, 8.0, 5.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.38864517211914, -7.9964165687561035, -7.604187965393066, -7.211959362030029, -6.819730758666992, -6.427502155303955, -6.035273551940918, -5.643044471740723, -5.250816345214844, -4.858587741851807, -4.4663591384887695, -4.074130535125732, -3.6819019317626953, -3.289673328399658, -2.897444486618042, -2.505215883255005, -2.1129870414733887, -1.7207584381103516, -1.3285298347473145, -0.9363011121749878, -0.5440725088119507, -0.15184390544891357, 0.24038481712341309, 0.6326134204864502, 1.0248420238494873, 1.4170706272125244, 1.8092992305755615, 2.2015280723571777, 2.593756675720215, 2.985985279083252, 3.378213882446289, 3.770442485809326, 4.162671089172363, 4.5548996925354, 4.9471282958984375, 5.339356899261475, 5.731585502624512, 6.123814105987549, 6.516042709350586, 6.908271789550781, 7.30049991607666, 7.692728519439697, 8.084957122802734, 8.47718620300293, 8.869414329528809, 9.261643409729004, 9.653871536254883, 10.046100616455078, 10.438329696655273, 10.830558776855469, 11.222786903381348, 11.615015983581543, 12.007244110107422, 12.399473190307617, 12.791701316833496, 13.183930397033691, 13.57615852355957, 13.968387603759766, 14.360615730285645, 14.75284481048584, 15.145072937011719, 15.537302017211914, 15.929530143737793, 16.321758270263672, 16.713987350463867]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 5.0, 6.0, 8.0, 14.0, 11.0, 16.0, 16.0, 28.0, 28.0, 21.0, 36.0, 26.0, 41.0, 38.0, 49.0, 39.0, 44.0, 47.0, 47.0, 55.0, 32.0, 49.0, 37.0, 40.0, 41.0, 36.0, 23.0, 29.0, 29.0, 22.0, 17.0, 13.0, 14.0, 10.0, 10.0, 5.0, 10.0, 2.0, 5.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.59898567199707, -11.231043815612793, -10.863101959228516, -10.495159149169922, -10.127217292785645, -9.759275436401367, -9.39133358001709, -9.023391723632812, -8.655449867248535, -8.287508010864258, -7.919565677642822, -7.551623821258545, -7.183681964874268, -6.815739631652832, -6.447797775268555, -6.079855918884277, -5.711913585662842, -5.3439717292785645, -4.976029396057129, -4.608087539672852, -4.240145683288574, -3.8722035884857178, -3.5042614936828613, -3.136319637298584, -2.7683775424957275, -2.400435447692871, -2.0324935913085938, -1.6645514965057373, -1.2966095209121704, -0.9286675453186035, -0.5607254505157471, -0.19278359413146973, 0.17515850067138672, 0.5431004762649536, 0.9110425114631653, 1.278984546661377, 1.6469265222549438, 2.0148684978485107, 2.382810592651367, 2.7507524490356445, 3.118694543838501, 3.4866366386413574, 3.8545784950256348, 4.22252082824707, 4.590462684631348, 4.958404541015625, 5.326346397399902, 5.69428825378418, 6.062230587005615, 6.430172443389893, 6.798114776611328, 7.1660566329956055, 7.533998489379883, 7.90194034576416, 8.269882202148438, 8.637825012207031, 9.005766868591309, 9.373708724975586, 9.741650581359863, 10.10959243774414, 10.477535247802734, 10.845477104187012, 11.213418960571289, 11.581360816955566, 11.949302673339844]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 6.0, 13.0, 7.0, 14.0, 20.0, 30.0, 54.0, 89.0, 114.0, 165.0, 250.0, 384.0, 594.0, 1021.0, 1574.0, 2620.0, 4481.0, 7696.0, 13547.0, 25263.0, 48214.0, 92232.0, 178246.0, 330586.0, 536348.0, 723246.0, 755217.0, 609392.0, 394940.0, 220464.0, 115479.0, 60406.0, 31507.0, 16925.0, 9416.0, 5381.0, 3310.0, 1897.0, 1129.0, 709.0, 462.0, 296.0, 206.0, 125.0, 81.0, 54.0, 24.0, 22.0, 15.0, 9.0, 6.0, 5.0, 1.0, 0.0, 2.0], "bins": [-8.9765625, -8.7213134765625, -8.466064453125, -8.2108154296875, -7.95556640625, -7.7003173828125, -7.445068359375, -7.1898193359375, -6.9345703125, -6.6793212890625, -6.424072265625, -6.1688232421875, -5.91357421875, -5.6583251953125, -5.403076171875, -5.1478271484375, -4.892578125, -4.6373291015625, -4.382080078125, -4.1268310546875, -3.87158203125, -3.6163330078125, -3.361083984375, -3.1058349609375, -2.8505859375, -2.5953369140625, -2.340087890625, -2.0848388671875, -1.82958984375, -1.5743408203125, -1.319091796875, -1.0638427734375, -0.80859375, -0.5533447265625, -0.298095703125, -0.0428466796875, 0.21240234375, 0.4676513671875, 0.722900390625, 0.9781494140625, 1.2333984375, 1.4886474609375, 1.743896484375, 1.9991455078125, 2.25439453125, 2.5096435546875, 2.764892578125, 3.0201416015625, 3.275390625, 3.5306396484375, 3.785888671875, 4.0411376953125, 4.29638671875, 4.5516357421875, 4.806884765625, 5.0621337890625, 5.3173828125, 5.5726318359375, 5.827880859375, 6.0831298828125, 6.33837890625, 6.5936279296875, 6.848876953125, 7.1041259765625, 7.359375]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 8.0, 7.0, 7.0, 12.0, 13.0, 12.0, 18.0, 18.0, 20.0, 23.0, 21.0, 27.0, 30.0, 42.0, 38.0, 45.0, 39.0, 58.0, 42.0, 40.0, 36.0, 56.0, 36.0, 50.0, 35.0, 38.0, 30.0, 32.0, 29.0, 19.0, 14.0, 20.0, 21.0, 13.0, 12.0, 15.0, 7.0, 11.0, 6.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.1171875, -8.8089599609375, -8.500732421875, -8.1925048828125, -7.88427734375, -7.5760498046875, -7.267822265625, -6.9595947265625, -6.6513671875, -6.3431396484375, -6.034912109375, -5.7266845703125, -5.41845703125, -5.1102294921875, -4.802001953125, -4.4937744140625, -4.185546875, -3.8773193359375, -3.569091796875, -3.2608642578125, -2.95263671875, -2.6444091796875, -2.336181640625, -2.0279541015625, -1.7197265625, -1.4114990234375, -1.103271484375, -0.7950439453125, -0.48681640625, -0.1785888671875, 0.129638671875, 0.4378662109375, 0.74609375, 1.0543212890625, 1.362548828125, 1.6707763671875, 1.97900390625, 2.2872314453125, 2.595458984375, 2.9036865234375, 3.2119140625, 3.5201416015625, 3.828369140625, 4.1365966796875, 4.44482421875, 4.7530517578125, 5.061279296875, 5.3695068359375, 5.677734375, 5.9859619140625, 6.294189453125, 6.6024169921875, 6.91064453125, 7.2188720703125, 7.527099609375, 7.8353271484375, 8.1435546875, 8.4517822265625, 8.760009765625, 9.0682373046875, 9.37646484375, 9.6846923828125, 9.992919921875, 10.3011474609375, 10.609375]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 7.0, 9.0, 13.0, 21.0, 28.0, 46.0, 80.0, 109.0, 136.0, 235.0, 335.0, 520.0, 877.0, 1376.0, 2082.0, 3232.0, 5265.0, 8706.0, 14135.0, 23544.0, 39171.0, 65566.0, 108370.0, 175605.0, 275672.0, 410085.0, 547963.0, 626124.0, 583722.0, 456263.0, 318524.0, 204244.0, 127337.0, 76996.0, 46396.0, 28045.0, 16766.0, 10086.0, 6180.0, 3781.0, 2389.0, 1472.0, 968.0, 597.0, 394.0, 314.0, 173.0, 113.0, 78.0, 58.0, 32.0, 17.0, 10.0, 6.0, 8.0, 8.0, 4.0, 2.0], "bins": [-8.6171875, -8.3612060546875, -8.105224609375, -7.8492431640625, -7.59326171875, -7.3372802734375, -7.081298828125, -6.8253173828125, -6.5693359375, -6.3133544921875, -6.057373046875, -5.8013916015625, -5.54541015625, -5.2894287109375, -5.033447265625, -4.7774658203125, -4.521484375, -4.2655029296875, -4.009521484375, -3.7535400390625, -3.49755859375, -3.2415771484375, -2.985595703125, -2.7296142578125, -2.4736328125, -2.2176513671875, -1.961669921875, -1.7056884765625, -1.44970703125, -1.1937255859375, -0.937744140625, -0.6817626953125, -0.42578125, -0.1697998046875, 0.086181640625, 0.3421630859375, 0.59814453125, 0.8541259765625, 1.110107421875, 1.3660888671875, 1.6220703125, 1.8780517578125, 2.134033203125, 2.3900146484375, 2.64599609375, 2.9019775390625, 3.157958984375, 3.4139404296875, 3.669921875, 3.9259033203125, 4.181884765625, 4.4378662109375, 4.69384765625, 4.9498291015625, 5.205810546875, 5.4617919921875, 5.7177734375, 5.9737548828125, 6.229736328125, 6.4857177734375, 6.74169921875, 6.9976806640625, 7.253662109375, 7.5096435546875, 7.765625]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 5.0, 12.0, 15.0, 12.0, 16.0, 25.0, 30.0, 38.0, 34.0, 59.0, 48.0, 75.0, 87.0, 105.0, 121.0, 142.0, 169.0, 186.0, 164.0, 220.0, 191.0, 235.0, 198.0, 222.0, 224.0, 211.0, 179.0, 177.0, 150.0, 128.0, 98.0, 105.0, 81.0, 57.0, 59.0, 38.0, 38.0, 27.0, 17.0, 21.0, 10.0, 12.0, 11.0, 6.0, 4.0, 3.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0], "bins": [-3.650390625, -3.540435791015625, -3.43048095703125, -3.320526123046875, -3.2105712890625, -3.100616455078125, -2.99066162109375, -2.880706787109375, -2.770751953125, -2.660797119140625, -2.55084228515625, -2.440887451171875, -2.3309326171875, -2.220977783203125, -2.11102294921875, -2.001068115234375, -1.89111328125, -1.781158447265625, -1.67120361328125, -1.561248779296875, -1.4512939453125, -1.341339111328125, -1.23138427734375, -1.121429443359375, -1.011474609375, -0.901519775390625, -0.79156494140625, -0.681610107421875, -0.5716552734375, -0.461700439453125, -0.35174560546875, -0.241790771484375, -0.1318359375, -0.021881103515625, 0.08807373046875, 0.198028564453125, 0.3079833984375, 0.417938232421875, 0.52789306640625, 0.637847900390625, 0.747802734375, 0.857757568359375, 0.96771240234375, 1.077667236328125, 1.1876220703125, 1.297576904296875, 1.40753173828125, 1.517486572265625, 1.62744140625, 1.737396240234375, 1.84735107421875, 1.957305908203125, 2.0672607421875, 2.177215576171875, 2.28717041015625, 2.397125244140625, 2.507080078125, 2.617034912109375, 2.72698974609375, 2.836944580078125, 2.9468994140625, 3.056854248046875, 3.16680908203125, 3.276763916015625, 3.38671875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 1.0, 1.0, 4.0, 4.0, 10.0, 3.0, 8.0, 15.0, 12.0, 19.0, 27.0, 18.0, 41.0, 31.0, 39.0, 31.0, 44.0, 53.0, 54.0, 49.0, 39.0, 44.0, 53.0, 44.0, 45.0, 42.0, 42.0, 39.0, 30.0, 33.0, 21.0, 19.0, 23.0, 10.0, 12.0, 14.0, 6.0, 8.0, 5.0, 2.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-10.66849422454834, -10.346779823303223, -10.025064468383789, -9.703350067138672, -9.381634712219238, -9.059920310974121, -8.738204956054688, -8.41649055480957, -8.094776153564453, -7.773061275482178, -7.451346397399902, -7.129631519317627, -6.807916641235352, -6.486202239990234, -6.164487361907959, -5.842772483825684, -5.52105712890625, -5.199342250823975, -4.877627372741699, -4.555912494659424, -4.234197616577148, -3.912482976913452, -3.590768337249756, -3.2690534591674805, -2.947338581085205, -2.6256237030029297, -2.3039088249206543, -1.982194185256958, -1.6604793071746826, -1.3387644290924072, -1.0170496702194214, -0.6953349113464355, -0.37362003326416016, -0.05190521478652954, 0.2698096036911011, 0.5915244221687317, 0.9132392406463623, 1.2349541187286377, 1.5566688776016235, 1.8783836364746094, 2.2000985145568848, 2.52181339263916, 2.8435282707214355, 3.165242910385132, 3.4869577884674072, 3.8086726665496826, 4.130387306213379, 4.452102184295654, 4.77381706237793, 5.095531940460205, 5.4172468185424805, 5.738961696624756, 6.060676574707031, 6.382390975952148, 6.704105854034424, 7.025820732116699, 7.347535610198975, 7.66925048828125, 7.990965366363525, 8.3126802444458, 8.634394645690918, 8.956110000610352, 9.277824401855469, 9.599538803100586, 9.92125415802002]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 4.0, 11.0, 11.0, 8.0, 11.0, 8.0, 18.0, 12.0, 17.0, 22.0, 34.0, 26.0, 33.0, 33.0, 30.0, 39.0, 45.0, 45.0, 39.0, 49.0, 51.0, 50.0, 44.0, 44.0, 32.0, 43.0, 31.0, 20.0, 28.0, 24.0, 22.0, 26.0, 20.0, 17.0, 9.0, 14.0, 4.0, 9.0, 6.0, 5.0, 3.0, 3.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.460762977600098, -9.125123977661133, -8.789485931396484, -8.45384693145752, -8.118207931518555, -7.782569408416748, -7.446930885314941, -7.111291885375977, -6.77565336227417, -6.440014839172363, -6.104375839233398, -5.768737316131592, -5.433098793029785, -5.09745979309082, -4.761821269989014, -4.426182746887207, -4.090543746948242, -3.7549049854278564, -3.4192662239074707, -3.083627700805664, -2.7479889392852783, -2.4123501777648926, -2.076711654663086, -1.7410728931427002, -1.4054341316223145, -1.0697953701019287, -0.7341567277908325, -0.39851808547973633, -0.06287932395935059, 0.27275943756103516, 0.6083979606628418, 0.9440367221832275, 1.2796764373779297, 1.6153151988983154, 1.9509538412094116, 2.286592483520508, 2.6222312450408936, 2.9578700065612793, 3.293508529663086, 3.6291472911834717, 3.9647860527038574, 4.300424575805664, 4.636063575744629, 4.9717020988464355, 5.307340621948242, 5.642979621887207, 5.978618144989014, 6.31425666809082, 6.649895668029785, 6.985534191131592, 7.321173191070557, 7.656811714172363, 7.992450714111328, 8.328088760375977, 8.663727760314941, 8.999366760253906, 9.335004806518555, 9.67064380645752, 10.006281852722168, 10.341920852661133, 10.677559852600098, 11.013198852539062, 11.348836898803711, 11.684475898742676, 12.02011489868164]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 2.0, 7.0, 12.0, 8.0, 13.0, 20.0, 40.0, 56.0, 67.0, 138.0, 216.0, 317.0, 534.0, 844.0, 1358.0, 2291.0, 3998.0, 6882.0, 12203.0, 20733.0, 35510.0, 58529.0, 91497.0, 129459.0, 155841.0, 156909.0, 130666.0, 92870.0, 60119.0, 36589.0, 21319.0, 12128.0, 7078.0, 4230.0, 2333.0, 1389.0, 879.0, 552.0, 328.0, 212.0, 144.0, 75.0, 61.0, 43.0, 24.0, 8.0, 14.0, 6.0, 2.0, 5.0, 3.0, 0.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.484375, -5.29541015625, -5.1064453125, -4.91748046875, -4.728515625, -4.53955078125, -4.3505859375, -4.16162109375, -3.97265625, -3.78369140625, -3.5947265625, -3.40576171875, -3.216796875, -3.02783203125, -2.8388671875, -2.64990234375, -2.4609375, -2.27197265625, -2.0830078125, -1.89404296875, -1.705078125, -1.51611328125, -1.3271484375, -1.13818359375, -0.94921875, -0.76025390625, -0.5712890625, -0.38232421875, -0.193359375, -0.00439453125, 0.1845703125, 0.37353515625, 0.5625, 0.75146484375, 0.9404296875, 1.12939453125, 1.318359375, 1.50732421875, 1.6962890625, 1.88525390625, 2.07421875, 2.26318359375, 2.4521484375, 2.64111328125, 2.830078125, 3.01904296875, 3.2080078125, 3.39697265625, 3.5859375, 3.77490234375, 3.9638671875, 4.15283203125, 4.341796875, 4.53076171875, 4.7197265625, 4.90869140625, 5.09765625, 5.28662109375, 5.4755859375, 5.66455078125, 5.853515625, 6.04248046875, 6.2314453125, 6.42041015625, 6.609375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [4.0, 3.0, 1.0, 4.0, 11.0, 6.0, 7.0, 12.0, 12.0, 11.0, 14.0, 19.0, 21.0, 23.0, 33.0, 27.0, 29.0, 28.0, 29.0, 41.0, 37.0, 39.0, 39.0, 38.0, 55.0, 43.0, 26.0, 43.0, 35.0, 36.0, 38.0, 28.0, 20.0, 20.0, 20.0, 20.0, 18.0, 20.0, 24.0, 16.0, 14.0, 6.0, 10.0, 9.0, 6.0, 5.0, 5.0, 2.0, 5.0, 1.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.546875, -7.2425537109375, -6.938232421875, -6.6339111328125, -6.32958984375, -6.0252685546875, -5.720947265625, -5.4166259765625, -5.1123046875, -4.8079833984375, -4.503662109375, -4.1993408203125, -3.89501953125, -3.5906982421875, -3.286376953125, -2.9820556640625, -2.677734375, -2.3734130859375, -2.069091796875, -1.7647705078125, -1.46044921875, -1.1561279296875, -0.851806640625, -0.5474853515625, -0.2431640625, 0.0611572265625, 0.365478515625, 0.6697998046875, 0.97412109375, 1.2784423828125, 1.582763671875, 1.8870849609375, 2.19140625, 2.4957275390625, 2.800048828125, 3.1043701171875, 3.40869140625, 3.7130126953125, 4.017333984375, 4.3216552734375, 4.6259765625, 4.9302978515625, 5.234619140625, 5.5389404296875, 5.84326171875, 6.1475830078125, 6.451904296875, 6.7562255859375, 7.060546875, 7.3648681640625, 7.669189453125, 7.9735107421875, 8.27783203125, 8.5821533203125, 8.886474609375, 9.1907958984375, 9.4951171875, 9.7994384765625, 10.103759765625, 10.4080810546875, 10.71240234375, 11.0167236328125, 11.321044921875, 11.6253662109375, 11.9296875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 5.0, 3.0, 2.0, 4.0, 7.0, 12.0, 12.0, 20.0, 21.0, 43.0, 51.0, 87.0, 141.0, 255.0, 432.0, 790.0, 1483.0, 2777.0, 5493.0, 10489.0, 20041.0, 44070.0, 705992.0, 194440.0, 29982.0, 15254.0, 7847.0, 4014.0, 2220.0, 1124.0, 601.0, 321.0, 186.0, 102.0, 84.0, 45.0, 22.0, 22.0, 14.0, 16.0, 12.0, 4.0, 9.0, 2.0, 5.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.875, -13.42431640625, -12.9736328125, -12.52294921875, -12.072265625, -11.62158203125, -11.1708984375, -10.72021484375, -10.26953125, -9.81884765625, -9.3681640625, -8.91748046875, -8.466796875, -8.01611328125, -7.5654296875, -7.11474609375, -6.6640625, -6.21337890625, -5.7626953125, -5.31201171875, -4.861328125, -4.41064453125, -3.9599609375, -3.50927734375, -3.05859375, -2.60791015625, -2.1572265625, -1.70654296875, -1.255859375, -0.80517578125, -0.3544921875, 0.09619140625, 0.546875, 0.99755859375, 1.4482421875, 1.89892578125, 2.349609375, 2.80029296875, 3.2509765625, 3.70166015625, 4.15234375, 4.60302734375, 5.0537109375, 5.50439453125, 5.955078125, 6.40576171875, 6.8564453125, 7.30712890625, 7.7578125, 8.20849609375, 8.6591796875, 9.10986328125, 9.560546875, 10.01123046875, 10.4619140625, 10.91259765625, 11.36328125, 11.81396484375, 12.2646484375, 12.71533203125, 13.166015625, 13.61669921875, 14.0673828125, 14.51806640625, 14.96875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 7.0, 8.0, 5.0, 13.0, 10.0, 16.0, 14.0, 22.0, 27.0, 26.0, 33.0, 32.0, 32.0, 34.0, 26.0, 36.0, 47.0, 61.0, 47.0, 47.0, 43.0, 43.0, 30.0, 41.0, 43.0, 40.0, 28.0, 30.0, 20.0, 26.0, 18.0, 19.0, 18.0, 13.0, 10.0, 11.0, 3.0, 11.0, 5.0, 4.0, 4.0, 2.0, 0.0, 0.0, 2.0, 2.0], "bins": [-11.34375, -11.0345458984375, -10.725341796875, -10.4161376953125, -10.10693359375, -9.7977294921875, -9.488525390625, -9.1793212890625, -8.8701171875, -8.5609130859375, -8.251708984375, -7.9425048828125, -7.63330078125, -7.3240966796875, -7.014892578125, -6.7056884765625, -6.396484375, -6.0872802734375, -5.778076171875, -5.4688720703125, -5.15966796875, -4.8504638671875, -4.541259765625, -4.2320556640625, -3.9228515625, -3.6136474609375, -3.304443359375, -2.9952392578125, -2.68603515625, -2.3768310546875, -2.067626953125, -1.7584228515625, -1.44921875, -1.1400146484375, -0.830810546875, -0.5216064453125, -0.21240234375, 0.0968017578125, 0.406005859375, 0.7152099609375, 1.0244140625, 1.3336181640625, 1.642822265625, 1.9520263671875, 2.26123046875, 2.5704345703125, 2.879638671875, 3.1888427734375, 3.498046875, 3.8072509765625, 4.116455078125, 4.4256591796875, 4.73486328125, 5.0440673828125, 5.353271484375, 5.6624755859375, 5.9716796875, 6.2808837890625, 6.590087890625, 6.8992919921875, 7.20849609375, 7.5177001953125, 7.826904296875, 8.1361083984375, 8.4453125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 4.0, 11.0, 3.0, 15.0, 11.0, 21.0, 32.0, 23.0, 42.0, 54.0, 74.0, 97.0, 126.0, 161.0, 261.0, 318.0, 528.0, 847.0, 1409.0, 2414.0, 4162.0, 7783.0, 15849.0, 41118.0, 583907.0, 324797.0, 33507.0, 14118.0, 7060.0, 3807.0, 2202.0, 1234.0, 820.0, 515.0, 358.0, 228.0, 158.0, 116.0, 90.0, 55.0, 51.0, 44.0, 34.0, 22.0, 15.0, 17.0, 12.0, 6.0, 6.0, 3.0, 4.0, 6.0, 1.0, 2.0, 0.0, 2.0], "bins": [-2.431640625, -2.357757568359375, -2.28387451171875, -2.209991455078125, -2.1361083984375, -2.062225341796875, -1.98834228515625, -1.914459228515625, -1.840576171875, -1.766693115234375, -1.69281005859375, -1.618927001953125, -1.5450439453125, -1.471160888671875, -1.39727783203125, -1.323394775390625, -1.24951171875, -1.175628662109375, -1.10174560546875, -1.027862548828125, -0.9539794921875, -0.880096435546875, -0.80621337890625, -0.732330322265625, -0.658447265625, -0.584564208984375, -0.51068115234375, -0.436798095703125, -0.3629150390625, -0.289031982421875, -0.21514892578125, -0.141265869140625, -0.0673828125, 0.006500244140625, 0.08038330078125, 0.154266357421875, 0.2281494140625, 0.302032470703125, 0.37591552734375, 0.449798583984375, 0.523681640625, 0.597564697265625, 0.67144775390625, 0.745330810546875, 0.8192138671875, 0.893096923828125, 0.96697998046875, 1.040863037109375, 1.11474609375, 1.188629150390625, 1.26251220703125, 1.336395263671875, 1.4102783203125, 1.484161376953125, 1.55804443359375, 1.631927490234375, 1.705810546875, 1.779693603515625, 1.85357666015625, 1.927459716796875, 2.0013427734375, 2.075225830078125, 2.14910888671875, 2.222991943359375, 2.296875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 4.0, 2.0, 4.0, 7.0, 10.0, 15.0, 19.0, 25.0, 42.0, 65.0, 84.0, 124.0, 136.0, 136.0, 111.0, 63.0, 49.0, 37.0, 29.0, 11.0, 7.0, 11.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.0012292861938476562, -0.0011974573135375977, -0.001165628433227539, -0.0011337995529174805, -0.0011019706726074219, -0.0010701417922973633, -0.0010383129119873047, -0.001006484031677246, -0.0009746551513671875, -0.0009428262710571289, -0.0009109973907470703, -0.0008791685104370117, -0.0008473396301269531, -0.0008155107498168945, -0.0007836818695068359, -0.0007518529891967773, -0.0007200241088867188, -0.0006881952285766602, -0.0006563663482666016, -0.000624537467956543, -0.0005927085876464844, -0.0005608797073364258, -0.0005290508270263672, -0.0004972219467163086, -0.00046539306640625, -0.0004335641860961914, -0.0004017353057861328, -0.0003699064254760742, -0.0003380775451660156, -0.00030624866485595703, -0.00027441978454589844, -0.00024259090423583984, -0.00021076202392578125, -0.00017893314361572266, -0.00014710426330566406, -0.00011527538299560547, -8.344650268554688e-05, -5.161762237548828e-05, -1.9788742065429688e-05, 1.2040138244628906e-05, 4.38690185546875e-05, 7.56978988647461e-05, 0.00010752677917480469, 0.00013935565948486328, 0.00017118453979492188, 0.00020301342010498047, 0.00023484230041503906, 0.00026667118072509766, 0.00029850006103515625, 0.00033032894134521484, 0.00036215782165527344, 0.00039398670196533203, 0.0004258155822753906, 0.0004576444625854492, 0.0004894733428955078, 0.0005213022232055664, 0.000553131103515625, 0.0005849599838256836, 0.0006167888641357422, 0.0006486177444458008, 0.0006804466247558594, 0.000712275505065918, 0.0007441043853759766, 0.0007759332656860352, 0.0008077621459960938]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 9.0, 9.0, 8.0, 16.0, 10.0, 43.0, 46.0, 82.0, 120.0, 185.0, 284.0, 407.0, 615.0, 949.0, 1410.0, 2323.0, 3734.0, 6040.0, 10165.0, 18615.0, 35453.0, 73795.0, 158079.0, 283462.0, 229231.0, 110312.0, 51857.0, 25891.0, 14004.0, 8068.0, 4941.0, 3010.0, 1974.0, 1170.0, 754.0, 502.0, 336.0, 234.0, 144.0, 97.0, 53.0, 31.0, 38.0, 21.0, 11.0, 7.0, 7.0, 4.0, 2.0, 1.0, 1.0], "bins": [-1.78125, -1.7328033447265625, -1.684356689453125, -1.6359100341796875, -1.58746337890625, -1.5390167236328125, -1.490570068359375, -1.4421234130859375, -1.3936767578125, -1.3452301025390625, -1.296783447265625, -1.2483367919921875, -1.19989013671875, -1.1514434814453125, -1.102996826171875, -1.0545501708984375, -1.006103515625, -0.9576568603515625, -0.909210205078125, -0.8607635498046875, -0.81231689453125, -0.7638702392578125, -0.715423583984375, -0.6669769287109375, -0.6185302734375, -0.5700836181640625, -0.521636962890625, -0.4731903076171875, -0.42474365234375, -0.3762969970703125, -0.327850341796875, -0.2794036865234375, -0.23095703125, -0.1825103759765625, -0.134063720703125, -0.0856170654296875, -0.03717041015625, 0.0112762451171875, 0.059722900390625, 0.1081695556640625, 0.1566162109375, 0.2050628662109375, 0.253509521484375, 0.3019561767578125, 0.35040283203125, 0.3988494873046875, 0.447296142578125, 0.4957427978515625, 0.544189453125, 0.5926361083984375, 0.641082763671875, 0.6895294189453125, 0.73797607421875, 0.7864227294921875, 0.834869384765625, 0.8833160400390625, 0.9317626953125, 0.9802093505859375, 1.028656005859375, 1.0771026611328125, 1.12554931640625, 1.1739959716796875, 1.222442626953125, 1.2708892822265625, 1.3193359375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 4.0, 3.0, 8.0, 14.0, 7.0, 14.0, 18.0, 22.0, 24.0, 37.0, 55.0, 74.0, 78.0, 76.0, 101.0, 101.0, 83.0, 54.0, 42.0, 42.0, 38.0, 11.0, 23.0, 10.0, 13.0, 10.0, 9.0, 8.0, 6.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.454833984375, -0.4384040832519531, -0.42197418212890625, -0.4055442810058594, -0.3891143798828125, -0.3726844787597656, -0.35625457763671875, -0.3398246765136719, -0.323394775390625, -0.3069648742675781, -0.29053497314453125, -0.2741050720214844, -0.2576751708984375, -0.24124526977539062, -0.22481536865234375, -0.20838546752929688, -0.19195556640625, -0.17552566528320312, -0.15909576416015625, -0.14266586303710938, -0.1262359619140625, -0.10980606079101562, -0.09337615966796875, -0.07694625854492188, -0.060516357421875, -0.044086456298828125, -0.02765655517578125, -0.011226654052734375, 0.0052032470703125, 0.021633148193359375, 0.03806304931640625, 0.054492950439453125, 0.0709228515625, 0.08735275268554688, 0.10378265380859375, 0.12021255493164062, 0.1366424560546875, 0.15307235717773438, 0.16950225830078125, 0.18593215942382812, 0.202362060546875, 0.21879196166992188, 0.23522186279296875, 0.2516517639160156, 0.2680816650390625, 0.2845115661621094, 0.30094146728515625, 0.3173713684082031, 0.33380126953125, 0.3502311706542969, 0.36666107177734375, 0.3830909729003906, 0.3995208740234375, 0.4159507751464844, 0.43238067626953125, 0.4488105773925781, 0.465240478515625, 0.4816703796386719, 0.49810028076171875, 0.5145301818847656, 0.5309600830078125, 0.5473899841308594, 0.5638198852539062, 0.5802497863769531, 0.5966796875]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 4.0, 0.0, 1.0, 7.0, 4.0, 5.0, 10.0, 16.0, 13.0, 18.0, 26.0, 29.0, 22.0, 28.0, 26.0, 43.0, 32.0, 42.0, 50.0, 45.0, 51.0, 56.0, 56.0, 41.0, 40.0, 36.0, 46.0, 32.0, 42.0, 26.0, 31.0, 32.0, 18.0, 16.0, 14.0, 10.0, 10.0, 6.0, 8.0, 2.0, 5.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-9.765376091003418, -9.456389427185059, -9.147403717041016, -8.838417053222656, -8.529430389404297, -8.220443725585938, -7.9114580154418945, -7.602471351623535, -7.293485164642334, -6.984498977661133, -6.675512313842773, -6.366526126861572, -6.057539939880371, -5.748553276062012, -5.4395670890808105, -5.130580902099609, -4.82159423828125, -4.512608051300049, -4.2036213874816895, -3.8946352005004883, -3.585648775100708, -3.2766623497009277, -2.9676761627197266, -2.6586897373199463, -2.349703311920166, -2.0407168865203857, -1.731730580329895, -1.4227442741394043, -1.113757848739624, -0.8047714233398438, -0.495785117149353, -0.1867988109588623, 0.12218666076660156, 0.43117302656173706, 0.7401593923568726, 1.0491456985473633, 1.3581321239471436, 1.6671185493469238, 1.9761048555374146, 2.2850911617279053, 2.5940775871276855, 2.903064012527466, 3.212050437927246, 3.5210366249084473, 3.8300230503082275, 4.139009475708008, 4.447995662689209, 4.75698184967041, 5.0659685134887695, 5.374954700469971, 5.68394136428833, 5.992927551269531, 6.301914215087891, 6.610900402069092, 6.919886589050293, 7.228873252868652, 7.5378594398498535, 7.846845626831055, 8.155832290649414, 8.464818954467773, 8.773804664611816, 9.082791328430176, 9.391777992248535, 9.700763702392578, 10.009750366210938]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 9.0, 8.0, 9.0, 10.0, 8.0, 15.0, 10.0, 19.0, 16.0, 25.0, 26.0, 37.0, 26.0, 31.0, 34.0, 34.0, 42.0, 47.0, 45.0, 47.0, 52.0, 55.0, 37.0, 48.0, 36.0, 37.0, 23.0, 34.0, 18.0, 29.0, 20.0, 30.0, 15.0, 17.0, 8.0, 11.0, 6.0, 11.0, 5.0, 7.0, 2.0, 3.0, 2.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.11067008972168, -8.7871675491333, -8.463665008544922, -8.140162467956543, -7.816660404205322, -7.493157863616943, -7.169655799865723, -6.846153259277344, -6.522650718688965, -6.199148178100586, -5.875645637512207, -5.552143573760986, -5.228641033172607, -4.9051384925842285, -4.581636428833008, -4.258133888244629, -3.93463134765625, -3.611128807067871, -3.2876265048980713, -2.9641242027282715, -2.6406216621398926, -2.3171191215515137, -1.9936168193817139, -1.670114517211914, -1.3466119766235352, -1.0231095552444458, -0.6996071338653564, -0.3761047124862671, -0.052602291107177734, 0.2709001302719116, 0.594402551651001, 0.9179048538208008, 1.2414064407348633, 1.5649088621139526, 1.888411283493042, 2.211913585662842, 2.5354161262512207, 2.8589186668395996, 3.1824209690093994, 3.505923271179199, 3.829425811767578, 4.152928352355957, 4.476430892944336, 4.799932956695557, 5.1234354972839355, 5.4469380378723145, 5.770440101623535, 6.093942642211914, 6.417445182800293, 6.740947723388672, 7.064450263977051, 7.3879523277282715, 7.71145486831665, 8.034956932067871, 8.35845947265625, 8.681962013244629, 9.005464553833008, 9.328967094421387, 9.652469635009766, 9.975972175598145, 10.299474716186523, 10.622976303100586, 10.946478843688965, 11.269981384277344, 11.593483924865723]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 4.0, 3.0, 7.0, 11.0, 7.0, 18.0, 32.0, 34.0, 51.0, 91.0, 124.0, 204.0, 283.0, 501.0, 725.0, 1128.0, 1863.0, 3018.0, 4804.0, 7514.0, 12081.0, 18705.0, 27831.0, 40865.0, 57199.0, 75565.0, 94663.0, 108623.0, 114529.0, 110344.0, 97607.0, 79824.0, 60764.0, 43768.0, 30084.0, 20105.0, 13119.0, 8292.0, 5140.0, 3384.0, 2022.0, 1355.0, 807.0, 530.0, 329.0, 197.0, 147.0, 81.0, 52.0, 34.0, 37.0, 29.0, 8.0, 11.0, 7.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-6.15625, -5.96142578125, -5.7666015625, -5.57177734375, -5.376953125, -5.18212890625, -4.9873046875, -4.79248046875, -4.59765625, -4.40283203125, -4.2080078125, -4.01318359375, -3.818359375, -3.62353515625, -3.4287109375, -3.23388671875, -3.0390625, -2.84423828125, -2.6494140625, -2.45458984375, -2.259765625, -2.06494140625, -1.8701171875, -1.67529296875, -1.48046875, -1.28564453125, -1.0908203125, -0.89599609375, -0.701171875, -0.50634765625, -0.3115234375, -0.11669921875, 0.078125, 0.27294921875, 0.4677734375, 0.66259765625, 0.857421875, 1.05224609375, 1.2470703125, 1.44189453125, 1.63671875, 1.83154296875, 2.0263671875, 2.22119140625, 2.416015625, 2.61083984375, 2.8056640625, 3.00048828125, 3.1953125, 3.39013671875, 3.5849609375, 3.77978515625, 3.974609375, 4.16943359375, 4.3642578125, 4.55908203125, 4.75390625, 4.94873046875, 5.1435546875, 5.33837890625, 5.533203125, 5.72802734375, 5.9228515625, 6.11767578125, 6.3125]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 7.0, 11.0, 7.0, 12.0, 18.0, 11.0, 16.0, 16.0, 29.0, 24.0, 27.0, 24.0, 36.0, 42.0, 37.0, 44.0, 46.0, 55.0, 35.0, 63.0, 35.0, 46.0, 42.0, 46.0, 44.0, 31.0, 31.0, 27.0, 24.0, 21.0, 23.0, 11.0, 16.0, 12.0, 10.0, 5.0, 7.0, 5.0, 7.0, 1.0, 1.0, 5.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.015625, -8.68212890625, -8.3486328125, -8.01513671875, -7.681640625, -7.34814453125, -7.0146484375, -6.68115234375, -6.34765625, -6.01416015625, -5.6806640625, -5.34716796875, -5.013671875, -4.68017578125, -4.3466796875, -4.01318359375, -3.6796875, -3.34619140625, -3.0126953125, -2.67919921875, -2.345703125, -2.01220703125, -1.6787109375, -1.34521484375, -1.01171875, -0.67822265625, -0.3447265625, -0.01123046875, 0.322265625, 0.65576171875, 0.9892578125, 1.32275390625, 1.65625, 1.98974609375, 2.3232421875, 2.65673828125, 2.990234375, 3.32373046875, 3.6572265625, 3.99072265625, 4.32421875, 4.65771484375, 4.9912109375, 5.32470703125, 5.658203125, 5.99169921875, 6.3251953125, 6.65869140625, 6.9921875, 7.32568359375, 7.6591796875, 7.99267578125, 8.326171875, 8.65966796875, 8.9931640625, 9.32666015625, 9.66015625, 9.99365234375, 10.3271484375, 10.66064453125, 10.994140625, 11.32763671875, 11.6611328125, 11.99462890625, 12.328125]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 8.0, 5.0, 24.0, 25.0, 27.0, 53.0, 90.0, 142.0, 227.0, 376.0, 592.0, 978.0, 1625.0, 2700.0, 4515.0, 7343.0, 11994.0, 19814.0, 31234.0, 48909.0, 71440.0, 97767.0, 122183.0, 134179.0, 130521.0, 111403.0, 85157.0, 60519.0, 39725.0, 25366.0, 15653.0, 9532.0, 5747.0, 3411.0, 2080.0, 1245.0, 771.0, 446.0, 262.0, 152.0, 127.0, 74.0, 41.0, 34.0, 21.0, 10.0, 6.0, 3.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.34375, -8.072509765625, -7.80126953125, -7.530029296875, -7.2587890625, -6.987548828125, -6.71630859375, -6.445068359375, -6.173828125, -5.902587890625, -5.63134765625, -5.360107421875, -5.0888671875, -4.817626953125, -4.54638671875, -4.275146484375, -4.00390625, -3.732666015625, -3.46142578125, -3.190185546875, -2.9189453125, -2.647705078125, -2.37646484375, -2.105224609375, -1.833984375, -1.562744140625, -1.29150390625, -1.020263671875, -0.7490234375, -0.477783203125, -0.20654296875, 0.064697265625, 0.3359375, 0.607177734375, 0.87841796875, 1.149658203125, 1.4208984375, 1.692138671875, 1.96337890625, 2.234619140625, 2.505859375, 2.777099609375, 3.04833984375, 3.319580078125, 3.5908203125, 3.862060546875, 4.13330078125, 4.404541015625, 4.67578125, 4.947021484375, 5.21826171875, 5.489501953125, 5.7607421875, 6.031982421875, 6.30322265625, 6.574462890625, 6.845703125, 7.116943359375, 7.38818359375, 7.659423828125, 7.9306640625, 8.201904296875, 8.47314453125, 8.744384765625, 9.015625]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 4.0, 0.0, 0.0, 1.0, 4.0, 3.0, 5.0, 3.0, 10.0, 12.0, 9.0, 13.0, 15.0, 24.0, 17.0, 23.0, 24.0, 22.0, 28.0, 28.0, 30.0, 41.0, 33.0, 39.0, 44.0, 36.0, 54.0, 50.0, 42.0, 48.0, 48.0, 34.0, 21.0, 27.0, 38.0, 27.0, 18.0, 21.0, 18.0, 18.0, 11.0, 13.0, 15.0, 6.0, 8.0, 5.0, 7.0, 3.0, 6.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-6.28125, -6.0911865234375, -5.901123046875, -5.7110595703125, -5.52099609375, -5.3309326171875, -5.140869140625, -4.9508056640625, -4.7607421875, -4.5706787109375, -4.380615234375, -4.1905517578125, -4.00048828125, -3.8104248046875, -3.620361328125, -3.4302978515625, -3.240234375, -3.0501708984375, -2.860107421875, -2.6700439453125, -2.47998046875, -2.2899169921875, -2.099853515625, -1.9097900390625, -1.7197265625, -1.5296630859375, -1.339599609375, -1.1495361328125, -0.95947265625, -0.7694091796875, -0.579345703125, -0.3892822265625, -0.19921875, -0.0091552734375, 0.180908203125, 0.3709716796875, 0.56103515625, 0.7510986328125, 0.941162109375, 1.1312255859375, 1.3212890625, 1.5113525390625, 1.701416015625, 1.8914794921875, 2.08154296875, 2.2716064453125, 2.461669921875, 2.6517333984375, 2.841796875, 3.0318603515625, 3.221923828125, 3.4119873046875, 3.60205078125, 3.7921142578125, 3.982177734375, 4.1722412109375, 4.3623046875, 4.5523681640625, 4.742431640625, 4.9324951171875, 5.12255859375, 5.3126220703125, 5.502685546875, 5.6927490234375, 5.8828125]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 7.0, 16.0, 10.0, 17.0, 20.0, 24.0, 54.0, 72.0, 137.0, 204.0, 301.0, 499.0, 757.0, 1171.0, 1964.0, 3186.0, 5223.0, 8647.0, 14656.0, 25384.0, 43207.0, 73097.0, 117050.0, 166296.0, 183543.0, 151109.0, 101671.0, 61719.0, 36077.0, 21053.0, 12404.0, 7380.0, 4325.0, 2708.0, 1644.0, 1074.0, 671.0, 428.0, 261.0, 190.0, 111.0, 81.0, 34.0, 35.0, 18.0, 9.0, 12.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.36328125, -5.202392578125, -5.04150390625, -4.880615234375, -4.7197265625, -4.558837890625, -4.39794921875, -4.237060546875, -4.076171875, -3.915283203125, -3.75439453125, -3.593505859375, -3.4326171875, -3.271728515625, -3.11083984375, -2.949951171875, -2.7890625, -2.628173828125, -2.46728515625, -2.306396484375, -2.1455078125, -1.984619140625, -1.82373046875, -1.662841796875, -1.501953125, -1.341064453125, -1.18017578125, -1.019287109375, -0.8583984375, -0.697509765625, -0.53662109375, -0.375732421875, -0.21484375, -0.053955078125, 0.10693359375, 0.267822265625, 0.4287109375, 0.589599609375, 0.75048828125, 0.911376953125, 1.072265625, 1.233154296875, 1.39404296875, 1.554931640625, 1.7158203125, 1.876708984375, 2.03759765625, 2.198486328125, 2.359375, 2.520263671875, 2.68115234375, 2.842041015625, 3.0029296875, 3.163818359375, 3.32470703125, 3.485595703125, 3.646484375, 3.807373046875, 3.96826171875, 4.129150390625, 4.2900390625, 4.450927734375, 4.61181640625, 4.772705078125, 4.93359375]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 0.0, 1.0, 3.0, 1.0, 1.0, 5.0, 5.0, 3.0, 11.0, 13.0, 10.0, 23.0, 28.0, 38.0, 58.0, 64.0, 91.0, 78.0, 91.0, 110.0, 75.0, 62.0, 56.0, 42.0, 28.0, 32.0, 18.0, 12.0, 13.0, 12.0, 6.0, 2.0, 5.0, 6.0, 5.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008406639099121094, -0.0008154734969139099, -0.0007902830839157104, -0.000765092670917511, -0.0007399022579193115, -0.0007147118449211121, -0.0006895214319229126, -0.0006643310189247131, -0.0006391406059265137, -0.0006139501929283142, -0.0005887597799301147, -0.0005635693669319153, -0.0005383789539337158, -0.0005131885409355164, -0.0004879981279373169, -0.00046280771493911743, -0.00043761730194091797, -0.0004124268889427185, -0.00038723647594451904, -0.0003620460629463196, -0.0003368556499481201, -0.00031166523694992065, -0.0002864748239517212, -0.00026128441095352173, -0.00023609399795532227, -0.0002109035849571228, -0.00018571317195892334, -0.00016052275896072388, -0.00013533234596252441, -0.00011014193296432495, -8.495151996612549e-05, -5.9761106967926025e-05, -3.457069396972656e-05, -9.3802809715271e-06, 1.5810132026672363e-05, 4.1000545024871826e-05, 6.619095802307129e-05, 9.138137102127075e-05, 0.00011657178401947021, 0.00014176219701766968, 0.00016695261001586914, 0.0001921430230140686, 0.00021733343601226807, 0.00024252384901046753, 0.000267714262008667, 0.00029290467500686646, 0.0003180950880050659, 0.0003432855010032654, 0.00036847591400146484, 0.0003936663269996643, 0.00041885673999786377, 0.00044404715299606323, 0.0004692375659942627, 0.0004944279789924622, 0.0005196183919906616, 0.0005448088049888611, 0.0005699992179870605, 0.00059518963098526, 0.0006203800439834595, 0.0006455704569816589, 0.0006707608699798584, 0.0006959512829780579, 0.0007211416959762573, 0.0007463321089744568, 0.0007715225219726562]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 4.0, 7.0, 7.0, 2.0, 13.0, 21.0, 20.0, 28.0, 46.0, 82.0, 98.0, 150.0, 260.0, 367.0, 533.0, 802.0, 1265.0, 2011.0, 3149.0, 5010.0, 8028.0, 13156.0, 21599.0, 35436.0, 58087.0, 91181.0, 132495.0, 162709.0, 161477.0, 126699.0, 85381.0, 53526.0, 32841.0, 19876.0, 11986.0, 7453.0, 4616.0, 2857.0, 1775.0, 1200.0, 761.0, 520.0, 346.0, 214.0, 154.0, 81.0, 73.0, 54.0, 34.0, 19.0, 23.0, 8.0, 8.0, 9.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0], "bins": [-4.6484375, -4.5028076171875, -4.357177734375, -4.2115478515625, -4.06591796875, -3.9202880859375, -3.774658203125, -3.6290283203125, -3.4833984375, -3.3377685546875, -3.192138671875, -3.0465087890625, -2.90087890625, -2.7552490234375, -2.609619140625, -2.4639892578125, -2.318359375, -2.1727294921875, -2.027099609375, -1.8814697265625, -1.73583984375, -1.5902099609375, -1.444580078125, -1.2989501953125, -1.1533203125, -1.0076904296875, -0.862060546875, -0.7164306640625, -0.57080078125, -0.4251708984375, -0.279541015625, -0.1339111328125, 0.01171875, 0.1573486328125, 0.302978515625, 0.4486083984375, 0.59423828125, 0.7398681640625, 0.885498046875, 1.0311279296875, 1.1767578125, 1.3223876953125, 1.468017578125, 1.6136474609375, 1.75927734375, 1.9049072265625, 2.050537109375, 2.1961669921875, 2.341796875, 2.4874267578125, 2.633056640625, 2.7786865234375, 2.92431640625, 3.0699462890625, 3.215576171875, 3.3612060546875, 3.5068359375, 3.6524658203125, 3.798095703125, 3.9437255859375, 4.08935546875, 4.2349853515625, 4.380615234375, 4.5262451171875, 4.671875]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 5.0, 3.0, 6.0, 8.0, 9.0, 14.0, 11.0, 13.0, 18.0, 22.0, 20.0, 18.0, 23.0, 36.0, 36.0, 47.0, 43.0, 42.0, 45.0, 41.0, 47.0, 58.0, 50.0, 45.0, 42.0, 45.0, 34.0, 22.0, 28.0, 21.0, 28.0, 26.0, 19.0, 12.0, 12.0, 8.0, 8.0, 10.0, 7.0, 6.0, 1.0, 6.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.55859375, -1.506011962890625, -1.45343017578125, -1.400848388671875, -1.3482666015625, -1.295684814453125, -1.24310302734375, -1.190521240234375, -1.137939453125, -1.085357666015625, -1.03277587890625, -0.980194091796875, -0.9276123046875, -0.875030517578125, -0.82244873046875, -0.769866943359375, -0.71728515625, -0.664703369140625, -0.61212158203125, -0.559539794921875, -0.5069580078125, -0.454376220703125, -0.40179443359375, -0.349212646484375, -0.296630859375, -0.244049072265625, -0.19146728515625, -0.138885498046875, -0.0863037109375, -0.033721923828125, 0.01885986328125, 0.071441650390625, 0.1240234375, 0.176605224609375, 0.22918701171875, 0.281768798828125, 0.3343505859375, 0.386932373046875, 0.43951416015625, 0.492095947265625, 0.544677734375, 0.597259521484375, 0.64984130859375, 0.702423095703125, 0.7550048828125, 0.807586669921875, 0.86016845703125, 0.912750244140625, 0.96533203125, 1.017913818359375, 1.07049560546875, 1.123077392578125, 1.1756591796875, 1.228240966796875, 1.28082275390625, 1.333404541015625, 1.385986328125, 1.438568115234375, 1.49114990234375, 1.543731689453125, 1.5963134765625, 1.648895263671875, 1.70147705078125, 1.754058837890625, 1.806640625]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 2.0, 4.0, 5.0, 4.0, 11.0, 11.0, 11.0, 11.0, 23.0, 19.0, 22.0, 16.0, 35.0, 39.0, 27.0, 39.0, 38.0, 47.0, 46.0, 36.0, 51.0, 53.0, 58.0, 49.0, 43.0, 46.0, 43.0, 33.0, 32.0, 28.0, 15.0, 25.0, 28.0, 17.0, 7.0, 9.0, 9.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.27790355682373, -8.96689510345459, -8.65588665008545, -8.344878196716309, -8.033868789672852, -7.722860813140869, -7.41185188293457, -7.10084342956543, -6.789834976196289, -6.478826522827148, -6.167818069458008, -5.856809139251709, -5.545800685882568, -5.234792232513428, -4.923783302307129, -4.612774848937988, -4.301766395568848, -3.990757942199707, -3.6797492504119873, -3.3687405586242676, -3.057732105255127, -2.7467236518859863, -2.4357149600982666, -2.124706268310547, -1.8136978149414062, -1.502689242362976, -1.191680669784546, -0.8806720972061157, -0.5696635246276855, -0.25865495204925537, 0.052353620529174805, 0.36336231231689453, 0.6743717193603516, 0.9853802919387817, 1.296388864517212, 1.607397437095642, 1.9184060096740723, 2.229414463043213, 2.5404231548309326, 2.8514318466186523, 3.162440299987793, 3.4734487533569336, 3.7844574451446533, 4.095466136932373, 4.406474590301514, 4.717483043670654, 5.028491973876953, 5.339500427246094, 5.650508880615234, 5.961517333984375, 6.272525787353516, 6.5835347175598145, 6.894543170928955, 7.205551624298096, 7.5165605545043945, 7.827569007873535, 8.138577461242676, 8.449585914611816, 8.760594367980957, 9.071602821350098, 9.382612228393555, 9.693620681762695, 10.004629135131836, 10.315637588500977, 10.626646041870117]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 4.0, 6.0, 7.0, 11.0, 14.0, 15.0, 18.0, 24.0, 19.0, 21.0, 30.0, 34.0, 36.0, 41.0, 56.0, 42.0, 45.0, 39.0, 43.0, 47.0, 52.0, 47.0, 50.0, 47.0, 44.0, 34.0, 20.0, 22.0, 30.0, 20.0, 16.0, 15.0, 10.0, 13.0, 9.0, 4.0, 6.0, 4.0, 5.0, 5.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.097450256347656, -9.748549461364746, -9.39964771270752, -9.05074691772461, -8.701845169067383, -8.352944374084473, -8.004042625427246, -7.655141830444336, -7.306240081787109, -6.957338809967041, -6.608437538146973, -6.259536266326904, -5.910634994506836, -5.561733722686768, -5.212832450866699, -4.863931655883789, -4.515030384063721, -4.166129112243652, -3.817227840423584, -3.4683265686035156, -3.1194252967834473, -2.770524024963379, -2.4216229915618896, -2.0727217197418213, -1.723820447921753, -1.3749191761016846, -1.0260179042816162, -0.6771167516708374, -0.32821547985076904, 0.020685791969299316, 0.3695869445800781, 0.7184882164001465, 1.0673894882202148, 1.4162907600402832, 1.7651920318603516, 2.11409330368042, 2.4629945755004883, 2.8118958473205566, 3.160796880722046, 3.5096981525421143, 3.8585994243621826, 4.207500457763672, 4.55640172958374, 4.905303001403809, 5.254204273223877, 5.603105545043945, 5.952006816864014, 6.300908088684082, 6.64980936050415, 6.998710632324219, 7.347611904144287, 7.6965131759643555, 8.045413970947266, 8.394315719604492, 8.743216514587402, 9.092118263244629, 9.441019058227539, 9.78991985321045, 10.138821601867676, 10.487722396850586, 10.836624145507812, 11.185524940490723, 11.53442668914795, 11.88332748413086, 12.232229232788086]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 6.0, 14.0, 10.0, 13.0, 37.0, 47.0, 76.0, 103.0, 149.0, 243.0, 338.0, 588.0, 894.0, 1486.0, 2493.0, 4211.0, 7396.0, 13933.0, 25752.0, 49362.0, 98365.0, 194832.0, 363116.0, 588607.0, 763790.0, 759061.0, 576449.0, 354084.0, 189097.0, 96304.0, 48164.0, 24979.0, 13237.0, 7147.0, 3988.0, 2323.0, 1365.0, 852.0, 494.0, 297.0, 185.0, 133.0, 79.0, 58.0, 36.0, 34.0, 17.0, 15.0, 13.0, 4.0, 8.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.6640625, -7.4166259765625, -7.169189453125, -6.9217529296875, -6.67431640625, -6.4268798828125, -6.179443359375, -5.9320068359375, -5.6845703125, -5.4371337890625, -5.189697265625, -4.9422607421875, -4.69482421875, -4.4473876953125, -4.199951171875, -3.9525146484375, -3.705078125, -3.4576416015625, -3.210205078125, -2.9627685546875, -2.71533203125, -2.4678955078125, -2.220458984375, -1.9730224609375, -1.7255859375, -1.4781494140625, -1.230712890625, -0.9832763671875, -0.73583984375, -0.4884033203125, -0.240966796875, 0.0064697265625, 0.25390625, 0.5013427734375, 0.748779296875, 0.9962158203125, 1.24365234375, 1.4910888671875, 1.738525390625, 1.9859619140625, 2.2333984375, 2.4808349609375, 2.728271484375, 2.9757080078125, 3.22314453125, 3.4705810546875, 3.718017578125, 3.9654541015625, 4.212890625, 4.4603271484375, 4.707763671875, 4.9552001953125, 5.20263671875, 5.4500732421875, 5.697509765625, 5.9449462890625, 6.1923828125, 6.4398193359375, 6.687255859375, 6.9346923828125, 7.18212890625, 7.4295654296875, 7.677001953125, 7.9244384765625, 8.171875]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 4.0, 7.0, 14.0, 13.0, 12.0, 17.0, 13.0, 24.0, 25.0, 23.0, 25.0, 36.0, 39.0, 36.0, 31.0, 44.0, 35.0, 41.0, 47.0, 43.0, 46.0, 46.0, 44.0, 34.0, 39.0, 32.0, 47.0, 25.0, 27.0, 18.0, 21.0, 15.0, 13.0, 19.0, 8.0, 4.0, 11.0, 9.0, 3.0, 2.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-9.1015625, -8.8270263671875, -8.552490234375, -8.2779541015625, -8.00341796875, -7.7288818359375, -7.454345703125, -7.1798095703125, -6.9052734375, -6.6307373046875, -6.356201171875, -6.0816650390625, -5.80712890625, -5.5325927734375, -5.258056640625, -4.9835205078125, -4.708984375, -4.4344482421875, -4.159912109375, -3.8853759765625, -3.61083984375, -3.3363037109375, -3.061767578125, -2.7872314453125, -2.5126953125, -2.2381591796875, -1.963623046875, -1.6890869140625, -1.41455078125, -1.1400146484375, -0.865478515625, -0.5909423828125, -0.31640625, -0.0418701171875, 0.232666015625, 0.5072021484375, 0.78173828125, 1.0562744140625, 1.330810546875, 1.6053466796875, 1.8798828125, 2.1544189453125, 2.428955078125, 2.7034912109375, 2.97802734375, 3.2525634765625, 3.527099609375, 3.8016357421875, 4.076171875, 4.3507080078125, 4.625244140625, 4.8997802734375, 5.17431640625, 5.4488525390625, 5.723388671875, 5.9979248046875, 6.2724609375, 6.5469970703125, 6.821533203125, 7.0960693359375, 7.37060546875, 7.6451416015625, 7.919677734375, 8.1942138671875, 8.46875]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 3.0, 4.0, 12.0, 9.0, 23.0, 29.0, 53.0, 71.0, 116.0, 147.0, 233.0, 426.0, 619.0, 1122.0, 1697.0, 2952.0, 4877.0, 8300.0, 14787.0, 25636.0, 45226.0, 81142.0, 142383.0, 244217.0, 396193.0, 577449.0, 698817.0, 663513.0, 501140.0, 327129.0, 195860.0, 112430.0, 63388.0, 35937.0, 20233.0, 11656.0, 6768.0, 3798.0, 2256.0, 1357.0, 809.0, 507.0, 315.0, 218.0, 152.0, 81.0, 69.0, 39.0, 32.0, 12.0, 18.0, 11.0, 6.0, 7.0, 2.0, 2.0, 2.0], "bins": [-9.0703125, -8.8018798828125, -8.533447265625, -8.2650146484375, -7.99658203125, -7.7281494140625, -7.459716796875, -7.1912841796875, -6.9228515625, -6.6544189453125, -6.385986328125, -6.1175537109375, -5.84912109375, -5.5806884765625, -5.312255859375, -5.0438232421875, -4.775390625, -4.5069580078125, -4.238525390625, -3.9700927734375, -3.70166015625, -3.4332275390625, -3.164794921875, -2.8963623046875, -2.6279296875, -2.3594970703125, -2.091064453125, -1.8226318359375, -1.55419921875, -1.2857666015625, -1.017333984375, -0.7489013671875, -0.48046875, -0.2120361328125, 0.056396484375, 0.3248291015625, 0.59326171875, 0.8616943359375, 1.130126953125, 1.3985595703125, 1.6669921875, 1.9354248046875, 2.203857421875, 2.4722900390625, 2.74072265625, 3.0091552734375, 3.277587890625, 3.5460205078125, 3.814453125, 4.0828857421875, 4.351318359375, 4.6197509765625, 4.88818359375, 5.1566162109375, 5.425048828125, 5.6934814453125, 5.9619140625, 6.2303466796875, 6.498779296875, 6.7672119140625, 7.03564453125, 7.3040771484375, 7.572509765625, 7.8409423828125, 8.109375]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 4.0, 3.0, 4.0, 3.0, 6.0, 11.0, 6.0, 12.0, 15.0, 21.0, 51.0, 47.0, 48.0, 60.0, 78.0, 109.0, 127.0, 112.0, 143.0, 191.0, 203.0, 210.0, 239.0, 225.0, 253.0, 235.0, 226.0, 211.0, 179.0, 167.0, 149.0, 147.0, 109.0, 94.0, 75.0, 60.0, 59.0, 40.0, 30.0, 33.0, 23.0, 20.0, 19.0, 7.0, 10.0, 3.0, 7.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.765625, -3.65985107421875, -3.5540771484375, -3.44830322265625, -3.342529296875, -3.23675537109375, -3.1309814453125, -3.02520751953125, -2.91943359375, -2.81365966796875, -2.7078857421875, -2.60211181640625, -2.496337890625, -2.39056396484375, -2.2847900390625, -2.17901611328125, -2.0732421875, -1.96746826171875, -1.8616943359375, -1.75592041015625, -1.650146484375, -1.54437255859375, -1.4385986328125, -1.33282470703125, -1.22705078125, -1.12127685546875, -1.0155029296875, -0.90972900390625, -0.803955078125, -0.69818115234375, -0.5924072265625, -0.48663330078125, -0.380859375, -0.27508544921875, -0.1693115234375, -0.06353759765625, 0.042236328125, 0.14801025390625, 0.2537841796875, 0.35955810546875, 0.46533203125, 0.57110595703125, 0.6768798828125, 0.78265380859375, 0.888427734375, 0.99420166015625, 1.0999755859375, 1.20574951171875, 1.3115234375, 1.41729736328125, 1.5230712890625, 1.62884521484375, 1.734619140625, 1.84039306640625, 1.9461669921875, 2.05194091796875, 2.15771484375, 2.26348876953125, 2.3692626953125, 2.47503662109375, 2.580810546875, 2.68658447265625, 2.7923583984375, 2.89813232421875, 3.00390625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 8.0, 11.0, 11.0, 8.0, 11.0, 24.0, 21.0, 17.0, 23.0, 32.0, 39.0, 43.0, 40.0, 44.0, 54.0, 54.0, 56.0, 48.0, 54.0, 52.0, 54.0, 43.0, 48.0, 36.0, 28.0, 27.0, 22.0, 24.0, 18.0, 14.0, 12.0, 6.0, 7.0, 5.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.274394989013672, -10.94471549987793, -10.615036964416504, -10.285357475280762, -9.95567798614502, -9.625999450683594, -9.296319961547852, -8.96664047241211, -8.636961936950684, -8.307282447814941, -7.977603435516357, -7.647924423217773, -7.3182454109191895, -6.9885663986206055, -6.658886909484863, -6.329207897186279, -5.999528408050537, -5.669849395751953, -5.340169906616211, -5.010490894317627, -4.680811882019043, -4.351132392883301, -4.021453380584717, -3.691774368286133, -3.3620951175689697, -3.0324158668518066, -2.7027368545532227, -2.3730576038360596, -2.0433783531188965, -1.7136993408203125, -1.3840200901031494, -1.0543410778045654, -0.7246618270874023, -0.3949826657772064, -0.0653035044670105, 0.2643756866455078, 0.5940548181533813, 0.9237339496612549, 1.253413200378418, 1.583092212677002, 1.912771463394165, 2.242450714111328, 2.572129726409912, 2.901808977127075, 3.2314882278442383, 3.5611672401428223, 3.8908464908599854, 4.220525741577148, 4.550204753875732, 4.879883766174316, 5.209563255310059, 5.539242267608643, 5.868921279907227, 6.198600769042969, 6.528279781341553, 6.857958793640137, 7.187638282775879, 7.517317295074463, 7.846996784210205, 8.176675796508789, 8.506355285644531, 8.836033821105957, 9.1657133102417, 9.495391845703125, 9.825071334838867]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 4.0, 5.0, 13.0, 6.0, 9.0, 13.0, 18.0, 14.0, 20.0, 18.0, 19.0, 26.0, 23.0, 41.0, 35.0, 37.0, 51.0, 38.0, 36.0, 45.0, 39.0, 32.0, 33.0, 35.0, 46.0, 31.0, 30.0, 28.0, 23.0, 33.0, 29.0, 29.0, 26.0, 15.0, 12.0, 18.0, 8.0, 13.0, 5.0, 9.0, 4.0, 4.0, 7.0, 9.0, 6.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-8.519075393676758, -8.245855331420898, -7.972634792327881, -7.6994147300720215, -7.426194667816162, -7.1529741287231445, -6.879754066467285, -6.606534004211426, -6.333313941955566, -6.060093879699707, -5.7868733406066895, -5.51365327835083, -5.240433216094971, -4.967212677001953, -4.693992614746094, -4.420772552490234, -4.147552013397217, -3.8743317127227783, -3.601111650466919, -3.3278913497924805, -3.054671287536621, -2.7814509868621826, -2.508230686187744, -2.2350106239318848, -1.9617903232574463, -1.6885701417922974, -1.4153499603271484, -1.14212965965271, -0.868909478187561, -0.5956892967224121, -0.32246899604797363, -0.04924881458282471, 0.22397136688232422, 0.49719157814979553, 0.7704117894172668, 1.0436320304870605, 1.3168522119522095, 1.5900723934173584, 1.8632926940917969, 2.1365127563476562, 2.4097330570220947, 2.682953357696533, 2.9561734199523926, 3.229393720626831, 3.5026140213012695, 3.775834083557129, 4.049054145812988, 4.322274684906006, 4.595494747161865, 4.868714809417725, 5.141935348510742, 5.415155410766602, 5.688375473022461, 5.96159553527832, 6.234816074371338, 6.508036136627197, 6.781256675720215, 7.054476737976074, 7.327697277069092, 7.600917339324951, 7.8741374015808105, 8.147357940673828, 8.420578002929688, 8.693798065185547, 8.967018127441406]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 5.0, 4.0, 7.0, 9.0, 12.0, 24.0, 33.0, 57.0, 86.0, 109.0, 163.0, 259.0, 345.0, 553.0, 796.0, 1219.0, 1863.0, 2922.0, 4543.0, 6886.0, 10815.0, 17037.0, 26730.0, 42234.0, 64316.0, 93335.0, 123734.0, 143799.0, 140598.0, 116842.0, 86229.0, 58407.0, 37467.0, 24087.0, 15301.0, 9670.0, 6234.0, 4057.0, 2671.0, 1679.0, 1113.0, 822.0, 474.0, 336.0, 213.0, 152.0, 95.0, 72.0, 51.0, 33.0, 24.0, 20.0, 6.0, 6.0, 4.0, 4.0, 6.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.03125, -3.89166259765625, -3.7520751953125, -3.61248779296875, -3.472900390625, -3.33331298828125, -3.1937255859375, -3.05413818359375, -2.91455078125, -2.77496337890625, -2.6353759765625, -2.49578857421875, -2.356201171875, -2.21661376953125, -2.0770263671875, -1.93743896484375, -1.7978515625, -1.65826416015625, -1.5186767578125, -1.37908935546875, -1.239501953125, -1.09991455078125, -0.9603271484375, -0.82073974609375, -0.68115234375, -0.54156494140625, -0.4019775390625, -0.26239013671875, -0.122802734375, 0.01678466796875, 0.1563720703125, 0.29595947265625, 0.435546875, 0.57513427734375, 0.7147216796875, 0.85430908203125, 0.993896484375, 1.13348388671875, 1.2730712890625, 1.41265869140625, 1.55224609375, 1.69183349609375, 1.8314208984375, 1.97100830078125, 2.110595703125, 2.25018310546875, 2.3897705078125, 2.52935791015625, 2.6689453125, 2.80853271484375, 2.9481201171875, 3.08770751953125, 3.227294921875, 3.36688232421875, 3.5064697265625, 3.64605712890625, 3.78564453125, 3.92523193359375, 4.0648193359375, 4.20440673828125, 4.343994140625, 4.48358154296875, 4.6231689453125, 4.76275634765625, 4.90234375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 3.0, 5.0, 9.0, 13.0, 9.0, 15.0, 15.0, 16.0, 25.0, 24.0, 19.0, 42.0, 26.0, 38.0, 43.0, 41.0, 57.0, 40.0, 41.0, 45.0, 49.0, 45.0, 34.0, 32.0, 38.0, 27.0, 39.0, 29.0, 29.0, 34.0, 14.0, 19.0, 12.0, 8.0, 16.0, 7.0, 12.0, 5.0, 6.0, 5.0, 6.0, 5.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.703125, -9.396484375, -9.08984375, -8.783203125, -8.4765625, -8.169921875, -7.86328125, -7.556640625, -7.25, -6.943359375, -6.63671875, -6.330078125, -6.0234375, -5.716796875, -5.41015625, -5.103515625, -4.796875, -4.490234375, -4.18359375, -3.876953125, -3.5703125, -3.263671875, -2.95703125, -2.650390625, -2.34375, -2.037109375, -1.73046875, -1.423828125, -1.1171875, -0.810546875, -0.50390625, -0.197265625, 0.109375, 0.416015625, 0.72265625, 1.029296875, 1.3359375, 1.642578125, 1.94921875, 2.255859375, 2.5625, 2.869140625, 3.17578125, 3.482421875, 3.7890625, 4.095703125, 4.40234375, 4.708984375, 5.015625, 5.322265625, 5.62890625, 5.935546875, 6.2421875, 6.548828125, 6.85546875, 7.162109375, 7.46875, 7.775390625, 8.08203125, 8.388671875, 8.6953125, 9.001953125, 9.30859375, 9.615234375, 9.921875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 7.0, 15.0, 10.0, 25.0, 25.0, 39.0, 69.0, 126.0, 193.0, 368.0, 763.0, 1795.0, 4379.0, 10522.0, 26167.0, 128200.0, 806495.0, 41494.0, 16039.0, 6673.0, 2716.0, 1240.0, 532.0, 283.0, 145.0, 76.0, 43.0, 41.0, 32.0, 13.0, 12.0, 6.0, 7.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.15625, -14.637939453125, -14.11962890625, -13.601318359375, -13.0830078125, -12.564697265625, -12.04638671875, -11.528076171875, -11.009765625, -10.491455078125, -9.97314453125, -9.454833984375, -8.9365234375, -8.418212890625, -7.89990234375, -7.381591796875, -6.86328125, -6.344970703125, -5.82666015625, -5.308349609375, -4.7900390625, -4.271728515625, -3.75341796875, -3.235107421875, -2.716796875, -2.198486328125, -1.68017578125, -1.161865234375, -0.6435546875, -0.125244140625, 0.39306640625, 0.911376953125, 1.4296875, 1.947998046875, 2.46630859375, 2.984619140625, 3.5029296875, 4.021240234375, 4.53955078125, 5.057861328125, 5.576171875, 6.094482421875, 6.61279296875, 7.131103515625, 7.6494140625, 8.167724609375, 8.68603515625, 9.204345703125, 9.72265625, 10.240966796875, 10.75927734375, 11.277587890625, 11.7958984375, 12.314208984375, 12.83251953125, 13.350830078125, 13.869140625, 14.387451171875, 14.90576171875, 15.424072265625, 15.9423828125, 16.460693359375, 16.97900390625, 17.497314453125, 18.015625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 4.0, 3.0, 1.0, 3.0, 7.0, 1.0, 6.0, 4.0, 5.0, 9.0, 11.0, 15.0, 17.0, 20.0, 21.0, 20.0, 23.0, 20.0, 28.0, 25.0, 40.0, 25.0, 36.0, 29.0, 22.0, 44.0, 33.0, 42.0, 32.0, 36.0, 45.0, 36.0, 28.0, 29.0, 37.0, 35.0, 22.0, 34.0, 13.0, 16.0, 30.0, 9.0, 14.0, 12.0, 12.0, 9.0, 11.0, 10.0, 6.0, 3.0, 9.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0], "bins": [-7.421875, -7.20330810546875, -6.9847412109375, -6.76617431640625, -6.547607421875, -6.32904052734375, -6.1104736328125, -5.89190673828125, -5.67333984375, -5.45477294921875, -5.2362060546875, -5.01763916015625, -4.799072265625, -4.58050537109375, -4.3619384765625, -4.14337158203125, -3.9248046875, -3.70623779296875, -3.4876708984375, -3.26910400390625, -3.050537109375, -2.83197021484375, -2.6134033203125, -2.39483642578125, -2.17626953125, -1.95770263671875, -1.7391357421875, -1.52056884765625, -1.302001953125, -1.08343505859375, -0.8648681640625, -0.64630126953125, -0.427734375, -0.20916748046875, 0.0093994140625, 0.22796630859375, 0.446533203125, 0.66510009765625, 0.8836669921875, 1.10223388671875, 1.32080078125, 1.53936767578125, 1.7579345703125, 1.97650146484375, 2.195068359375, 2.41363525390625, 2.6322021484375, 2.85076904296875, 3.0693359375, 3.28790283203125, 3.5064697265625, 3.72503662109375, 3.943603515625, 4.16217041015625, 4.3807373046875, 4.59930419921875, 4.81787109375, 5.03643798828125, 5.2550048828125, 5.47357177734375, 5.692138671875, 5.91070556640625, 6.1292724609375, 6.34783935546875, 6.56640625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 2.0, 3.0, 6.0, 3.0, 13.0, 14.0, 19.0, 18.0, 39.0, 55.0, 59.0, 106.0, 126.0, 206.0, 272.0, 375.0, 611.0, 934.0, 1539.0, 2706.0, 4817.0, 9435.0, 21186.0, 85181.0, 813789.0, 67401.0, 19445.0, 8848.0, 4463.0, 2525.0, 1561.0, 933.0, 543.0, 380.0, 301.0, 179.0, 119.0, 88.0, 62.0, 47.0, 47.0, 26.0, 21.0, 16.0, 12.0, 9.0, 8.0, 6.0, 1.0, 2.0, 5.0, 2.0, 2.0], "bins": [-1.8623046875, -1.8097686767578125, -1.757232666015625, -1.7046966552734375, -1.65216064453125, -1.5996246337890625, -1.547088623046875, -1.4945526123046875, -1.4420166015625, -1.3894805908203125, -1.336944580078125, -1.2844085693359375, -1.23187255859375, -1.1793365478515625, -1.126800537109375, -1.0742645263671875, -1.021728515625, -0.9691925048828125, -0.916656494140625, -0.8641204833984375, -0.81158447265625, -0.7590484619140625, -0.706512451171875, -0.6539764404296875, -0.6014404296875, -0.5489044189453125, -0.496368408203125, -0.4438323974609375, -0.39129638671875, -0.3387603759765625, -0.286224365234375, -0.2336883544921875, -0.18115234375, -0.1286163330078125, -0.076080322265625, -0.0235443115234375, 0.02899169921875, 0.0815277099609375, 0.134063720703125, 0.1865997314453125, 0.2391357421875, 0.2916717529296875, 0.344207763671875, 0.3967437744140625, 0.44927978515625, 0.5018157958984375, 0.554351806640625, 0.6068878173828125, 0.659423828125, 0.7119598388671875, 0.764495849609375, 0.8170318603515625, 0.86956787109375, 0.9221038818359375, 0.974639892578125, 1.0271759033203125, 1.0797119140625, 1.1322479248046875, 1.184783935546875, 1.2373199462890625, 1.28985595703125, 1.3423919677734375, 1.394927978515625, 1.4474639892578125, 1.5]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 3.0, 5.0, 7.0, 10.0, 26.0, 25.0, 57.0, 90.0, 146.0, 214.0, 156.0, 87.0, 61.0, 31.0, 26.0, 15.0, 15.0, 9.0, 5.0, 5.0, 4.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00064849853515625, -0.0006230771541595459, -0.0005976557731628418, -0.0005722343921661377, -0.0005468130111694336, -0.0005213916301727295, -0.0004959702491760254, -0.0004705488681793213, -0.0004451274871826172, -0.0004197061061859131, -0.000394284725189209, -0.0003688633441925049, -0.0003434419631958008, -0.0003180205821990967, -0.0002925992012023926, -0.0002671778202056885, -0.00024175643920898438, -0.00021633505821228027, -0.00019091367721557617, -0.00016549229621887207, -0.00014007091522216797, -0.00011464953422546387, -8.922815322875977e-05, -6.380677223205566e-05, -3.838539123535156e-05, -1.2964010238647461e-05, 1.245737075805664e-05, 3.787875175476074e-05, 6.330013275146484e-05, 8.872151374816895e-05, 0.00011414289474487305, 0.00013956427574157715, 0.00016498565673828125, 0.00019040703773498535, 0.00021582841873168945, 0.00024124979972839355, 0.00026667118072509766, 0.00029209256172180176, 0.00031751394271850586, 0.00034293532371520996, 0.00036835670471191406, 0.00039377808570861816, 0.00041919946670532227, 0.00044462084770202637, 0.00047004222869873047, 0.0004954636096954346, 0.0005208849906921387, 0.0005463063716888428, 0.0005717277526855469, 0.000597149133682251, 0.0006225705146789551, 0.0006479918956756592, 0.0006734132766723633, 0.0006988346576690674, 0.0007242560386657715, 0.0007496774196624756, 0.0007750988006591797, 0.0008005201816558838, 0.0008259415626525879, 0.000851362943649292, 0.0008767843246459961, 0.0009022057056427002, 0.0009276270866394043, 0.0009530484676361084, 0.0009784698486328125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 6.0, 3.0, 2.0, 9.0, 15.0, 13.0, 24.0, 23.0, 39.0, 68.0, 83.0, 131.0, 214.0, 297.0, 450.0, 597.0, 948.0, 1371.0, 2001.0, 2999.0, 4585.0, 6828.0, 11232.0, 18064.0, 31926.0, 60388.0, 120268.0, 213828.0, 239790.0, 153783.0, 78668.0, 40399.0, 22224.0, 13077.0, 8067.0, 5345.0, 3469.0, 2374.0, 1570.0, 1068.0, 700.0, 517.0, 334.0, 253.0, 153.0, 102.0, 82.0, 57.0, 48.0, 20.0, 16.0, 16.0, 11.0, 5.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.93994140625, -0.9088058471679688, -0.8776702880859375, -0.8465347290039062, -0.815399169921875, -0.7842636108398438, -0.7531280517578125, -0.7219924926757812, -0.69085693359375, -0.6597213745117188, -0.6285858154296875, -0.5974502563476562, -0.566314697265625, -0.5351791381835938, -0.5040435791015625, -0.47290802001953125, -0.4417724609375, -0.41063690185546875, -0.3795013427734375, -0.34836578369140625, -0.317230224609375, -0.28609466552734375, -0.2549591064453125, -0.22382354736328125, -0.19268798828125, -0.16155242919921875, -0.1304168701171875, -0.09928131103515625, -0.068145751953125, -0.03701019287109375, -0.0058746337890625, 0.02526092529296875, 0.056396484375, 0.08753204345703125, 0.1186676025390625, 0.14980316162109375, 0.180938720703125, 0.21207427978515625, 0.2432098388671875, 0.27434539794921875, 0.30548095703125, 0.33661651611328125, 0.3677520751953125, 0.39888763427734375, 0.430023193359375, 0.46115875244140625, 0.4922943115234375, 0.5234298706054688, 0.5545654296875, 0.5857009887695312, 0.6168365478515625, 0.6479721069335938, 0.679107666015625, 0.7102432250976562, 0.7413787841796875, 0.7725143432617188, 0.80364990234375, 0.8347854614257812, 0.8659210205078125, 0.8970565795898438, 0.928192138671875, 0.9593276977539062, 0.9904632568359375, 1.0215988159179688, 1.052734375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 4.0, 6.0, 5.0, 9.0, 5.0, 7.0, 8.0, 6.0, 3.0, 11.0, 9.0, 18.0, 19.0, 16.0, 31.0, 40.0, 38.0, 46.0, 52.0, 75.0, 77.0, 74.0, 67.0, 78.0, 55.0, 57.0, 26.0, 23.0, 22.0, 15.0, 12.0, 10.0, 6.0, 11.0, 10.0, 6.0, 9.0, 5.0, 5.0, 8.0, 5.0, 4.0, 2.0, 3.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.38134765625, -0.37052154541015625, -0.3596954345703125, -0.34886932373046875, -0.338043212890625, -0.32721710205078125, -0.3163909912109375, -0.30556488037109375, -0.29473876953125, -0.28391265869140625, -0.2730865478515625, -0.26226043701171875, -0.251434326171875, -0.24060821533203125, -0.2297821044921875, -0.21895599365234375, -0.2081298828125, -0.19730377197265625, -0.1864776611328125, -0.17565155029296875, -0.164825439453125, -0.15399932861328125, -0.1431732177734375, -0.13234710693359375, -0.12152099609375, -0.11069488525390625, -0.0998687744140625, -0.08904266357421875, -0.078216552734375, -0.06739044189453125, -0.0565643310546875, -0.04573822021484375, -0.034912109375, -0.02408599853515625, -0.0132598876953125, -0.00243377685546875, 0.008392333984375, 0.01921844482421875, 0.0300445556640625, 0.04087066650390625, 0.05169677734375, 0.06252288818359375, 0.0733489990234375, 0.08417510986328125, 0.095001220703125, 0.10582733154296875, 0.1166534423828125, 0.12747955322265625, 0.1383056640625, 0.14913177490234375, 0.1599578857421875, 0.17078399658203125, 0.181610107421875, 0.19243621826171875, 0.2032623291015625, 0.21408843994140625, 0.22491455078125, 0.23574066162109375, 0.2465667724609375, 0.25739288330078125, 0.268218994140625, 0.27904510498046875, 0.2898712158203125, 0.30069732666015625, 0.3115234375]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 8.0, 7.0, 7.0, 8.0, 12.0, 15.0, 27.0, 28.0, 27.0, 29.0, 32.0, 38.0, 44.0, 34.0, 49.0, 56.0, 59.0, 47.0, 51.0, 38.0, 45.0, 63.0, 30.0, 40.0, 42.0, 37.0, 22.0, 25.0, 19.0, 22.0, 10.0, 8.0, 7.0, 7.0, 5.0, 1.0, 4.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.250198364257812, -10.93216323852539, -10.614128112792969, -10.296093940734863, -9.978058815002441, -9.66002368927002, -9.341988563537598, -9.023953437805176, -8.70591926574707, -8.387884140014648, -8.069849014282227, -7.751814365386963, -7.433779716491699, -7.115744590759277, -6.7977094650268555, -6.479674339294434, -6.161639213562012, -5.84360408782959, -5.525569438934326, -5.207534313201904, -4.889499664306641, -4.571464538574219, -4.253429412841797, -3.935394525527954, -3.6173596382141113, -3.2993247509002686, -2.981289863586426, -2.663254737854004, -2.345219850540161, -2.0271849632263184, -1.709149956703186, -1.3911149501800537, -1.0730791091918945, -0.755044162273407, -0.43700921535491943, -0.11897426843643188, 0.19906067848205566, 0.5170955657958984, 0.8351305723190308, 1.153165578842163, 1.4712004661560059, 1.7892353534698486, 2.1072702407836914, 2.4253053665161133, 2.743340253829956, 3.061375141143799, 3.3794102668762207, 3.6974451541900635, 4.015480041503906, 4.333515167236328, 4.651549816131592, 4.969584941864014, 5.287619590759277, 5.605654716491699, 5.923689842224121, 6.241724967956543, 6.559759616851807, 6.8777947425842285, 7.195829391479492, 7.513864517211914, 7.831899642944336, 8.149934768676758, 8.467968940734863, 8.786004066467285, 9.104039192199707]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 6.0, 4.0, 5.0, 10.0, 11.0, 8.0, 15.0, 10.0, 19.0, 20.0, 17.0, 17.0, 23.0, 34.0, 28.0, 40.0, 47.0, 36.0, 43.0, 54.0, 33.0, 32.0, 33.0, 38.0, 42.0, 41.0, 28.0, 33.0, 30.0, 24.0, 37.0, 20.0, 26.0, 30.0, 12.0, 15.0, 18.0, 15.0, 5.0, 7.0, 6.0, 5.0, 4.0, 9.0, 7.0, 7.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-8.481182098388672, -8.208797454833984, -7.936413288116455, -7.664029121398926, -7.391644477844238, -7.119260311126709, -6.84687614440918, -6.574491500854492, -6.302107334136963, -6.029723167419434, -5.757338523864746, -5.484954357147217, -5.2125701904296875, -4.940185546875, -4.667801380157471, -4.395417213439941, -4.123032569885254, -3.8506481647491455, -3.578263759613037, -3.305879592895508, -3.0334951877593994, -2.761110782623291, -2.4887266159057617, -2.2163422107696533, -1.943957805633545, -1.6715734004974365, -1.3991891145706177, -1.1268048286437988, -0.8544204235076904, -0.582036018371582, -0.3096517324447632, -0.037267446517944336, 0.23511791229248047, 0.5075022578239441, 0.7798866033554077, 1.0522708892822266, 1.324655294418335, 1.5970396995544434, 1.8694239854812622, 2.141808271408081, 2.4141926765441895, 2.686577081680298, 2.9589614868164062, 3.2313456535339355, 3.503730058670044, 3.7761144638061523, 4.048498630523682, 4.320882797241211, 4.593267440795898, 4.865651607513428, 5.138036251068115, 5.4104204177856445, 5.682805061340332, 5.955189228057861, 6.227573394775391, 6.499958038330078, 6.772342205047607, 7.044726371765137, 7.317111015319824, 7.5894951820373535, 7.861879348754883, 8.13426399230957, 8.406648635864258, 8.679032325744629, 8.951416969299316]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 4.0, 10.0, 10.0, 8.0, 19.0, 33.0, 27.0, 58.0, 90.0, 160.0, 292.0, 387.0, 674.0, 1013.0, 1533.0, 2482.0, 3864.0, 5978.0, 9289.0, 13983.0, 21022.0, 30272.0, 42071.0, 56611.0, 72199.0, 87091.0, 98887.0, 103776.0, 101620.0, 93180.0, 79233.0, 63589.0, 49227.0, 35605.0, 25164.0, 17087.0, 11435.0, 7506.0, 4782.0, 2999.0, 1976.0, 1183.0, 778.0, 490.0, 339.0, 203.0, 127.0, 83.0, 48.0, 22.0, 19.0, 14.0, 5.0, 7.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-5.69140625, -5.5120849609375, -5.332763671875, -5.1534423828125, -4.97412109375, -4.7947998046875, -4.615478515625, -4.4361572265625, -4.2568359375, -4.0775146484375, -3.898193359375, -3.7188720703125, -3.53955078125, -3.3602294921875, -3.180908203125, -3.0015869140625, -2.822265625, -2.6429443359375, -2.463623046875, -2.2843017578125, -2.10498046875, -1.9256591796875, -1.746337890625, -1.5670166015625, -1.3876953125, -1.2083740234375, -1.029052734375, -0.8497314453125, -0.67041015625, -0.4910888671875, -0.311767578125, -0.1324462890625, 0.046875, 0.2261962890625, 0.405517578125, 0.5848388671875, 0.76416015625, 0.9434814453125, 1.122802734375, 1.3021240234375, 1.4814453125, 1.6607666015625, 1.840087890625, 2.0194091796875, 2.19873046875, 2.3780517578125, 2.557373046875, 2.7366943359375, 2.916015625, 3.0953369140625, 3.274658203125, 3.4539794921875, 3.63330078125, 3.8126220703125, 3.991943359375, 4.1712646484375, 4.3505859375, 4.5299072265625, 4.709228515625, 4.8885498046875, 5.06787109375, 5.2471923828125, 5.426513671875, 5.6058349609375, 5.78515625]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 3.0, 7.0, 5.0, 7.0, 9.0, 10.0, 11.0, 13.0, 14.0, 20.0, 23.0, 24.0, 21.0, 30.0, 36.0, 26.0, 41.0, 46.0, 37.0, 34.0, 38.0, 51.0, 37.0, 43.0, 28.0, 37.0, 37.0, 33.0, 39.0, 32.0, 21.0, 35.0, 20.0, 18.0, 16.0, 11.0, 15.0, 16.0, 12.0, 8.0, 9.0, 7.0, 11.0, 1.0, 3.0, 4.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.94140625, -7.66888427734375, -7.3963623046875, -7.12384033203125, -6.851318359375, -6.57879638671875, -6.3062744140625, -6.03375244140625, -5.76123046875, -5.48870849609375, -5.2161865234375, -4.94366455078125, -4.671142578125, -4.39862060546875, -4.1260986328125, -3.85357666015625, -3.5810546875, -3.30853271484375, -3.0360107421875, -2.76348876953125, -2.490966796875, -2.21844482421875, -1.9459228515625, -1.67340087890625, -1.40087890625, -1.12835693359375, -0.8558349609375, -0.58331298828125, -0.310791015625, -0.03826904296875, 0.2342529296875, 0.50677490234375, 0.779296875, 1.05181884765625, 1.3243408203125, 1.59686279296875, 1.869384765625, 2.14190673828125, 2.4144287109375, 2.68695068359375, 2.95947265625, 3.23199462890625, 3.5045166015625, 3.77703857421875, 4.049560546875, 4.32208251953125, 4.5946044921875, 4.86712646484375, 5.1396484375, 5.41217041015625, 5.6846923828125, 5.95721435546875, 6.229736328125, 6.50225830078125, 6.7747802734375, 7.04730224609375, 7.31982421875, 7.59234619140625, 7.8648681640625, 8.13739013671875, 8.409912109375, 8.68243408203125, 8.9549560546875, 9.22747802734375, 9.5]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 5.0, 2.0, 6.0, 7.0, 14.0, 13.0, 11.0, 24.0, 47.0, 62.0, 93.0, 163.0, 237.0, 389.0, 590.0, 945.0, 1352.0, 2270.0, 3551.0, 5654.0, 8669.0, 13880.0, 21277.0, 31914.0, 47059.0, 65105.0, 85776.0, 104407.0, 117573.0, 118386.0, 108550.0, 90340.0, 69836.0, 50495.0, 35048.0, 23183.0, 15116.0, 9537.0, 6063.0, 3982.0, 2485.0, 1575.0, 1054.0, 649.0, 391.0, 256.0, 155.0, 122.0, 88.0, 62.0, 32.0, 17.0, 19.0, 6.0, 11.0, 9.0, 3.0, 1.0, 1.0, 2.0, 1.0], "bins": [-7.5, -7.26641845703125, -7.0328369140625, -6.79925537109375, -6.565673828125, -6.33209228515625, -6.0985107421875, -5.86492919921875, -5.63134765625, -5.39776611328125, -5.1641845703125, -4.93060302734375, -4.697021484375, -4.46343994140625, -4.2298583984375, -3.99627685546875, -3.7626953125, -3.52911376953125, -3.2955322265625, -3.06195068359375, -2.828369140625, -2.59478759765625, -2.3612060546875, -2.12762451171875, -1.89404296875, -1.66046142578125, -1.4268798828125, -1.19329833984375, -0.959716796875, -0.72613525390625, -0.4925537109375, -0.25897216796875, -0.025390625, 0.20819091796875, 0.4417724609375, 0.67535400390625, 0.908935546875, 1.14251708984375, 1.3760986328125, 1.60968017578125, 1.84326171875, 2.07684326171875, 2.3104248046875, 2.54400634765625, 2.777587890625, 3.01116943359375, 3.2447509765625, 3.47833251953125, 3.7119140625, 3.94549560546875, 4.1790771484375, 4.41265869140625, 4.646240234375, 4.87982177734375, 5.1134033203125, 5.34698486328125, 5.58056640625, 5.81414794921875, 6.0477294921875, 6.28131103515625, 6.514892578125, 6.74847412109375, 6.9820556640625, 7.21563720703125, 7.44921875]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 4.0, 1.0, 4.0, 5.0, 10.0, 7.0, 6.0, 5.0, 15.0, 13.0, 17.0, 22.0, 20.0, 25.0, 34.0, 35.0, 23.0, 32.0, 39.0, 43.0, 46.0, 41.0, 38.0, 47.0, 43.0, 44.0, 38.0, 40.0, 46.0, 40.0, 26.0, 23.0, 28.0, 22.0, 26.0, 24.0, 17.0, 8.0, 12.0, 13.0, 7.0, 8.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.66796875, -6.47869873046875, -6.2894287109375, -6.10015869140625, -5.910888671875, -5.72161865234375, -5.5323486328125, -5.34307861328125, -5.15380859375, -4.96453857421875, -4.7752685546875, -4.58599853515625, -4.396728515625, -4.20745849609375, -4.0181884765625, -3.82891845703125, -3.6396484375, -3.45037841796875, -3.2611083984375, -3.07183837890625, -2.882568359375, -2.69329833984375, -2.5040283203125, -2.31475830078125, -2.12548828125, -1.93621826171875, -1.7469482421875, -1.55767822265625, -1.368408203125, -1.17913818359375, -0.9898681640625, -0.80059814453125, -0.611328125, -0.42205810546875, -0.2327880859375, -0.04351806640625, 0.145751953125, 0.33502197265625, 0.5242919921875, 0.71356201171875, 0.90283203125, 1.09210205078125, 1.2813720703125, 1.47064208984375, 1.659912109375, 1.84918212890625, 2.0384521484375, 2.22772216796875, 2.4169921875, 2.60626220703125, 2.7955322265625, 2.98480224609375, 3.174072265625, 3.36334228515625, 3.5526123046875, 3.74188232421875, 3.93115234375, 4.12042236328125, 4.3096923828125, 4.49896240234375, 4.688232421875, 4.87750244140625, 5.0667724609375, 5.25604248046875, 5.4453125]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 2.0, 9.0, 6.0, 12.0, 17.0, 34.0, 45.0, 85.0, 110.0, 182.0, 238.0, 424.0, 742.0, 1311.0, 2504.0, 5236.0, 11836.0, 27301.0, 64546.0, 147091.0, 256436.0, 259241.0, 151662.0, 67680.0, 28141.0, 12269.0, 5642.0, 2563.0, 1349.0, 743.0, 426.0, 259.0, 142.0, 98.0, 50.0, 40.0, 33.0, 20.0, 12.0, 7.0, 8.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.625, -6.396728515625, -6.16845703125, -5.940185546875, -5.7119140625, -5.483642578125, -5.25537109375, -5.027099609375, -4.798828125, -4.570556640625, -4.34228515625, -4.114013671875, -3.8857421875, -3.657470703125, -3.42919921875, -3.200927734375, -2.97265625, -2.744384765625, -2.51611328125, -2.287841796875, -2.0595703125, -1.831298828125, -1.60302734375, -1.374755859375, -1.146484375, -0.918212890625, -0.68994140625, -0.461669921875, -0.2333984375, -0.005126953125, 0.22314453125, 0.451416015625, 0.6796875, 0.907958984375, 1.13623046875, 1.364501953125, 1.5927734375, 1.821044921875, 2.04931640625, 2.277587890625, 2.505859375, 2.734130859375, 2.96240234375, 3.190673828125, 3.4189453125, 3.647216796875, 3.87548828125, 4.103759765625, 4.33203125, 4.560302734375, 4.78857421875, 5.016845703125, 5.2451171875, 5.473388671875, 5.70166015625, 5.929931640625, 6.158203125, 6.386474609375, 6.61474609375, 6.843017578125, 7.0712890625, 7.299560546875, 7.52783203125, 7.756103515625, 7.984375]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 5.0, 7.0, 6.0, 5.0, 9.0, 10.0, 18.0, 10.0, 18.0, 30.0, 38.0, 37.0, 53.0, 72.0, 71.0, 66.0, 58.0, 92.0, 71.0, 63.0, 49.0, 51.0, 35.0, 33.0, 17.0, 21.0, 15.0, 12.0, 9.0, 8.0, 4.0, 2.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0007166862487792969, -0.0006987117230892181, -0.0006807371973991394, -0.0006627626717090607, -0.0006447881460189819, -0.0006268136203289032, -0.0006088390946388245, -0.0005908645689487457, -0.000572890043258667, -0.0005549155175685883, -0.0005369409918785095, -0.0005189664661884308, -0.000500991940498352, -0.0004830174148082733, -0.0004650428891181946, -0.00044706836342811584, -0.0004290938377380371, -0.0004111193120479584, -0.00039314478635787964, -0.0003751702606678009, -0.00035719573497772217, -0.00033922120928764343, -0.0003212466835975647, -0.00030327215790748596, -0.0002852976322174072, -0.0002673231065273285, -0.00024934858083724976, -0.00023137405514717102, -0.00021339952945709229, -0.00019542500376701355, -0.00017745047807693481, -0.00015947595238685608, -0.00014150142669677734, -0.0001235269010066986, -0.00010555237531661987, -8.757784962654114e-05, -6.96033239364624e-05, -5.162879824638367e-05, -3.365427255630493e-05, -1.5679746866226196e-05, 2.294778823852539e-06, 2.0269304513931274e-05, 3.824383020401001e-05, 5.6218355894088745e-05, 7.419288158416748e-05, 9.216740727424622e-05, 0.00011014193296432495, 0.0001281164586544037, 0.00014609098434448242, 0.00016406551003456116, 0.0001820400357246399, 0.00020001456141471863, 0.00021798908710479736, 0.0002359636127948761, 0.00025393813848495483, 0.00027191266417503357, 0.0002898871898651123, 0.00030786171555519104, 0.0003258362412452698, 0.0003438107669353485, 0.00036178529262542725, 0.000379759818315506, 0.0003977343440055847, 0.00041570886969566345, 0.0004336833953857422]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 2.0, 2.0, 5.0, 7.0, 9.0, 13.0, 17.0, 24.0, 32.0, 59.0, 67.0, 95.0, 173.0, 245.0, 387.0, 624.0, 982.0, 1586.0, 2682.0, 4510.0, 7642.0, 12870.0, 21683.0, 36499.0, 59142.0, 89637.0, 123755.0, 148936.0, 150822.0, 128993.0, 95706.0, 63218.0, 39258.0, 23831.0, 14085.0, 8367.0, 5037.0, 2923.0, 1764.0, 1057.0, 605.0, 432.0, 259.0, 158.0, 115.0, 78.0, 44.0, 45.0, 26.0, 15.0, 17.0, 9.0, 6.0, 6.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.61328125, -3.4931640625, -3.373046875, -3.2529296875, -3.1328125, -3.0126953125, -2.892578125, -2.7724609375, -2.65234375, -2.5322265625, -2.412109375, -2.2919921875, -2.171875, -2.0517578125, -1.931640625, -1.8115234375, -1.69140625, -1.5712890625, -1.451171875, -1.3310546875, -1.2109375, -1.0908203125, -0.970703125, -0.8505859375, -0.73046875, -0.6103515625, -0.490234375, -0.3701171875, -0.25, -0.1298828125, -0.009765625, 0.1103515625, 0.23046875, 0.3505859375, 0.470703125, 0.5908203125, 0.7109375, 0.8310546875, 0.951171875, 1.0712890625, 1.19140625, 1.3115234375, 1.431640625, 1.5517578125, 1.671875, 1.7919921875, 1.912109375, 2.0322265625, 2.15234375, 2.2724609375, 2.392578125, 2.5126953125, 2.6328125, 2.7529296875, 2.873046875, 2.9931640625, 3.11328125, 3.2333984375, 3.353515625, 3.4736328125, 3.59375, 3.7138671875, 3.833984375, 3.9541015625, 4.07421875]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 0.0, 2.0, 5.0, 3.0, 6.0, 8.0, 6.0, 6.0, 7.0, 9.0, 13.0, 11.0, 22.0, 25.0, 36.0, 30.0, 36.0, 49.0, 41.0, 33.0, 43.0, 50.0, 54.0, 55.0, 43.0, 59.0, 35.0, 44.0, 42.0, 29.0, 33.0, 36.0, 19.0, 14.0, 26.0, 13.0, 17.0, 14.0, 14.0, 5.0, 7.0, 2.0, 1.0, 4.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5087890625, -1.46331787109375, -1.4178466796875, -1.37237548828125, -1.326904296875, -1.28143310546875, -1.2359619140625, -1.19049072265625, -1.14501953125, -1.09954833984375, -1.0540771484375, -1.00860595703125, -0.963134765625, -0.91766357421875, -0.8721923828125, -0.82672119140625, -0.78125, -0.73577880859375, -0.6903076171875, -0.64483642578125, -0.599365234375, -0.55389404296875, -0.5084228515625, -0.46295166015625, -0.41748046875, -0.37200927734375, -0.3265380859375, -0.28106689453125, -0.235595703125, -0.19012451171875, -0.1446533203125, -0.09918212890625, -0.0537109375, -0.00823974609375, 0.0372314453125, 0.08270263671875, 0.128173828125, 0.17364501953125, 0.2191162109375, 0.26458740234375, 0.31005859375, 0.35552978515625, 0.4010009765625, 0.44647216796875, 0.491943359375, 0.53741455078125, 0.5828857421875, 0.62835693359375, 0.673828125, 0.71929931640625, 0.7647705078125, 0.81024169921875, 0.855712890625, 0.90118408203125, 0.9466552734375, 0.99212646484375, 1.03759765625, 1.08306884765625, 1.1285400390625, 1.17401123046875, 1.219482421875, 1.26495361328125, 1.3104248046875, 1.35589599609375, 1.4013671875]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 5.0, 2.0, 7.0, 7.0, 11.0, 13.0, 14.0, 23.0, 24.0, 39.0, 29.0, 28.0, 39.0, 29.0, 41.0, 37.0, 55.0, 43.0, 39.0, 47.0, 48.0, 51.0, 46.0, 49.0, 34.0, 31.0, 24.0, 37.0, 35.0, 24.0, 23.0, 17.0, 18.0, 10.0, 8.0, 5.0, 5.0, 3.0, 4.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.9841890335083, -9.684004783630371, -9.383820533752441, -9.083636283874512, -8.783452033996582, -8.483267784118652, -8.183083534240723, -7.882899284362793, -7.582715034484863, -7.282530784606934, -6.982346534729004, -6.682162284851074, -6.3819780349731445, -6.081793785095215, -5.781609535217285, -5.4814252853393555, -5.181241035461426, -4.881056785583496, -4.580872535705566, -4.280688285827637, -3.980504035949707, -3.6803197860717773, -3.3801355361938477, -3.079951286315918, -2.7797670364379883, -2.4795827865600586, -2.179398536682129, -1.8792142868041992, -1.5790300369262695, -1.2788457870483398, -0.9786615371704102, -0.6784772872924805, -0.3782920837402344, -0.07810783386230469, 0.222076416015625, 0.5222606658935547, 0.8224449157714844, 1.122629165649414, 1.4228134155273438, 1.7229976654052734, 2.023181915283203, 2.323366165161133, 2.6235504150390625, 2.923734664916992, 3.223918914794922, 3.5241031646728516, 3.8242874145507812, 4.124471664428711, 4.424655914306641, 4.72484016418457, 5.0250244140625, 5.32520866394043, 5.625392913818359, 5.925577163696289, 6.225761413574219, 6.525945663452148, 6.826129913330078, 7.126314163208008, 7.4264984130859375, 7.726682662963867, 8.026866912841797, 8.327051162719727, 8.627235412597656, 8.927419662475586, 9.227603912353516]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 3.0, 0.0, 6.0, 8.0, 2.0, 11.0, 9.0, 12.0, 19.0, 16.0, 20.0, 24.0, 24.0, 22.0, 17.0, 30.0, 37.0, 33.0, 47.0, 42.0, 46.0, 44.0, 60.0, 47.0, 37.0, 43.0, 43.0, 33.0, 33.0, 28.0, 34.0, 24.0, 16.0, 21.0, 14.0, 27.0, 14.0, 13.0, 4.0, 11.0, 3.0, 9.0, 5.0, 4.0, 8.0, 1.0, 3.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0], "bins": [-10.024230003356934, -9.72581672668457, -9.427403450012207, -9.128990173339844, -8.830577850341797, -8.532164573669434, -8.23375129699707, -7.935338020324707, -7.636924743652344, -7.3385114669799805, -7.040098190307617, -6.741685390472412, -6.443272113800049, -6.1448588371276855, -5.8464460372924805, -5.548032760620117, -5.249619483947754, -4.951206207275391, -4.652792930603027, -4.354380130767822, -4.055966854095459, -3.7575535774230957, -3.4591405391693115, -3.1607275009155273, -2.862314224243164, -2.563900947570801, -2.2654879093170166, -1.9670747518539429, -1.6686615943908691, -1.3702484369277954, -1.0718352794647217, -0.7734222412109375, -0.4750089645385742, -0.1765958070755005, 0.12181735038757324, 0.420230507850647, 0.7186436653137207, 1.0170568227767944, 1.3154699802398682, 1.6138830184936523, 1.9122962951660156, 2.210709571838379, 2.509122610092163, 2.8075356483459473, 3.1059489250183105, 3.404362201690674, 3.702775239944458, 4.001188278198242, 4.2996015548706055, 4.598014831542969, 4.896428108215332, 5.194840908050537, 5.4932541847229, 5.791667461395264, 6.090080261230469, 6.388493537902832, 6.686906814575195, 6.985320091247559, 7.283733367919922, 7.582146167755127, 7.88055944442749, 8.178972244262695, 8.477385520935059, 8.775798797607422, 9.074212074279785]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [4.0, 2.0, 0.0, 3.0, 5.0, 10.0, 9.0, 24.0, 32.0, 45.0, 69.0, 108.0, 175.0, 240.0, 361.0, 588.0, 929.0, 1488.0, 2551.0, 4214.0, 7203.0, 12558.0, 23039.0, 42249.0, 81253.0, 158347.0, 296042.0, 500579.0, 706730.0, 777540.0, 646604.0, 425265.0, 239672.0, 124185.0, 63907.0, 33719.0, 18304.0, 10355.0, 6051.0, 3538.0, 2251.0, 1428.0, 920.0, 578.0, 373.0, 250.0, 164.0, 117.0, 64.0, 52.0, 42.0, 26.0, 7.0, 11.0, 9.0, 6.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-6.8984375, -6.6632080078125, -6.427978515625, -6.1927490234375, -5.95751953125, -5.7222900390625, -5.487060546875, -5.2518310546875, -5.0166015625, -4.7813720703125, -4.546142578125, -4.3109130859375, -4.07568359375, -3.8404541015625, -3.605224609375, -3.3699951171875, -3.134765625, -2.8995361328125, -2.664306640625, -2.4290771484375, -2.19384765625, -1.9586181640625, -1.723388671875, -1.4881591796875, -1.2529296875, -1.0177001953125, -0.782470703125, -0.5472412109375, -0.31201171875, -0.0767822265625, 0.158447265625, 0.3936767578125, 0.62890625, 0.8641357421875, 1.099365234375, 1.3345947265625, 1.56982421875, 1.8050537109375, 2.040283203125, 2.2755126953125, 2.5107421875, 2.7459716796875, 2.981201171875, 3.2164306640625, 3.45166015625, 3.6868896484375, 3.922119140625, 4.1573486328125, 4.392578125, 4.6278076171875, 4.863037109375, 5.0982666015625, 5.33349609375, 5.5687255859375, 5.803955078125, 6.0391845703125, 6.2744140625, 6.5096435546875, 6.744873046875, 6.9801025390625, 7.21533203125, 7.4505615234375, 7.685791015625, 7.9210205078125, 8.15625]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 5.0, 3.0, 3.0, 11.0, 8.0, 8.0, 10.0, 17.0, 12.0, 17.0, 26.0, 28.0, 25.0, 24.0, 45.0, 23.0, 26.0, 43.0, 39.0, 49.0, 34.0, 53.0, 48.0, 44.0, 37.0, 30.0, 36.0, 32.0, 28.0, 25.0, 24.0, 20.0, 28.0, 13.0, 22.0, 13.0, 14.0, 12.0, 14.0, 10.0, 6.0, 8.0, 4.0, 8.0, 6.0, 3.0, 5.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-7.30859375, -7.07366943359375, -6.8387451171875, -6.60382080078125, -6.368896484375, -6.13397216796875, -5.8990478515625, -5.66412353515625, -5.42919921875, -5.19427490234375, -4.9593505859375, -4.72442626953125, -4.489501953125, -4.25457763671875, -4.0196533203125, -3.78472900390625, -3.5498046875, -3.31488037109375, -3.0799560546875, -2.84503173828125, -2.610107421875, -2.37518310546875, -2.1402587890625, -1.90533447265625, -1.67041015625, -1.43548583984375, -1.2005615234375, -0.96563720703125, -0.730712890625, -0.49578857421875, -0.2608642578125, -0.02593994140625, 0.208984375, 0.44390869140625, 0.6788330078125, 0.91375732421875, 1.148681640625, 1.38360595703125, 1.6185302734375, 1.85345458984375, 2.08837890625, 2.32330322265625, 2.5582275390625, 2.79315185546875, 3.028076171875, 3.26300048828125, 3.4979248046875, 3.73284912109375, 3.9677734375, 4.20269775390625, 4.4376220703125, 4.67254638671875, 4.907470703125, 5.14239501953125, 5.3773193359375, 5.61224365234375, 5.84716796875, 6.08209228515625, 6.3170166015625, 6.55194091796875, 6.786865234375, 7.02178955078125, 7.2567138671875, 7.49163818359375, 7.7265625]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 1.0, 3.0, 1.0, 3.0, 7.0, 9.0, 7.0, 14.0, 21.0, 44.0, 73.0, 109.0, 205.0, 378.0, 706.0, 1263.0, 2483.0, 5185.0, 10495.0, 22134.0, 47528.0, 105777.0, 228428.0, 466077.0, 796516.0, 964696.0, 745532.0, 419802.0, 203208.0, 93204.0, 42129.0, 19512.0, 9340.0, 4539.0, 2326.0, 1151.0, 636.0, 297.0, 188.0, 96.0, 62.0, 39.0, 14.0, 16.0, 9.0, 9.0, 4.0, 9.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-12.1640625, -11.8106689453125, -11.457275390625, -11.1038818359375, -10.75048828125, -10.3970947265625, -10.043701171875, -9.6903076171875, -9.3369140625, -8.9835205078125, -8.630126953125, -8.2767333984375, -7.92333984375, -7.5699462890625, -7.216552734375, -6.8631591796875, -6.509765625, -6.1563720703125, -5.802978515625, -5.4495849609375, -5.09619140625, -4.7427978515625, -4.389404296875, -4.0360107421875, -3.6826171875, -3.3292236328125, -2.975830078125, -2.6224365234375, -2.26904296875, -1.9156494140625, -1.562255859375, -1.2088623046875, -0.85546875, -0.5020751953125, -0.148681640625, 0.2047119140625, 0.55810546875, 0.9114990234375, 1.264892578125, 1.6182861328125, 1.9716796875, 2.3250732421875, 2.678466796875, 3.0318603515625, 3.38525390625, 3.7386474609375, 4.092041015625, 4.4454345703125, 4.798828125, 5.1522216796875, 5.505615234375, 5.8590087890625, 6.21240234375, 6.5657958984375, 6.919189453125, 7.2725830078125, 7.6259765625, 7.9793701171875, 8.332763671875, 8.6861572265625, 9.03955078125, 9.3929443359375, 9.746337890625, 10.0997314453125, 10.453125]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 8.0, 9.0, 11.0, 22.0, 21.0, 38.0, 61.0, 63.0, 73.0, 122.0, 141.0, 195.0, 215.0, 246.0, 241.0, 273.0, 309.0, 294.0, 282.0, 253.0, 231.0, 212.0, 157.0, 134.0, 116.0, 100.0, 65.0, 49.0, 36.0, 27.0, 25.0, 17.0, 8.0, 10.0, 6.0, 7.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.275390625, -3.145111083984375, -3.01483154296875, -2.884552001953125, -2.7542724609375, -2.623992919921875, -2.49371337890625, -2.363433837890625, -2.233154296875, -2.102874755859375, -1.97259521484375, -1.842315673828125, -1.7120361328125, -1.581756591796875, -1.45147705078125, -1.321197509765625, -1.19091796875, -1.060638427734375, -0.93035888671875, -0.800079345703125, -0.6697998046875, -0.539520263671875, -0.40924072265625, -0.278961181640625, -0.148681640625, -0.018402099609375, 0.11187744140625, 0.242156982421875, 0.3724365234375, 0.502716064453125, 0.63299560546875, 0.763275146484375, 0.8935546875, 1.023834228515625, 1.15411376953125, 1.284393310546875, 1.4146728515625, 1.544952392578125, 1.67523193359375, 1.805511474609375, 1.935791015625, 2.066070556640625, 2.19635009765625, 2.326629638671875, 2.4569091796875, 2.587188720703125, 2.71746826171875, 2.847747802734375, 2.97802734375, 3.108306884765625, 3.23858642578125, 3.368865966796875, 3.4991455078125, 3.629425048828125, 3.75970458984375, 3.889984130859375, 4.020263671875, 4.150543212890625, 4.28082275390625, 4.411102294921875, 4.5413818359375, 4.671661376953125, 4.80194091796875, 4.932220458984375, 5.0625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 6.0, 4.0, 5.0, 4.0, 9.0, 8.0, 10.0, 16.0, 17.0, 23.0, 19.0, 35.0, 29.0, 36.0, 29.0, 53.0, 48.0, 41.0, 48.0, 49.0, 60.0, 37.0, 50.0, 49.0, 33.0, 43.0, 41.0, 30.0, 25.0, 27.0, 30.0, 23.0, 15.0, 11.0, 13.0, 6.0, 8.0, 7.0, 6.0, 5.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-10.987895011901855, -10.695504188537598, -10.40311336517334, -10.110722541809082, -9.818330764770508, -9.52593994140625, -9.233549118041992, -8.941158294677734, -8.648767471313477, -8.356376647949219, -8.063985824584961, -7.771594524383545, -7.479203701019287, -7.186812877655029, -6.894421577453613, -6.6020307540893555, -6.309639930725098, -6.01724910736084, -5.724858283996582, -5.432466983795166, -5.140076160430908, -4.84768533706665, -4.555294036865234, -4.262903213500977, -3.9705123901367188, -3.678121566772461, -3.385730504989624, -3.093339443206787, -2.8009486198425293, -2.5085577964782715, -2.2161667346954346, -1.9237756729125977, -1.6313858032226562, -1.3389948606491089, -1.0466039180755615, -0.7542129755020142, -0.4618220329284668, -0.16943109035491943, 0.12295985221862793, 0.41535091400146484, 0.7077417373657227, 1.00013267993927, 1.2925236225128174, 1.5849145650863647, 1.877305507659912, 2.16969633102417, 2.462087392807007, 2.7544784545898438, 3.0468692779541016, 3.3392601013183594, 3.6316511631011963, 3.924042224884033, 4.216433048248291, 4.508823871612549, 4.801215171813965, 5.093605995178223, 5.3859968185424805, 5.678387641906738, 5.970778465270996, 6.263169765472412, 6.55556058883667, 6.847951412200928, 7.140342712402344, 7.432733535766602, 7.725124359130859]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 5.0, 9.0, 5.0, 15.0, 15.0, 11.0, 14.0, 18.0, 17.0, 13.0, 31.0, 36.0, 29.0, 27.0, 34.0, 42.0, 36.0, 34.0, 48.0, 43.0, 39.0, 45.0, 42.0, 35.0, 35.0, 40.0, 33.0, 28.0, 33.0, 23.0, 26.0, 18.0, 23.0, 23.0, 7.0, 7.0, 13.0, 11.0, 6.0, 5.0, 8.0, 2.0, 8.0, 3.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-8.461244583129883, -8.19428539276123, -7.927326679229736, -7.660367488861084, -7.39340877532959, -7.1264495849609375, -6.859490394592285, -6.592531204223633, -6.325572490692139, -6.058613300323486, -5.791654586791992, -5.52469539642334, -5.2577362060546875, -4.990777492523193, -4.723818302154541, -4.456859588623047, -4.1899003982543945, -3.9229414463043213, -3.655982494354248, -3.3890233039855957, -3.1220643520355225, -2.855105400085449, -2.588146209716797, -2.3211872577667236, -2.0542283058166504, -1.7872693538665771, -1.5203102827072144, -1.2533512115478516, -0.9863922595977783, -0.7194333076477051, -0.4524742364883423, -0.1855151653289795, 0.08144283294677734, 0.34840184450149536, 0.6153608560562134, 0.8823198676109314, 1.1492788791656494, 1.4162378311157227, 1.6831969022750854, 1.9501559734344482, 2.2171149253845215, 2.4840738773345947, 2.751032829284668, 3.0179920196533203, 3.2849509716033936, 3.551909923553467, 3.818869113922119, 4.085827827453613, 4.352787017822266, 4.619746208190918, 4.886704921722412, 5.1536641120910645, 5.420622825622559, 5.687582015991211, 5.954541206359863, 6.221500396728516, 6.48845911026001, 6.755418300628662, 7.022377014160156, 7.289336204528809, 7.556295394897461, 7.823254108428955, 8.09021282196045, 8.357172012329102, 8.624131202697754]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 8.0, 16.0, 16.0, 19.0, 38.0, 43.0, 78.0, 109.0, 133.0, 211.0, 361.0, 512.0, 860.0, 1316.0, 2132.0, 3688.0, 6490.0, 11284.0, 19561.0, 35628.0, 61382.0, 100475.0, 146257.0, 175593.0, 165949.0, 125395.0, 80267.0, 47519.0, 26952.0, 15135.0, 8614.0, 4849.0, 2961.0, 1691.0, 1030.0, 670.0, 438.0, 281.0, 184.0, 146.0, 78.0, 53.0, 38.0, 31.0, 22.0, 4.0, 12.0, 11.0, 5.0, 7.0, 5.0, 2.0, 1.0, 2.0], "bins": [-3.666015625, -3.55743408203125, -3.4488525390625, -3.34027099609375, -3.231689453125, -3.12310791015625, -3.0145263671875, -2.90594482421875, -2.79736328125, -2.68878173828125, -2.5802001953125, -2.47161865234375, -2.363037109375, -2.25445556640625, -2.1458740234375, -2.03729248046875, -1.9287109375, -1.82012939453125, -1.7115478515625, -1.60296630859375, -1.494384765625, -1.38580322265625, -1.2772216796875, -1.16864013671875, -1.06005859375, -0.95147705078125, -0.8428955078125, -0.73431396484375, -0.625732421875, -0.51715087890625, -0.4085693359375, -0.29998779296875, -0.19140625, -0.08282470703125, 0.0257568359375, 0.13433837890625, 0.242919921875, 0.35150146484375, 0.4600830078125, 0.56866455078125, 0.67724609375, 0.78582763671875, 0.8944091796875, 1.00299072265625, 1.111572265625, 1.22015380859375, 1.3287353515625, 1.43731689453125, 1.5458984375, 1.65447998046875, 1.7630615234375, 1.87164306640625, 1.980224609375, 2.08880615234375, 2.1973876953125, 2.30596923828125, 2.41455078125, 2.52313232421875, 2.6317138671875, 2.74029541015625, 2.848876953125, 2.95745849609375, 3.0660400390625, 3.17462158203125, 3.283203125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 6.0, 12.0, 10.0, 8.0, 14.0, 12.0, 21.0, 18.0, 23.0, 28.0, 20.0, 30.0, 22.0, 33.0, 35.0, 40.0, 41.0, 37.0, 44.0, 51.0, 50.0, 43.0, 43.0, 37.0, 32.0, 35.0, 33.0, 23.0, 31.0, 23.0, 26.0, 21.0, 12.0, 10.0, 20.0, 8.0, 10.0, 5.0, 9.0, 4.0, 6.0, 4.0, 6.0, 1.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.8984375, -8.620361328125, -8.34228515625, -8.064208984375, -7.7861328125, -7.508056640625, -7.22998046875, -6.951904296875, -6.673828125, -6.395751953125, -6.11767578125, -5.839599609375, -5.5615234375, -5.283447265625, -5.00537109375, -4.727294921875, -4.44921875, -4.171142578125, -3.89306640625, -3.614990234375, -3.3369140625, -3.058837890625, -2.78076171875, -2.502685546875, -2.224609375, -1.946533203125, -1.66845703125, -1.390380859375, -1.1123046875, -0.834228515625, -0.55615234375, -0.278076171875, 0.0, 0.278076171875, 0.55615234375, 0.834228515625, 1.1123046875, 1.390380859375, 1.66845703125, 1.946533203125, 2.224609375, 2.502685546875, 2.78076171875, 3.058837890625, 3.3369140625, 3.614990234375, 3.89306640625, 4.171142578125, 4.44921875, 4.727294921875, 5.00537109375, 5.283447265625, 5.5615234375, 5.839599609375, 6.11767578125, 6.395751953125, 6.673828125, 6.951904296875, 7.22998046875, 7.508056640625, 7.7861328125, 8.064208984375, 8.34228515625, 8.620361328125, 8.8984375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 8.0, 3.0, 6.0, 7.0, 12.0, 17.0, 24.0, 39.0, 47.0, 43.0, 71.0, 94.0, 140.0, 251.0, 450.0, 775.0, 1450.0, 2885.0, 6081.0, 13409.0, 29158.0, 205434.0, 716878.0, 38554.0, 16865.0, 7928.0, 3691.0, 1829.0, 965.0, 518.0, 284.0, 191.0, 122.0, 94.0, 61.0, 51.0, 38.0, 27.0, 22.0, 15.0, 11.0, 3.0, 6.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.0, -10.63525390625, -10.2705078125, -9.90576171875, -9.541015625, -9.17626953125, -8.8115234375, -8.44677734375, -8.08203125, -7.71728515625, -7.3525390625, -6.98779296875, -6.623046875, -6.25830078125, -5.8935546875, -5.52880859375, -5.1640625, -4.79931640625, -4.4345703125, -4.06982421875, -3.705078125, -3.34033203125, -2.9755859375, -2.61083984375, -2.24609375, -1.88134765625, -1.5166015625, -1.15185546875, -0.787109375, -0.42236328125, -0.0576171875, 0.30712890625, 0.671875, 1.03662109375, 1.4013671875, 1.76611328125, 2.130859375, 2.49560546875, 2.8603515625, 3.22509765625, 3.58984375, 3.95458984375, 4.3193359375, 4.68408203125, 5.048828125, 5.41357421875, 5.7783203125, 6.14306640625, 6.5078125, 6.87255859375, 7.2373046875, 7.60205078125, 7.966796875, 8.33154296875, 8.6962890625, 9.06103515625, 9.42578125, 9.79052734375, 10.1552734375, 10.52001953125, 10.884765625, 11.24951171875, 11.6142578125, 11.97900390625, 12.34375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 5.0, 10.0, 17.0, 10.0, 10.0, 15.0, 17.0, 17.0, 19.0, 18.0, 27.0, 36.0, 26.0, 38.0, 28.0, 40.0, 41.0, 36.0, 40.0, 33.0, 46.0, 42.0, 37.0, 37.0, 32.0, 32.0, 43.0, 36.0, 33.0, 26.0, 34.0, 16.0, 15.0, 17.0, 11.0, 16.0, 15.0, 7.0, 3.0, 9.0, 3.0, 2.0, 2.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.80078125, -6.5823974609375, -6.364013671875, -6.1456298828125, -5.92724609375, -5.7088623046875, -5.490478515625, -5.2720947265625, -5.0537109375, -4.8353271484375, -4.616943359375, -4.3985595703125, -4.18017578125, -3.9617919921875, -3.743408203125, -3.5250244140625, -3.306640625, -3.0882568359375, -2.869873046875, -2.6514892578125, -2.43310546875, -2.2147216796875, -1.996337890625, -1.7779541015625, -1.5595703125, -1.3411865234375, -1.122802734375, -0.9044189453125, -0.68603515625, -0.4676513671875, -0.249267578125, -0.0308837890625, 0.1875, 0.4058837890625, 0.624267578125, 0.8426513671875, 1.06103515625, 1.2794189453125, 1.497802734375, 1.7161865234375, 1.9345703125, 2.1529541015625, 2.371337890625, 2.5897216796875, 2.80810546875, 3.0264892578125, 3.244873046875, 3.4632568359375, 3.681640625, 3.9000244140625, 4.118408203125, 4.3367919921875, 4.55517578125, 4.7735595703125, 4.991943359375, 5.2103271484375, 5.4287109375, 5.6470947265625, 5.865478515625, 6.0838623046875, 6.30224609375, 6.5206298828125, 6.739013671875, 6.9573974609375, 7.17578125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 6.0, 8.0, 14.0, 11.0, 23.0, 17.0, 37.0, 64.0, 79.0, 81.0, 150.0, 271.0, 389.0, 538.0, 880.0, 1457.0, 2578.0, 4372.0, 8506.0, 17109.0, 44655.0, 678726.0, 228852.0, 30268.0, 13432.0, 6729.0, 3696.0, 2050.0, 1213.0, 764.0, 486.0, 322.0, 250.0, 160.0, 102.0, 86.0, 54.0, 37.0, 23.0, 15.0, 8.0, 11.0, 12.0, 6.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-1.10546875, -1.0727920532226562, -1.0401153564453125, -1.0074386596679688, -0.974761962890625, -0.9420852661132812, -0.9094085693359375, -0.8767318725585938, -0.84405517578125, -0.8113784790039062, -0.7787017822265625, -0.7460250854492188, -0.713348388671875, -0.6806716918945312, -0.6479949951171875, -0.6153182983398438, -0.5826416015625, -0.5499649047851562, -0.5172882080078125, -0.48461151123046875, -0.451934814453125, -0.41925811767578125, -0.3865814208984375, -0.35390472412109375, -0.32122802734375, -0.28855133056640625, -0.2558746337890625, -0.22319793701171875, -0.190521240234375, -0.15784454345703125, -0.1251678466796875, -0.09249114990234375, -0.059814453125, -0.02713775634765625, 0.0055389404296875, 0.03821563720703125, 0.070892333984375, 0.10356903076171875, 0.1362457275390625, 0.16892242431640625, 0.20159912109375, 0.23427581787109375, 0.2669525146484375, 0.29962921142578125, 0.332305908203125, 0.36498260498046875, 0.3976593017578125, 0.43033599853515625, 0.4630126953125, 0.49568939208984375, 0.5283660888671875, 0.5610427856445312, 0.593719482421875, 0.6263961791992188, 0.6590728759765625, 0.6917495727539062, 0.72442626953125, 0.7571029663085938, 0.7897796630859375, 0.8224563598632812, 0.855133056640625, 0.8878097534179688, 0.9204864501953125, 0.9531631469726562, 0.98583984375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 4.0, 4.0, 3.0, 7.0, 11.0, 11.0, 25.0, 41.0, 55.0, 81.0, 129.0, 158.0, 140.0, 98.0, 71.0, 57.0, 31.0, 20.0, 14.0, 13.0, 8.0, 8.0, 7.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00029015541076660156, -0.0002822764217853546, -0.00027439743280410767, -0.0002665184438228607, -0.00025863945484161377, -0.0002507604658603668, -0.00024288147687911987, -0.00023500248789787292, -0.00022712349891662598, -0.00021924450993537903, -0.00021136552095413208, -0.00020348653197288513, -0.00019560754299163818, -0.00018772855401039124, -0.0001798495650291443, -0.00017197057604789734, -0.0001640915870666504, -0.00015621259808540344, -0.0001483336091041565, -0.00014045462012290955, -0.0001325756311416626, -0.00012469664216041565, -0.0001168176531791687, -0.00010893866419792175, -0.0001010596752166748, -9.318068623542786e-05, -8.530169725418091e-05, -7.742270827293396e-05, -6.954371929168701e-05, -6.166473031044006e-05, -5.3785741329193115e-05, -4.590675234794617e-05, -3.802776336669922e-05, -3.014877438545227e-05, -2.2269785404205322e-05, -1.4390796422958374e-05, -6.511807441711426e-06, 1.3671815395355225e-06, 9.24617052078247e-06, 1.712515950202942e-05, 2.5004148483276367e-05, 3.2883137464523315e-05, 4.0762126445770264e-05, 4.864111542701721e-05, 5.652010440826416e-05, 6.439909338951111e-05, 7.227808237075806e-05, 8.0157071352005e-05, 8.803606033325195e-05, 9.59150493144989e-05, 0.00010379403829574585, 0.0001116730272769928, 0.00011955201625823975, 0.0001274310052394867, 0.00013530999422073364, 0.0001431889832019806, 0.00015106797218322754, 0.0001589469611644745, 0.00016682595014572144, 0.00017470493912696838, 0.00018258392810821533, 0.00019046291708946228, 0.00019834190607070923, 0.00020622089505195618, 0.00021409988403320312]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 6.0, 5.0, 10.0, 14.0, 20.0, 45.0, 46.0, 98.0, 129.0, 190.0, 354.0, 518.0, 845.0, 1379.0, 2347.0, 4068.0, 7952.0, 16053.0, 33382.0, 71175.0, 140073.0, 220540.0, 230999.0, 156861.0, 83012.0, 39404.0, 18652.0, 9136.0, 4634.0, 2607.0, 1521.0, 875.0, 559.0, 383.0, 247.0, 146.0, 112.0, 66.0, 41.0, 19.0, 15.0, 16.0, 6.0, 5.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.78759765625, -0.7622756958007812, -0.7369537353515625, -0.7116317749023438, -0.686309814453125, -0.6609878540039062, -0.6356658935546875, -0.6103439331054688, -0.58502197265625, -0.5597000122070312, -0.5343780517578125, -0.5090560913085938, -0.483734130859375, -0.45841217041015625, -0.4330902099609375, -0.40776824951171875, -0.3824462890625, -0.35712432861328125, -0.3318023681640625, -0.30648040771484375, -0.281158447265625, -0.25583648681640625, -0.2305145263671875, -0.20519256591796875, -0.17987060546875, -0.15454864501953125, -0.1292266845703125, -0.10390472412109375, -0.078582763671875, -0.05326080322265625, -0.0279388427734375, -0.00261688232421875, 0.022705078125, 0.04802703857421875, 0.0733489990234375, 0.09867095947265625, 0.123992919921875, 0.14931488037109375, 0.1746368408203125, 0.19995880126953125, 0.22528076171875, 0.25060272216796875, 0.2759246826171875, 0.30124664306640625, 0.326568603515625, 0.35189056396484375, 0.3772125244140625, 0.40253448486328125, 0.4278564453125, 0.45317840576171875, 0.4785003662109375, 0.5038223266601562, 0.529144287109375, 0.5544662475585938, 0.5797882080078125, 0.6051101684570312, 0.63043212890625, 0.6557540893554688, 0.6810760498046875, 0.7063980102539062, 0.731719970703125, 0.7570419311523438, 0.7823638916015625, 0.8076858520507812, 0.8330078125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 3.0, 5.0, 2.0, 9.0, 12.0, 7.0, 8.0, 15.0, 31.0, 41.0, 60.0, 49.0, 71.0, 64.0, 70.0, 72.0, 79.0, 87.0, 72.0, 50.0, 50.0, 33.0, 31.0, 22.0, 15.0, 8.0, 12.0, 3.0, 1.0, 1.0, 4.0, 2.0, 1.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.293212890625, -0.28441619873046875, -0.2756195068359375, -0.26682281494140625, -0.258026123046875, -0.24922943115234375, -0.2404327392578125, -0.23163604736328125, -0.22283935546875, -0.21404266357421875, -0.2052459716796875, -0.19644927978515625, -0.187652587890625, -0.17885589599609375, -0.1700592041015625, -0.16126251220703125, -0.1524658203125, -0.14366912841796875, -0.1348724365234375, -0.12607574462890625, -0.117279052734375, -0.10848236083984375, -0.0996856689453125, -0.09088897705078125, -0.08209228515625, -0.07329559326171875, -0.0644989013671875, -0.05570220947265625, -0.046905517578125, -0.03810882568359375, -0.0293121337890625, -0.02051544189453125, -0.01171875, -0.00292205810546875, 0.0058746337890625, 0.01467132568359375, 0.023468017578125, 0.03226470947265625, 0.0410614013671875, 0.04985809326171875, 0.05865478515625, 0.06745147705078125, 0.0762481689453125, 0.08504486083984375, 0.093841552734375, 0.10263824462890625, 0.1114349365234375, 0.12023162841796875, 0.1290283203125, 0.13782501220703125, 0.1466217041015625, 0.15541839599609375, 0.164215087890625, 0.17301177978515625, 0.1818084716796875, 0.19060516357421875, 0.19940185546875, 0.20819854736328125, 0.2169952392578125, 0.22579193115234375, 0.234588623046875, 0.24338531494140625, 0.2521820068359375, 0.26097869873046875, 0.269775390625]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 8.0, 6.0, 15.0, 9.0, 13.0, 15.0, 20.0, 20.0, 35.0, 28.0, 44.0, 45.0, 50.0, 47.0, 42.0, 54.0, 60.0, 37.0, 55.0, 51.0, 44.0, 41.0, 32.0, 38.0, 35.0, 30.0, 26.0, 24.0, 13.0, 20.0, 11.0, 6.0, 7.0, 6.0, 11.0, 5.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-11.46593189239502, -11.16418743133545, -10.862442016601562, -10.560697555541992, -10.258952140808105, -9.957207679748535, -9.655462265014648, -9.353717803955078, -9.051973342895508, -8.750228881835938, -8.44848346710205, -8.14673900604248, -7.844994068145752, -7.543249130249023, -7.241504192352295, -6.939759254455566, -6.638014316558838, -6.336269378662109, -6.034524440765381, -5.732779502868652, -5.431035041809082, -5.1292901039123535, -4.827545166015625, -4.525800704956055, -4.224055290222168, -3.9223103523254395, -3.62056565284729, -3.3188207149505615, -3.017076015472412, -2.7153310775756836, -2.413586139678955, -2.1118414402008057, -1.810096263885498, -1.508351445198059, -1.2066066265106201, -0.9048616886138916, -0.6031168699264526, -0.30137205123901367, 0.00037288665771484375, 0.30211758613586426, 0.6038625240325928, 0.9056073427200317, 1.2073521614074707, 1.5090970993041992, 1.8108419179916382, 2.112586736679077, 2.4143316745758057, 2.716076374053955, 3.0178213119506836, 3.319566249847412, 3.6213109493255615, 3.92305588722229, 4.2248005867004395, 4.526545524597168, 4.8282904624938965, 5.130035400390625, 5.431779861450195, 5.733524799346924, 6.035269737243652, 6.337014198303223, 6.638759136199951, 6.94050407409668, 7.242249011993408, 7.543993949890137, 7.845738887786865]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 6.0, 3.0, 10.0, 15.0, 12.0, 10.0, 8.0, 24.0, 15.0, 16.0, 26.0, 32.0, 32.0, 29.0, 36.0, 40.0, 32.0, 39.0, 42.0, 48.0, 40.0, 39.0, 42.0, 38.0, 39.0, 41.0, 31.0, 30.0, 30.0, 27.0, 24.0, 25.0, 19.0, 16.0, 15.0, 6.0, 11.0, 13.0, 9.0, 4.0, 7.0, 4.0, 6.0, 4.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-8.40929889678955, -8.14473819732666, -7.8801774978637695, -7.615616798400879, -7.351056098937988, -7.086495399475098, -6.821934223175049, -6.557373523712158, -6.292812824249268, -6.028252124786377, -5.763691425323486, -5.499130725860596, -5.234569549560547, -4.970008850097656, -4.705448150634766, -4.440887451171875, -4.176326751708984, -3.9117660522460938, -3.647205352783203, -3.3826444149017334, -3.1180837154388428, -2.853523015975952, -2.5889620780944824, -2.324401378631592, -2.059840679168701, -1.7952799797058105, -1.5307191610336304, -1.2661583423614502, -1.0015976428985596, -0.737036943435669, -0.47247612476348877, -0.2079153060913086, 0.05664539337158203, 0.32120615243911743, 0.5857669115066528, 0.8503276705741882, 1.1148884296417236, 1.3794491291046143, 1.6440099477767944, 1.9085707664489746, 2.1731314659118652, 2.437692165374756, 2.7022528648376465, 2.966813802719116, 3.231374502182007, 3.4959352016448975, 3.760496139526367, 4.025056838989258, 4.289617538452148, 4.554178237915039, 4.81873893737793, 5.08329963684082, 5.347860336303711, 5.612421035766602, 5.87698221206665, 6.141542911529541, 6.406103610992432, 6.670664310455322, 6.935225009918213, 7.1997857093811035, 7.464346885681152, 7.728907585144043, 7.993468284606934, 8.258028984069824, 8.522589683532715]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 5.0, 9.0, 13.0, 28.0, 40.0, 69.0, 101.0, 145.0, 231.0, 377.0, 603.0, 843.0, 1414.0, 2308.0, 3413.0, 5341.0, 8445.0, 12309.0, 18563.0, 26764.0, 37280.0, 50458.0, 65258.0, 79462.0, 92290.0, 100010.0, 101206.0, 96084.0, 84781.0, 70590.0, 55465.0, 41480.0, 30210.0, 21134.0, 14572.0, 9747.0, 6271.0, 4090.0, 2662.0, 1691.0, 973.0, 659.0, 409.0, 270.0, 180.0, 124.0, 80.0, 49.0, 19.0, 16.0, 11.0, 8.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.62890625, -4.47552490234375, -4.3221435546875, -4.16876220703125, -4.015380859375, -3.86199951171875, -3.7086181640625, -3.55523681640625, -3.40185546875, -3.24847412109375, -3.0950927734375, -2.94171142578125, -2.788330078125, -2.63494873046875, -2.4815673828125, -2.32818603515625, -2.1748046875, -2.02142333984375, -1.8680419921875, -1.71466064453125, -1.561279296875, -1.40789794921875, -1.2545166015625, -1.10113525390625, -0.94775390625, -0.79437255859375, -0.6409912109375, -0.48760986328125, -0.334228515625, -0.18084716796875, -0.0274658203125, 0.12591552734375, 0.279296875, 0.43267822265625, 0.5860595703125, 0.73944091796875, 0.892822265625, 1.04620361328125, 1.1995849609375, 1.35296630859375, 1.50634765625, 1.65972900390625, 1.8131103515625, 1.96649169921875, 2.119873046875, 2.27325439453125, 2.4266357421875, 2.58001708984375, 2.7333984375, 2.88677978515625, 3.0401611328125, 3.19354248046875, 3.346923828125, 3.50030517578125, 3.6536865234375, 3.80706787109375, 3.96044921875, 4.11383056640625, 4.2672119140625, 4.42059326171875, 4.573974609375, 4.72735595703125, 4.8807373046875, 5.03411865234375, 5.1875]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 7.0, 11.0, 9.0, 12.0, 11.0, 16.0, 16.0, 16.0, 20.0, 22.0, 27.0, 31.0, 37.0, 44.0, 41.0, 40.0, 45.0, 55.0, 41.0, 42.0, 40.0, 40.0, 43.0, 44.0, 33.0, 24.0, 37.0, 34.0, 22.0, 18.0, 16.0, 16.0, 19.0, 18.0, 11.0, 10.0, 13.0, 2.0, 10.0, 1.0, 3.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-8.8046875, -8.52392578125, -8.2431640625, -7.96240234375, -7.681640625, -7.40087890625, -7.1201171875, -6.83935546875, -6.55859375, -6.27783203125, -5.9970703125, -5.71630859375, -5.435546875, -5.15478515625, -4.8740234375, -4.59326171875, -4.3125, -4.03173828125, -3.7509765625, -3.47021484375, -3.189453125, -2.90869140625, -2.6279296875, -2.34716796875, -2.06640625, -1.78564453125, -1.5048828125, -1.22412109375, -0.943359375, -0.66259765625, -0.3818359375, -0.10107421875, 0.1796875, 0.46044921875, 0.7412109375, 1.02197265625, 1.302734375, 1.58349609375, 1.8642578125, 2.14501953125, 2.42578125, 2.70654296875, 2.9873046875, 3.26806640625, 3.548828125, 3.82958984375, 4.1103515625, 4.39111328125, 4.671875, 4.95263671875, 5.2333984375, 5.51416015625, 5.794921875, 6.07568359375, 6.3564453125, 6.63720703125, 6.91796875, 7.19873046875, 7.4794921875, 7.76025390625, 8.041015625, 8.32177734375, 8.6025390625, 8.88330078125, 9.1640625]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 7.0, 7.0, 14.0, 22.0, 37.0, 62.0, 93.0, 152.0, 241.0, 332.0, 602.0, 986.0, 1497.0, 2487.0, 4049.0, 6441.0, 10207.0, 16022.0, 24922.0, 37389.0, 53881.0, 73949.0, 95811.0, 112441.0, 120792.0, 117677.0, 102592.0, 82189.0, 61067.0, 42966.0, 28771.0, 18719.0, 11936.0, 7658.0, 4841.0, 2850.0, 1862.0, 1135.0, 690.0, 458.0, 278.0, 174.0, 88.0, 62.0, 43.0, 24.0, 9.0, 15.0, 4.0, 12.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-6.39453125, -6.19268798828125, -5.9908447265625, -5.78900146484375, -5.587158203125, -5.38531494140625, -5.1834716796875, -4.98162841796875, -4.77978515625, -4.57794189453125, -4.3760986328125, -4.17425537109375, -3.972412109375, -3.77056884765625, -3.5687255859375, -3.36688232421875, -3.1650390625, -2.96319580078125, -2.7613525390625, -2.55950927734375, -2.357666015625, -2.15582275390625, -1.9539794921875, -1.75213623046875, -1.55029296875, -1.34844970703125, -1.1466064453125, -0.94476318359375, -0.742919921875, -0.54107666015625, -0.3392333984375, -0.13739013671875, 0.064453125, 0.26629638671875, 0.4681396484375, 0.66998291015625, 0.871826171875, 1.07366943359375, 1.2755126953125, 1.47735595703125, 1.67919921875, 1.88104248046875, 2.0828857421875, 2.28472900390625, 2.486572265625, 2.68841552734375, 2.8902587890625, 3.09210205078125, 3.2939453125, 3.49578857421875, 3.6976318359375, 3.89947509765625, 4.101318359375, 4.30316162109375, 4.5050048828125, 4.70684814453125, 4.90869140625, 5.11053466796875, 5.3123779296875, 5.51422119140625, 5.716064453125, 5.91790771484375, 6.1197509765625, 6.32159423828125, 6.5234375]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 4.0, 3.0, 7.0, 6.0, 6.0, 7.0, 15.0, 18.0, 18.0, 19.0, 31.0, 23.0, 37.0, 36.0, 39.0, 34.0, 32.0, 45.0, 48.0, 46.0, 42.0, 47.0, 45.0, 36.0, 37.0, 50.0, 30.0, 39.0, 28.0, 29.0, 27.0, 15.0, 16.0, 15.0, 11.0, 11.0, 14.0, 17.0, 8.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-6.2421875, -6.0635986328125, -5.885009765625, -5.7064208984375, -5.52783203125, -5.3492431640625, -5.170654296875, -4.9920654296875, -4.8134765625, -4.6348876953125, -4.456298828125, -4.2777099609375, -4.09912109375, -3.9205322265625, -3.741943359375, -3.5633544921875, -3.384765625, -3.2061767578125, -3.027587890625, -2.8489990234375, -2.67041015625, -2.4918212890625, -2.313232421875, -2.1346435546875, -1.9560546875, -1.7774658203125, -1.598876953125, -1.4202880859375, -1.24169921875, -1.0631103515625, -0.884521484375, -0.7059326171875, -0.52734375, -0.3487548828125, -0.170166015625, 0.0084228515625, 0.18701171875, 0.3656005859375, 0.544189453125, 0.7227783203125, 0.9013671875, 1.0799560546875, 1.258544921875, 1.4371337890625, 1.61572265625, 1.7943115234375, 1.972900390625, 2.1514892578125, 2.330078125, 2.5086669921875, 2.687255859375, 2.8658447265625, 3.04443359375, 3.2230224609375, 3.401611328125, 3.5802001953125, 3.7587890625, 3.9373779296875, 4.115966796875, 4.2945556640625, 4.47314453125, 4.6517333984375, 4.830322265625, 5.0089111328125, 5.1875]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 6.0, 8.0, 6.0, 9.0, 8.0, 14.0, 29.0, 17.0, 49.0, 59.0, 104.0, 116.0, 248.0, 384.0, 658.0, 1142.0, 2139.0, 4181.0, 8500.0, 17115.0, 35773.0, 74480.0, 137945.0, 206657.0, 219908.0, 160614.0, 90448.0, 44977.0, 21368.0, 10443.0, 5128.0, 2611.0, 1405.0, 779.0, 428.0, 316.0, 159.0, 96.0, 74.0, 63.0, 26.0, 18.0, 16.0, 15.0, 6.0, 7.0, 5.0, 3.0, 0.0, 3.0, 3.0, 2.0], "bins": [-6.27734375, -6.10369873046875, -5.9300537109375, -5.75640869140625, -5.582763671875, -5.40911865234375, -5.2354736328125, -5.06182861328125, -4.88818359375, -4.71453857421875, -4.5408935546875, -4.36724853515625, -4.193603515625, -4.01995849609375, -3.8463134765625, -3.67266845703125, -3.4990234375, -3.32537841796875, -3.1517333984375, -2.97808837890625, -2.804443359375, -2.63079833984375, -2.4571533203125, -2.28350830078125, -2.10986328125, -1.93621826171875, -1.7625732421875, -1.58892822265625, -1.415283203125, -1.24163818359375, -1.0679931640625, -0.89434814453125, -0.720703125, -0.54705810546875, -0.3734130859375, -0.19976806640625, -0.026123046875, 0.14752197265625, 0.3211669921875, 0.49481201171875, 0.66845703125, 0.84210205078125, 1.0157470703125, 1.18939208984375, 1.363037109375, 1.53668212890625, 1.7103271484375, 1.88397216796875, 2.0576171875, 2.23126220703125, 2.4049072265625, 2.57855224609375, 2.752197265625, 2.92584228515625, 3.0994873046875, 3.27313232421875, 3.44677734375, 3.62042236328125, 3.7940673828125, 3.96771240234375, 4.141357421875, 4.31500244140625, 4.4886474609375, 4.66229248046875, 4.8359375]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 4.0, 0.0, 5.0, 8.0, 7.0, 5.0, 13.0, 17.0, 13.0, 18.0, 28.0, 37.0, 36.0, 53.0, 46.0, 53.0, 75.0, 84.0, 77.0, 68.0, 74.0, 51.0, 52.0, 50.0, 40.0, 30.0, 20.0, 9.0, 12.0, 6.0, 5.0, 10.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0007238388061523438, -0.0007066130638122559, -0.000689387321472168, -0.0006721615791320801, -0.0006549358367919922, -0.0006377100944519043, -0.0006204843521118164, -0.0006032586097717285, -0.0005860328674316406, -0.0005688071250915527, -0.0005515813827514648, -0.000534355640411377, -0.0005171298980712891, -0.0004999041557312012, -0.0004826784133911133, -0.0004654526710510254, -0.0004482269287109375, -0.0004310011863708496, -0.0004137754440307617, -0.00039654970169067383, -0.00037932395935058594, -0.00036209821701049805, -0.00034487247467041016, -0.00032764673233032227, -0.0003104209899902344, -0.0002931952476501465, -0.0002759695053100586, -0.0002587437629699707, -0.0002415180206298828, -0.00022429227828979492, -0.00020706653594970703, -0.00018984079360961914, -0.00017261505126953125, -0.00015538930892944336, -0.00013816356658935547, -0.00012093782424926758, -0.00010371208190917969, -8.64863395690918e-05, -6.92605972290039e-05, -5.2034854888916016e-05, -3.4809112548828125e-05, -1.7583370208740234e-05, -3.5762786865234375e-07, 1.6868114471435547e-05, 3.409385681152344e-05, 5.131959915161133e-05, 6.854534149169922e-05, 8.577108383178711e-05, 0.000102996826171875, 0.00012022256851196289, 0.00013744831085205078, 0.00015467405319213867, 0.00017189979553222656, 0.00018912553787231445, 0.00020635128021240234, 0.00022357702255249023, 0.00024080276489257812, 0.000258028507232666, 0.0002752542495727539, 0.0002924799919128418, 0.0003097057342529297, 0.0003269314765930176, 0.00034415721893310547, 0.00036138296127319336, 0.00037860870361328125]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [5.0, 1.0, 2.0, 5.0, 9.0, 7.0, 14.0, 16.0, 24.0, 38.0, 61.0, 76.0, 118.0, 151.0, 217.0, 311.0, 514.0, 720.0, 1090.0, 1583.0, 2502.0, 3984.0, 6062.0, 9422.0, 14558.0, 22306.0, 32995.0, 47651.0, 66762.0, 87748.0, 108196.0, 119970.0, 118941.0, 107290.0, 87329.0, 65638.0, 47531.0, 32381.0, 21645.0, 14086.0, 9263.0, 5948.0, 3973.0, 2477.0, 1641.0, 1154.0, 700.0, 439.0, 336.0, 210.0, 148.0, 104.0, 69.0, 54.0, 34.0, 22.0, 19.0, 12.0, 3.0, 6.0, 4.0, 0.0, 0.0, 1.0], "bins": [-2.94921875, -2.85699462890625, -2.7647705078125, -2.67254638671875, -2.580322265625, -2.48809814453125, -2.3958740234375, -2.30364990234375, -2.21142578125, -2.11920166015625, -2.0269775390625, -1.93475341796875, -1.842529296875, -1.75030517578125, -1.6580810546875, -1.56585693359375, -1.4736328125, -1.38140869140625, -1.2891845703125, -1.19696044921875, -1.104736328125, -1.01251220703125, -0.9202880859375, -0.82806396484375, -0.73583984375, -0.64361572265625, -0.5513916015625, -0.45916748046875, -0.366943359375, -0.27471923828125, -0.1824951171875, -0.09027099609375, 0.001953125, 0.09417724609375, 0.1864013671875, 0.27862548828125, 0.370849609375, 0.46307373046875, 0.5552978515625, 0.64752197265625, 0.73974609375, 0.83197021484375, 0.9241943359375, 1.01641845703125, 1.108642578125, 1.20086669921875, 1.2930908203125, 1.38531494140625, 1.4775390625, 1.56976318359375, 1.6619873046875, 1.75421142578125, 1.846435546875, 1.93865966796875, 2.0308837890625, 2.12310791015625, 2.21533203125, 2.30755615234375, 2.3997802734375, 2.49200439453125, 2.584228515625, 2.67645263671875, 2.7686767578125, 2.86090087890625, 2.953125]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 4.0, 2.0, 5.0, 2.0, 8.0, 10.0, 14.0, 11.0, 12.0, 20.0, 15.0, 23.0, 10.0, 33.0, 41.0, 29.0, 30.0, 36.0, 37.0, 46.0, 53.0, 37.0, 48.0, 53.0, 52.0, 32.0, 33.0, 48.0, 37.0, 22.0, 30.0, 33.0, 24.0, 16.0, 18.0, 12.0, 9.0, 7.0, 12.0, 9.0, 9.0, 5.0, 3.0, 2.0, 4.0, 4.0, 0.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.2880859375, -1.2499542236328125, -1.211822509765625, -1.1736907958984375, -1.13555908203125, -1.0974273681640625, -1.059295654296875, -1.0211639404296875, -0.9830322265625, -0.9449005126953125, -0.906768798828125, -0.8686370849609375, -0.83050537109375, -0.7923736572265625, -0.754241943359375, -0.7161102294921875, -0.677978515625, -0.6398468017578125, -0.601715087890625, -0.5635833740234375, -0.52545166015625, -0.4873199462890625, -0.449188232421875, -0.4110565185546875, -0.3729248046875, -0.3347930908203125, -0.296661376953125, -0.2585296630859375, -0.22039794921875, -0.1822662353515625, -0.144134521484375, -0.1060028076171875, -0.06787109375, -0.0297393798828125, 0.008392333984375, 0.0465240478515625, 0.08465576171875, 0.1227874755859375, 0.160919189453125, 0.1990509033203125, 0.2371826171875, 0.2753143310546875, 0.313446044921875, 0.3515777587890625, 0.38970947265625, 0.4278411865234375, 0.465972900390625, 0.5041046142578125, 0.542236328125, 0.5803680419921875, 0.618499755859375, 0.6566314697265625, 0.69476318359375, 0.7328948974609375, 0.771026611328125, 0.8091583251953125, 0.8472900390625, 0.8854217529296875, 0.923553466796875, 0.9616851806640625, 0.99981689453125, 1.0379486083984375, 1.076080322265625, 1.1142120361328125, 1.15234375]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 5.0, 4.0, 5.0, 7.0, 8.0, 17.0, 7.0, 18.0, 15.0, 21.0, 25.0, 36.0, 33.0, 31.0, 35.0, 40.0, 57.0, 56.0, 48.0, 43.0, 59.0, 47.0, 47.0, 29.0, 38.0, 49.0, 30.0, 37.0, 22.0, 25.0, 18.0, 23.0, 13.0, 8.0, 16.0, 10.0, 6.0, 6.0, 6.0, 3.0, 3.0, 3.0, 1.0, 1.0, 3.0], "bins": [-10.756875991821289, -10.48032283782959, -10.20376968383789, -9.927217483520508, -9.650664329528809, -9.37411117553711, -9.09755802154541, -8.821004867553711, -8.544452667236328, -8.267899513244629, -7.991346836090088, -7.714793682098389, -7.438241004943848, -7.161687850952148, -6.885134696960449, -6.60858154296875, -6.332028388977051, -6.055475234985352, -5.7789225578308105, -5.502369403839111, -5.22581672668457, -4.949263572692871, -4.672710418701172, -4.396157264709473, -4.119604587554932, -3.8430516719818115, -3.5664987564086914, -3.289945602416992, -3.013392686843872, -2.736839771270752, -2.4602866172790527, -2.1837337017059326, -1.907179832458496, -1.630626916885376, -1.3540738821029663, -1.0775208473205566, -0.8009679317474365, -0.5244150161743164, -0.24786198139190674, 0.02869105339050293, 0.30524396896362305, 0.5817969441413879, 0.8583499193191528, 1.1349029541015625, 1.4114558696746826, 1.6880087852478027, 1.9645618200302124, 2.241114854812622, 2.517667770385742, 2.7942206859588623, 3.0707736015319824, 3.3473267555236816, 3.6238796710968018, 3.900432586669922, 4.176985740661621, 4.45353889465332, 4.730091571807861, 5.0066447257995605, 5.283197402954102, 5.559750556945801, 5.8363037109375, 6.112856388092041, 6.38940954208374, 6.665962219238281, 6.9425153732299805]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 2.0, 8.0, 5.0, 5.0, 8.0, 10.0, 8.0, 18.0, 12.0, 22.0, 19.0, 23.0, 20.0, 33.0, 31.0, 27.0, 42.0, 31.0, 44.0, 42.0, 40.0, 37.0, 39.0, 38.0, 33.0, 43.0, 36.0, 31.0, 42.0, 36.0, 31.0, 20.0, 28.0, 23.0, 19.0, 13.0, 14.0, 10.0, 10.0, 9.0, 7.0, 6.0, 12.0, 4.0, 9.0, 3.0, 5.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.217131614685059, -7.957611560821533, -7.69809103012085, -7.438570976257324, -7.179050445556641, -6.919530391693115, -6.66001033782959, -6.400489807128906, -6.140969276428223, -5.881449222564697, -5.621928691864014, -5.362408638000488, -5.102888107299805, -4.843368053436279, -4.583847999572754, -4.32432746887207, -4.064807415008545, -3.8052871227264404, -3.545766830444336, -3.2862467765808105, -3.026726245880127, -2.7672061920166016, -2.507685899734497, -2.2481656074523926, -1.988645315170288, -1.7291250228881836, -1.469604730606079, -1.2100845575332642, -0.9505642652511597, -0.6910439729690552, -0.43152379989624023, -0.17200350761413574, 0.08751678466796875, 0.34703704714775085, 0.606557309627533, 0.8660775423049927, 1.1255978345870972, 1.3851181268692017, 1.6446382999420166, 1.904158592224121, 2.1636788845062256, 2.42319917678833, 2.6827194690704346, 2.942239761352539, 3.2017598152160645, 3.461280345916748, 3.7208003997802734, 3.980320692062378, 4.239840984344482, 4.499361038208008, 4.758881568908691, 5.018401622772217, 5.2779221534729, 5.537442207336426, 5.796962738037109, 6.056482791900635, 6.31600284576416, 6.5755228996276855, 6.835043430328369, 7.0945634841918945, 7.354084014892578, 7.6136040687561035, 7.873124122619629, 8.132644653320312, 8.392165184020996]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 7.0, 2.0, 7.0, 11.0, 17.0, 26.0, 44.0, 49.0, 90.0, 126.0, 234.0, 374.0, 620.0, 1054.0, 1798.0, 3172.0, 5567.0, 10353.0, 19875.0, 39080.0, 80195.0, 167215.0, 330723.0, 573629.0, 796777.0, 817123.0, 614709.0, 362496.0, 185838.0, 89946.0, 43757.0, 22056.0, 11736.0, 6439.0, 3646.0, 2109.0, 1316.0, 798.0, 439.0, 277.0, 212.0, 117.0, 89.0, 47.0, 40.0, 22.0, 9.0, 9.0, 11.0, 4.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.37109375, -7.12603759765625, -6.8809814453125, -6.63592529296875, -6.390869140625, -6.14581298828125, -5.9007568359375, -5.65570068359375, -5.41064453125, -5.16558837890625, -4.9205322265625, -4.67547607421875, -4.430419921875, -4.18536376953125, -3.9403076171875, -3.69525146484375, -3.4501953125, -3.20513916015625, -2.9600830078125, -2.71502685546875, -2.469970703125, -2.22491455078125, -1.9798583984375, -1.73480224609375, -1.48974609375, -1.24468994140625, -0.9996337890625, -0.75457763671875, -0.509521484375, -0.26446533203125, -0.0194091796875, 0.22564697265625, 0.470703125, 0.71575927734375, 0.9608154296875, 1.20587158203125, 1.450927734375, 1.69598388671875, 1.9410400390625, 2.18609619140625, 2.43115234375, 2.67620849609375, 2.9212646484375, 3.16632080078125, 3.411376953125, 3.65643310546875, 3.9014892578125, 4.14654541015625, 4.3916015625, 4.63665771484375, 4.8817138671875, 5.12677001953125, 5.371826171875, 5.61688232421875, 5.8619384765625, 6.10699462890625, 6.35205078125, 6.59710693359375, 6.8421630859375, 7.08721923828125, 7.332275390625, 7.57733154296875, 7.8223876953125, 8.06744384765625, 8.3125]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 4.0, 5.0, 4.0, 11.0, 8.0, 8.0, 16.0, 17.0, 14.0, 8.0, 20.0, 24.0, 26.0, 34.0, 19.0, 42.0, 36.0, 30.0, 47.0, 47.0, 41.0, 46.0, 38.0, 39.0, 38.0, 33.0, 40.0, 29.0, 37.0, 31.0, 29.0, 26.0, 21.0, 20.0, 22.0, 15.0, 12.0, 9.0, 11.0, 8.0, 10.0, 13.0, 6.0, 5.0, 2.0, 2.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.77734375, -6.55377197265625, -6.3302001953125, -6.10662841796875, -5.883056640625, -5.65948486328125, -5.4359130859375, -5.21234130859375, -4.98876953125, -4.76519775390625, -4.5416259765625, -4.31805419921875, -4.094482421875, -3.87091064453125, -3.6473388671875, -3.42376708984375, -3.2001953125, -2.97662353515625, -2.7530517578125, -2.52947998046875, -2.305908203125, -2.08233642578125, -1.8587646484375, -1.63519287109375, -1.41162109375, -1.18804931640625, -0.9644775390625, -0.74090576171875, -0.517333984375, -0.29376220703125, -0.0701904296875, 0.15338134765625, 0.376953125, 0.60052490234375, 0.8240966796875, 1.04766845703125, 1.271240234375, 1.49481201171875, 1.7183837890625, 1.94195556640625, 2.16552734375, 2.38909912109375, 2.6126708984375, 2.83624267578125, 3.059814453125, 3.28338623046875, 3.5069580078125, 3.73052978515625, 3.9541015625, 4.17767333984375, 4.4012451171875, 4.62481689453125, 4.848388671875, 5.07196044921875, 5.2955322265625, 5.51910400390625, 5.74267578125, 5.96624755859375, 6.1898193359375, 6.41339111328125, 6.636962890625, 6.86053466796875, 7.0841064453125, 7.30767822265625, 7.53125]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [3.0, 5.0, 2.0, 4.0, 21.0, 15.0, 14.0, 32.0, 34.0, 65.0, 87.0, 120.0, 182.0, 279.0, 393.0, 601.0, 859.0, 1357.0, 2041.0, 3122.0, 4978.0, 8133.0, 13314.0, 22692.0, 38268.0, 64385.0, 110050.0, 183790.0, 297986.0, 445533.0, 590960.0, 649056.0, 583435.0, 437807.0, 290696.0, 179821.0, 107192.0, 63234.0, 37043.0, 21936.0, 13105.0, 7969.0, 4854.0, 3030.0, 1938.0, 1255.0, 842.0, 542.0, 397.0, 269.0, 149.0, 127.0, 82.0, 61.0, 50.0, 33.0, 26.0, 12.0, 8.0, 4.0, 2.0, 2.0, 0.0, 2.0], "bins": [-7.1328125, -6.90618896484375, -6.6795654296875, -6.45294189453125, -6.226318359375, -5.99969482421875, -5.7730712890625, -5.54644775390625, -5.31982421875, -5.09320068359375, -4.8665771484375, -4.63995361328125, -4.413330078125, -4.18670654296875, -3.9600830078125, -3.73345947265625, -3.5068359375, -3.28021240234375, -3.0535888671875, -2.82696533203125, -2.600341796875, -2.37371826171875, -2.1470947265625, -1.92047119140625, -1.69384765625, -1.46722412109375, -1.2406005859375, -1.01397705078125, -0.787353515625, -0.56072998046875, -0.3341064453125, -0.10748291015625, 0.119140625, 0.34576416015625, 0.5723876953125, 0.79901123046875, 1.025634765625, 1.25225830078125, 1.4788818359375, 1.70550537109375, 1.93212890625, 2.15875244140625, 2.3853759765625, 2.61199951171875, 2.838623046875, 3.06524658203125, 3.2918701171875, 3.51849365234375, 3.7451171875, 3.97174072265625, 4.1983642578125, 4.42498779296875, 4.651611328125, 4.87823486328125, 5.1048583984375, 5.33148193359375, 5.55810546875, 5.78472900390625, 6.0113525390625, 6.23797607421875, 6.464599609375, 6.69122314453125, 6.9178466796875, 7.14447021484375, 7.37109375]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 6.0, 2.0, 5.0, 8.0, 13.0, 9.0, 14.0, 22.0, 24.0, 34.0, 51.0, 52.0, 67.0, 88.0, 105.0, 111.0, 149.0, 147.0, 217.0, 219.0, 214.0, 233.0, 247.0, 240.0, 211.0, 243.0, 212.0, 195.0, 149.0, 130.0, 136.0, 109.0, 101.0, 65.0, 49.0, 54.0, 37.0, 28.0, 19.0, 16.0, 15.0, 5.0, 9.0, 6.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0], "bins": [-3.4765625, -3.377685546875, -3.27880859375, -3.179931640625, -3.0810546875, -2.982177734375, -2.88330078125, -2.784423828125, -2.685546875, -2.586669921875, -2.48779296875, -2.388916015625, -2.2900390625, -2.191162109375, -2.09228515625, -1.993408203125, -1.89453125, -1.795654296875, -1.69677734375, -1.597900390625, -1.4990234375, -1.400146484375, -1.30126953125, -1.202392578125, -1.103515625, -1.004638671875, -0.90576171875, -0.806884765625, -0.7080078125, -0.609130859375, -0.51025390625, -0.411376953125, -0.3125, -0.213623046875, -0.11474609375, -0.015869140625, 0.0830078125, 0.181884765625, 0.28076171875, 0.379638671875, 0.478515625, 0.577392578125, 0.67626953125, 0.775146484375, 0.8740234375, 0.972900390625, 1.07177734375, 1.170654296875, 1.26953125, 1.368408203125, 1.46728515625, 1.566162109375, 1.6650390625, 1.763916015625, 1.86279296875, 1.961669921875, 2.060546875, 2.159423828125, 2.25830078125, 2.357177734375, 2.4560546875, 2.554931640625, 2.65380859375, 2.752685546875, 2.8515625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 6.0, 5.0, 4.0, 16.0, 14.0, 11.0, 19.0, 22.0, 13.0, 21.0, 26.0, 28.0, 31.0, 48.0, 40.0, 49.0, 43.0, 42.0, 42.0, 45.0, 38.0, 41.0, 35.0, 39.0, 36.0, 41.0, 31.0, 19.0, 35.0, 28.0, 22.0, 20.0, 16.0, 7.0, 9.0, 6.0, 10.0, 4.0, 6.0, 9.0, 3.0, 7.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.978044033050537, -7.740965843200684, -7.503887176513672, -7.266808986663818, -7.029730796813965, -6.792652606964111, -6.555574417114258, -6.318495750427246, -6.081417560577393, -5.844339370727539, -5.607260704040527, -5.370182514190674, -5.13310432434082, -4.896026134490967, -4.658947944641113, -4.421869277954102, -4.184791088104248, -3.9477128982543945, -3.710634469985962, -3.4735560417175293, -3.236477851867676, -2.9993996620178223, -2.7623212337493896, -2.525242805480957, -2.2881646156311035, -2.05108642578125, -1.8140079975128174, -1.5769296884536743, -1.3398513793945312, -1.1027730703353882, -0.8656947612762451, -0.628616452217102, -0.391538143157959, -0.15445983409881592, 0.08261847496032715, 0.3196967840194702, 0.5567750930786133, 0.7938534021377563, 1.0309317111968994, 1.2680100202560425, 1.5050883293151855, 1.7421666383743286, 1.9792449474334717, 2.2163233757019043, 2.453401565551758, 2.6904797554016113, 2.927558183670044, 3.1646366119384766, 3.40171480178833, 3.6387929916381836, 3.875871419906616, 4.112949848175049, 4.350028038024902, 4.587106227874756, 4.824184417724609, 5.061263084411621, 5.298341274261475, 5.535419464111328, 5.77249813079834, 6.009576320648193, 6.246654510498047, 6.4837327003479, 6.720810890197754, 6.957889556884766, 7.194967746734619]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 1.0, 6.0, 4.0, 10.0, 10.0, 10.0, 10.0, 9.0, 19.0, 19.0, 18.0, 22.0, 22.0, 17.0, 27.0, 27.0, 28.0, 31.0, 36.0, 42.0, 31.0, 32.0, 30.0, 28.0, 36.0, 52.0, 37.0, 41.0, 28.0, 31.0, 28.0, 31.0, 30.0, 26.0, 21.0, 20.0, 19.0, 15.0, 16.0, 20.0, 12.0, 11.0, 4.0, 4.0, 5.0, 6.0, 8.0, 1.0, 5.0, 3.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-7.260483264923096, -7.033613681793213, -6.80674409866333, -6.579874515533447, -6.3530049324035645, -6.126135349273682, -5.899266242980957, -5.672396659851074, -5.445527076721191, -5.218657493591309, -4.991787910461426, -4.764918327331543, -4.53804874420166, -4.311179161071777, -4.0843095779418945, -3.857440233230591, -3.630570411682129, -3.403700828552246, -3.1768312454223633, -2.9499616622924805, -2.7230920791625977, -2.496222496032715, -2.269353151321411, -2.0424835681915283, -1.8156139850616455, -1.5887444019317627, -1.3618748188018799, -1.1350053548812866, -0.9081357717514038, -0.681266188621521, -0.45439672470092773, -0.22752714157104492, -0.0006575584411621094, 0.22621199488639832, 0.45308154821395874, 0.6799510717391968, 0.9068206548690796, 1.1336902379989624, 1.3605597019195557, 1.5874292850494385, 1.8142988681793213, 2.041168451309204, 2.268038034439087, 2.4949073791503906, 2.7217769622802734, 2.9486465454101562, 3.175516128540039, 3.402385711669922, 3.6292552947998047, 3.8561248779296875, 4.08299446105957, 4.309864044189453, 4.536733627319336, 4.763603210449219, 4.990472793579102, 5.217342376708984, 5.444211959838867, 5.67108154296875, 5.897951126098633, 6.124820709228516, 6.351690292358398, 6.578559875488281, 6.805429458618164, 7.032299041748047, 7.2591681480407715]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 3.0, 10.0, 16.0, 12.0, 27.0, 40.0, 62.0, 109.0, 151.0, 262.0, 398.0, 626.0, 968.0, 1580.0, 2562.0, 4186.0, 7173.0, 12293.0, 21088.0, 35976.0, 59527.0, 92517.0, 130247.0, 158569.0, 156578.0, 128638.0, 91125.0, 57870.0, 35293.0, 20805.0, 12237.0, 6987.0, 4119.0, 2492.0, 1541.0, 925.0, 550.0, 361.0, 219.0, 135.0, 99.0, 66.0, 46.0, 25.0, 20.0, 16.0, 4.0, 7.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.603515625, -2.5220947265625, -2.440673828125, -2.3592529296875, -2.27783203125, -2.1964111328125, -2.114990234375, -2.0335693359375, -1.9521484375, -1.8707275390625, -1.789306640625, -1.7078857421875, -1.62646484375, -1.5450439453125, -1.463623046875, -1.3822021484375, -1.30078125, -1.2193603515625, -1.137939453125, -1.0565185546875, -0.97509765625, -0.8936767578125, -0.812255859375, -0.7308349609375, -0.6494140625, -0.5679931640625, -0.486572265625, -0.4051513671875, -0.32373046875, -0.2423095703125, -0.160888671875, -0.0794677734375, 0.001953125, 0.0833740234375, 0.164794921875, 0.2462158203125, 0.32763671875, 0.4090576171875, 0.490478515625, 0.5718994140625, 0.6533203125, 0.7347412109375, 0.816162109375, 0.8975830078125, 0.97900390625, 1.0604248046875, 1.141845703125, 1.2232666015625, 1.3046875, 1.3861083984375, 1.467529296875, 1.5489501953125, 1.63037109375, 1.7117919921875, 1.793212890625, 1.8746337890625, 1.9560546875, 2.0374755859375, 2.118896484375, 2.2003173828125, 2.28173828125, 2.3631591796875, 2.444580078125, 2.5260009765625, 2.607421875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 3.0, 6.0, 7.0, 6.0, 8.0, 11.0, 17.0, 16.0, 17.0, 18.0, 19.0, 24.0, 21.0, 22.0, 19.0, 25.0, 23.0, 25.0, 34.0, 39.0, 31.0, 33.0, 41.0, 29.0, 33.0, 37.0, 40.0, 35.0, 31.0, 34.0, 28.0, 29.0, 28.0, 19.0, 23.0, 24.0, 14.0, 18.0, 18.0, 20.0, 17.0, 11.0, 7.0, 9.0, 8.0, 6.0, 4.0, 3.0, 2.0, 1.0, 3.0, 7.0, 1.0, 0.0, 3.0, 1.0, 2.0], "bins": [-7.00390625, -6.7799072265625, -6.555908203125, -6.3319091796875, -6.10791015625, -5.8839111328125, -5.659912109375, -5.4359130859375, -5.2119140625, -4.9879150390625, -4.763916015625, -4.5399169921875, -4.31591796875, -4.0919189453125, -3.867919921875, -3.6439208984375, -3.419921875, -3.1959228515625, -2.971923828125, -2.7479248046875, -2.52392578125, -2.2999267578125, -2.075927734375, -1.8519287109375, -1.6279296875, -1.4039306640625, -1.179931640625, -0.9559326171875, -0.73193359375, -0.5079345703125, -0.283935546875, -0.0599365234375, 0.1640625, 0.3880615234375, 0.612060546875, 0.8360595703125, 1.06005859375, 1.2840576171875, 1.508056640625, 1.7320556640625, 1.9560546875, 2.1800537109375, 2.404052734375, 2.6280517578125, 2.85205078125, 3.0760498046875, 3.300048828125, 3.5240478515625, 3.748046875, 3.9720458984375, 4.196044921875, 4.4200439453125, 4.64404296875, 4.8680419921875, 5.092041015625, 5.3160400390625, 5.5400390625, 5.7640380859375, 5.988037109375, 6.2120361328125, 6.43603515625, 6.6600341796875, 6.884033203125, 7.1080322265625, 7.33203125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 4.0, 7.0, 3.0, 11.0, 20.0, 14.0, 25.0, 19.0, 29.0, 38.0, 44.0, 62.0, 75.0, 86.0, 174.0, 218.0, 344.0, 502.0, 990.0, 1700.0, 3312.0, 6617.0, 13679.0, 29828.0, 251100.0, 668896.0, 36949.0, 16527.0, 8088.0, 4072.0, 2111.0, 1120.0, 651.0, 355.0, 253.0, 164.0, 100.0, 72.0, 58.0, 60.0, 42.0, 23.0, 33.0, 19.0, 14.0, 16.0, 8.0, 7.0, 5.0, 4.0, 4.0, 5.0, 3.0, 0.0, 0.0, 2.0, 1.0], "bins": [-9.0703125, -8.7879638671875, -8.505615234375, -8.2232666015625, -7.94091796875, -7.6585693359375, -7.376220703125, -7.0938720703125, -6.8115234375, -6.5291748046875, -6.246826171875, -5.9644775390625, -5.68212890625, -5.3997802734375, -5.117431640625, -4.8350830078125, -4.552734375, -4.2703857421875, -3.988037109375, -3.7056884765625, -3.42333984375, -3.1409912109375, -2.858642578125, -2.5762939453125, -2.2939453125, -2.0115966796875, -1.729248046875, -1.4468994140625, -1.16455078125, -0.8822021484375, -0.599853515625, -0.3175048828125, -0.03515625, 0.2471923828125, 0.529541015625, 0.8118896484375, 1.09423828125, 1.3765869140625, 1.658935546875, 1.9412841796875, 2.2236328125, 2.5059814453125, 2.788330078125, 3.0706787109375, 3.35302734375, 3.6353759765625, 3.917724609375, 4.2000732421875, 4.482421875, 4.7647705078125, 5.047119140625, 5.3294677734375, 5.61181640625, 5.8941650390625, 6.176513671875, 6.4588623046875, 6.7412109375, 7.0235595703125, 7.305908203125, 7.5882568359375, 7.87060546875, 8.1529541015625, 8.435302734375, 8.7176513671875, 9.0]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 7.0, 7.0, 6.0, 8.0, 14.0, 7.0, 16.0, 28.0, 14.0, 25.0, 20.0, 25.0, 27.0, 23.0, 21.0, 36.0, 33.0, 47.0, 42.0, 47.0, 45.0, 38.0, 34.0, 35.0, 41.0, 41.0, 43.0, 27.0, 38.0, 32.0, 27.0, 25.0, 18.0, 18.0, 17.0, 17.0, 7.0, 13.0, 8.0, 6.0, 5.0, 5.0, 4.0, 2.0, 4.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.75390625, -5.5699462890625, -5.385986328125, -5.2020263671875, -5.01806640625, -4.8341064453125, -4.650146484375, -4.4661865234375, -4.2822265625, -4.0982666015625, -3.914306640625, -3.7303466796875, -3.54638671875, -3.3624267578125, -3.178466796875, -2.9945068359375, -2.810546875, -2.6265869140625, -2.442626953125, -2.2586669921875, -2.07470703125, -1.8907470703125, -1.706787109375, -1.5228271484375, -1.3388671875, -1.1549072265625, -0.970947265625, -0.7869873046875, -0.60302734375, -0.4190673828125, -0.235107421875, -0.0511474609375, 0.1328125, 0.3167724609375, 0.500732421875, 0.6846923828125, 0.86865234375, 1.0526123046875, 1.236572265625, 1.4205322265625, 1.6044921875, 1.7884521484375, 1.972412109375, 2.1563720703125, 2.34033203125, 2.5242919921875, 2.708251953125, 2.8922119140625, 3.076171875, 3.2601318359375, 3.444091796875, 3.6280517578125, 3.81201171875, 3.9959716796875, 4.179931640625, 4.3638916015625, 4.5478515625, 4.7318115234375, 4.915771484375, 5.0997314453125, 5.28369140625, 5.4676513671875, 5.651611328125, 5.8355712890625, 6.01953125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 1.0, 4.0, 2.0, 8.0, 11.0, 5.0, 12.0, 24.0, 14.0, 24.0, 45.0, 57.0, 89.0, 89.0, 130.0, 178.0, 325.0, 451.0, 739.0, 1252.0, 2136.0, 4081.0, 7845.0, 16337.0, 40170.0, 605853.0, 306349.0, 32697.0, 14049.0, 6890.0, 3593.0, 1997.0, 1139.0, 647.0, 424.0, 255.0, 207.0, 125.0, 70.0, 61.0, 43.0, 28.0, 17.0, 22.0, 10.0, 14.0, 9.0, 10.0, 4.0, 3.0, 6.0, 3.0, 0.0, 5.0, 0.0, 2.0, 3.0], "bins": [-0.87255859375, -0.846038818359375, -0.81951904296875, -0.792999267578125, -0.7664794921875, -0.739959716796875, -0.71343994140625, -0.686920166015625, -0.660400390625, -0.633880615234375, -0.60736083984375, -0.580841064453125, -0.5543212890625, -0.527801513671875, -0.50128173828125, -0.474761962890625, -0.4482421875, -0.421722412109375, -0.39520263671875, -0.368682861328125, -0.3421630859375, -0.315643310546875, -0.28912353515625, -0.262603759765625, -0.236083984375, -0.209564208984375, -0.18304443359375, -0.156524658203125, -0.1300048828125, -0.103485107421875, -0.07696533203125, -0.050445556640625, -0.02392578125, 0.002593994140625, 0.02911376953125, 0.055633544921875, 0.0821533203125, 0.108673095703125, 0.13519287109375, 0.161712646484375, 0.188232421875, 0.214752197265625, 0.24127197265625, 0.267791748046875, 0.2943115234375, 0.320831298828125, 0.34735107421875, 0.373870849609375, 0.400390625, 0.426910400390625, 0.45343017578125, 0.479949951171875, 0.5064697265625, 0.532989501953125, 0.55950927734375, 0.586029052734375, 0.612548828125, 0.639068603515625, 0.66558837890625, 0.692108154296875, 0.7186279296875, 0.745147705078125, 0.77166748046875, 0.798187255859375, 0.82470703125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 3.0, 4.0, 5.0, 1.0, 3.0, 7.0, 9.0, 13.0, 6.0, 20.0, 26.0, 50.0, 39.0, 49.0, 59.0, 62.0, 79.0, 74.0, 82.0, 55.0, 65.0, 63.0, 52.0, 37.0, 17.0, 25.0, 14.0, 21.0, 18.0, 8.0, 10.0, 11.0, 6.0, 3.0, 3.0, 2.0, 5.0, 2.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.423494338989258e-05, -9.127426892518997e-05, -8.831359446048737e-05, -8.535291999578476e-05, -8.239224553108215e-05, -7.943157106637955e-05, -7.647089660167694e-05, -7.351022213697433e-05, -7.054954767227173e-05, -6.758887320756912e-05, -6.462819874286652e-05, -6.166752427816391e-05, -5.8706849813461304e-05, -5.57461753487587e-05, -5.278550088405609e-05, -4.9824826419353485e-05, -4.686415195465088e-05, -4.390347748994827e-05, -4.0942803025245667e-05, -3.798212856054306e-05, -3.5021454095840454e-05, -3.206077963113785e-05, -2.9100105166435242e-05, -2.6139430701732635e-05, -2.317875623703003e-05, -2.0218081772327423e-05, -1.7257407307624817e-05, -1.429673284292221e-05, -1.1336058378219604e-05, -8.375383913516998e-06, -5.414709448814392e-06, -2.454034984111786e-06, 5.066394805908203e-07, 3.4673139452934265e-06, 6.427988409996033e-06, 9.388662874698639e-06, 1.2349337339401245e-05, 1.531001180410385e-05, 1.8270686268806458e-05, 2.1231360733509064e-05, 2.419203519821167e-05, 2.7152709662914276e-05, 3.0113384127616882e-05, 3.307405859231949e-05, 3.6034733057022095e-05, 3.89954075217247e-05, 4.195608198642731e-05, 4.491675645112991e-05, 4.787743091583252e-05, 5.0838105380535126e-05, 5.379877984523773e-05, 5.675945430994034e-05, 5.9720128774642944e-05, 6.268080323934555e-05, 6.564147770404816e-05, 6.860215216875076e-05, 7.156282663345337e-05, 7.452350109815598e-05, 7.748417556285858e-05, 8.044485002756119e-05, 8.34055244922638e-05, 8.63661989569664e-05, 8.9326873421669e-05, 9.228754788637161e-05, 9.524822235107422e-05]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 6.0, 8.0, 16.0, 23.0, 28.0, 33.0, 49.0, 59.0, 74.0, 129.0, 183.0, 241.0, 344.0, 470.0, 652.0, 948.0, 1382.0, 2068.0, 3182.0, 5021.0, 8234.0, 13950.0, 24313.0, 43057.0, 74367.0, 121136.0, 167534.0, 182417.0, 151531.0, 101742.0, 60738.0, 34444.0, 19461.0, 11285.0, 6752.0, 4238.0, 2713.0, 1796.0, 1165.0, 831.0, 511.0, 408.0, 294.0, 190.0, 159.0, 99.0, 82.0, 74.0, 33.0, 39.0, 15.0, 20.0, 9.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.47607421875, -0.46036529541015625, -0.4446563720703125, -0.42894744873046875, -0.413238525390625, -0.39752960205078125, -0.3818206787109375, -0.36611175537109375, -0.35040283203125, -0.33469390869140625, -0.3189849853515625, -0.30327606201171875, -0.287567138671875, -0.27185821533203125, -0.2561492919921875, -0.24044036865234375, -0.2247314453125, -0.20902252197265625, -0.1933135986328125, -0.17760467529296875, -0.161895751953125, -0.14618682861328125, -0.1304779052734375, -0.11476898193359375, -0.09906005859375, -0.08335113525390625, -0.0676422119140625, -0.05193328857421875, -0.036224365234375, -0.02051544189453125, -0.0048065185546875, 0.01090240478515625, 0.026611328125, 0.04232025146484375, 0.0580291748046875, 0.07373809814453125, 0.089447021484375, 0.10515594482421875, 0.1208648681640625, 0.13657379150390625, 0.15228271484375, 0.16799163818359375, 0.1837005615234375, 0.19940948486328125, 0.215118408203125, 0.23082733154296875, 0.2465362548828125, 0.26224517822265625, 0.2779541015625, 0.29366302490234375, 0.3093719482421875, 0.32508087158203125, 0.340789794921875, 0.35649871826171875, 0.3722076416015625, 0.38791656494140625, 0.40362548828125, 0.41933441162109375, 0.4350433349609375, 0.45075225830078125, 0.466461181640625, 0.48217010498046875, 0.4978790283203125, 0.5135879516601562, 0.529296875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 3.0, 6.0, 6.0, 8.0, 6.0, 14.0, 13.0, 19.0, 24.0, 20.0, 45.0, 47.0, 56.0, 57.0, 71.0, 74.0, 77.0, 68.0, 65.0, 55.0, 61.0, 44.0, 35.0, 27.0, 16.0, 21.0, 17.0, 14.0, 7.0, 8.0, 3.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.224853515625, -0.2177143096923828, -0.21057510375976562, -0.20343589782714844, -0.19629669189453125, -0.18915748596191406, -0.18201828002929688, -0.1748790740966797, -0.1677398681640625, -0.1606006622314453, -0.15346145629882812, -0.14632225036621094, -0.13918304443359375, -0.13204383850097656, -0.12490463256835938, -0.11776542663574219, -0.110626220703125, -0.10348701477050781, -0.09634780883789062, -0.08920860290527344, -0.08206939697265625, -0.07493019104003906, -0.06779098510742188, -0.06065177917480469, -0.0535125732421875, -0.04637336730957031, -0.039234161376953125, -0.03209495544433594, -0.02495574951171875, -0.017816543579101562, -0.010677337646484375, -0.0035381317138671875, 0.00360107421875, 0.010740280151367188, 0.017879486083984375, 0.025018692016601562, 0.03215789794921875, 0.03929710388183594, 0.046436309814453125, 0.05357551574707031, 0.0607147216796875, 0.06785392761230469, 0.07499313354492188, 0.08213233947753906, 0.08927154541015625, 0.09641075134277344, 0.10354995727539062, 0.11068916320800781, 0.117828369140625, 0.12496757507324219, 0.13210678100585938, 0.13924598693847656, 0.14638519287109375, 0.15352439880371094, 0.16066360473632812, 0.1678028106689453, 0.1749420166015625, 0.1820812225341797, 0.18922042846679688, 0.19635963439941406, 0.20349884033203125, 0.21063804626464844, 0.21777725219726562, 0.2249164581298828, 0.2320556640625]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 3.0, 4.0, 2.0, 6.0, 14.0, 17.0, 9.0, 13.0, 16.0, 20.0, 16.0, 25.0, 27.0, 39.0, 27.0, 38.0, 46.0, 39.0, 46.0, 35.0, 49.0, 40.0, 39.0, 33.0, 37.0, 37.0, 41.0, 35.0, 26.0, 22.0, 37.0, 29.0, 18.0, 18.0, 17.0, 12.0, 11.0, 3.0, 10.0, 10.0, 5.0, 5.0, 4.0, 7.0, 4.0, 3.0, 4.0, 3.0, 0.0, 4.0, 1.0], "bins": [-7.763863563537598, -7.538478374481201, -7.313093185424805, -7.087707996368408, -6.862322807312012, -6.636937618255615, -6.411552429199219, -6.186167240142822, -5.960782051086426, -5.735396862030029, -5.510011672973633, -5.284626483917236, -5.05924129486084, -4.833856105804443, -4.608470916748047, -4.38308572769165, -4.157700538635254, -3.9323153495788574, -3.706930160522461, -3.4815449714660645, -3.256159782409668, -3.0307745933532715, -2.805389404296875, -2.5800042152404785, -2.354619026184082, -2.1292338371276855, -1.903848648071289, -1.6784634590148926, -1.453078269958496, -1.2276930809020996, -1.0023078918457031, -0.7769227027893066, -0.5515379905700684, -0.3261528015136719, -0.10076761245727539, 0.1246175765991211, 0.3500027656555176, 0.5753879547119141, 0.8007731437683105, 1.026158332824707, 1.2515435218811035, 1.4769287109375, 1.7023138999938965, 1.927699089050293, 2.1530842781066895, 2.378469467163086, 2.6038546562194824, 2.829239845275879, 3.0546250343322754, 3.280010223388672, 3.5053954124450684, 3.730780601501465, 3.9561657905578613, 4.181550979614258, 4.406936168670654, 4.632321357727051, 4.857706546783447, 5.083091735839844, 5.30847692489624, 5.533862113952637, 5.759247303009033, 5.98463249206543, 6.210017681121826, 6.435402870178223, 6.660788059234619]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 4.0, 5.0, 10.0, 11.0, 9.0, 10.0, 10.0, 19.0, 16.0, 21.0, 25.0, 21.0, 16.0, 27.0, 27.0, 32.0, 31.0, 40.0, 35.0, 32.0, 25.0, 36.0, 30.0, 36.0, 55.0, 36.0, 39.0, 24.0, 34.0, 30.0, 30.0, 29.0, 26.0, 17.0, 24.0, 22.0, 10.0, 19.0, 16.0, 15.0, 7.0, 5.0, 5.0, 3.0, 8.0, 6.0, 1.0, 5.0, 4.0, 5.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-7.143939018249512, -6.92017126083374, -6.696403503417969, -6.472635746002197, -6.248867988586426, -6.025099754333496, -5.801331996917725, -5.577564239501953, -5.353796482086182, -5.13002872467041, -4.906260967254639, -4.682493209838867, -4.4587249755859375, -4.234957695007324, -4.0111894607543945, -3.787421703338623, -3.5636539459228516, -3.33988618850708, -3.1161184310913086, -2.892350435256958, -2.6685826778411865, -2.444814920425415, -2.2210469245910645, -1.997279167175293, -1.7735114097595215, -1.54974365234375, -1.325975775718689, -1.102207899093628, -0.8784401416778564, -0.654672384262085, -0.4309045076370239, -0.2071366310119629, 0.01663064956665039, 0.24039846658706665, 0.4641662836074829, 0.6879341006278992, 0.9117019176483154, 1.135469675064087, 1.359237551689148, 1.583005428314209, 1.8067731857299805, 2.030540943145752, 2.2543087005615234, 2.478076696395874, 2.7018444538116455, 2.925612211227417, 3.1493802070617676, 3.373147964477539, 3.5969157218933105, 3.820683479309082, 4.0444512367248535, 4.268218994140625, 4.491987228393555, 4.715754508972168, 4.939522743225098, 5.163290500640869, 5.387058258056641, 5.610826015472412, 5.834593772888184, 6.058361530303955, 6.282129287719727, 6.505897521972656, 6.729665279388428, 6.953433036804199, 7.177200794219971]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 3.0, 6.0, 7.0, 10.0, 28.0, 40.0, 58.0, 97.0, 176.0, 238.0, 386.0, 588.0, 988.0, 1637.0, 2504.0, 3992.0, 6090.0, 9279.0, 14219.0, 20280.0, 28881.0, 40909.0, 54556.0, 70326.0, 84641.0, 97100.0, 103374.0, 102278.0, 93847.0, 80545.0, 65109.0, 50027.0, 37100.0, 25892.0, 18344.0, 12170.0, 8354.0, 5288.0, 3371.0, 2120.0, 1378.0, 840.0, 533.0, 353.0, 224.0, 148.0, 81.0, 56.0, 46.0, 19.0, 9.0, 12.0, 8.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.4765625, -4.3314208984375, -4.186279296875, -4.0411376953125, -3.89599609375, -3.7508544921875, -3.605712890625, -3.4605712890625, -3.3154296875, -3.1702880859375, -3.025146484375, -2.8800048828125, -2.73486328125, -2.5897216796875, -2.444580078125, -2.2994384765625, -2.154296875, -2.0091552734375, -1.864013671875, -1.7188720703125, -1.57373046875, -1.4285888671875, -1.283447265625, -1.1383056640625, -0.9931640625, -0.8480224609375, -0.702880859375, -0.5577392578125, -0.41259765625, -0.2674560546875, -0.122314453125, 0.0228271484375, 0.16796875, 0.3131103515625, 0.458251953125, 0.6033935546875, 0.74853515625, 0.8936767578125, 1.038818359375, 1.1839599609375, 1.3291015625, 1.4742431640625, 1.619384765625, 1.7645263671875, 1.90966796875, 2.0548095703125, 2.199951171875, 2.3450927734375, 2.490234375, 2.6353759765625, 2.780517578125, 2.9256591796875, 3.07080078125, 3.2159423828125, 3.361083984375, 3.5062255859375, 3.6513671875, 3.7965087890625, 3.941650390625, 4.0867919921875, 4.23193359375, 4.3770751953125, 4.522216796875, 4.6673583984375, 4.8125]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 6.0, 4.0, 4.0, 6.0, 8.0, 7.0, 17.0, 9.0, 14.0, 19.0, 11.0, 10.0, 29.0, 26.0, 16.0, 28.0, 23.0, 23.0, 18.0, 34.0, 35.0, 39.0, 32.0, 34.0, 24.0, 34.0, 43.0, 40.0, 41.0, 35.0, 32.0, 32.0, 28.0, 31.0, 21.0, 26.0, 17.0, 25.0, 16.0, 19.0, 16.0, 9.0, 10.0, 12.0, 6.0, 9.0, 3.0, 5.0, 5.0, 6.0, 3.0, 0.0, 2.0, 8.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0], "bins": [-6.37109375, -6.15533447265625, -5.9395751953125, -5.72381591796875, -5.508056640625, -5.29229736328125, -5.0765380859375, -4.86077880859375, -4.64501953125, -4.42926025390625, -4.2135009765625, -3.99774169921875, -3.781982421875, -3.56622314453125, -3.3504638671875, -3.13470458984375, -2.9189453125, -2.70318603515625, -2.4874267578125, -2.27166748046875, -2.055908203125, -1.84014892578125, -1.6243896484375, -1.40863037109375, -1.19287109375, -0.97711181640625, -0.7613525390625, -0.54559326171875, -0.329833984375, -0.11407470703125, 0.1016845703125, 0.31744384765625, 0.533203125, 0.74896240234375, 0.9647216796875, 1.18048095703125, 1.396240234375, 1.61199951171875, 1.8277587890625, 2.04351806640625, 2.25927734375, 2.47503662109375, 2.6907958984375, 2.90655517578125, 3.122314453125, 3.33807373046875, 3.5538330078125, 3.76959228515625, 3.9853515625, 4.20111083984375, 4.4168701171875, 4.63262939453125, 4.848388671875, 5.06414794921875, 5.2799072265625, 5.49566650390625, 5.71142578125, 5.92718505859375, 6.1429443359375, 6.35870361328125, 6.574462890625, 6.79022216796875, 7.0059814453125, 7.22174072265625, 7.4375]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 6.0, 1.0, 15.0, 15.0, 19.0, 42.0, 68.0, 99.0, 130.0, 219.0, 362.0, 567.0, 849.0, 1349.0, 2239.0, 3464.0, 5418.0, 8782.0, 13387.0, 20517.0, 30504.0, 43977.0, 61339.0, 80705.0, 98750.0, 112103.0, 115332.0, 108651.0, 93534.0, 74524.0, 55375.0, 39378.0, 26889.0, 17798.0, 11705.0, 7451.0, 4762.0, 3013.0, 1929.0, 1207.0, 755.0, 504.0, 275.0, 188.0, 147.0, 78.0, 53.0, 38.0, 21.0, 17.0, 11.0, 3.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.56640625, -5.3887939453125, -5.211181640625, -5.0335693359375, -4.85595703125, -4.6783447265625, -4.500732421875, -4.3231201171875, -4.1455078125, -3.9678955078125, -3.790283203125, -3.6126708984375, -3.43505859375, -3.2574462890625, -3.079833984375, -2.9022216796875, -2.724609375, -2.5469970703125, -2.369384765625, -2.1917724609375, -2.01416015625, -1.8365478515625, -1.658935546875, -1.4813232421875, -1.3037109375, -1.1260986328125, -0.948486328125, -0.7708740234375, -0.59326171875, -0.4156494140625, -0.238037109375, -0.0604248046875, 0.1171875, 0.2947998046875, 0.472412109375, 0.6500244140625, 0.82763671875, 1.0052490234375, 1.182861328125, 1.3604736328125, 1.5380859375, 1.7156982421875, 1.893310546875, 2.0709228515625, 2.24853515625, 2.4261474609375, 2.603759765625, 2.7813720703125, 2.958984375, 3.1365966796875, 3.314208984375, 3.4918212890625, 3.66943359375, 3.8470458984375, 4.024658203125, 4.2022705078125, 4.3798828125, 4.5574951171875, 4.735107421875, 4.9127197265625, 5.09033203125, 5.2679443359375, 5.445556640625, 5.6231689453125, 5.80078125]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 2.0, 4.0, 5.0, 5.0, 11.0, 4.0, 10.0, 14.0, 12.0, 22.0, 21.0, 29.0, 19.0, 20.0, 26.0, 26.0, 35.0, 32.0, 36.0, 41.0, 42.0, 37.0, 39.0, 35.0, 33.0, 34.0, 30.0, 40.0, 27.0, 35.0, 34.0, 29.0, 21.0, 26.0, 24.0, 30.0, 22.0, 12.0, 15.0, 17.0, 9.0, 5.0, 6.0, 8.0, 4.0, 7.0, 5.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-4.6875, -4.53875732421875, -4.3900146484375, -4.24127197265625, -4.092529296875, -3.94378662109375, -3.7950439453125, -3.64630126953125, -3.49755859375, -3.34881591796875, -3.2000732421875, -3.05133056640625, -2.902587890625, -2.75384521484375, -2.6051025390625, -2.45635986328125, -2.3076171875, -2.15887451171875, -2.0101318359375, -1.86138916015625, -1.712646484375, -1.56390380859375, -1.4151611328125, -1.26641845703125, -1.11767578125, -0.96893310546875, -0.8201904296875, -0.67144775390625, -0.522705078125, -0.37396240234375, -0.2252197265625, -0.07647705078125, 0.072265625, 0.22100830078125, 0.3697509765625, 0.51849365234375, 0.667236328125, 0.81597900390625, 0.9647216796875, 1.11346435546875, 1.26220703125, 1.41094970703125, 1.5596923828125, 1.70843505859375, 1.857177734375, 2.00592041015625, 2.1546630859375, 2.30340576171875, 2.4521484375, 2.60089111328125, 2.7496337890625, 2.89837646484375, 3.047119140625, 3.19586181640625, 3.3446044921875, 3.49334716796875, 3.64208984375, 3.79083251953125, 3.9395751953125, 4.08831787109375, 4.237060546875, 4.38580322265625, 4.5345458984375, 4.68328857421875, 4.83203125]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 3.0, 7.0, 6.0, 19.0, 34.0, 30.0, 59.0, 72.0, 112.0, 162.0, 271.0, 422.0, 631.0, 1042.0, 1583.0, 2306.0, 3600.0, 5774.0, 8792.0, 13583.0, 20780.0, 31268.0, 46347.0, 65278.0, 87915.0, 108858.0, 122112.0, 122318.0, 109837.0, 89110.0, 66466.0, 46608.0, 32059.0, 21519.0, 14029.0, 9076.0, 5879.0, 3729.0, 2434.0, 1572.0, 1007.0, 654.0, 410.0, 271.0, 183.0, 109.0, 82.0, 42.0, 35.0, 23.0, 18.0, 10.0, 5.0, 4.0, 3.0, 3.0, 4.0, 1.0, 0.0, 2.0], "bins": [-2.490234375, -2.40997314453125, -2.3297119140625, -2.24945068359375, -2.169189453125, -2.08892822265625, -2.0086669921875, -1.92840576171875, -1.84814453125, -1.76788330078125, -1.6876220703125, -1.60736083984375, -1.527099609375, -1.44683837890625, -1.3665771484375, -1.28631591796875, -1.2060546875, -1.12579345703125, -1.0455322265625, -0.96527099609375, -0.885009765625, -0.80474853515625, -0.7244873046875, -0.64422607421875, -0.56396484375, -0.48370361328125, -0.4034423828125, -0.32318115234375, -0.242919921875, -0.16265869140625, -0.0823974609375, -0.00213623046875, 0.078125, 0.15838623046875, 0.2386474609375, 0.31890869140625, 0.399169921875, 0.47943115234375, 0.5596923828125, 0.63995361328125, 0.72021484375, 0.80047607421875, 0.8807373046875, 0.96099853515625, 1.041259765625, 1.12152099609375, 1.2017822265625, 1.28204345703125, 1.3623046875, 1.44256591796875, 1.5228271484375, 1.60308837890625, 1.683349609375, 1.76361083984375, 1.8438720703125, 1.92413330078125, 2.00439453125, 2.08465576171875, 2.1649169921875, 2.24517822265625, 2.325439453125, 2.40570068359375, 2.4859619140625, 2.56622314453125, 2.646484375]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 8.0, 14.0, 13.0, 10.0, 24.0, 18.0, 25.0, 36.0, 33.0, 43.0, 71.0, 64.0, 73.0, 67.0, 68.0, 66.0, 64.0, 58.0, 52.0, 40.0, 26.0, 31.0, 27.0, 13.0, 8.0, 9.0, 10.0, 7.0, 5.0, 4.0, 7.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004277229309082031, -0.0004148930311203003, -0.00040206313133239746, -0.00038923323154449463, -0.0003764033317565918, -0.00036357343196868896, -0.00035074353218078613, -0.0003379136323928833, -0.00032508373260498047, -0.00031225383281707764, -0.0002994239330291748, -0.00028659403324127197, -0.00027376413345336914, -0.0002609342336654663, -0.0002481043338775635, -0.00023527443408966064, -0.0002224445343017578, -0.00020961463451385498, -0.00019678473472595215, -0.00018395483493804932, -0.00017112493515014648, -0.00015829503536224365, -0.00014546513557434082, -0.000132635235786438, -0.00011980533599853516, -0.00010697543621063232, -9.414553642272949e-05, -8.131563663482666e-05, -6.848573684692383e-05, -5.5655837059020996e-05, -4.2825937271118164e-05, -2.9996037483215332e-05, -1.71661376953125e-05, -4.336237907409668e-06, 8.493661880493164e-06, 2.1323561668395996e-05, 3.415346145629883e-05, 4.698336124420166e-05, 5.981326103210449e-05, 7.264316082000732e-05, 8.547306060791016e-05, 9.830296039581299e-05, 0.00011113286018371582, 0.00012396275997161865, 0.00013679265975952148, 0.00014962255954742432, 0.00016245245933532715, 0.00017528235912322998, 0.0001881122589111328, 0.00020094215869903564, 0.00021377205848693848, 0.0002266019582748413, 0.00023943185806274414, 0.00025226175785064697, 0.0002650916576385498, 0.00027792155742645264, 0.00029075145721435547, 0.0003035813570022583, 0.00031641125679016113, 0.00032924115657806396, 0.0003420710563659668, 0.00035490095615386963, 0.00036773085594177246, 0.0003805607557296753, 0.0003933906555175781]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 6.0, 10.0, 15.0, 19.0, 27.0, 48.0, 81.0, 126.0, 168.0, 291.0, 422.0, 701.0, 1098.0, 1838.0, 3187.0, 5205.0, 9052.0, 15156.0, 25461.0, 41157.0, 65382.0, 94662.0, 124059.0, 143737.0, 142201.0, 121308.0, 91857.0, 62063.0, 39387.0, 24290.0, 14561.0, 8533.0, 4989.0, 2884.0, 1717.0, 1110.0, 645.0, 402.0, 245.0, 174.0, 98.0, 69.0, 47.0, 30.0, 10.0, 14.0, 7.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.01953125, -2.925018310546875, -2.83050537109375, -2.735992431640625, -2.6414794921875, -2.546966552734375, -2.45245361328125, -2.357940673828125, -2.263427734375, -2.168914794921875, -2.07440185546875, -1.979888916015625, -1.8853759765625, -1.790863037109375, -1.69635009765625, -1.601837158203125, -1.50732421875, -1.412811279296875, -1.31829833984375, -1.223785400390625, -1.1292724609375, -1.034759521484375, -0.94024658203125, -0.845733642578125, -0.751220703125, -0.656707763671875, -0.56219482421875, -0.467681884765625, -0.3731689453125, -0.278656005859375, -0.18414306640625, -0.089630126953125, 0.0048828125, 0.099395751953125, 0.19390869140625, 0.288421630859375, 0.3829345703125, 0.477447509765625, 0.57196044921875, 0.666473388671875, 0.760986328125, 0.855499267578125, 0.95001220703125, 1.044525146484375, 1.1390380859375, 1.233551025390625, 1.32806396484375, 1.422576904296875, 1.51708984375, 1.611602783203125, 1.70611572265625, 1.800628662109375, 1.8951416015625, 1.989654541015625, 2.08416748046875, 2.178680419921875, 2.273193359375, 2.367706298828125, 2.46221923828125, 2.556732177734375, 2.6512451171875, 2.745758056640625, 2.84027099609375, 2.934783935546875, 3.029296875]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 0.0, 3.0, 3.0, 4.0, 7.0, 3.0, 10.0, 15.0, 20.0, 17.0, 20.0, 18.0, 22.0, 28.0, 32.0, 26.0, 42.0, 36.0, 40.0, 41.0, 38.0, 44.0, 41.0, 46.0, 36.0, 43.0, 42.0, 40.0, 30.0, 34.0, 27.0, 22.0, 23.0, 27.0, 20.0, 19.0, 17.0, 15.0, 14.0, 12.0, 5.0, 5.0, 6.0, 7.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.0439453125, -1.0102691650390625, -0.976593017578125, -0.9429168701171875, -0.90924072265625, -0.8755645751953125, -0.841888427734375, -0.8082122802734375, -0.7745361328125, -0.7408599853515625, -0.707183837890625, -0.6735076904296875, -0.63983154296875, -0.6061553955078125, -0.572479248046875, -0.5388031005859375, -0.505126953125, -0.4714508056640625, -0.437774658203125, -0.4040985107421875, -0.37042236328125, -0.3367462158203125, -0.303070068359375, -0.2693939208984375, -0.2357177734375, -0.2020416259765625, -0.168365478515625, -0.1346893310546875, -0.10101318359375, -0.0673370361328125, -0.033660888671875, 1.52587890625e-05, 0.03369140625, 0.0673675537109375, 0.101043701171875, 0.1347198486328125, 0.16839599609375, 0.2020721435546875, 0.235748291015625, 0.2694244384765625, 0.3031005859375, 0.3367767333984375, 0.370452880859375, 0.4041290283203125, 0.43780517578125, 0.4714813232421875, 0.505157470703125, 0.5388336181640625, 0.572509765625, 0.6061859130859375, 0.639862060546875, 0.6735382080078125, 0.70721435546875, 0.7408905029296875, 0.774566650390625, 0.8082427978515625, 0.8419189453125, 0.8755950927734375, 0.909271240234375, 0.9429473876953125, 0.97662353515625, 1.0102996826171875, 1.043975830078125, 1.0776519775390625, 1.111328125]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 5.0, 8.0, 7.0, 13.0, 8.0, 16.0, 12.0, 18.0, 19.0, 36.0, 31.0, 26.0, 43.0, 43.0, 50.0, 41.0, 45.0, 50.0, 44.0, 36.0, 53.0, 39.0, 23.0, 41.0, 32.0, 32.0, 32.0, 35.0, 31.0, 31.0, 17.0, 17.0, 9.0, 10.0, 6.0, 5.0, 7.0, 8.0, 4.0, 7.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-8.035961151123047, -7.7931227684021, -7.550284385681152, -7.307446002960205, -7.064607620239258, -6.8217692375183105, -6.578930854797363, -6.336092472076416, -6.093254089355469, -5.8504157066345215, -5.607577323913574, -5.364738941192627, -5.12190055847168, -4.879062175750732, -4.636223793029785, -4.393385410308838, -4.150547027587891, -3.9077086448669434, -3.664870262145996, -3.422031879425049, -3.1791934967041016, -2.9363551139831543, -2.693516731262207, -2.4506783485412598, -2.2078399658203125, -1.9650015830993652, -1.722163200378418, -1.4793248176574707, -1.2364864349365234, -0.9936480522155762, -0.7508096694946289, -0.5079712867736816, -0.2651333808898926, -0.022294998168945312, 0.22054338455200195, 0.4633817672729492, 0.7062201499938965, 0.9490585327148438, 1.191896915435791, 1.4347352981567383, 1.6775736808776855, 1.9204120635986328, 2.16325044631958, 2.4060888290405273, 2.6489272117614746, 2.891765594482422, 3.134603977203369, 3.3774423599243164, 3.6202807426452637, 3.863119125366211, 4.105957508087158, 4.3487958908081055, 4.591634273529053, 4.83447265625, 5.077311038970947, 5.3201494216918945, 5.562987804412842, 5.805826187133789, 6.048664569854736, 6.291502952575684, 6.534341335296631, 6.777179718017578, 7.020018100738525, 7.262856483459473, 7.50569486618042]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 6.0, 4.0, 1.0, 6.0, 9.0, 6.0, 12.0, 11.0, 16.0, 18.0, 15.0, 19.0, 15.0, 22.0, 20.0, 27.0, 28.0, 33.0, 38.0, 40.0, 37.0, 30.0, 32.0, 44.0, 38.0, 32.0, 37.0, 35.0, 28.0, 37.0, 37.0, 26.0, 35.0, 24.0, 25.0, 24.0, 18.0, 17.0, 16.0, 12.0, 13.0, 9.0, 11.0, 10.0, 4.0, 6.0, 6.0, 3.0, 5.0, 3.0, 5.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-7.184974193572998, -6.951821327209473, -6.718667984008789, -6.485515117645264, -6.252362251281738, -6.019208908081055, -5.786056041717529, -5.552903175354004, -5.31974983215332, -5.086596965789795, -4.853443622589111, -4.620290756225586, -4.3871378898620605, -4.153985023498535, -3.9208316802978516, -3.687678813934326, -3.454525947570801, -3.2213728427886963, -2.988219976425171, -2.7550668716430664, -2.521914005279541, -2.2887609004974365, -2.055607795715332, -1.822454810142517, -1.5893018245697021, -1.3561488389968872, -1.1229958534240723, -0.8898427486419678, -0.6566897630691528, -0.4235367774963379, -0.1903836727142334, 0.04276931285858154, 0.2759218215942383, 0.5090748071670532, 0.7422278523445129, 0.9753808975219727, 1.2085338830947876, 1.4416868686676025, 1.674839973449707, 1.907992959022522, 2.141145944595337, 2.3742990493774414, 2.607451915740967, 2.8406050205230713, 3.073758125305176, 3.306910991668701, 3.5400640964508057, 3.77321720123291, 4.0063700675964355, 4.239522933959961, 4.4726762771606445, 4.70582914352417, 4.938982009887695, 5.172135353088379, 5.405288219451904, 5.63844108581543, 5.871594429016113, 6.104747295379639, 6.337900638580322, 6.571053504943848, 6.804206371307373, 7.037359237670898, 7.270512580871582, 7.503665447235107, 7.736818313598633]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 5.0, 5.0, 7.0, 15.0, 20.0, 35.0, 60.0, 84.0, 107.0, 146.0, 227.0, 375.0, 634.0, 988.0, 1559.0, 2613.0, 4270.0, 7512.0, 13272.0, 23435.0, 44120.0, 85202.0, 160745.0, 294711.0, 479686.0, 665688.0, 738224.0, 641751.0, 449586.0, 266217.0, 143803.0, 76025.0, 40258.0, 21845.0, 12453.0, 7044.0, 4180.0, 2640.0, 1628.0, 1016.0, 686.0, 457.0, 314.0, 188.0, 148.0, 102.0, 54.0, 61.0, 31.0, 27.0, 13.0, 7.0, 3.0, 7.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-6.16015625, -5.9508056640625, -5.741455078125, -5.5321044921875, -5.32275390625, -5.1134033203125, -4.904052734375, -4.6947021484375, -4.4853515625, -4.2760009765625, -4.066650390625, -3.8572998046875, -3.64794921875, -3.4385986328125, -3.229248046875, -3.0198974609375, -2.810546875, -2.6011962890625, -2.391845703125, -2.1824951171875, -1.97314453125, -1.7637939453125, -1.554443359375, -1.3450927734375, -1.1357421875, -0.9263916015625, -0.717041015625, -0.5076904296875, -0.29833984375, -0.0889892578125, 0.120361328125, 0.3297119140625, 0.5390625, 0.7484130859375, 0.957763671875, 1.1671142578125, 1.37646484375, 1.5858154296875, 1.795166015625, 2.0045166015625, 2.2138671875, 2.4232177734375, 2.632568359375, 2.8419189453125, 3.05126953125, 3.2606201171875, 3.469970703125, 3.6793212890625, 3.888671875, 4.0980224609375, 4.307373046875, 4.5167236328125, 4.72607421875, 4.9354248046875, 5.144775390625, 5.3541259765625, 5.5634765625, 5.7728271484375, 5.982177734375, 6.1915283203125, 6.40087890625, 6.6102294921875, 6.819580078125, 7.0289306640625, 7.23828125]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 4.0, 3.0, 4.0, 7.0, 2.0, 4.0, 13.0, 15.0, 10.0, 12.0, 10.0, 13.0, 19.0, 19.0, 18.0, 22.0, 17.0, 30.0, 32.0, 33.0, 25.0, 33.0, 43.0, 43.0, 33.0, 35.0, 29.0, 32.0, 37.0, 39.0, 42.0, 34.0, 27.0, 32.0, 34.0, 29.0, 19.0, 25.0, 19.0, 17.0, 9.0, 13.0, 12.0, 13.0, 4.0, 6.0, 5.0, 7.0, 8.0, 4.0, 3.0, 6.0, 1.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.81640625, -5.617919921875, -5.41943359375, -5.220947265625, -5.0224609375, -4.823974609375, -4.62548828125, -4.427001953125, -4.228515625, -4.030029296875, -3.83154296875, -3.633056640625, -3.4345703125, -3.236083984375, -3.03759765625, -2.839111328125, -2.640625, -2.442138671875, -2.24365234375, -2.045166015625, -1.8466796875, -1.648193359375, -1.44970703125, -1.251220703125, -1.052734375, -0.854248046875, -0.65576171875, -0.457275390625, -0.2587890625, -0.060302734375, 0.13818359375, 0.336669921875, 0.53515625, 0.733642578125, 0.93212890625, 1.130615234375, 1.3291015625, 1.527587890625, 1.72607421875, 1.924560546875, 2.123046875, 2.321533203125, 2.52001953125, 2.718505859375, 2.9169921875, 3.115478515625, 3.31396484375, 3.512451171875, 3.7109375, 3.909423828125, 4.10791015625, 4.306396484375, 4.5048828125, 4.703369140625, 4.90185546875, 5.100341796875, 5.298828125, 5.497314453125, 5.69580078125, 5.894287109375, 6.0927734375, 6.291259765625, 6.48974609375, 6.688232421875, 6.88671875]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 4.0, 3.0, 3.0, 6.0, 11.0, 16.0, 25.0, 45.0, 61.0, 93.0, 165.0, 286.0, 401.0, 669.0, 1185.0, 1917.0, 3424.0, 5941.0, 10523.0, 19146.0, 34528.0, 64167.0, 117526.0, 211096.0, 360474.0, 552209.0, 707303.0, 709822.0, 554332.0, 363229.0, 213311.0, 118547.0, 64542.0, 35447.0, 19067.0, 10715.0, 5893.0, 3361.0, 1879.0, 1128.0, 683.0, 419.0, 279.0, 161.0, 79.0, 71.0, 34.0, 24.0, 10.0, 15.0, 11.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.55859375, -7.30670166015625, -7.0548095703125, -6.80291748046875, -6.551025390625, -6.29913330078125, -6.0472412109375, -5.79534912109375, -5.54345703125, -5.29156494140625, -5.0396728515625, -4.78778076171875, -4.535888671875, -4.28399658203125, -4.0321044921875, -3.78021240234375, -3.5283203125, -3.27642822265625, -3.0245361328125, -2.77264404296875, -2.520751953125, -2.26885986328125, -2.0169677734375, -1.76507568359375, -1.51318359375, -1.26129150390625, -1.0093994140625, -0.75750732421875, -0.505615234375, -0.25372314453125, -0.0018310546875, 0.25006103515625, 0.501953125, 0.75384521484375, 1.0057373046875, 1.25762939453125, 1.509521484375, 1.76141357421875, 2.0133056640625, 2.26519775390625, 2.51708984375, 2.76898193359375, 3.0208740234375, 3.27276611328125, 3.524658203125, 3.77655029296875, 4.0284423828125, 4.28033447265625, 4.5322265625, 4.78411865234375, 5.0360107421875, 5.28790283203125, 5.539794921875, 5.79168701171875, 6.0435791015625, 6.29547119140625, 6.54736328125, 6.79925537109375, 7.0511474609375, 7.30303955078125, 7.554931640625, 7.80682373046875, 8.0587158203125, 8.31060791015625, 8.5625]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 4.0, 8.0, 11.0, 9.0, 12.0, 25.0, 25.0, 27.0, 41.0, 55.0, 96.0, 87.0, 106.0, 125.0, 161.0, 204.0, 222.0, 244.0, 239.0, 273.0, 270.0, 297.0, 224.0, 236.0, 175.0, 166.0, 154.0, 121.0, 102.0, 97.0, 53.0, 49.0, 42.0, 33.0, 31.0, 25.0, 8.0, 9.0, 8.0, 5.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.076171875, -2.967864990234375, -2.85955810546875, -2.751251220703125, -2.6429443359375, -2.534637451171875, -2.42633056640625, -2.318023681640625, -2.209716796875, -2.101409912109375, -1.99310302734375, -1.884796142578125, -1.7764892578125, -1.668182373046875, -1.55987548828125, -1.451568603515625, -1.34326171875, -1.234954833984375, -1.12664794921875, -1.018341064453125, -0.9100341796875, -0.801727294921875, -0.69342041015625, -0.585113525390625, -0.476806640625, -0.368499755859375, -0.26019287109375, -0.151885986328125, -0.0435791015625, 0.064727783203125, 0.17303466796875, 0.281341552734375, 0.3896484375, 0.497955322265625, 0.60626220703125, 0.714569091796875, 0.8228759765625, 0.931182861328125, 1.03948974609375, 1.147796630859375, 1.256103515625, 1.364410400390625, 1.47271728515625, 1.581024169921875, 1.6893310546875, 1.797637939453125, 1.90594482421875, 2.014251708984375, 2.12255859375, 2.230865478515625, 2.33917236328125, 2.447479248046875, 2.5557861328125, 2.664093017578125, 2.77239990234375, 2.880706787109375, 2.989013671875, 3.097320556640625, 3.20562744140625, 3.313934326171875, 3.4222412109375, 3.530548095703125, 3.63885498046875, 3.747161865234375, 3.85546875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 3.0, 8.0, 9.0, 15.0, 9.0, 10.0, 15.0, 16.0, 28.0, 18.0, 26.0, 27.0, 25.0, 41.0, 45.0, 40.0, 49.0, 33.0, 35.0, 43.0, 43.0, 41.0, 38.0, 33.0, 40.0, 33.0, 35.0, 31.0, 26.0, 24.0, 20.0, 23.0, 10.0, 15.0, 16.0, 16.0, 14.0, 12.0, 7.0, 4.0, 5.0, 6.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0], "bins": [-7.646332740783691, -7.423660755157471, -7.200988292694092, -6.978316307067871, -6.75564432144165, -6.53297233581543, -6.310299873352051, -6.08762788772583, -5.864955902099609, -5.642283916473389, -5.41961145401001, -5.196939468383789, -4.974267482757568, -4.751595497131348, -4.528923034667969, -4.306251049041748, -4.083579063415527, -3.8609068393707275, -3.638234853744507, -3.415562629699707, -3.1928906440734863, -2.9702184200286865, -2.7475461959838867, -2.524874210357666, -2.302201747894287, -2.0795295238494873, -1.8568575382232666, -1.6341853141784668, -1.411513328552246, -1.1888411045074463, -0.966168999671936, -0.7434968948364258, -0.5208249092102051, -0.2981528043746948, -0.07548066973686218, 0.14719146490097046, 0.3698635697364807, 0.5925357341766357, 0.815207839012146, 1.0378799438476562, 1.2605520486831665, 1.4832241535186768, 1.705896258354187, 1.9285683631896973, 2.151240587234497, 2.373912811279297, 2.5965847969055176, 2.8192567825317383, 3.041929006576538, 3.264601230621338, 3.4872732162475586, 3.7099454402923584, 3.932617425918579, 4.155289649963379, 4.3779616355896, 4.60063362121582, 4.823306083679199, 5.04597806930542, 5.268650531768799, 5.4913225173950195, 5.71399450302124, 5.936666488647461, 6.15933895111084, 6.3820109367370605, 6.604682922363281]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 4.0, 1.0, 7.0, 8.0, 11.0, 10.0, 13.0, 16.0, 12.0, 19.0, 24.0, 30.0, 33.0, 41.0, 26.0, 27.0, 30.0, 33.0, 34.0, 31.0, 31.0, 38.0, 36.0, 46.0, 44.0, 38.0, 32.0, 36.0, 35.0, 35.0, 28.0, 26.0, 28.0, 18.0, 14.0, 16.0, 17.0, 9.0, 18.0, 8.0, 10.0, 5.0, 7.0, 6.0, 5.0, 4.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.953693389892578, -6.71685791015625, -6.480022430419922, -6.2431864738464355, -6.006350994110107, -5.769515514373779, -5.532679557800293, -5.295844078063965, -5.059008598327637, -4.822173118591309, -4.5853376388549805, -4.348501682281494, -4.111666202545166, -3.874830722808838, -3.6379950046539307, -3.4011592864990234, -3.1643238067626953, -2.927488327026367, -2.69065260887146, -2.4538168907165527, -2.2169814109802246, -1.980145812034607, -1.7433102130889893, -1.5064746141433716, -1.269639015197754, -1.0328034162521362, -0.7959678173065186, -0.5591322183609009, -0.3222966194152832, -0.08546102046966553, 0.15137457847595215, 0.3882101774215698, 0.6250457763671875, 0.8618813753128052, 1.0987169742584229, 1.3355525732040405, 1.5723881721496582, 1.8092237710952759, 2.0460593700408936, 2.282895088195801, 2.519730567932129, 2.756566047668457, 2.9934017658233643, 3.2302374839782715, 3.4670729637145996, 3.7039084434509277, 3.940744161605835, 4.177579879760742, 4.41441535949707, 4.651250839233398, 4.888086318969727, 5.124922275543213, 5.361757755279541, 5.598593235015869, 5.8354291915893555, 6.072264671325684, 6.309100151062012, 6.54593563079834, 6.782771110534668, 7.019607067108154, 7.256442546844482, 7.4932780265808105, 7.730113983154297, 7.966949462890625, 8.203784942626953]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 4.0, 1.0, 6.0, 4.0, 15.0, 18.0, 35.0, 44.0, 65.0, 86.0, 120.0, 172.0, 277.0, 410.0, 664.0, 900.0, 1418.0, 2213.0, 3491.0, 5489.0, 8697.0, 13901.0, 21847.0, 33608.0, 50166.0, 71454.0, 95968.0, 117708.0, 129796.0, 125285.0, 107242.0, 82861.0, 59863.0, 40755.0, 26740.0, 17101.0, 10952.0, 6952.0, 4245.0, 2787.0, 1805.0, 1170.0, 733.0, 486.0, 328.0, 201.0, 147.0, 103.0, 66.0, 48.0, 37.0, 32.0, 19.0, 9.0, 10.0, 3.0, 8.0, 2.0, 4.0, 0.0, 1.0, 1.0], "bins": [-1.65234375, -1.5985870361328125, -1.544830322265625, -1.4910736083984375, -1.43731689453125, -1.3835601806640625, -1.329803466796875, -1.2760467529296875, -1.2222900390625, -1.1685333251953125, -1.114776611328125, -1.0610198974609375, -1.00726318359375, -0.9535064697265625, -0.899749755859375, -0.8459930419921875, -0.792236328125, -0.7384796142578125, -0.684722900390625, -0.6309661865234375, -0.57720947265625, -0.5234527587890625, -0.469696044921875, -0.4159393310546875, -0.3621826171875, -0.3084259033203125, -0.254669189453125, -0.2009124755859375, -0.14715576171875, -0.0933990478515625, -0.039642333984375, 0.0141143798828125, 0.06787109375, 0.1216278076171875, 0.175384521484375, 0.2291412353515625, 0.28289794921875, 0.3366546630859375, 0.390411376953125, 0.4441680908203125, 0.4979248046875, 0.5516815185546875, 0.605438232421875, 0.6591949462890625, 0.71295166015625, 0.7667083740234375, 0.820465087890625, 0.8742218017578125, 0.927978515625, 0.9817352294921875, 1.035491943359375, 1.0892486572265625, 1.14300537109375, 1.1967620849609375, 1.250518798828125, 1.3042755126953125, 1.3580322265625, 1.4117889404296875, 1.465545654296875, 1.5193023681640625, 1.57305908203125, 1.6268157958984375, 1.680572509765625, 1.7343292236328125, 1.7880859375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 3.0, 5.0, 3.0, 3.0, 9.0, 3.0, 6.0, 6.0, 8.0, 14.0, 15.0, 18.0, 13.0, 18.0, 22.0, 25.0, 24.0, 23.0, 23.0, 31.0, 28.0, 28.0, 30.0, 32.0, 31.0, 28.0, 29.0, 27.0, 42.0, 43.0, 34.0, 29.0, 38.0, 36.0, 22.0, 22.0, 24.0, 24.0, 28.0, 18.0, 18.0, 16.0, 14.0, 18.0, 17.0, 15.0, 6.0, 7.0, 9.0, 6.0, 4.0, 7.0, 3.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0], "bins": [-6.79296875, -6.57806396484375, -6.3631591796875, -6.14825439453125, -5.933349609375, -5.71844482421875, -5.5035400390625, -5.28863525390625, -5.07373046875, -4.85882568359375, -4.6439208984375, -4.42901611328125, -4.214111328125, -3.99920654296875, -3.7843017578125, -3.56939697265625, -3.3544921875, -3.13958740234375, -2.9246826171875, -2.70977783203125, -2.494873046875, -2.27996826171875, -2.0650634765625, -1.85015869140625, -1.63525390625, -1.42034912109375, -1.2054443359375, -0.99053955078125, -0.775634765625, -0.56072998046875, -0.3458251953125, -0.13092041015625, 0.083984375, 0.29888916015625, 0.5137939453125, 0.72869873046875, 0.943603515625, 1.15850830078125, 1.3734130859375, 1.58831787109375, 1.80322265625, 2.01812744140625, 2.2330322265625, 2.44793701171875, 2.662841796875, 2.87774658203125, 3.0926513671875, 3.30755615234375, 3.5224609375, 3.73736572265625, 3.9522705078125, 4.16717529296875, 4.382080078125, 4.59698486328125, 4.8118896484375, 5.02679443359375, 5.24169921875, 5.45660400390625, 5.6715087890625, 5.88641357421875, 6.101318359375, 6.31622314453125, 6.5311279296875, 6.74603271484375, 6.9609375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 6.0, 9.0, 6.0, 11.0, 8.0, 14.0, 14.0, 28.0, 36.0, 50.0, 66.0, 105.0, 161.0, 218.0, 409.0, 686.0, 1415.0, 3002.0, 6710.0, 15813.0, 39750.0, 790388.0, 142932.0, 26444.0, 10976.0, 4693.0, 2111.0, 1007.0, 526.0, 306.0, 226.0, 126.0, 83.0, 50.0, 42.0, 31.0, 24.0, 15.0, 15.0, 11.0, 6.0, 4.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-8.703125, -8.42041015625, -8.1376953125, -7.85498046875, -7.572265625, -7.28955078125, -7.0068359375, -6.72412109375, -6.44140625, -6.15869140625, -5.8759765625, -5.59326171875, -5.310546875, -5.02783203125, -4.7451171875, -4.46240234375, -4.1796875, -3.89697265625, -3.6142578125, -3.33154296875, -3.048828125, -2.76611328125, -2.4833984375, -2.20068359375, -1.91796875, -1.63525390625, -1.3525390625, -1.06982421875, -0.787109375, -0.50439453125, -0.2216796875, 0.06103515625, 0.34375, 0.62646484375, 0.9091796875, 1.19189453125, 1.474609375, 1.75732421875, 2.0400390625, 2.32275390625, 2.60546875, 2.88818359375, 3.1708984375, 3.45361328125, 3.736328125, 4.01904296875, 4.3017578125, 4.58447265625, 4.8671875, 5.14990234375, 5.4326171875, 5.71533203125, 5.998046875, 6.28076171875, 6.5634765625, 6.84619140625, 7.12890625, 7.41162109375, 7.6943359375, 7.97705078125, 8.259765625, 8.54248046875, 8.8251953125, 9.10791015625, 9.390625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 6.0, 7.0, 12.0, 7.0, 11.0, 18.0, 23.0, 28.0, 15.0, 33.0, 14.0, 36.0, 38.0, 45.0, 36.0, 40.0, 35.0, 49.0, 46.0, 46.0, 38.0, 40.0, 37.0, 43.0, 34.0, 44.0, 38.0, 25.0, 24.0, 18.0, 17.0, 20.0, 14.0, 11.0, 11.0, 13.0, 11.0, 2.0, 3.0, 4.0, 4.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.8359375, -5.642333984375, -5.44873046875, -5.255126953125, -5.0615234375, -4.867919921875, -4.67431640625, -4.480712890625, -4.287109375, -4.093505859375, -3.89990234375, -3.706298828125, -3.5126953125, -3.319091796875, -3.12548828125, -2.931884765625, -2.73828125, -2.544677734375, -2.35107421875, -2.157470703125, -1.9638671875, -1.770263671875, -1.57666015625, -1.383056640625, -1.189453125, -0.995849609375, -0.80224609375, -0.608642578125, -0.4150390625, -0.221435546875, -0.02783203125, 0.165771484375, 0.359375, 0.552978515625, 0.74658203125, 0.940185546875, 1.1337890625, 1.327392578125, 1.52099609375, 1.714599609375, 1.908203125, 2.101806640625, 2.29541015625, 2.489013671875, 2.6826171875, 2.876220703125, 3.06982421875, 3.263427734375, 3.45703125, 3.650634765625, 3.84423828125, 4.037841796875, 4.2314453125, 4.425048828125, 4.61865234375, 4.812255859375, 5.005859375, 5.199462890625, 5.39306640625, 5.586669921875, 5.7802734375, 5.973876953125, 6.16748046875, 6.361083984375, 6.5546875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 5.0, 6.0, 4.0, 5.0, 5.0, 4.0, 9.0, 9.0, 14.0, 12.0, 22.0, 31.0, 49.0, 51.0, 51.0, 90.0, 122.0, 164.0, 220.0, 295.0, 462.0, 713.0, 1238.0, 2238.0, 4647.0, 11105.0, 30694.0, 455305.0, 488157.0, 31213.0, 11177.0, 4701.0, 2253.0, 1206.0, 675.0, 469.0, 302.0, 197.0, 168.0, 103.0, 88.0, 60.0, 46.0, 40.0, 33.0, 25.0, 22.0, 13.0, 12.0, 11.0, 6.0, 5.0, 5.0, 4.0, 2.0, 5.0, 1.0, 0.0, 3.0, 2.0, 1.0], "bins": [-0.8916015625, -0.8628463745117188, -0.8340911865234375, -0.8053359985351562, -0.776580810546875, -0.7478256225585938, -0.7190704345703125, -0.6903152465820312, -0.66156005859375, -0.6328048706054688, -0.6040496826171875, -0.5752944946289062, -0.546539306640625, -0.5177841186523438, -0.4890289306640625, -0.46027374267578125, -0.4315185546875, -0.40276336669921875, -0.3740081787109375, -0.34525299072265625, -0.316497802734375, -0.28774261474609375, -0.2589874267578125, -0.23023223876953125, -0.20147705078125, -0.17272186279296875, -0.1439666748046875, -0.11521148681640625, -0.086456298828125, -0.05770111083984375, -0.0289459228515625, -0.00019073486328125, 0.028564453125, 0.05731964111328125, 0.0860748291015625, 0.11483001708984375, 0.143585205078125, 0.17234039306640625, 0.2010955810546875, 0.22985076904296875, 0.25860595703125, 0.28736114501953125, 0.3161163330078125, 0.34487152099609375, 0.373626708984375, 0.40238189697265625, 0.4311370849609375, 0.45989227294921875, 0.4886474609375, 0.5174026489257812, 0.5461578369140625, 0.5749130249023438, 0.603668212890625, 0.6324234008789062, 0.6611785888671875, 0.6899337768554688, 0.71868896484375, 0.7474441528320312, 0.7761993408203125, 0.8049545288085938, 0.833709716796875, 0.8624649047851562, 0.8912200927734375, 0.9199752807617188, 0.94873046875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 6.0, 2.0, 8.0, 8.0, 8.0, 15.0, 14.0, 25.0, 24.0, 34.0, 64.0, 80.0, 92.0, 102.0, 98.0, 73.0, 84.0, 54.0, 62.0, 42.0, 27.0, 20.0, 15.0, 14.0, 11.0, 4.0, 5.0, 2.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.878376007080078e-05, -6.657745689153671e-05, -6.437115371227264e-05, -6.216485053300858e-05, -5.995854735374451e-05, -5.775224417448044e-05, -5.554594099521637e-05, -5.33396378159523e-05, -5.113333463668823e-05, -4.8927031457424164e-05, -4.6720728278160095e-05, -4.4514425098896027e-05, -4.230812191963196e-05, -4.010181874036789e-05, -3.789551556110382e-05, -3.568921238183975e-05, -3.3482909202575684e-05, -3.1276606023311615e-05, -2.9070302844047546e-05, -2.6863999664783478e-05, -2.465769648551941e-05, -2.245139330625534e-05, -2.0245090126991272e-05, -1.8038786947727203e-05, -1.5832483768463135e-05, -1.3626180589199066e-05, -1.1419877409934998e-05, -9.213574230670929e-06, -7.00727105140686e-06, -4.800967872142792e-06, -2.594664692878723e-06, -3.8836151361465454e-07, 1.817941665649414e-06, 4.024244844913483e-06, 6.230548024177551e-06, 8.43685120344162e-06, 1.0643154382705688e-05, 1.2849457561969757e-05, 1.5055760741233826e-05, 1.7262063920497894e-05, 1.9468367099761963e-05, 2.167467027902603e-05, 2.38809734582901e-05, 2.608727663755417e-05, 2.8293579816818237e-05, 3.0499882996082306e-05, 3.2706186175346375e-05, 3.491248935461044e-05, 3.711879253387451e-05, 3.932509571313858e-05, 4.153139889240265e-05, 4.373770207166672e-05, 4.5944005250930786e-05, 4.8150308430194855e-05, 5.035661160945892e-05, 5.256291478872299e-05, 5.476921796798706e-05, 5.697552114725113e-05, 5.91818243265152e-05, 6.138812750577927e-05, 6.359443068504333e-05, 6.58007338643074e-05, 6.800703704357147e-05, 7.021334022283554e-05, 7.241964340209961e-05]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 6.0, 1.0, 6.0, 12.0, 18.0, 12.0, 43.0, 43.0, 75.0, 101.0, 157.0, 242.0, 445.0, 647.0, 1083.0, 2010.0, 3753.0, 6618.0, 13351.0, 28009.0, 66473.0, 164302.0, 291104.0, 254937.0, 121810.0, 48502.0, 21605.0, 10553.0, 5517.0, 2845.0, 1760.0, 968.0, 587.0, 350.0, 222.0, 137.0, 78.0, 64.0, 45.0, 18.0, 17.0, 15.0, 7.0, 4.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.89013671875, -0.8630218505859375, -0.835906982421875, -0.8087921142578125, -0.78167724609375, -0.7545623779296875, -0.727447509765625, -0.7003326416015625, -0.6732177734375, -0.6461029052734375, -0.618988037109375, -0.5918731689453125, -0.56475830078125, -0.5376434326171875, -0.510528564453125, -0.4834136962890625, -0.456298828125, -0.4291839599609375, -0.402069091796875, -0.3749542236328125, -0.34783935546875, -0.3207244873046875, -0.293609619140625, -0.2664947509765625, -0.2393798828125, -0.2122650146484375, -0.185150146484375, -0.1580352783203125, -0.13092041015625, -0.1038055419921875, -0.076690673828125, -0.0495758056640625, -0.0224609375, 0.0046539306640625, 0.031768798828125, 0.0588836669921875, 0.08599853515625, 0.1131134033203125, 0.140228271484375, 0.1673431396484375, 0.1944580078125, 0.2215728759765625, 0.248687744140625, 0.2758026123046875, 0.30291748046875, 0.3300323486328125, 0.357147216796875, 0.3842620849609375, 0.411376953125, 0.4384918212890625, 0.465606689453125, 0.4927215576171875, 0.51983642578125, 0.5469512939453125, 0.574066162109375, 0.6011810302734375, 0.6282958984375, 0.6554107666015625, 0.682525634765625, 0.7096405029296875, 0.73675537109375, 0.7638702392578125, 0.790985107421875, 0.8180999755859375, 0.84521484375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 6.0, 4.0, 3.0, 6.0, 9.0, 10.0, 15.0, 9.0, 25.0, 27.0, 27.0, 50.0, 55.0, 59.0, 59.0, 70.0, 67.0, 66.0, 75.0, 64.0, 57.0, 42.0, 32.0, 30.0, 21.0, 20.0, 17.0, 14.0, 9.0, 10.0, 7.0, 8.0, 3.0, 4.0, 3.0, 7.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0], "bins": [-0.2509765625, -0.24374008178710938, -0.23650360107421875, -0.22926712036132812, -0.2220306396484375, -0.21479415893554688, -0.20755767822265625, -0.20032119750976562, -0.193084716796875, -0.18584823608398438, -0.17861175537109375, -0.17137527465820312, -0.1641387939453125, -0.15690231323242188, -0.14966583251953125, -0.14242935180664062, -0.13519287109375, -0.12795639038085938, -0.12071990966796875, -0.11348342895507812, -0.1062469482421875, -0.09901046752929688, -0.09177398681640625, -0.08453750610351562, -0.077301025390625, -0.07006454467773438, -0.06282806396484375, -0.055591583251953125, -0.0483551025390625, -0.041118621826171875, -0.03388214111328125, -0.026645660400390625, -0.0194091796875, -0.012172698974609375, -0.00493621826171875, 0.002300262451171875, 0.0095367431640625, 0.016773223876953125, 0.02400970458984375, 0.031246185302734375, 0.038482666015625, 0.045719146728515625, 0.05295562744140625, 0.060192108154296875, 0.0674285888671875, 0.07466506958007812, 0.08190155029296875, 0.08913803100585938, 0.09637451171875, 0.10361099243164062, 0.11084747314453125, 0.11808395385742188, 0.1253204345703125, 0.13255691528320312, 0.13979339599609375, 0.14702987670898438, 0.154266357421875, 0.16150283813476562, 0.16873931884765625, 0.17597579956054688, 0.1832122802734375, 0.19044876098632812, 0.19768524169921875, 0.20492172241210938, 0.212158203125]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 5.0, 3.0, 7.0, 11.0, 10.0, 17.0, 10.0, 15.0, 18.0, 25.0, 26.0, 36.0, 23.0, 30.0, 39.0, 43.0, 48.0, 44.0, 34.0, 32.0, 53.0, 37.0, 37.0, 46.0, 30.0, 36.0, 36.0, 36.0, 22.0, 24.0, 28.0, 18.0, 13.0, 17.0, 9.0, 15.0, 11.0, 13.0, 9.0, 9.0, 7.0, 5.0, 5.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-7.196216583251953, -6.9747314453125, -6.753246307373047, -6.5317606925964355, -6.310275554656982, -6.088790416717529, -5.867305278778076, -5.645819664001465, -5.424334526062012, -5.202849388122559, -4.9813642501831055, -4.759878635406494, -4.538393497467041, -4.316908359527588, -4.095423221588135, -3.8739378452301025, -3.6524527072906494, -3.4309675693511963, -3.209482192993164, -2.987997055053711, -2.7665116786956787, -2.5450265407562256, -2.3235411643981934, -2.1020560264587402, -1.8805707693099976, -1.6590855121612549, -1.4376002550125122, -1.2161149978637695, -0.9946298003196716, -0.7731446027755737, -0.551659345626831, -0.3301740884780884, -0.1086888313293457, 0.11279641091823578, 0.33428165316581726, 0.5557668805122375, 0.7772521376609802, 0.9987373352050781, 1.2202225923538208, 1.4417078495025635, 1.6631931066513062, 1.8846783638000488, 2.106163501739502, 2.327648878097534, 2.5491340160369873, 2.7706193923950195, 2.9921045303344727, 3.213589668273926, 3.435075044631958, 3.656560182571411, 3.8780455589294434, 4.0995306968688965, 4.32101583480835, 4.542501449584961, 4.763986587524414, 4.985471725463867, 5.20695686340332, 5.428442001342773, 5.649927139282227, 5.871412754058838, 6.092897891998291, 6.314383029937744, 6.535868167877197, 6.757353782653809, 6.978838920593262]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 6.0, 1.0, 7.0, 8.0, 10.0, 11.0, 10.0, 15.0, 14.0, 13.0, 25.0, 29.0, 31.0, 34.0, 36.0, 24.0, 30.0, 34.0, 29.0, 38.0, 28.0, 37.0, 34.0, 39.0, 49.0, 41.0, 35.0, 38.0, 31.0, 37.0, 27.0, 29.0, 24.0, 27.0, 14.0, 14.0, 16.0, 11.0, 18.0, 9.0, 8.0, 8.0, 6.0, 9.0, 3.0, 3.0, 3.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.714550971984863, -6.48015832901001, -6.245765686035156, -6.011373519897461, -5.776980876922607, -5.542588233947754, -5.3081955909729, -5.073802947998047, -4.839410305023193, -4.60501766204834, -4.370625019073486, -4.136232376098633, -3.9018399715423584, -3.667447566986084, -3.4330549240112305, -3.198662281036377, -2.9642698764801025, -2.729877233505249, -2.4954848289489746, -2.261092185974121, -2.0266995429992676, -1.7923070192337036, -1.5579144954681396, -1.3235218524932861, -1.0891293287277222, -0.8547367453575134, -0.6203441619873047, -0.3859516382217407, -0.15155905485153198, 0.08283352851867676, 0.3172260522842407, 0.5516186952590942, 0.7860112190246582, 1.0204037427902222, 1.2547963857650757, 1.4891889095306396, 1.7235815525054932, 1.9579740762710571, 2.192366600036621, 2.4267592430114746, 2.661151885986328, 2.8955445289611816, 3.129936933517456, 3.3643295764923096, 3.598722219467163, 3.8331146240234375, 4.067507266998291, 4.3018999099731445, 4.53629207611084, 4.770684719085693, 5.005077362060547, 5.239469528198242, 5.473862171173096, 5.708254814147949, 5.942647457122803, 6.177040100097656, 6.41143274307251, 6.645825386047363, 6.880218029022217, 7.11461067199707, 7.349002838134766, 7.583395481109619, 7.817788124084473, 8.052181243896484, 8.28657341003418]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 5.0, 8.0, 6.0, 9.0, 17.0, 31.0, 42.0, 79.0, 128.0, 163.0, 305.0, 480.0, 748.0, 1164.0, 1820.0, 2809.0, 4593.0, 6810.0, 10596.0, 16040.0, 23027.0, 33527.0, 46568.0, 60431.0, 77105.0, 91145.0, 100724.0, 103937.0, 100424.0, 89551.0, 74964.0, 59055.0, 44399.0, 31889.0, 22511.0, 15263.0, 10008.0, 6445.0, 4203.0, 2771.0, 1799.0, 1065.0, 700.0, 435.0, 285.0, 181.0, 113.0, 68.0, 41.0, 31.0, 22.0, 11.0, 7.0, 3.0, 4.0, 2.0, 0.0, 2.0], "bins": [-4.625, -4.4866943359375, -4.348388671875, -4.2100830078125, -4.07177734375, -3.9334716796875, -3.795166015625, -3.6568603515625, -3.5185546875, -3.3802490234375, -3.241943359375, -3.1036376953125, -2.96533203125, -2.8270263671875, -2.688720703125, -2.5504150390625, -2.412109375, -2.2738037109375, -2.135498046875, -1.9971923828125, -1.85888671875, -1.7205810546875, -1.582275390625, -1.4439697265625, -1.3056640625, -1.1673583984375, -1.029052734375, -0.8907470703125, -0.75244140625, -0.6141357421875, -0.475830078125, -0.3375244140625, -0.19921875, -0.0609130859375, 0.077392578125, 0.2156982421875, 0.35400390625, 0.4923095703125, 0.630615234375, 0.7689208984375, 0.9072265625, 1.0455322265625, 1.183837890625, 1.3221435546875, 1.46044921875, 1.5987548828125, 1.737060546875, 1.8753662109375, 2.013671875, 2.1519775390625, 2.290283203125, 2.4285888671875, 2.56689453125, 2.7052001953125, 2.843505859375, 2.9818115234375, 3.1201171875, 3.2584228515625, 3.396728515625, 3.5350341796875, 3.67333984375, 3.8116455078125, 3.949951171875, 4.0882568359375, 4.2265625]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 4.0, 3.0, 4.0, 6.0, 4.0, 11.0, 10.0, 10.0, 11.0, 15.0, 16.0, 15.0, 23.0, 34.0, 30.0, 30.0, 26.0, 34.0, 38.0, 34.0, 13.0, 36.0, 28.0, 34.0, 40.0, 29.0, 33.0, 47.0, 31.0, 24.0, 42.0, 33.0, 25.0, 34.0, 21.0, 25.0, 25.0, 26.0, 15.0, 8.0, 10.0, 9.0, 9.0, 10.0, 9.0, 4.0, 5.0, 6.0, 5.0, 7.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0], "bins": [-6.9765625, -6.7568359375, -6.537109375, -6.3173828125, -6.09765625, -5.8779296875, -5.658203125, -5.4384765625, -5.21875, -4.9990234375, -4.779296875, -4.5595703125, -4.33984375, -4.1201171875, -3.900390625, -3.6806640625, -3.4609375, -3.2412109375, -3.021484375, -2.8017578125, -2.58203125, -2.3623046875, -2.142578125, -1.9228515625, -1.703125, -1.4833984375, -1.263671875, -1.0439453125, -0.82421875, -0.6044921875, -0.384765625, -0.1650390625, 0.0546875, 0.2744140625, 0.494140625, 0.7138671875, 0.93359375, 1.1533203125, 1.373046875, 1.5927734375, 1.8125, 2.0322265625, 2.251953125, 2.4716796875, 2.69140625, 2.9111328125, 3.130859375, 3.3505859375, 3.5703125, 3.7900390625, 4.009765625, 4.2294921875, 4.44921875, 4.6689453125, 4.888671875, 5.1083984375, 5.328125, 5.5478515625, 5.767578125, 5.9873046875, 6.20703125, 6.4267578125, 6.646484375, 6.8662109375, 7.0859375]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 3.0, 9.0, 6.0, 16.0, 26.0, 30.0, 52.0, 101.0, 146.0, 202.0, 330.0, 557.0, 850.0, 1363.0, 2145.0, 3468.0, 5385.0, 8375.0, 13291.0, 19857.0, 29211.0, 42120.0, 57659.0, 76319.0, 93482.0, 106261.0, 112017.0, 107777.0, 95421.0, 78304.0, 60064.0, 44047.0, 30704.0, 20873.0, 13751.0, 8773.0, 5711.0, 3667.0, 2223.0, 1461.0, 896.0, 542.0, 362.0, 259.0, 149.0, 102.0, 65.0, 39.0, 31.0, 18.0, 19.0, 8.0, 5.0, 3.0, 7.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-4.640625, -4.483642578125, -4.32666015625, -4.169677734375, -4.0126953125, -3.855712890625, -3.69873046875, -3.541748046875, -3.384765625, -3.227783203125, -3.07080078125, -2.913818359375, -2.7568359375, -2.599853515625, -2.44287109375, -2.285888671875, -2.12890625, -1.971923828125, -1.81494140625, -1.657958984375, -1.5009765625, -1.343994140625, -1.18701171875, -1.030029296875, -0.873046875, -0.716064453125, -0.55908203125, -0.402099609375, -0.2451171875, -0.088134765625, 0.06884765625, 0.225830078125, 0.3828125, 0.539794921875, 0.69677734375, 0.853759765625, 1.0107421875, 1.167724609375, 1.32470703125, 1.481689453125, 1.638671875, 1.795654296875, 1.95263671875, 2.109619140625, 2.2666015625, 2.423583984375, 2.58056640625, 2.737548828125, 2.89453125, 3.051513671875, 3.20849609375, 3.365478515625, 3.5224609375, 3.679443359375, 3.83642578125, 3.993408203125, 4.150390625, 4.307373046875, 4.46435546875, 4.621337890625, 4.7783203125, 4.935302734375, 5.09228515625, 5.249267578125, 5.40625]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 3.0, 2.0, 2.0, 4.0, 4.0, 5.0, 4.0, 6.0, 13.0, 13.0, 18.0, 14.0, 23.0, 27.0, 33.0, 30.0, 26.0, 41.0, 29.0, 45.0, 42.0, 48.0, 43.0, 48.0, 40.0, 42.0, 37.0, 30.0, 30.0, 41.0, 33.0, 28.0, 30.0, 28.0, 22.0, 26.0, 15.0, 23.0, 6.0, 9.0, 8.0, 10.0, 13.0, 3.0, 4.0, 3.0, 4.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.4140625, -4.2503662109375, -4.086669921875, -3.9229736328125, -3.75927734375, -3.5955810546875, -3.431884765625, -3.2681884765625, -3.1044921875, -2.9407958984375, -2.777099609375, -2.6134033203125, -2.44970703125, -2.2860107421875, -2.122314453125, -1.9586181640625, -1.794921875, -1.6312255859375, -1.467529296875, -1.3038330078125, -1.14013671875, -0.9764404296875, -0.812744140625, -0.6490478515625, -0.4853515625, -0.3216552734375, -0.157958984375, 0.0057373046875, 0.16943359375, 0.3331298828125, 0.496826171875, 0.6605224609375, 0.82421875, 0.9879150390625, 1.151611328125, 1.3153076171875, 1.47900390625, 1.6427001953125, 1.806396484375, 1.9700927734375, 2.1337890625, 2.2974853515625, 2.461181640625, 2.6248779296875, 2.78857421875, 2.9522705078125, 3.115966796875, 3.2796630859375, 3.443359375, 3.6070556640625, 3.770751953125, 3.9344482421875, 4.09814453125, 4.2618408203125, 4.425537109375, 4.5892333984375, 4.7529296875, 4.9166259765625, 5.080322265625, 5.2440185546875, 5.40771484375, 5.5714111328125, 5.735107421875, 5.8988037109375, 6.0625]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 7.0, 3.0, 12.0, 22.0, 31.0, 52.0, 76.0, 108.0, 147.0, 221.0, 424.0, 604.0, 1024.0, 1638.0, 2569.0, 4500.0, 7468.0, 12293.0, 20373.0, 33204.0, 52239.0, 77744.0, 106263.0, 131436.0, 140898.0, 131637.0, 107315.0, 78399.0, 52452.0, 33485.0, 20368.0, 12440.0, 7417.0, 4441.0, 2710.0, 1674.0, 1047.0, 679.0, 411.0, 254.0, 169.0, 104.0, 70.0, 43.0, 40.0, 24.0, 14.0, 4.0, 3.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3203125, -2.246673583984375, -2.17303466796875, -2.099395751953125, -2.0257568359375, -1.952117919921875, -1.87847900390625, -1.804840087890625, -1.731201171875, -1.657562255859375, -1.58392333984375, -1.510284423828125, -1.4366455078125, -1.363006591796875, -1.28936767578125, -1.215728759765625, -1.14208984375, -1.068450927734375, -0.99481201171875, -0.921173095703125, -0.8475341796875, -0.773895263671875, -0.70025634765625, -0.626617431640625, -0.552978515625, -0.479339599609375, -0.40570068359375, -0.332061767578125, -0.2584228515625, -0.184783935546875, -0.11114501953125, -0.037506103515625, 0.0361328125, 0.109771728515625, 0.18341064453125, 0.257049560546875, 0.3306884765625, 0.404327392578125, 0.47796630859375, 0.551605224609375, 0.625244140625, 0.698883056640625, 0.77252197265625, 0.846160888671875, 0.9197998046875, 0.993438720703125, 1.06707763671875, 1.140716552734375, 1.21435546875, 1.287994384765625, 1.36163330078125, 1.435272216796875, 1.5089111328125, 1.582550048828125, 1.65618896484375, 1.729827880859375, 1.803466796875, 1.877105712890625, 1.95074462890625, 2.024383544921875, 2.0980224609375, 2.171661376953125, 2.24530029296875, 2.318939208984375, 2.392578125]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 2.0, 0.0, 4.0, 7.0, 6.0, 8.0, 13.0, 17.0, 17.0, 15.0, 23.0, 17.0, 31.0, 43.0, 49.0, 38.0, 55.0, 52.0, 58.0, 52.0, 51.0, 49.0, 60.0, 51.0, 43.0, 32.0, 37.0, 29.0, 19.0, 24.0, 19.0, 15.0, 19.0, 6.0, 5.0, 7.0, 5.0, 5.0, 6.0, 3.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.00028896331787109375, -0.0002809111028909683, -0.0002728588879108429, -0.00026480667293071747, -0.00025675445795059204, -0.0002487022429704666, -0.0002406500279903412, -0.00023259781301021576, -0.00022454559803009033, -0.0002164933830499649, -0.00020844116806983948, -0.00020038895308971405, -0.00019233673810958862, -0.0001842845231294632, -0.00017623230814933777, -0.00016818009316921234, -0.00016012787818908691, -0.0001520756632089615, -0.00014402344822883606, -0.00013597123324871063, -0.0001279190182685852, -0.00011986680328845978, -0.00011181458830833435, -0.00010376237332820892, -9.57101583480835e-05, -8.765794336795807e-05, -7.960572838783264e-05, -7.155351340770721e-05, -6.350129842758179e-05, -5.544908344745636e-05, -4.739686846733093e-05, -3.9344653487205505e-05, -3.129243850708008e-05, -2.324022352695465e-05, -1.5188008546829224e-05, -7.135793566703796e-06, 9.164214134216309e-07, 8.968636393547058e-06, 1.7020851373672485e-05, 2.5073066353797913e-05, 3.312528133392334e-05, 4.117749631404877e-05, 4.9229711294174194e-05, 5.728192627429962e-05, 6.533414125442505e-05, 7.338635623455048e-05, 8.14385712146759e-05, 8.949078619480133e-05, 9.754300117492676e-05, 0.00010559521615505219, 0.00011364743113517761, 0.00012169964611530304, 0.00012975186109542847, 0.0001378040760755539, 0.00014585629105567932, 0.00015390850603580475, 0.00016196072101593018, 0.0001700129359960556, 0.00017806515097618103, 0.00018611736595630646, 0.00019416958093643188, 0.0002022217959165573, 0.00021027401089668274, 0.00021832622587680817, 0.0002263784408569336]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 4.0, 8.0, 7.0, 13.0, 20.0, 27.0, 32.0, 52.0, 122.0, 159.0, 294.0, 493.0, 747.0, 1344.0, 2491.0, 4545.0, 8875.0, 17066.0, 32258.0, 59591.0, 100759.0, 148457.0, 180638.0, 172080.0, 131677.0, 84037.0, 48319.0, 25759.0, 13268.0, 6947.0, 3715.0, 2032.0, 1116.0, 686.0, 343.0, 232.0, 117.0, 93.0, 51.0, 30.0, 21.0, 14.0, 9.0, 8.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.396484375, -3.296051025390625, -3.19561767578125, -3.095184326171875, -2.9947509765625, -2.894317626953125, -2.79388427734375, -2.693450927734375, -2.593017578125, -2.492584228515625, -2.39215087890625, -2.291717529296875, -2.1912841796875, -2.090850830078125, -1.99041748046875, -1.889984130859375, -1.78955078125, -1.689117431640625, -1.58868408203125, -1.488250732421875, -1.3878173828125, -1.287384033203125, -1.18695068359375, -1.086517333984375, -0.986083984375, -0.885650634765625, -0.78521728515625, -0.684783935546875, -0.5843505859375, -0.483917236328125, -0.38348388671875, -0.283050537109375, -0.1826171875, -0.082183837890625, 0.01824951171875, 0.118682861328125, 0.2191162109375, 0.319549560546875, 0.41998291015625, 0.520416259765625, 0.620849609375, 0.721282958984375, 0.82171630859375, 0.922149658203125, 1.0225830078125, 1.123016357421875, 1.22344970703125, 1.323883056640625, 1.42431640625, 1.524749755859375, 1.62518310546875, 1.725616455078125, 1.8260498046875, 1.926483154296875, 2.02691650390625, 2.127349853515625, 2.227783203125, 2.328216552734375, 2.42864990234375, 2.529083251953125, 2.6295166015625, 2.729949951171875, 2.83038330078125, 2.930816650390625, 3.03125]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 1.0, 2.0, 4.0, 5.0, 7.0, 8.0, 14.0, 23.0, 12.0, 18.0, 30.0, 30.0, 47.0, 43.0, 45.0, 68.0, 60.0, 57.0, 63.0, 57.0, 59.0, 56.0, 55.0, 54.0, 35.0, 26.0, 33.0, 16.0, 20.0, 14.0, 12.0, 6.0, 10.0, 6.0, 3.0, 8.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.404296875, -1.3660430908203125, -1.327789306640625, -1.2895355224609375, -1.25128173828125, -1.2130279541015625, -1.174774169921875, -1.1365203857421875, -1.0982666015625, -1.0600128173828125, -1.021759033203125, -0.9835052490234375, -0.94525146484375, -0.9069976806640625, -0.868743896484375, -0.8304901123046875, -0.792236328125, -0.7539825439453125, -0.715728759765625, -0.6774749755859375, -0.63922119140625, -0.6009674072265625, -0.562713623046875, -0.5244598388671875, -0.4862060546875, -0.4479522705078125, -0.409698486328125, -0.3714447021484375, -0.33319091796875, -0.2949371337890625, -0.256683349609375, -0.2184295654296875, -0.18017578125, -0.1419219970703125, -0.103668212890625, -0.0654144287109375, -0.02716064453125, 0.0110931396484375, 0.049346923828125, 0.0876007080078125, 0.1258544921875, 0.1641082763671875, 0.202362060546875, 0.2406158447265625, 0.27886962890625, 0.3171234130859375, 0.355377197265625, 0.3936309814453125, 0.431884765625, 0.4701385498046875, 0.508392333984375, 0.5466461181640625, 0.58489990234375, 0.6231536865234375, 0.661407470703125, 0.6996612548828125, 0.7379150390625, 0.7761688232421875, 0.814422607421875, 0.8526763916015625, 0.89093017578125, 0.9291839599609375, 0.967437744140625, 1.0056915283203125, 1.0439453125]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 4.0, 3.0, 8.0, 9.0, 4.0, 9.0, 6.0, 18.0, 16.0, 30.0, 23.0, 21.0, 29.0, 36.0, 43.0, 38.0, 33.0, 38.0, 45.0, 44.0, 45.0, 43.0, 42.0, 44.0, 44.0, 17.0, 29.0, 34.0, 37.0, 26.0, 39.0, 13.0, 20.0, 20.0, 15.0, 11.0, 6.0, 10.0, 13.0, 7.0, 5.0, 4.0, 7.0, 3.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0], "bins": [-7.390832424163818, -7.167598247528076, -6.944364547729492, -6.72113037109375, -6.497896194458008, -6.274662017822266, -6.051428318023682, -5.8281941413879395, -5.6049604415893555, -5.381726264953613, -5.158492565155029, -4.935258388519287, -4.712024211883545, -4.488790512084961, -4.265556335449219, -4.042322158813477, -3.8190879821777344, -3.5958540439605713, -3.372619867324829, -3.149385929107666, -2.926151752471924, -2.7029178142547607, -2.4796838760375977, -2.2564496994018555, -2.0332157611846924, -1.8099817037582397, -1.586747646331787, -1.363513708114624, -1.1402796506881714, -0.9170455932617188, -0.6938116550445557, -0.470577597618103, -0.2473435401916504, -0.02410951256752014, 0.1991245150566101, 0.42235851287841797, 0.6455925703048706, 0.8688266277313232, 1.0920605659484863, 1.315294623374939, 1.5385286808013916, 1.7617627382278442, 1.9849967956542969, 2.20823073387146, 2.431464672088623, 2.6546988487243652, 2.8779327869415283, 3.1011667251586914, 3.3244009017944336, 3.5476348400115967, 3.770869016647339, 3.994102954864502, 4.217337131500244, 4.440570831298828, 4.66380500793457, 4.8870391845703125, 5.110273361206055, 5.333507537841797, 5.556741237640381, 5.779975414276123, 6.003209590911865, 6.226443290710449, 6.449677467346191, 6.672911643981934, 6.896145343780518]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 6.0, 11.0, 12.0, 9.0, 20.0, 9.0, 21.0, 20.0, 27.0, 21.0, 29.0, 22.0, 19.0, 30.0, 30.0, 40.0, 54.0, 38.0, 54.0, 48.0, 32.0, 37.0, 38.0, 39.0, 33.0, 44.0, 33.0, 31.0, 27.0, 23.0, 27.0, 17.0, 17.0, 24.0, 15.0, 9.0, 8.0, 6.0, 4.0, 6.0, 5.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.792431354522705, -7.530953407287598, -7.26947546005249, -7.007997512817383, -6.746520042419434, -6.485042095184326, -6.223564147949219, -5.962086200714111, -5.700608253479004, -5.4391303062438965, -5.177652359008789, -4.91617488861084, -4.654696941375732, -4.393218994140625, -4.131741046905518, -3.87026309967041, -3.608785629272461, -3.3473076820373535, -3.085829973220825, -2.8243520259857178, -2.5628743171691895, -2.301396369934082, -2.0399184226989746, -1.7784405946731567, -1.5169627666473389, -1.255484938621521, -0.9940070509910583, -0.7325291633605957, -0.47105133533477783, -0.20957350730895996, 0.05190443992614746, 0.31338226795196533, 0.5748605728149414, 0.8363384008407593, 1.0978162288665771, 1.3592941761016846, 1.6207720041275024, 1.8822498321533203, 2.1437277793884277, 2.405205726623535, 2.6666834354400635, 2.928161382675171, 3.189639091491699, 3.4511170387268066, 3.712594985961914, 3.9740726947784424, 4.235550880432129, 4.497028350830078, 4.7585062980651855, 5.019984245300293, 5.2814621925354, 5.542940139770508, 5.804417610168457, 6.0658955574035645, 6.327373504638672, 6.588851451873779, 6.850329399108887, 7.111807346343994, 7.373285293579102, 7.634762763977051, 7.896240711212158, 8.157718658447266, 8.419197082519531, 8.68067455291748, 8.94215202331543]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 4.0, 6.0, 2.0, 6.0, 8.0, 14.0, 29.0, 39.0, 58.0, 109.0, 161.0, 256.0, 419.0, 711.0, 1110.0, 2024.0, 3678.0, 6984.0, 13523.0, 27632.0, 60126.0, 131351.0, 281410.0, 533054.0, 808181.0, 886019.0, 683525.0, 396494.0, 192249.0, 86834.0, 39473.0, 18392.0, 9127.0, 4844.0, 2706.0, 1384.0, 900.0, 536.0, 316.0, 223.0, 141.0, 92.0, 50.0, 40.0, 14.0, 13.0, 9.0, 5.0, 11.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.48828125, -7.23223876953125, -6.9761962890625, -6.72015380859375, -6.464111328125, -6.20806884765625, -5.9520263671875, -5.69598388671875, -5.43994140625, -5.18389892578125, -4.9278564453125, -4.67181396484375, -4.415771484375, -4.15972900390625, -3.9036865234375, -3.64764404296875, -3.3916015625, -3.13555908203125, -2.8795166015625, -2.62347412109375, -2.367431640625, -2.11138916015625, -1.8553466796875, -1.59930419921875, -1.34326171875, -1.08721923828125, -0.8311767578125, -0.57513427734375, -0.319091796875, -0.06304931640625, 0.1929931640625, 0.44903564453125, 0.705078125, 0.96112060546875, 1.2171630859375, 1.47320556640625, 1.729248046875, 1.98529052734375, 2.2413330078125, 2.49737548828125, 2.75341796875, 3.00946044921875, 3.2655029296875, 3.52154541015625, 3.777587890625, 4.03363037109375, 4.2896728515625, 4.54571533203125, 4.8017578125, 5.05780029296875, 5.3138427734375, 5.56988525390625, 5.825927734375, 6.08197021484375, 6.3380126953125, 6.59405517578125, 6.85009765625, 7.10614013671875, 7.3621826171875, 7.61822509765625, 7.874267578125, 8.13031005859375, 8.3863525390625, 8.64239501953125, 8.8984375]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 7.0, 1.0, 0.0, 3.0, 2.0, 5.0, 8.0, 9.0, 15.0, 10.0, 17.0, 13.0, 11.0, 25.0, 22.0, 34.0, 26.0, 19.0, 22.0, 38.0, 30.0, 43.0, 39.0, 42.0, 49.0, 41.0, 37.0, 39.0, 42.0, 40.0, 44.0, 35.0, 34.0, 29.0, 21.0, 22.0, 18.0, 20.0, 18.0, 12.0, 14.0, 13.0, 15.0, 10.0, 6.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.7578125, -6.52996826171875, -6.3021240234375, -6.07427978515625, -5.846435546875, -5.61859130859375, -5.3907470703125, -5.16290283203125, -4.93505859375, -4.70721435546875, -4.4793701171875, -4.25152587890625, -4.023681640625, -3.79583740234375, -3.5679931640625, -3.34014892578125, -3.1123046875, -2.88446044921875, -2.6566162109375, -2.42877197265625, -2.200927734375, -1.97308349609375, -1.7452392578125, -1.51739501953125, -1.28955078125, -1.06170654296875, -0.8338623046875, -0.60601806640625, -0.378173828125, -0.15032958984375, 0.0775146484375, 0.30535888671875, 0.533203125, 0.76104736328125, 0.9888916015625, 1.21673583984375, 1.444580078125, 1.67242431640625, 1.9002685546875, 2.12811279296875, 2.35595703125, 2.58380126953125, 2.8116455078125, 3.03948974609375, 3.267333984375, 3.49517822265625, 3.7230224609375, 3.95086669921875, 4.1787109375, 4.40655517578125, 4.6343994140625, 4.86224365234375, 5.090087890625, 5.31793212890625, 5.5457763671875, 5.77362060546875, 6.00146484375, 6.22930908203125, 6.4571533203125, 6.68499755859375, 6.912841796875, 7.14068603515625, 7.3685302734375, 7.59637451171875, 7.82421875]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 4.0, 5.0, 13.0, 14.0, 21.0, 27.0, 70.0, 95.0, 135.0, 227.0, 378.0, 630.0, 1099.0, 1895.0, 3469.0, 6430.0, 12566.0, 25074.0, 52920.0, 112497.0, 235199.0, 460990.0, 754804.0, 903459.0, 740642.0, 446039.0, 226520.0, 108101.0, 50596.0, 24395.0, 12039.0, 6180.0, 3323.0, 1824.0, 1095.0, 597.0, 337.0, 211.0, 127.0, 72.0, 59.0, 35.0, 14.0, 19.0, 15.0, 5.0, 9.0, 5.0, 6.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.5078125, -9.19580078125, -8.8837890625, -8.57177734375, -8.259765625, -7.94775390625, -7.6357421875, -7.32373046875, -7.01171875, -6.69970703125, -6.3876953125, -6.07568359375, -5.763671875, -5.45166015625, -5.1396484375, -4.82763671875, -4.515625, -4.20361328125, -3.8916015625, -3.57958984375, -3.267578125, -2.95556640625, -2.6435546875, -2.33154296875, -2.01953125, -1.70751953125, -1.3955078125, -1.08349609375, -0.771484375, -0.45947265625, -0.1474609375, 0.16455078125, 0.4765625, 0.78857421875, 1.1005859375, 1.41259765625, 1.724609375, 2.03662109375, 2.3486328125, 2.66064453125, 2.97265625, 3.28466796875, 3.5966796875, 3.90869140625, 4.220703125, 4.53271484375, 4.8447265625, 5.15673828125, 5.46875, 5.78076171875, 6.0927734375, 6.40478515625, 6.716796875, 7.02880859375, 7.3408203125, 7.65283203125, 7.96484375, 8.27685546875, 8.5888671875, 8.90087890625, 9.212890625, 9.52490234375, 9.8369140625, 10.14892578125, 10.4609375]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 3.0, 6.0, 9.0, 9.0, 22.0, 27.0, 36.0, 51.0, 75.0, 103.0, 115.0, 149.0, 165.0, 236.0, 260.0, 254.0, 286.0, 312.0, 318.0, 271.0, 242.0, 250.0, 173.0, 178.0, 130.0, 89.0, 82.0, 73.0, 41.0, 34.0, 35.0, 15.0, 13.0, 4.0, 4.0, 4.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.98046875, -2.8551025390625, -2.729736328125, -2.6043701171875, -2.47900390625, -2.3536376953125, -2.228271484375, -2.1029052734375, -1.9775390625, -1.8521728515625, -1.726806640625, -1.6014404296875, -1.47607421875, -1.3507080078125, -1.225341796875, -1.0999755859375, -0.974609375, -0.8492431640625, -0.723876953125, -0.5985107421875, -0.47314453125, -0.3477783203125, -0.222412109375, -0.0970458984375, 0.0283203125, 0.1536865234375, 0.279052734375, 0.4044189453125, 0.52978515625, 0.6551513671875, 0.780517578125, 0.9058837890625, 1.03125, 1.1566162109375, 1.281982421875, 1.4073486328125, 1.53271484375, 1.6580810546875, 1.783447265625, 1.9088134765625, 2.0341796875, 2.1595458984375, 2.284912109375, 2.4102783203125, 2.53564453125, 2.6610107421875, 2.786376953125, 2.9117431640625, 3.037109375, 3.1624755859375, 3.287841796875, 3.4132080078125, 3.53857421875, 3.6639404296875, 3.789306640625, 3.9146728515625, 4.0400390625, 4.1654052734375, 4.290771484375, 4.4161376953125, 4.54150390625, 4.6668701171875, 4.792236328125, 4.9176025390625, 5.04296875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 2.0, 5.0, 2.0, 1.0, 5.0, 12.0, 6.0, 10.0, 10.0, 14.0, 12.0, 13.0, 26.0, 24.0, 23.0, 28.0, 38.0, 32.0, 45.0, 35.0, 37.0, 41.0, 53.0, 35.0, 50.0, 46.0, 40.0, 38.0, 29.0, 36.0, 34.0, 27.0, 21.0, 22.0, 26.0, 15.0, 15.0, 16.0, 12.0, 16.0, 7.0, 8.0, 6.0, 5.0, 11.0, 5.0, 2.0, 3.0, 4.0, 4.0, 0.0, 0.0, 2.0, 3.0], "bins": [-7.569426536560059, -7.347121238708496, -7.124815940856934, -6.902510643005371, -6.68020486831665, -6.457899570465088, -6.235594272613525, -6.013288974761963, -5.790983200073242, -5.56867790222168, -5.346372604370117, -5.124067306518555, -4.901761531829834, -4.6794562339782715, -4.457150936126709, -4.2348456382751465, -4.012540340423584, -3.7902350425720215, -3.56792950630188, -3.3456242084503174, -3.123318672180176, -2.9010133743286133, -2.678708076477051, -2.4564027786254883, -2.2340972423553467, -2.011791944503784, -1.7894864082336426, -1.56718111038208, -1.344875693321228, -1.122570276260376, -0.9002649784088135, -0.6779595613479614, -0.4556546211242676, -0.23334923386573792, -0.011043846607208252, 0.21126151084899902, 0.4335669279098511, 0.6558723449707031, 0.8781776428222656, 1.1004830598831177, 1.3227884769439697, 1.5450938940048218, 1.7673993110656738, 1.9897046089172363, 2.212009906768799, 2.4343154430389404, 2.656620740890503, 2.8789262771606445, 3.101231575012207, 3.3235368728637695, 3.545842409133911, 3.7681477069854736, 3.9904532432556152, 4.212758541107178, 4.43506383895874, 4.657369136810303, 4.879674911499023, 5.101980209350586, 5.324285507202148, 5.546590805053711, 5.768896579742432, 5.991201877593994, 6.213507175445557, 6.435812473297119, 6.658117771148682]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 3.0, 5.0, 6.0, 7.0, 3.0, 11.0, 16.0, 26.0, 11.0, 21.0, 24.0, 19.0, 23.0, 24.0, 33.0, 42.0, 37.0, 43.0, 39.0, 47.0, 45.0, 39.0, 57.0, 41.0, 45.0, 33.0, 32.0, 40.0, 32.0, 30.0, 28.0, 26.0, 19.0, 19.0, 16.0, 19.0, 8.0, 11.0, 8.0, 5.0, 2.0, 7.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.914515018463135, -7.643177509307861, -7.371840000152588, -7.1005024909973145, -6.829165458679199, -6.557827949523926, -6.286490440368652, -6.015152931213379, -5.7438154220581055, -5.472477912902832, -5.201140403747559, -4.929802894592285, -4.658465385437012, -4.387127876281738, -4.115790843963623, -3.8444533348083496, -3.573115825653076, -3.3017783164978027, -3.0304408073425293, -2.759103536605835, -2.4877660274505615, -2.216428518295288, -1.9450911283493042, -1.6737537384033203, -1.4024162292480469, -1.1310787200927734, -0.8597413301467896, -0.5884038805961609, -0.3170664310455322, -0.04572892189025879, 0.2256084680557251, 0.496945858001709, 0.7682838439941406, 1.039621353149414, 1.310958743095398, 1.5822961330413818, 1.8536336421966553, 2.1249711513519287, 2.396308422088623, 2.6676459312438965, 2.93898344039917, 3.2103209495544434, 3.481658458709717, 3.752995729446411, 4.0243330001831055, 4.295670509338379, 4.567008018493652, 4.838345527648926, 5.109683036804199, 5.381020545959473, 5.652358055114746, 5.9236955642700195, 6.195033073425293, 6.466370582580566, 6.737707614898682, 7.009045124053955, 7.2803826332092285, 7.551720142364502, 7.823057651519775, 8.09439468383789, 8.365732192993164, 8.637069702148438, 8.908407211303711, 9.179744720458984, 9.451082229614258]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 2.0, 6.0, 8.0, 6.0, 10.0, 18.0, 23.0, 39.0, 64.0, 59.0, 77.0, 127.0, 192.0, 301.0, 460.0, 770.0, 1148.0, 2076.0, 3715.0, 7054.0, 14424.0, 29795.0, 61806.0, 118196.0, 190944.0, 224096.0, 178326.0, 106339.0, 54448.0, 26541.0, 12812.0, 6435.0, 3409.0, 1797.0, 1114.0, 648.0, 423.0, 297.0, 165.0, 125.0, 82.0, 48.0, 39.0, 40.0, 21.0, 14.0, 6.0, 7.0, 3.0, 4.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.287109375, -2.2093505859375, -2.131591796875, -2.0538330078125, -1.97607421875, -1.8983154296875, -1.820556640625, -1.7427978515625, -1.6650390625, -1.5872802734375, -1.509521484375, -1.4317626953125, -1.35400390625, -1.2762451171875, -1.198486328125, -1.1207275390625, -1.04296875, -0.9652099609375, -0.887451171875, -0.8096923828125, -0.73193359375, -0.6541748046875, -0.576416015625, -0.4986572265625, -0.4208984375, -0.3431396484375, -0.265380859375, -0.1876220703125, -0.10986328125, -0.0321044921875, 0.045654296875, 0.1234130859375, 0.201171875, 0.2789306640625, 0.356689453125, 0.4344482421875, 0.51220703125, 0.5899658203125, 0.667724609375, 0.7454833984375, 0.8232421875, 0.9010009765625, 0.978759765625, 1.0565185546875, 1.13427734375, 1.2120361328125, 1.289794921875, 1.3675537109375, 1.4453125, 1.5230712890625, 1.600830078125, 1.6785888671875, 1.75634765625, 1.8341064453125, 1.911865234375, 1.9896240234375, 2.0673828125, 2.1451416015625, 2.222900390625, 2.3006591796875, 2.37841796875, 2.4561767578125, 2.533935546875, 2.6116943359375, 2.689453125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 2.0, 8.0, 5.0, 5.0, 14.0, 9.0, 18.0, 14.0, 25.0, 22.0, 29.0, 35.0, 28.0, 30.0, 38.0, 40.0, 44.0, 54.0, 40.0, 53.0, 56.0, 40.0, 39.0, 57.0, 39.0, 33.0, 30.0, 39.0, 32.0, 26.0, 21.0, 22.0, 9.0, 11.0, 10.0, 5.0, 8.0, 10.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.3515625, -8.048583984375, -7.74560546875, -7.442626953125, -7.1396484375, -6.836669921875, -6.53369140625, -6.230712890625, -5.927734375, -5.624755859375, -5.32177734375, -5.018798828125, -4.7158203125, -4.412841796875, -4.10986328125, -3.806884765625, -3.50390625, -3.200927734375, -2.89794921875, -2.594970703125, -2.2919921875, -1.989013671875, -1.68603515625, -1.383056640625, -1.080078125, -0.777099609375, -0.47412109375, -0.171142578125, 0.1318359375, 0.434814453125, 0.73779296875, 1.040771484375, 1.34375, 1.646728515625, 1.94970703125, 2.252685546875, 2.5556640625, 2.858642578125, 3.16162109375, 3.464599609375, 3.767578125, 4.070556640625, 4.37353515625, 4.676513671875, 4.9794921875, 5.282470703125, 5.58544921875, 5.888427734375, 6.19140625, 6.494384765625, 6.79736328125, 7.100341796875, 7.4033203125, 7.706298828125, 8.00927734375, 8.312255859375, 8.615234375, 8.918212890625, 9.22119140625, 9.524169921875, 9.8271484375, 10.130126953125, 10.43310546875, 10.736083984375, 11.0390625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 4.0, 3.0, 4.0, 7.0, 6.0, 6.0, 7.0, 3.0, 10.0, 18.0, 19.0, 28.0, 26.0, 29.0, 43.0, 76.0, 79.0, 112.0, 178.0, 277.0, 460.0, 867.0, 1823.0, 4401.0, 12210.0, 40183.0, 878208.0, 79611.0, 18338.0, 6271.0, 2447.0, 1124.0, 622.0, 325.0, 208.0, 148.0, 110.0, 70.0, 39.0, 39.0, 27.0, 19.0, 21.0, 15.0, 12.0, 0.0, 3.0, 8.0, 6.0, 5.0, 3.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.546875, -9.2357177734375, -8.924560546875, -8.6134033203125, -8.30224609375, -7.9910888671875, -7.679931640625, -7.3687744140625, -7.0576171875, -6.7464599609375, -6.435302734375, -6.1241455078125, -5.81298828125, -5.5018310546875, -5.190673828125, -4.8795166015625, -4.568359375, -4.2572021484375, -3.946044921875, -3.6348876953125, -3.32373046875, -3.0125732421875, -2.701416015625, -2.3902587890625, -2.0791015625, -1.7679443359375, -1.456787109375, -1.1456298828125, -0.83447265625, -0.5233154296875, -0.212158203125, 0.0989990234375, 0.41015625, 0.7213134765625, 1.032470703125, 1.3436279296875, 1.65478515625, 1.9659423828125, 2.277099609375, 2.5882568359375, 2.8994140625, 3.2105712890625, 3.521728515625, 3.8328857421875, 4.14404296875, 4.4552001953125, 4.766357421875, 5.0775146484375, 5.388671875, 5.6998291015625, 6.010986328125, 6.3221435546875, 6.63330078125, 6.9444580078125, 7.255615234375, 7.5667724609375, 7.8779296875, 8.1890869140625, 8.500244140625, 8.8114013671875, 9.12255859375, 9.4337158203125, 9.744873046875, 10.0560302734375, 10.3671875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 4.0, 4.0, 3.0, 7.0, 7.0, 8.0, 6.0, 8.0, 7.0, 16.0, 17.0, 14.0, 19.0, 24.0, 28.0, 37.0, 32.0, 36.0, 38.0, 43.0, 32.0, 45.0, 47.0, 36.0, 41.0, 32.0, 37.0, 39.0, 37.0, 36.0, 31.0, 30.0, 37.0, 37.0, 19.0, 19.0, 25.0, 11.0, 11.0, 16.0, 7.0, 11.0, 5.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0], "bins": [-6.92578125, -6.73712158203125, -6.5484619140625, -6.35980224609375, -6.171142578125, -5.98248291015625, -5.7938232421875, -5.60516357421875, -5.41650390625, -5.22784423828125, -5.0391845703125, -4.85052490234375, -4.661865234375, -4.47320556640625, -4.2845458984375, -4.09588623046875, -3.9072265625, -3.71856689453125, -3.5299072265625, -3.34124755859375, -3.152587890625, -2.96392822265625, -2.7752685546875, -2.58660888671875, -2.39794921875, -2.20928955078125, -2.0206298828125, -1.83197021484375, -1.643310546875, -1.45465087890625, -1.2659912109375, -1.07733154296875, -0.888671875, -0.70001220703125, -0.5113525390625, -0.32269287109375, -0.134033203125, 0.05462646484375, 0.2432861328125, 0.43194580078125, 0.62060546875, 0.80926513671875, 0.9979248046875, 1.18658447265625, 1.375244140625, 1.56390380859375, 1.7525634765625, 1.94122314453125, 2.1298828125, 2.31854248046875, 2.5072021484375, 2.69586181640625, 2.884521484375, 3.07318115234375, 3.2618408203125, 3.45050048828125, 3.63916015625, 3.82781982421875, 4.0164794921875, 4.20513916015625, 4.393798828125, 4.58245849609375, 4.7711181640625, 4.95977783203125, 5.1484375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 3.0, 2.0, 3.0, 3.0, 7.0, 4.0, 7.0, 5.0, 11.0, 11.0, 11.0, 14.0, 22.0, 37.0, 48.0, 113.0, 167.0, 313.0, 681.0, 1711.0, 6541.0, 41914.0, 952709.0, 35389.0, 5730.0, 1637.0, 620.0, 333.0, 188.0, 115.0, 54.0, 42.0, 31.0, 23.0, 12.0, 14.0, 10.0, 9.0, 4.0, 2.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7509765625, -1.6986541748046875, -1.646331787109375, -1.5940093994140625, -1.54168701171875, -1.4893646240234375, -1.437042236328125, -1.3847198486328125, -1.3323974609375, -1.2800750732421875, -1.227752685546875, -1.1754302978515625, -1.12310791015625, -1.0707855224609375, -1.018463134765625, -0.9661407470703125, -0.913818359375, -0.8614959716796875, -0.809173583984375, -0.7568511962890625, -0.70452880859375, -0.6522064208984375, -0.599884033203125, -0.5475616455078125, -0.4952392578125, -0.4429168701171875, -0.390594482421875, -0.3382720947265625, -0.28594970703125, -0.2336273193359375, -0.181304931640625, -0.1289825439453125, -0.07666015625, -0.0243377685546875, 0.027984619140625, 0.0803070068359375, 0.13262939453125, 0.1849517822265625, 0.237274169921875, 0.2895965576171875, 0.3419189453125, 0.3942413330078125, 0.446563720703125, 0.4988861083984375, 0.55120849609375, 0.6035308837890625, 0.655853271484375, 0.7081756591796875, 0.760498046875, 0.8128204345703125, 0.865142822265625, 0.9174652099609375, 0.96978759765625, 1.0221099853515625, 1.074432373046875, 1.1267547607421875, 1.1790771484375, 1.2313995361328125, 1.283721923828125, 1.3360443115234375, 1.38836669921875, 1.4406890869140625, 1.493011474609375, 1.5453338623046875, 1.59765625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 4.0, 5.0, 8.0, 7.0, 11.0, 18.0, 16.0, 30.0, 34.0, 41.0, 49.0, 77.0, 78.0, 81.0, 79.0, 111.0, 84.0, 70.0, 46.0, 39.0, 23.0, 17.0, 17.0, 11.0, 10.0, 7.0, 6.0, 7.0, 2.0, 2.0, 1.0, 4.0, 2.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.9385089874267578e-05, -2.7992762625217438e-05, -2.6600435376167297e-05, -2.5208108127117157e-05, -2.3815780878067017e-05, -2.2423453629016876e-05, -2.1031126379966736e-05, -1.9638799130916595e-05, -1.8246471881866455e-05, -1.6854144632816315e-05, -1.5461817383766174e-05, -1.4069490134716034e-05, -1.2677162885665894e-05, -1.1284835636615753e-05, -9.892508387565613e-06, -8.500181138515472e-06, -7.107853889465332e-06, -5.715526640415192e-06, -4.323199391365051e-06, -2.930872142314911e-06, -1.5385448932647705e-06, -1.4621764421463013e-07, 1.2461096048355103e-06, 2.6384368538856506e-06, 4.030764102935791e-06, 5.423091351985931e-06, 6.815418601036072e-06, 8.207745850086212e-06, 9.600073099136353e-06, 1.0992400348186493e-05, 1.2384727597236633e-05, 1.3777054846286774e-05, 1.5169382095336914e-05, 1.6561709344387054e-05, 1.7954036593437195e-05, 1.9346363842487335e-05, 2.0738691091537476e-05, 2.2131018340587616e-05, 2.3523345589637756e-05, 2.4915672838687897e-05, 2.6308000087738037e-05, 2.7700327336788177e-05, 2.9092654585838318e-05, 3.0484981834888458e-05, 3.18773090839386e-05, 3.326963633298874e-05, 3.466196358203888e-05, 3.605429083108902e-05, 3.744661808013916e-05, 3.88389453291893e-05, 4.023127257823944e-05, 4.162359982728958e-05, 4.301592707633972e-05, 4.440825432538986e-05, 4.580058157444e-05, 4.719290882349014e-05, 4.858523607254028e-05, 4.9977563321590424e-05, 5.1369890570640564e-05, 5.2762217819690704e-05, 5.4154545068740845e-05, 5.5546872317790985e-05, 5.6939199566841125e-05, 5.8331526815891266e-05, 5.9723854064941406e-05]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 6.0, 2.0, 7.0, 7.0, 10.0, 14.0, 18.0, 35.0, 42.0, 59.0, 91.0, 109.0, 163.0, 190.0, 269.0, 388.0, 507.0, 733.0, 915.0, 1320.0, 1876.0, 2855.0, 4994.0, 9640.0, 23523.0, 76717.0, 294025.0, 420513.0, 140432.0, 37269.0, 13790.0, 6540.0, 3666.0, 2343.0, 1527.0, 1114.0, 767.0, 584.0, 416.0, 306.0, 227.0, 157.0, 111.0, 87.0, 54.0, 41.0, 26.0, 22.0, 19.0, 11.0, 12.0, 3.0, 6.0, 6.0, 0.0, 3.0, 0.0, 1.0, 2.0], "bins": [-1.3876953125, -1.3446197509765625, -1.301544189453125, -1.2584686279296875, -1.21539306640625, -1.1723175048828125, -1.129241943359375, -1.0861663818359375, -1.0430908203125, -1.0000152587890625, -0.956939697265625, -0.9138641357421875, -0.87078857421875, -0.8277130126953125, -0.784637451171875, -0.7415618896484375, -0.698486328125, -0.6554107666015625, -0.612335205078125, -0.5692596435546875, -0.52618408203125, -0.4831085205078125, -0.440032958984375, -0.3969573974609375, -0.3538818359375, -0.3108062744140625, -0.267730712890625, -0.2246551513671875, -0.18157958984375, -0.1385040283203125, -0.095428466796875, -0.0523529052734375, -0.00927734375, 0.0337982177734375, 0.076873779296875, 0.1199493408203125, 0.16302490234375, 0.2061004638671875, 0.249176025390625, 0.2922515869140625, 0.3353271484375, 0.3784027099609375, 0.421478271484375, 0.4645538330078125, 0.50762939453125, 0.5507049560546875, 0.593780517578125, 0.6368560791015625, 0.679931640625, 0.7230072021484375, 0.766082763671875, 0.8091583251953125, 0.85223388671875, 0.8953094482421875, 0.938385009765625, 0.9814605712890625, 1.0245361328125, 1.0676116943359375, 1.110687255859375, 1.1537628173828125, 1.19683837890625, 1.2399139404296875, 1.282989501953125, 1.3260650634765625, 1.369140625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 7.0, 13.0, 17.0, 18.0, 32.0, 60.0, 81.0, 110.0, 152.0, 164.0, 100.0, 72.0, 51.0, 36.0, 28.0, 12.0, 11.0, 7.0, 6.0, 2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 4.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.434326171875, -0.4203338623046875, -0.406341552734375, -0.3923492431640625, -0.37835693359375, -0.3643646240234375, -0.350372314453125, -0.3363800048828125, -0.3223876953125, -0.3083953857421875, -0.294403076171875, -0.2804107666015625, -0.26641845703125, -0.2524261474609375, -0.238433837890625, -0.2244415283203125, -0.21044921875, -0.1964569091796875, -0.182464599609375, -0.1684722900390625, -0.15447998046875, -0.1404876708984375, -0.126495361328125, -0.1125030517578125, -0.0985107421875, -0.0845184326171875, -0.070526123046875, -0.0565338134765625, -0.04254150390625, -0.0285491943359375, -0.014556884765625, -0.0005645751953125, 0.013427734375, 0.0274200439453125, 0.041412353515625, 0.0554046630859375, 0.06939697265625, 0.0833892822265625, 0.097381591796875, 0.1113739013671875, 0.1253662109375, 0.1393585205078125, 0.153350830078125, 0.1673431396484375, 0.18133544921875, 0.1953277587890625, 0.209320068359375, 0.2233123779296875, 0.2373046875, 0.2512969970703125, 0.265289306640625, 0.2792816162109375, 0.29327392578125, 0.3072662353515625, 0.321258544921875, 0.3352508544921875, 0.3492431640625, 0.3632354736328125, 0.377227783203125, 0.3912200927734375, 0.40521240234375, 0.4192047119140625, 0.433197021484375, 0.4471893310546875, 0.461181640625]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 3.0, 5.0, 3.0, 1.0, 6.0, 7.0, 5.0, 9.0, 9.0, 16.0, 12.0, 8.0, 15.0, 24.0, 20.0, 27.0, 25.0, 25.0, 27.0, 47.0, 44.0, 39.0, 34.0, 40.0, 42.0, 45.0, 38.0, 39.0, 38.0, 42.0, 32.0, 30.0, 36.0, 19.0, 20.0, 27.0, 22.0, 19.0, 11.0, 13.0, 14.0, 10.0, 11.0, 11.0, 6.0, 6.0, 6.0, 6.0, 6.0, 2.0, 5.0, 3.0, 2.0, 0.0, 1.0, 4.0], "bins": [-7.060250282287598, -6.849306106567383, -6.638362407684326, -6.427418231964111, -6.2164740562438965, -6.00553035736084, -5.794586181640625, -5.58364200592041, -5.372697830200195, -5.1617536544799805, -4.950809955596924, -4.739865779876709, -4.528921604156494, -4.3179779052734375, -4.107033729553223, -3.896089553833008, -3.685145854949951, -3.4742019176483154, -3.2632577419281006, -3.052313804626465, -2.84136962890625, -2.6304256916046143, -2.4194817543029785, -2.2085375785827637, -1.997593641281128, -1.7866495847702026, -1.5757055282592773, -1.3647615909576416, -1.1538175344467163, -0.942873477935791, -0.7319295406341553, -0.52098548412323, -0.3100419044494629, -0.09909787774085999, 0.11184614896774292, 0.32279014587402344, 0.5337342023849487, 0.744678258895874, 0.9556221961975098, 1.166566252708435, 1.3775103092193604, 1.5884543657302856, 1.799398422241211, 2.0103423595428467, 2.2212862968444824, 2.4322304725646973, 2.643174409866333, 2.8541183471679688, 3.0650625228881836, 3.2760064601898193, 3.486950635910034, 3.69789457321167, 3.9088387489318848, 4.119782447814941, 4.330726623535156, 4.541670799255371, 4.752614974975586, 4.963559150695801, 5.174502849578857, 5.385447025299072, 5.596391201019287, 5.807334899902344, 6.018279075622559, 6.229223251342773, 6.44016695022583]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 4.0, 8.0, 6.0, 2.0, 10.0, 18.0, 20.0, 15.0, 22.0, 25.0, 17.0, 18.0, 32.0, 28.0, 44.0, 33.0, 38.0, 39.0, 49.0, 42.0, 44.0, 58.0, 42.0, 43.0, 32.0, 38.0, 29.0, 40.0, 28.0, 30.0, 21.0, 28.0, 14.0, 21.0, 14.0, 11.0, 11.0, 11.0, 5.0, 3.0, 6.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.914395332336426, -7.645867824554443, -7.377339839935303, -7.10881233215332, -6.84028434753418, -6.571756839752197, -6.303229331970215, -6.034701347351074, -5.766173839569092, -5.497646331787109, -5.229118347167969, -4.960590839385986, -4.692063331604004, -4.423535346984863, -4.155007839202881, -3.8864800930023193, -3.617952346801758, -3.3494246006011963, -3.0808968544006348, -2.8123693466186523, -2.543841600418091, -2.2753138542175293, -2.006786346435547, -1.7382586002349854, -1.4697308540344238, -1.2012031078338623, -0.9326754808425903, -0.6641477942466736, -0.39562010765075684, -0.1270923614501953, 0.14143526554107666, 0.40996289253234863, 0.6784915924072266, 0.9470192790031433, 1.21554696559906, 1.484074592590332, 1.7526023387908936, 2.021130084991455, 2.2896575927734375, 2.558185338973999, 2.8267130851745605, 3.095240831375122, 3.3637685775756836, 3.632296085357666, 3.9008238315582275, 4.169351577758789, 4.4378790855407715, 4.706406593322754, 4.9749345779418945, 5.243462085723877, 5.511990070343018, 5.780517578125, 6.049045562744141, 6.317573070526123, 6.5861005783081055, 6.854628562927246, 7.1231560707092285, 7.391683578491211, 7.660211563110352, 7.928739070892334, 8.197266578674316, 8.465794563293457, 8.734322547912598, 9.002849578857422, 9.271377563476562]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 5.0, 4.0, 5.0, 5.0, 6.0, 11.0, 14.0, 20.0, 22.0, 50.0, 71.0, 112.0, 166.0, 256.0, 436.0, 623.0, 1045.0, 1686.0, 2844.0, 4554.0, 7546.0, 12279.0, 19865.0, 30689.0, 45539.0, 65179.0, 87675.0, 106927.0, 119744.0, 121949.0, 110571.0, 92902.0, 71236.0, 51126.0, 34511.0, 22693.0, 14058.0, 8598.0, 5226.0, 3162.0, 1971.0, 1219.0, 724.0, 438.0, 289.0, 168.0, 120.0, 72.0, 47.0, 40.0, 27.0, 11.0, 11.0, 7.0, 10.0, 3.0, 2.0, 1.0, 1.0], "bins": [-5.45703125, -5.29718017578125, -5.1373291015625, -4.97747802734375, -4.817626953125, -4.65777587890625, -4.4979248046875, -4.33807373046875, -4.17822265625, -4.01837158203125, -3.8585205078125, -3.69866943359375, -3.538818359375, -3.37896728515625, -3.2191162109375, -3.05926513671875, -2.8994140625, -2.73956298828125, -2.5797119140625, -2.41986083984375, -2.260009765625, -2.10015869140625, -1.9403076171875, -1.78045654296875, -1.62060546875, -1.46075439453125, -1.3009033203125, -1.14105224609375, -0.981201171875, -0.82135009765625, -0.6614990234375, -0.50164794921875, -0.341796875, -0.18194580078125, -0.0220947265625, 0.13775634765625, 0.297607421875, 0.45745849609375, 0.6173095703125, 0.77716064453125, 0.93701171875, 1.09686279296875, 1.2567138671875, 1.41656494140625, 1.576416015625, 1.73626708984375, 1.8961181640625, 2.05596923828125, 2.2158203125, 2.37567138671875, 2.5355224609375, 2.69537353515625, 2.855224609375, 3.01507568359375, 3.1749267578125, 3.33477783203125, 3.49462890625, 3.65447998046875, 3.8143310546875, 3.97418212890625, 4.134033203125, 4.29388427734375, 4.4537353515625, 4.61358642578125, 4.7734375]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 5.0, 2.0, 7.0, 3.0, 7.0, 14.0, 10.0, 24.0, 18.0, 24.0, 10.0, 14.0, 23.0, 36.0, 38.0, 43.0, 43.0, 37.0, 44.0, 45.0, 45.0, 56.0, 40.0, 31.0, 37.0, 40.0, 36.0, 34.0, 41.0, 27.0, 25.0, 21.0, 20.0, 17.0, 13.0, 13.0, 17.0, 11.0, 8.0, 9.0, 4.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.93359375, -7.66265869140625, -7.3917236328125, -7.12078857421875, -6.849853515625, -6.57891845703125, -6.3079833984375, -6.03704833984375, -5.76611328125, -5.49517822265625, -5.2242431640625, -4.95330810546875, -4.682373046875, -4.41143798828125, -4.1405029296875, -3.86956787109375, -3.5986328125, -3.32769775390625, -3.0567626953125, -2.78582763671875, -2.514892578125, -2.24395751953125, -1.9730224609375, -1.70208740234375, -1.43115234375, -1.16021728515625, -0.8892822265625, -0.61834716796875, -0.347412109375, -0.07647705078125, 0.1944580078125, 0.46539306640625, 0.736328125, 1.00726318359375, 1.2781982421875, 1.54913330078125, 1.820068359375, 2.09100341796875, 2.3619384765625, 2.63287353515625, 2.90380859375, 3.17474365234375, 3.4456787109375, 3.71661376953125, 3.987548828125, 4.25848388671875, 4.5294189453125, 4.80035400390625, 5.0712890625, 5.34222412109375, 5.6131591796875, 5.88409423828125, 6.155029296875, 6.42596435546875, 6.6968994140625, 6.96783447265625, 7.23876953125, 7.50970458984375, 7.7806396484375, 8.05157470703125, 8.322509765625, 8.59344482421875, 8.8643798828125, 9.13531494140625, 9.40625]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 8.0, 4.0, 9.0, 20.0, 18.0, 36.0, 79.0, 108.0, 172.0, 296.0, 510.0, 829.0, 1507.0, 2558.0, 4432.0, 7536.0, 12614.0, 20767.0, 33616.0, 51511.0, 75309.0, 100413.0, 122455.0, 132887.0, 127088.0, 108754.0, 84241.0, 59404.0, 39287.0, 25010.0, 15068.0, 8968.0, 5443.0, 3186.0, 1851.0, 1086.0, 588.0, 356.0, 200.0, 138.0, 81.0, 42.0, 32.0, 15.0, 16.0, 4.0, 7.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.26953125, -6.0833740234375, -5.897216796875, -5.7110595703125, -5.52490234375, -5.3387451171875, -5.152587890625, -4.9664306640625, -4.7802734375, -4.5941162109375, -4.407958984375, -4.2218017578125, -4.03564453125, -3.8494873046875, -3.663330078125, -3.4771728515625, -3.291015625, -3.1048583984375, -2.918701171875, -2.7325439453125, -2.54638671875, -2.3602294921875, -2.174072265625, -1.9879150390625, -1.8017578125, -1.6156005859375, -1.429443359375, -1.2432861328125, -1.05712890625, -0.8709716796875, -0.684814453125, -0.4986572265625, -0.3125, -0.1263427734375, 0.059814453125, 0.2459716796875, 0.43212890625, 0.6182861328125, 0.804443359375, 0.9906005859375, 1.1767578125, 1.3629150390625, 1.549072265625, 1.7352294921875, 1.92138671875, 2.1075439453125, 2.293701171875, 2.4798583984375, 2.666015625, 2.8521728515625, 3.038330078125, 3.2244873046875, 3.41064453125, 3.5968017578125, 3.782958984375, 3.9691162109375, 4.1552734375, 4.3414306640625, 4.527587890625, 4.7137451171875, 4.89990234375, 5.0860595703125, 5.272216796875, 5.4583740234375, 5.64453125]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 7.0, 7.0, 4.0, 13.0, 11.0, 16.0, 8.0, 18.0, 15.0, 18.0, 17.0, 20.0, 33.0, 38.0, 32.0, 37.0, 35.0, 48.0, 43.0, 54.0, 48.0, 44.0, 41.0, 41.0, 43.0, 35.0, 32.0, 39.0, 25.0, 23.0, 27.0, 25.0, 20.0, 11.0, 15.0, 11.0, 16.0, 8.0, 9.0, 4.0, 3.0, 4.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-6.37890625, -6.20123291015625, -6.0235595703125, -5.84588623046875, -5.668212890625, -5.49053955078125, -5.3128662109375, -5.13519287109375, -4.95751953125, -4.77984619140625, -4.6021728515625, -4.42449951171875, -4.246826171875, -4.06915283203125, -3.8914794921875, -3.71380615234375, -3.5361328125, -3.35845947265625, -3.1807861328125, -3.00311279296875, -2.825439453125, -2.64776611328125, -2.4700927734375, -2.29241943359375, -2.11474609375, -1.93707275390625, -1.7593994140625, -1.58172607421875, -1.404052734375, -1.22637939453125, -1.0487060546875, -0.87103271484375, -0.693359375, -0.51568603515625, -0.3380126953125, -0.16033935546875, 0.017333984375, 0.19500732421875, 0.3726806640625, 0.55035400390625, 0.72802734375, 0.90570068359375, 1.0833740234375, 1.26104736328125, 1.438720703125, 1.61639404296875, 1.7940673828125, 1.97174072265625, 2.1494140625, 2.32708740234375, 2.5047607421875, 2.68243408203125, 2.860107421875, 3.03778076171875, 3.2154541015625, 3.39312744140625, 3.57080078125, 3.74847412109375, 3.9261474609375, 4.10382080078125, 4.281494140625, 4.45916748046875, 4.6368408203125, 4.81451416015625, 4.9921875]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 5.0, 10.0, 15.0, 8.0, 24.0, 33.0, 55.0, 73.0, 127.0, 193.0, 300.0, 538.0, 898.0, 1836.0, 3550.0, 7839.0, 17643.0, 38526.0, 80838.0, 147753.0, 210036.0, 214855.0, 156771.0, 88045.0, 42374.0, 19025.0, 8618.0, 4017.0, 1998.0, 1084.0, 569.0, 314.0, 216.0, 109.0, 73.0, 47.0, 33.0, 27.0, 15.0, 19.0, 12.0, 6.0, 9.0, 4.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0], "bins": [-4.00390625, -3.88970947265625, -3.7755126953125, -3.66131591796875, -3.547119140625, -3.43292236328125, -3.3187255859375, -3.20452880859375, -3.09033203125, -2.97613525390625, -2.8619384765625, -2.74774169921875, -2.633544921875, -2.51934814453125, -2.4051513671875, -2.29095458984375, -2.1767578125, -2.06256103515625, -1.9483642578125, -1.83416748046875, -1.719970703125, -1.60577392578125, -1.4915771484375, -1.37738037109375, -1.26318359375, -1.14898681640625, -1.0347900390625, -0.92059326171875, -0.806396484375, -0.69219970703125, -0.5780029296875, -0.46380615234375, -0.349609375, -0.23541259765625, -0.1212158203125, -0.00701904296875, 0.107177734375, 0.22137451171875, 0.3355712890625, 0.44976806640625, 0.56396484375, 0.67816162109375, 0.7923583984375, 0.90655517578125, 1.020751953125, 1.13494873046875, 1.2491455078125, 1.36334228515625, 1.4775390625, 1.59173583984375, 1.7059326171875, 1.82012939453125, 1.934326171875, 2.04852294921875, 2.1627197265625, 2.27691650390625, 2.39111328125, 2.50531005859375, 2.6195068359375, 2.73370361328125, 2.847900390625, 2.96209716796875, 3.0762939453125, 3.19049072265625, 3.3046875]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 4.0, 6.0, 10.0, 14.0, 16.0, 24.0, 33.0, 29.0, 59.0, 42.0, 52.0, 56.0, 64.0, 82.0, 72.0, 67.0, 67.0, 53.0, 51.0, 55.0, 25.0, 24.0, 25.0, 23.0, 15.0, 7.0, 10.0, 4.0, 4.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00031876564025878906, -0.00030779093503952026, -0.00029681622982025146, -0.00028584152460098267, -0.00027486681938171387, -0.00026389211416244507, -0.00025291740894317627, -0.00024194270372390747, -0.00023096799850463867, -0.00021999329328536987, -0.00020901858806610107, -0.00019804388284683228, -0.00018706917762756348, -0.00017609447240829468, -0.00016511976718902588, -0.00015414506196975708, -0.00014317035675048828, -0.00013219565153121948, -0.00012122094631195068, -0.00011024624109268188, -9.927153587341309e-05, -8.829683065414429e-05, -7.732212543487549e-05, -6.634742021560669e-05, -5.537271499633789e-05, -4.439800977706909e-05, -3.342330455780029e-05, -2.2448599338531494e-05, -1.1473894119262695e-05, -4.991888999938965e-07, 1.0475516319274902e-05, 2.14502215385437e-05, 3.24249267578125e-05, 4.33996319770813e-05, 5.43743371963501e-05, 6.53490424156189e-05, 7.63237476348877e-05, 8.72984528541565e-05, 9.827315807342529e-05, 0.00010924786329269409, 0.00012022256851196289, 0.0001311972737312317, 0.0001421719789505005, 0.0001531466841697693, 0.00016412138938903809, 0.00017509609460830688, 0.00018607079982757568, 0.00019704550504684448, 0.00020802021026611328, 0.00021899491548538208, 0.00022996962070465088, 0.00024094432592391968, 0.0002519190311431885, 0.0002628937363624573, 0.0002738684415817261, 0.0002848431468009949, 0.00029581785202026367, 0.00030679255723953247, 0.00031776726245880127, 0.00032874196767807007, 0.00033971667289733887, 0.00035069137811660767, 0.00036166608333587646, 0.00037264078855514526, 0.00038361549377441406]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 9.0, 7.0, 10.0, 18.0, 21.0, 26.0, 45.0, 76.0, 98.0, 158.0, 240.0, 381.0, 584.0, 1029.0, 1820.0, 3270.0, 6243.0, 12269.0, 24550.0, 48499.0, 90600.0, 145800.0, 191193.0, 190111.0, 144833.0, 88770.0, 47695.0, 24149.0, 12018.0, 6121.0, 3316.0, 1743.0, 1066.0, 660.0, 384.0, 274.0, 157.0, 90.0, 64.0, 61.0, 32.0, 19.0, 18.0, 10.0, 5.0, 3.0, 6.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0], "bins": [-3.552734375, -3.445037841796875, -3.33734130859375, -3.229644775390625, -3.1219482421875, -3.014251708984375, -2.90655517578125, -2.798858642578125, -2.691162109375, -2.583465576171875, -2.47576904296875, -2.368072509765625, -2.2603759765625, -2.152679443359375, -2.04498291015625, -1.937286376953125, -1.82958984375, -1.721893310546875, -1.61419677734375, -1.506500244140625, -1.3988037109375, -1.291107177734375, -1.18341064453125, -1.075714111328125, -0.968017578125, -0.860321044921875, -0.75262451171875, -0.644927978515625, -0.5372314453125, -0.429534912109375, -0.32183837890625, -0.214141845703125, -0.1064453125, 0.001251220703125, 0.10894775390625, 0.216644287109375, 0.3243408203125, 0.432037353515625, 0.53973388671875, 0.647430419921875, 0.755126953125, 0.862823486328125, 0.97052001953125, 1.078216552734375, 1.1859130859375, 1.293609619140625, 1.40130615234375, 1.509002685546875, 1.61669921875, 1.724395751953125, 1.83209228515625, 1.939788818359375, 2.0474853515625, 2.155181884765625, 2.26287841796875, 2.370574951171875, 2.478271484375, 2.585968017578125, 2.69366455078125, 2.801361083984375, 2.9090576171875, 3.016754150390625, 3.12445068359375, 3.232147216796875, 3.33984375]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 3.0, 5.0, 1.0, 9.0, 6.0, 6.0, 7.0, 4.0, 5.0, 14.0, 16.0, 14.0, 21.0, 20.0, 16.0, 24.0, 16.0, 48.0, 35.0, 27.0, 44.0, 36.0, 48.0, 48.0, 40.0, 45.0, 51.0, 46.0, 50.0, 32.0, 40.0, 33.0, 30.0, 28.0, 23.0, 18.0, 15.0, 12.0, 10.0, 13.0, 13.0, 4.0, 8.0, 5.0, 3.0, 5.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0], "bins": [-0.90185546875, -0.8736343383789062, -0.8454132080078125, -0.8171920776367188, -0.788970947265625, -0.7607498168945312, -0.7325286865234375, -0.7043075561523438, -0.67608642578125, -0.6478652954101562, -0.6196441650390625, -0.5914230346679688, -0.563201904296875, -0.5349807739257812, -0.5067596435546875, -0.47853851318359375, -0.4503173828125, -0.42209625244140625, -0.3938751220703125, -0.36565399169921875, -0.337432861328125, -0.30921173095703125, -0.2809906005859375, -0.25276947021484375, -0.22454833984375, -0.19632720947265625, -0.1681060791015625, -0.13988494873046875, -0.111663818359375, -0.08344268798828125, -0.0552215576171875, -0.02700042724609375, 0.001220703125, 0.02944183349609375, 0.0576629638671875, 0.08588409423828125, 0.114105224609375, 0.14232635498046875, 0.1705474853515625, 0.19876861572265625, 0.22698974609375, 0.25521087646484375, 0.2834320068359375, 0.31165313720703125, 0.339874267578125, 0.36809539794921875, 0.3963165283203125, 0.42453765869140625, 0.4527587890625, 0.48097991943359375, 0.5092010498046875, 0.5374221801757812, 0.565643310546875, 0.5938644409179688, 0.6220855712890625, 0.6503067016601562, 0.67852783203125, 0.7067489624023438, 0.7349700927734375, 0.7631912231445312, 0.791412353515625, 0.8196334838867188, 0.8478546142578125, 0.8760757446289062, 0.904296875]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 3.0, 3.0, 3.0, 11.0, 8.0, 9.0, 8.0, 10.0, 12.0, 18.0, 16.0, 22.0, 26.0, 27.0, 28.0, 32.0, 46.0, 48.0, 44.0, 58.0, 56.0, 47.0, 54.0, 42.0, 40.0, 37.0, 34.0, 26.0, 37.0, 32.0, 19.0, 26.0, 18.0, 21.0, 16.0, 11.0, 11.0, 13.0, 11.0, 7.0, 3.0, 0.0, 4.0, 5.0, 4.0, 1.0, 0.0, 2.0, 3.0], "bins": [-8.940248489379883, -8.697125434875488, -8.454002380371094, -8.2108793258667, -7.967756748199463, -7.724633693695068, -7.481510639190674, -7.238387584686279, -6.995264530181885, -6.75214147567749, -6.509018421173096, -6.265895843505859, -6.022772789001465, -5.77964973449707, -5.536526679992676, -5.293403625488281, -5.050280570983887, -4.807157516479492, -4.564034461975098, -4.320911407470703, -4.077788829803467, -3.8346657752990723, -3.5915427207946777, -3.348419666290283, -3.105297088623047, -2.8621740341186523, -2.619051218032837, -2.3759281635284424, -2.132805109024048, -1.8896821737289429, -1.646559238433838, -1.4034361839294434, -1.1603131294250488, -0.9171901345252991, -0.6740671396255493, -0.43094420433044434, -0.18782120943069458, 0.055301785469055176, 0.29842472076416016, 0.5415477752685547, 0.7846707105636597, 1.0277936458587646, 1.2709167003631592, 1.5140396356582642, 1.7571625709533691, 2.0002856254577637, 2.243408679962158, 2.4865317344665527, 2.729654550552368, 2.9727776050567627, 3.215900421142578, 3.4590234756469727, 3.702146530151367, 3.9452695846557617, 4.188392639160156, 4.431515693664551, 4.674638271331787, 4.917761325836182, 5.160884380340576, 5.4040069580078125, 5.647130012512207, 5.890253067016602, 6.133376121520996, 6.376499176025391, 6.619622230529785]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 9.0, 3.0, 7.0, 6.0, 12.0, 13.0, 14.0, 20.0, 11.0, 18.0, 34.0, 24.0, 38.0, 25.0, 37.0, 40.0, 43.0, 59.0, 37.0, 46.0, 48.0, 52.0, 52.0, 47.0, 39.0, 40.0, 33.0, 23.0, 28.0, 26.0, 24.0, 20.0, 14.0, 13.0, 9.0, 7.0, 10.0, 3.0, 6.0, 3.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.129925727844238, -8.834258079528809, -8.538590431213379, -8.24292278289795, -7.9472551345825195, -7.65158748626709, -7.355920314788818, -7.060252666473389, -6.764585018157959, -6.468917369842529, -6.1732497215271, -5.87758207321167, -5.581914901733398, -5.286247253417969, -4.990579605102539, -4.694911956787109, -4.39924430847168, -4.10357666015625, -3.8079090118408203, -3.5122416019439697, -3.21657395362854, -2.9209063053131104, -2.6252388954162598, -2.32957124710083, -2.0339035987854004, -1.7382359504699707, -1.4425684213638306, -1.1469008922576904, -0.8512332439422607, -0.555565595626831, -0.2598980665206909, 0.03576946258544922, 0.3314371109008789, 0.6271046996116638, 0.9227722883224487, 1.2184398174285889, 1.5141074657440186, 1.8097751140594482, 2.105442523956299, 2.4011101722717285, 2.696777820587158, 2.992445468902588, 3.2881131172180176, 3.583780527114868, 3.879448175430298, 4.175115585327148, 4.470783233642578, 4.766450881958008, 5.0621185302734375, 5.357786178588867, 5.653453826904297, 5.949121475219727, 6.244789123535156, 6.540456771850586, 6.836123943328857, 7.131791591644287, 7.427459239959717, 7.7231268882751465, 8.018794059753418, 8.314461708068848, 8.610129356384277, 8.905797004699707, 9.201464653015137, 9.497132301330566, 9.792799949645996]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 5.0, 5.0, 13.0, 12.0, 24.0, 47.0, 73.0, 126.0, 169.0, 251.0, 368.0, 524.0, 867.0, 1331.0, 2049.0, 3288.0, 5354.0, 9176.0, 16409.0, 29807.0, 56114.0, 108532.0, 204566.0, 364165.0, 566429.0, 721924.0, 723567.0, 571226.0, 366963.0, 206365.0, 108472.0, 56298.0, 29591.0, 16144.0, 9245.0, 5341.0, 3399.0, 2051.0, 1300.0, 864.0, 590.0, 383.0, 259.0, 168.0, 146.0, 97.0, 61.0, 42.0, 34.0, 19.0, 16.0, 8.0, 5.0, 7.0, 1.0, 4.0, 0.0, 0.0, 2.0, 2.0, 1.0], "bins": [-6.22265625, -6.00811767578125, -5.7935791015625, -5.57904052734375, -5.364501953125, -5.14996337890625, -4.9354248046875, -4.72088623046875, -4.50634765625, -4.29180908203125, -4.0772705078125, -3.86273193359375, -3.648193359375, -3.43365478515625, -3.2191162109375, -3.00457763671875, -2.7900390625, -2.57550048828125, -2.3609619140625, -2.14642333984375, -1.931884765625, -1.71734619140625, -1.5028076171875, -1.28826904296875, -1.07373046875, -0.85919189453125, -0.6446533203125, -0.43011474609375, -0.215576171875, -0.00103759765625, 0.2135009765625, 0.42803955078125, 0.642578125, 0.85711669921875, 1.0716552734375, 1.28619384765625, 1.500732421875, 1.71527099609375, 1.9298095703125, 2.14434814453125, 2.35888671875, 2.57342529296875, 2.7879638671875, 3.00250244140625, 3.217041015625, 3.43157958984375, 3.6461181640625, 3.86065673828125, 4.0751953125, 4.28973388671875, 4.5042724609375, 4.71881103515625, 4.933349609375, 5.14788818359375, 5.3624267578125, 5.57696533203125, 5.79150390625, 6.00604248046875, 6.2205810546875, 6.43511962890625, 6.649658203125, 6.86419677734375, 7.0787353515625, 7.29327392578125, 7.5078125]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 4.0, 3.0, 5.0, 4.0, 4.0, 5.0, 5.0, 13.0, 6.0, 9.0, 11.0, 19.0, 16.0, 13.0, 22.0, 22.0, 30.0, 32.0, 34.0, 47.0, 29.0, 29.0, 47.0, 43.0, 47.0, 51.0, 42.0, 41.0, 39.0, 28.0, 37.0, 40.0, 25.0, 29.0, 27.0, 24.0, 24.0, 14.0, 21.0, 17.0, 15.0, 9.0, 7.0, 3.0, 7.0, 3.0, 2.0, 5.0, 2.0, 2.0, 2.0, 2.0], "bins": [-8.7421875, -8.50634765625, -8.2705078125, -8.03466796875, -7.798828125, -7.56298828125, -7.3271484375, -7.09130859375, -6.85546875, -6.61962890625, -6.3837890625, -6.14794921875, -5.912109375, -5.67626953125, -5.4404296875, -5.20458984375, -4.96875, -4.73291015625, -4.4970703125, -4.26123046875, -4.025390625, -3.78955078125, -3.5537109375, -3.31787109375, -3.08203125, -2.84619140625, -2.6103515625, -2.37451171875, -2.138671875, -1.90283203125, -1.6669921875, -1.43115234375, -1.1953125, -0.95947265625, -0.7236328125, -0.48779296875, -0.251953125, -0.01611328125, 0.2197265625, 0.45556640625, 0.69140625, 0.92724609375, 1.1630859375, 1.39892578125, 1.634765625, 1.87060546875, 2.1064453125, 2.34228515625, 2.578125, 2.81396484375, 3.0498046875, 3.28564453125, 3.521484375, 3.75732421875, 3.9931640625, 4.22900390625, 4.46484375, 4.70068359375, 4.9365234375, 5.17236328125, 5.408203125, 5.64404296875, 5.8798828125, 6.11572265625, 6.3515625]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 7.0, 6.0, 14.0, 18.0, 14.0, 28.0, 30.0, 49.0, 89.0, 133.0, 228.0, 381.0, 660.0, 1220.0, 2303.0, 4706.0, 9651.0, 21187.0, 48836.0, 116572.0, 278280.0, 589495.0, 949829.0, 983970.0, 642712.0, 311963.0, 132003.0, 54669.0, 23649.0, 10777.0, 5107.0, 2512.0, 1393.0, 725.0, 412.0, 241.0, 131.0, 97.0, 69.0, 37.0, 34.0, 19.0, 12.0, 11.0, 4.0, 2.0, 4.0, 1.0, 2.0, 2.0, 0.0, 4.0], "bins": [-12.765625, -12.401611328125, -12.03759765625, -11.673583984375, -11.3095703125, -10.945556640625, -10.58154296875, -10.217529296875, -9.853515625, -9.489501953125, -9.12548828125, -8.761474609375, -8.3974609375, -8.033447265625, -7.66943359375, -7.305419921875, -6.94140625, -6.577392578125, -6.21337890625, -5.849365234375, -5.4853515625, -5.121337890625, -4.75732421875, -4.393310546875, -4.029296875, -3.665283203125, -3.30126953125, -2.937255859375, -2.5732421875, -2.209228515625, -1.84521484375, -1.481201171875, -1.1171875, -0.753173828125, -0.38916015625, -0.025146484375, 0.3388671875, 0.702880859375, 1.06689453125, 1.430908203125, 1.794921875, 2.158935546875, 2.52294921875, 2.886962890625, 3.2509765625, 3.614990234375, 3.97900390625, 4.343017578125, 4.70703125, 5.071044921875, 5.43505859375, 5.799072265625, 6.1630859375, 6.527099609375, 6.89111328125, 7.255126953125, 7.619140625, 7.983154296875, 8.34716796875, 8.711181640625, 9.0751953125, 9.439208984375, 9.80322265625, 10.167236328125, 10.53125]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 4.0, 2.0, 3.0, 6.0, 12.0, 21.0, 19.0, 16.0, 33.0, 26.0, 43.0, 62.0, 69.0, 110.0, 106.0, 147.0, 161.0, 177.0, 201.0, 211.0, 262.0, 226.0, 223.0, 252.0, 244.0, 215.0, 205.0, 176.0, 165.0, 128.0, 129.0, 99.0, 80.0, 68.0, 37.0, 39.0, 27.0, 24.0, 15.0, 12.0, 10.0, 5.0, 5.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-3.650390625, -3.54449462890625, -3.4385986328125, -3.33270263671875, -3.226806640625, -3.12091064453125, -3.0150146484375, -2.90911865234375, -2.80322265625, -2.69732666015625, -2.5914306640625, -2.48553466796875, -2.379638671875, -2.27374267578125, -2.1678466796875, -2.06195068359375, -1.9560546875, -1.85015869140625, -1.7442626953125, -1.63836669921875, -1.532470703125, -1.42657470703125, -1.3206787109375, -1.21478271484375, -1.10888671875, -1.00299072265625, -0.8970947265625, -0.79119873046875, -0.685302734375, -0.57940673828125, -0.4735107421875, -0.36761474609375, -0.26171875, -0.15582275390625, -0.0499267578125, 0.05596923828125, 0.161865234375, 0.26776123046875, 0.3736572265625, 0.47955322265625, 0.58544921875, 0.69134521484375, 0.7972412109375, 0.90313720703125, 1.009033203125, 1.11492919921875, 1.2208251953125, 1.32672119140625, 1.4326171875, 1.53851318359375, 1.6444091796875, 1.75030517578125, 1.856201171875, 1.96209716796875, 2.0679931640625, 2.17388916015625, 2.27978515625, 2.38568115234375, 2.4915771484375, 2.59747314453125, 2.703369140625, 2.80926513671875, 2.9151611328125, 3.02105712890625, 3.126953125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 4.0, 8.0, 6.0, 7.0, 10.0, 11.0, 8.0, 10.0, 17.0, 21.0, 22.0, 21.0, 26.0, 20.0, 33.0, 27.0, 49.0, 45.0, 44.0, 38.0, 39.0, 53.0, 39.0, 33.0, 32.0, 38.0, 39.0, 39.0, 38.0, 25.0, 25.0, 27.0, 28.0, 18.0, 18.0, 14.0, 14.0, 11.0, 7.0, 9.0, 5.0, 5.0, 4.0, 7.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.112786769866943, -6.889453411102295, -6.666120529174805, -6.442787170410156, -6.219453811645508, -5.996120452880859, -5.772787570953369, -5.549454212188721, -5.3261213302612305, -5.102787971496582, -4.879455089569092, -4.656121730804443, -4.432788372039795, -4.209455490112305, -3.9861221313476562, -3.762788772583008, -3.5394554138183594, -3.31612229347229, -3.0927889347076416, -2.8694558143615723, -2.646122455596924, -2.4227893352508545, -2.199456214904785, -1.9761229753494263, -1.7527897357940674, -1.5294564962387085, -1.3061232566833496, -1.0827901363372803, -0.8594568967819214, -0.6361236572265625, -0.41279053688049316, -0.18945729732513428, 0.03387641906738281, 0.2572096288204193, 0.4805428385734558, 0.7038760185241699, 0.9272092580795288, 1.1505424976348877, 1.373875617980957, 1.597208857536316, 1.8205420970916748, 2.043875217437744, 2.2672085762023926, 2.490541696548462, 2.7138748168945312, 2.9372081756591797, 3.160541296005249, 3.3838744163513184, 3.607207775115967, 3.830540895462036, 4.0538740158081055, 4.277207374572754, 4.500540733337402, 4.723874092102051, 4.947206974029541, 5.1705403327941895, 5.39387321472168, 5.617206573486328, 5.840539455413818, 6.063872814178467, 6.287206172943115, 6.5105390548706055, 6.733872413635254, 6.957205772399902, 7.180539131164551]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 5.0, 11.0, 6.0, 5.0, 11.0, 10.0, 9.0, 14.0, 13.0, 21.0, 21.0, 27.0, 13.0, 29.0, 29.0, 28.0, 36.0, 35.0, 40.0, 31.0, 48.0, 42.0, 34.0, 41.0, 41.0, 37.0, 37.0, 49.0, 34.0, 36.0, 26.0, 22.0, 14.0, 27.0, 15.0, 9.0, 15.0, 23.0, 13.0, 9.0, 11.0, 7.0, 4.0, 1.0, 5.0, 6.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.118122577667236, -6.868508815765381, -6.618894577026367, -6.369280815124512, -6.119667053222656, -5.870053291320801, -5.620439529418945, -5.370825290679932, -5.121211528778076, -4.871597766876221, -4.621983528137207, -4.372369766235352, -4.122756004333496, -3.8731422424316406, -3.623528242111206, -3.3739142417907715, -3.124300479888916, -2.8746867179870605, -2.625072717666626, -2.3754587173461914, -2.125844955444336, -1.876231074333191, -1.626617193222046, -1.3770033121109009, -1.1273894309997559, -0.8777755498886108, -0.6281616687774658, -0.3785477876663208, -0.12893390655517578, 0.12067997455596924, 0.37029385566711426, 0.6199077367782593, 0.8695220947265625, 1.1191359758377075, 1.3687498569488525, 1.6183637380599976, 1.8679776191711426, 2.117591381072998, 2.3672053813934326, 2.616819381713867, 2.8664331436157227, 3.116046905517578, 3.3656609058380127, 3.6152749061584473, 3.8648886680603027, 4.114502429962158, 4.364116668701172, 4.613730430603027, 4.863344192504883, 5.112957954406738, 5.362571716308594, 5.612185955047607, 5.861799716949463, 6.111413478851318, 6.361027717590332, 6.6106414794921875, 6.860255241394043, 7.109869003295898, 7.359482765197754, 7.609097003936768, 7.858710765838623, 8.108325004577637, 8.357938766479492, 8.607552528381348, 8.857166290283203]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 5.0, 10.0, 13.0, 21.0, 20.0, 27.0, 45.0, 67.0, 115.0, 164.0, 280.0, 387.0, 689.0, 1143.0, 1904.0, 3420.0, 6159.0, 11094.0, 20248.0, 37364.0, 67561.0, 112041.0, 162863.0, 187782.0, 165093.0, 114866.0, 69332.0, 38488.0, 21159.0, 11483.0, 6277.0, 3394.0, 2053.0, 1134.0, 720.0, 416.0, 276.0, 159.0, 97.0, 66.0, 42.0, 28.0, 17.0, 12.0, 9.0, 3.0, 4.0, 6.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6865234375, -1.633026123046875, -1.57952880859375, -1.526031494140625, -1.4725341796875, -1.419036865234375, -1.36553955078125, -1.312042236328125, -1.258544921875, -1.205047607421875, -1.15155029296875, -1.098052978515625, -1.0445556640625, -0.991058349609375, -0.93756103515625, -0.884063720703125, -0.83056640625, -0.777069091796875, -0.72357177734375, -0.670074462890625, -0.6165771484375, -0.563079833984375, -0.50958251953125, -0.456085205078125, -0.402587890625, -0.349090576171875, -0.29559326171875, -0.242095947265625, -0.1885986328125, -0.135101318359375, -0.08160400390625, -0.028106689453125, 0.025390625, 0.078887939453125, 0.13238525390625, 0.185882568359375, 0.2393798828125, 0.292877197265625, 0.34637451171875, 0.399871826171875, 0.453369140625, 0.506866455078125, 0.56036376953125, 0.613861083984375, 0.6673583984375, 0.720855712890625, 0.77435302734375, 0.827850341796875, 0.88134765625, 0.934844970703125, 0.98834228515625, 1.041839599609375, 1.0953369140625, 1.148834228515625, 1.20233154296875, 1.255828857421875, 1.309326171875, 1.362823486328125, 1.41632080078125, 1.469818115234375, 1.5233154296875, 1.576812744140625, 1.63031005859375, 1.683807373046875, 1.7373046875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 8.0, 7.0, 12.0, 4.0, 12.0, 7.0, 11.0, 13.0, 21.0, 14.0, 19.0, 31.0, 32.0, 31.0, 29.0, 38.0, 28.0, 34.0, 44.0, 46.0, 32.0, 47.0, 44.0, 47.0, 35.0, 44.0, 42.0, 48.0, 36.0, 24.0, 22.0, 14.0, 19.0, 19.0, 13.0, 13.0, 18.0, 13.0, 7.0, 4.0, 10.0, 0.0, 5.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.0625, -7.7891845703125, -7.515869140625, -7.2425537109375, -6.96923828125, -6.6959228515625, -6.422607421875, -6.1492919921875, -5.8759765625, -5.6026611328125, -5.329345703125, -5.0560302734375, -4.78271484375, -4.5093994140625, -4.236083984375, -3.9627685546875, -3.689453125, -3.4161376953125, -3.142822265625, -2.8695068359375, -2.59619140625, -2.3228759765625, -2.049560546875, -1.7762451171875, -1.5029296875, -1.2296142578125, -0.956298828125, -0.6829833984375, -0.40966796875, -0.1363525390625, 0.136962890625, 0.4102783203125, 0.68359375, 0.9569091796875, 1.230224609375, 1.5035400390625, 1.77685546875, 2.0501708984375, 2.323486328125, 2.5968017578125, 2.8701171875, 3.1434326171875, 3.416748046875, 3.6900634765625, 3.96337890625, 4.2366943359375, 4.510009765625, 4.7833251953125, 5.056640625, 5.3299560546875, 5.603271484375, 5.8765869140625, 6.14990234375, 6.4232177734375, 6.696533203125, 6.9698486328125, 7.2431640625, 7.5164794921875, 7.789794921875, 8.0631103515625, 8.33642578125, 8.6097412109375, 8.883056640625, 9.1563720703125, 9.4296875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 6.0, 3.0, 4.0, 10.0, 10.0, 16.0, 24.0, 32.0, 39.0, 66.0, 99.0, 200.0, 344.0, 738.0, 2173.0, 7842.0, 32743.0, 888643.0, 93824.0, 15529.0, 3907.0, 1181.0, 502.0, 227.0, 133.0, 76.0, 48.0, 37.0, 25.0, 17.0, 14.0, 8.0, 9.0, 5.0, 5.0, 6.0, 4.0, 0.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.953125, -9.658203125, -9.36328125, -9.068359375, -8.7734375, -8.478515625, -8.18359375, -7.888671875, -7.59375, -7.298828125, -7.00390625, -6.708984375, -6.4140625, -6.119140625, -5.82421875, -5.529296875, -5.234375, -4.939453125, -4.64453125, -4.349609375, -4.0546875, -3.759765625, -3.46484375, -3.169921875, -2.875, -2.580078125, -2.28515625, -1.990234375, -1.6953125, -1.400390625, -1.10546875, -0.810546875, -0.515625, -0.220703125, 0.07421875, 0.369140625, 0.6640625, 0.958984375, 1.25390625, 1.548828125, 1.84375, 2.138671875, 2.43359375, 2.728515625, 3.0234375, 3.318359375, 3.61328125, 3.908203125, 4.203125, 4.498046875, 4.79296875, 5.087890625, 5.3828125, 5.677734375, 5.97265625, 6.267578125, 6.5625, 6.857421875, 7.15234375, 7.447265625, 7.7421875, 8.037109375, 8.33203125, 8.626953125, 8.921875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 6.0, 1.0, 0.0, 6.0, 7.0, 9.0, 5.0, 4.0, 17.0, 16.0, 13.0, 25.0, 25.0, 39.0, 35.0, 30.0, 37.0, 33.0, 31.0, 42.0, 36.0, 56.0, 36.0, 35.0, 50.0, 43.0, 37.0, 38.0, 29.0, 34.0, 21.0, 31.0, 25.0, 29.0, 23.0, 26.0, 14.0, 12.0, 12.0, 10.0, 13.0, 2.0, 7.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.1953125, -6.00079345703125, -5.8062744140625, -5.61175537109375, -5.417236328125, -5.22271728515625, -5.0281982421875, -4.83367919921875, -4.63916015625, -4.44464111328125, -4.2501220703125, -4.05560302734375, -3.861083984375, -3.66656494140625, -3.4720458984375, -3.27752685546875, -3.0830078125, -2.88848876953125, -2.6939697265625, -2.49945068359375, -2.304931640625, -2.11041259765625, -1.9158935546875, -1.72137451171875, -1.52685546875, -1.33233642578125, -1.1378173828125, -0.94329833984375, -0.748779296875, -0.55426025390625, -0.3597412109375, -0.16522216796875, 0.029296875, 0.22381591796875, 0.4183349609375, 0.61285400390625, 0.807373046875, 1.00189208984375, 1.1964111328125, 1.39093017578125, 1.58544921875, 1.77996826171875, 1.9744873046875, 2.16900634765625, 2.363525390625, 2.55804443359375, 2.7525634765625, 2.94708251953125, 3.1416015625, 3.33612060546875, 3.5306396484375, 3.72515869140625, 3.919677734375, 4.11419677734375, 4.3087158203125, 4.50323486328125, 4.69775390625, 4.89227294921875, 5.0867919921875, 5.28131103515625, 5.475830078125, 5.67034912109375, 5.8648681640625, 6.05938720703125, 6.25390625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 8.0, 2.0, 10.0, 11.0, 10.0, 13.0, 27.0, 24.0, 34.0, 53.0, 89.0, 112.0, 169.0, 313.0, 444.0, 788.0, 1374.0, 2585.0, 5090.0, 10344.0, 22291.0, 72548.0, 841994.0, 51022.0, 19736.0, 9308.0, 4574.0, 2386.0, 1289.0, 673.0, 415.0, 261.0, 174.0, 115.0, 82.0, 39.0, 33.0, 25.0, 24.0, 15.0, 14.0, 11.0, 8.0, 6.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.486328125, -0.47084808349609375, -0.4553680419921875, -0.43988800048828125, -0.424407958984375, -0.40892791748046875, -0.3934478759765625, -0.37796783447265625, -0.36248779296875, -0.34700775146484375, -0.3315277099609375, -0.31604766845703125, -0.300567626953125, -0.28508758544921875, -0.2696075439453125, -0.25412750244140625, -0.2386474609375, -0.22316741943359375, -0.2076873779296875, -0.19220733642578125, -0.176727294921875, -0.16124725341796875, -0.1457672119140625, -0.13028717041015625, -0.11480712890625, -0.09932708740234375, -0.0838470458984375, -0.06836700439453125, -0.052886962890625, -0.03740692138671875, -0.0219268798828125, -0.00644683837890625, 0.009033203125, 0.02451324462890625, 0.0399932861328125, 0.05547332763671875, 0.070953369140625, 0.08643341064453125, 0.1019134521484375, 0.11739349365234375, 0.13287353515625, 0.14835357666015625, 0.1638336181640625, 0.17931365966796875, 0.194793701171875, 0.21027374267578125, 0.2257537841796875, 0.24123382568359375, 0.2567138671875, 0.27219390869140625, 0.2876739501953125, 0.30315399169921875, 0.318634033203125, 0.33411407470703125, 0.3495941162109375, 0.36507415771484375, 0.38055419921875, 0.39603424072265625, 0.4115142822265625, 0.42699432373046875, 0.442474365234375, 0.45795440673828125, 0.4734344482421875, 0.48891448974609375, 0.50439453125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 6.0, 2.0, 11.0, 5.0, 11.0, 16.0, 21.0, 30.0, 34.0, 25.0, 48.0, 56.0, 52.0, 76.0, 84.0, 67.0, 58.0, 72.0, 60.0, 47.0, 43.0, 33.0, 28.0, 24.0, 26.0, 15.0, 9.0, 9.0, 9.0, 9.0, 3.0, 4.0, 4.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1398067474365234e-05, -2.0743347704410553e-05, -2.008862793445587e-05, -1.943390816450119e-05, -1.877918839454651e-05, -1.8124468624591827e-05, -1.7469748854637146e-05, -1.6815029084682465e-05, -1.6160309314727783e-05, -1.5505589544773102e-05, -1.485086977481842e-05, -1.4196150004863739e-05, -1.3541430234909058e-05, -1.2886710464954376e-05, -1.2231990694999695e-05, -1.1577270925045013e-05, -1.0922551155090332e-05, -1.026783138513565e-05, -9.61311161518097e-06, -8.958391845226288e-06, -8.303672075271606e-06, -7.648952305316925e-06, -6.994232535362244e-06, -6.339512765407562e-06, -5.684792995452881e-06, -5.0300732254981995e-06, -4.375353455543518e-06, -3.7206336855888367e-06, -3.0659139156341553e-06, -2.411194145679474e-06, -1.7564743757247925e-06, -1.101754605770111e-06, -4.470348358154297e-07, 2.076849341392517e-07, 8.624047040939331e-07, 1.5171244740486145e-06, 2.171844244003296e-06, 2.8265640139579773e-06, 3.4812837839126587e-06, 4.13600355386734e-06, 4.7907233238220215e-06, 5.445443093776703e-06, 6.100162863731384e-06, 6.754882633686066e-06, 7.409602403640747e-06, 8.064322173595428e-06, 8.71904194355011e-06, 9.373761713504791e-06, 1.0028481483459473e-05, 1.0683201253414154e-05, 1.1337921023368835e-05, 1.1992640793323517e-05, 1.2647360563278198e-05, 1.330208033323288e-05, 1.3956800103187561e-05, 1.4611519873142242e-05, 1.5266239643096924e-05, 1.5920959413051605e-05, 1.6575679183006287e-05, 1.7230398952960968e-05, 1.788511872291565e-05, 1.853983849287033e-05, 1.9194558262825012e-05, 1.9849278032779694e-05, 2.0503997802734375e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [4.0, 5.0, 1.0, 8.0, 3.0, 13.0, 12.0, 21.0, 36.0, 51.0, 80.0, 117.0, 155.0, 262.0, 401.0, 583.0, 820.0, 1188.0, 1820.0, 2965.0, 4471.0, 6742.0, 10367.0, 15289.0, 22650.0, 33535.0, 48727.0, 70078.0, 95313.0, 120714.0, 134665.0, 126899.0, 103875.0, 76625.0, 55006.0, 37898.0, 25888.0, 17117.0, 11658.0, 7719.0, 4901.0, 3425.0, 2192.0, 1397.0, 953.0, 619.0, 421.0, 264.0, 175.0, 138.0, 104.0, 57.0, 49.0, 30.0, 15.0, 18.0, 11.0, 6.0, 10.0, 5.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.264404296875, -0.2557792663574219, -0.24715423583984375, -0.23852920532226562, -0.2299041748046875, -0.22127914428710938, -0.21265411376953125, -0.20402908325195312, -0.195404052734375, -0.18677902221679688, -0.17815399169921875, -0.16952896118164062, -0.1609039306640625, -0.15227890014648438, -0.14365386962890625, -0.13502883911132812, -0.12640380859375, -0.11777877807617188, -0.10915374755859375, -0.10052871704101562, -0.0919036865234375, -0.08327865600585938, -0.07465362548828125, -0.06602859497070312, -0.057403564453125, -0.048778533935546875, -0.04015350341796875, -0.031528472900390625, -0.0229034423828125, -0.014278411865234375, -0.00565338134765625, 0.002971649169921875, 0.0115966796875, 0.020221710205078125, 0.02884674072265625, 0.037471771240234375, 0.0460968017578125, 0.054721832275390625, 0.06334686279296875, 0.07197189331054688, 0.080596923828125, 0.08922195434570312, 0.09784698486328125, 0.10647201538085938, 0.1150970458984375, 0.12372207641601562, 0.13234710693359375, 0.14097213745117188, 0.14959716796875, 0.15822219848632812, 0.16684722900390625, 0.17547225952148438, 0.1840972900390625, 0.19272232055664062, 0.20134735107421875, 0.20997238159179688, 0.218597412109375, 0.22722244262695312, 0.23584747314453125, 0.24447250366210938, 0.2530975341796875, 0.2617225646972656, 0.27034759521484375, 0.2789726257324219, 0.28759765625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 5.0, 0.0, 1.0, 3.0, 3.0, 4.0, 3.0, 5.0, 7.0, 12.0, 10.0, 12.0, 14.0, 15.0, 16.0, 24.0, 34.0, 31.0, 24.0, 29.0, 48.0, 25.0, 23.0, 28.0, 41.0, 40.0, 33.0, 34.0, 37.0, 34.0, 43.0, 28.0, 39.0, 43.0, 33.0, 31.0, 28.0, 23.0, 14.0, 26.0, 17.0, 16.0, 12.0, 21.0, 12.0, 8.0, 6.0, 5.0, 4.0, 1.0, 2.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.10870361328125, -0.10487842559814453, -0.10105323791503906, -0.0972280502319336, -0.09340286254882812, -0.08957767486572266, -0.08575248718261719, -0.08192729949951172, -0.07810211181640625, -0.07427692413330078, -0.07045173645019531, -0.06662654876708984, -0.06280136108398438, -0.058976173400878906, -0.05515098571777344, -0.05132579803466797, -0.0475006103515625, -0.04367542266845703, -0.03985023498535156, -0.036025047302246094, -0.032199859619140625, -0.028374671936035156, -0.024549484252929688, -0.02072429656982422, -0.01689910888671875, -0.013073921203613281, -0.009248733520507812, -0.005423545837402344, -0.001598358154296875, 0.0022268295288085938, 0.0060520172119140625, 0.009877204895019531, 0.013702392578125, 0.01752758026123047, 0.021352767944335938, 0.025177955627441406, 0.029003143310546875, 0.032828330993652344, 0.03665351867675781, 0.04047870635986328, 0.04430389404296875, 0.04812908172607422, 0.05195426940917969, 0.055779457092285156, 0.059604644775390625, 0.0634298324584961, 0.06725502014160156, 0.07108020782470703, 0.0749053955078125, 0.07873058319091797, 0.08255577087402344, 0.0863809585571289, 0.09020614624023438, 0.09403133392333984, 0.09785652160644531, 0.10168170928955078, 0.10550689697265625, 0.10933208465576172, 0.11315727233886719, 0.11698246002197266, 0.12080764770507812, 0.1246328353881836, 0.12845802307128906, 0.13228321075439453, 0.1361083984375]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 0.0, 0.0, 3.0, 6.0, 7.0, 6.0, 10.0, 7.0, 11.0, 14.0, 11.0, 19.0, 17.0, 22.0, 21.0, 21.0, 30.0, 24.0, 43.0, 42.0, 45.0, 45.0, 38.0, 33.0, 48.0, 46.0, 34.0, 35.0, 38.0, 46.0, 32.0, 31.0, 29.0, 28.0, 23.0, 23.0, 19.0, 18.0, 20.0, 9.0, 7.0, 6.0, 11.0, 5.0, 4.0, 7.0, 4.0, 5.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.970053195953369, -6.748722553253174, -6.5273919105529785, -6.306061267852783, -6.084730625152588, -5.863399982452393, -5.642068862915039, -5.420738220214844, -5.199407577514648, -4.978076934814453, -4.756746292114258, -4.5354156494140625, -4.314085006713867, -4.092754364013672, -3.8714234828948975, -3.650092840194702, -3.428762435913086, -3.2074317932128906, -2.9861011505126953, -2.7647705078125, -2.5434398651123047, -2.3221092224121094, -2.100778341293335, -1.8794476985931396, -1.6581170558929443, -1.436786413192749, -1.2154557704925537, -0.9941250085830688, -0.7727943658828735, -0.5514637231826782, -0.33013296127319336, -0.10880231857299805, 0.11252784729003906, 0.33385851979255676, 0.5551891922950745, 0.7765198945999146, 0.9978505373001099, 1.2191811800003052, 1.44051194190979, 1.6618425846099854, 1.8831732273101807, 2.104503870010376, 2.3258345127105713, 2.5471653938293457, 2.768496036529541, 2.9898266792297363, 3.2111573219299316, 3.432487964630127, 3.6538186073303223, 3.8751492500305176, 4.096479892730713, 4.317810535430908, 4.5391411781311035, 4.760471820831299, 4.981802940368652, 5.203133583068848, 5.424464225769043, 5.645794868469238, 5.867125511169434, 6.088456153869629, 6.309786796569824, 6.5311174392700195, 6.752448081970215, 6.97377872467041, 7.1951093673706055]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 3.0, 1.0, 5.0, 14.0, 5.0, 8.0, 9.0, 11.0, 10.0, 13.0, 19.0, 19.0, 20.0, 22.0, 24.0, 27.0, 30.0, 28.0, 37.0, 40.0, 32.0, 41.0, 46.0, 38.0, 34.0, 46.0, 33.0, 39.0, 48.0, 32.0, 41.0, 31.0, 27.0, 16.0, 21.0, 23.0, 13.0, 13.0, 18.0, 12.0, 16.0, 7.0, 12.0, 6.0, 3.0, 2.0, 6.0, 3.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.983174800872803, -6.734507083892822, -6.485838890075684, -6.237171173095703, -5.9885029792785645, -5.739835262298584, -5.491167068481445, -5.242499351501465, -4.993831634521484, -4.745163917541504, -4.496495723724365, -4.247828006744385, -3.999159812927246, -3.7504920959472656, -3.501824140548706, -3.2531561851501465, -3.004487991333008, -2.7558200359344482, -2.5071520805358887, -2.258484363555908, -2.0098161697387695, -1.7611483335494995, -1.5124804973602295, -1.26381254196167, -1.0151445865631104, -0.7664766311645508, -0.517808735370636, -0.2691408395767212, -0.02047288417816162, 0.22819507122039795, 0.47686290740966797, 0.7255308628082275, 0.9741983413696289, 1.2228662967681885, 1.471534252166748, 1.720202088356018, 1.9688700437545776, 2.2175378799438477, 2.4662058353424072, 2.714873790740967, 2.9635417461395264, 3.212209701538086, 3.4608776569366455, 3.709545612335205, 3.9582133293151855, 4.206881523132324, 4.455549240112305, 4.704216957092285, 4.952885150909424, 5.201552867889404, 5.450221061706543, 5.698888778686523, 5.947556972503662, 6.196224689483643, 6.444892883300781, 6.693560600280762, 6.942228317260742, 7.190896034240723, 7.439564228057861, 7.688231945037842, 7.9369001388549805, 8.185567855834961, 8.434235572814941, 8.682903289794922, 8.931571960449219]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 1.0, 4.0, 12.0, 13.0, 22.0, 29.0, 58.0, 119.0, 210.0, 345.0, 602.0, 1246.0, 2416.0, 4863.0, 9311.0, 17732.0, 32452.0, 54439.0, 85115.0, 120328.0, 146984.0, 154134.0, 138950.0, 106639.0, 72855.0, 44901.0, 25960.0, 13671.0, 7258.0, 3774.0, 1902.0, 1034.0, 486.0, 317.0, 164.0, 82.0, 48.0, 42.0, 20.0, 12.0, 4.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.23828125, -5.03131103515625, -4.8243408203125, -4.61737060546875, -4.410400390625, -4.20343017578125, -3.9964599609375, -3.78948974609375, -3.58251953125, -3.37554931640625, -3.1685791015625, -2.96160888671875, -2.754638671875, -2.54766845703125, -2.3406982421875, -2.13372802734375, -1.9267578125, -1.71978759765625, -1.5128173828125, -1.30584716796875, -1.098876953125, -0.89190673828125, -0.6849365234375, -0.47796630859375, -0.27099609375, -0.06402587890625, 0.1429443359375, 0.34991455078125, 0.556884765625, 0.76385498046875, 0.9708251953125, 1.17779541015625, 1.384765625, 1.59173583984375, 1.7987060546875, 2.00567626953125, 2.212646484375, 2.41961669921875, 2.6265869140625, 2.83355712890625, 3.04052734375, 3.24749755859375, 3.4544677734375, 3.66143798828125, 3.868408203125, 4.07537841796875, 4.2823486328125, 4.48931884765625, 4.6962890625, 4.90325927734375, 5.1102294921875, 5.31719970703125, 5.524169921875, 5.73114013671875, 5.9381103515625, 6.14508056640625, 6.35205078125, 6.55902099609375, 6.7659912109375, 6.97296142578125, 7.179931640625, 7.38690185546875, 7.5938720703125, 7.80084228515625, 8.0078125]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 9.0, 8.0, 3.0, 4.0, 13.0, 8.0, 12.0, 11.0, 18.0, 18.0, 14.0, 28.0, 28.0, 30.0, 25.0, 34.0, 33.0, 34.0, 45.0, 42.0, 53.0, 41.0, 41.0, 41.0, 39.0, 35.0, 38.0, 32.0, 39.0, 32.0, 29.0, 22.0, 21.0, 17.0, 25.0, 21.0, 18.0, 7.0, 10.0, 12.0, 5.0, 3.0, 1.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.375, -8.10498046875, -7.8349609375, -7.56494140625, -7.294921875, -7.02490234375, -6.7548828125, -6.48486328125, -6.21484375, -5.94482421875, -5.6748046875, -5.40478515625, -5.134765625, -4.86474609375, -4.5947265625, -4.32470703125, -4.0546875, -3.78466796875, -3.5146484375, -3.24462890625, -2.974609375, -2.70458984375, -2.4345703125, -2.16455078125, -1.89453125, -1.62451171875, -1.3544921875, -1.08447265625, -0.814453125, -0.54443359375, -0.2744140625, -0.00439453125, 0.265625, 0.53564453125, 0.8056640625, 1.07568359375, 1.345703125, 1.61572265625, 1.8857421875, 2.15576171875, 2.42578125, 2.69580078125, 2.9658203125, 3.23583984375, 3.505859375, 3.77587890625, 4.0458984375, 4.31591796875, 4.5859375, 4.85595703125, 5.1259765625, 5.39599609375, 5.666015625, 5.93603515625, 6.2060546875, 6.47607421875, 6.74609375, 7.01611328125, 7.2861328125, 7.55615234375, 7.826171875, 8.09619140625, 8.3662109375, 8.63623046875, 8.90625]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 3.0, 9.0, 17.0, 17.0, 41.0, 54.0, 89.0, 124.0, 210.0, 374.0, 632.0, 948.0, 1641.0, 2727.0, 4160.0, 6649.0, 10554.0, 16037.0, 24863.0, 36981.0, 52607.0, 71073.0, 90798.0, 106470.0, 115200.0, 113476.0, 102448.0, 84597.0, 65309.0, 47170.0, 32678.0, 22086.0, 14168.0, 9325.0, 5794.0, 3555.0, 2247.0, 1313.0, 827.0, 493.0, 291.0, 184.0, 131.0, 74.0, 51.0, 29.0, 20.0, 9.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-5.39453125, -5.23028564453125, -5.0660400390625, -4.90179443359375, -4.737548828125, -4.57330322265625, -4.4090576171875, -4.24481201171875, -4.08056640625, -3.91632080078125, -3.7520751953125, -3.58782958984375, -3.423583984375, -3.25933837890625, -3.0950927734375, -2.93084716796875, -2.7666015625, -2.60235595703125, -2.4381103515625, -2.27386474609375, -2.109619140625, -1.94537353515625, -1.7811279296875, -1.61688232421875, -1.45263671875, -1.28839111328125, -1.1241455078125, -0.95989990234375, -0.795654296875, -0.63140869140625, -0.4671630859375, -0.30291748046875, -0.138671875, 0.02557373046875, 0.1898193359375, 0.35406494140625, 0.518310546875, 0.68255615234375, 0.8468017578125, 1.01104736328125, 1.17529296875, 1.33953857421875, 1.5037841796875, 1.66802978515625, 1.832275390625, 1.99652099609375, 2.1607666015625, 2.32501220703125, 2.4892578125, 2.65350341796875, 2.8177490234375, 2.98199462890625, 3.146240234375, 3.31048583984375, 3.4747314453125, 3.63897705078125, 3.80322265625, 3.96746826171875, 4.1317138671875, 4.29595947265625, 4.460205078125, 4.62445068359375, 4.7886962890625, 4.95294189453125, 5.1171875]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 6.0, 2.0, 9.0, 9.0, 10.0, 11.0, 10.0, 17.0, 33.0, 16.0, 27.0, 24.0, 34.0, 30.0, 42.0, 42.0, 39.0, 52.0, 46.0, 54.0, 35.0, 47.0, 37.0, 38.0, 31.0, 41.0, 23.0, 27.0, 28.0, 28.0, 21.0, 30.0, 22.0, 9.0, 9.0, 13.0, 10.0, 17.0, 8.0, 6.0, 4.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3203125, -5.1456298828125, -4.970947265625, -4.7962646484375, -4.62158203125, -4.4468994140625, -4.272216796875, -4.0975341796875, -3.9228515625, -3.7481689453125, -3.573486328125, -3.3988037109375, -3.22412109375, -3.0494384765625, -2.874755859375, -2.7000732421875, -2.525390625, -2.3507080078125, -2.176025390625, -2.0013427734375, -1.82666015625, -1.6519775390625, -1.477294921875, -1.3026123046875, -1.1279296875, -0.9532470703125, -0.778564453125, -0.6038818359375, -0.42919921875, -0.2545166015625, -0.079833984375, 0.0948486328125, 0.26953125, 0.4442138671875, 0.618896484375, 0.7935791015625, 0.96826171875, 1.1429443359375, 1.317626953125, 1.4923095703125, 1.6669921875, 1.8416748046875, 2.016357421875, 2.1910400390625, 2.36572265625, 2.5404052734375, 2.715087890625, 2.8897705078125, 3.064453125, 3.2391357421875, 3.413818359375, 3.5885009765625, 3.76318359375, 3.9378662109375, 4.112548828125, 4.2872314453125, 4.4619140625, 4.6365966796875, 4.811279296875, 4.9859619140625, 5.16064453125, 5.3353271484375, 5.510009765625, 5.6846923828125, 5.859375]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 6.0, 10.0, 8.0, 18.0, 11.0, 13.0, 33.0, 34.0, 48.0, 74.0, 99.0, 104.0, 145.0, 219.0, 202.0, 299.0, 425.0, 599.0, 877.0, 1548.0, 3195.0, 8136.0, 22271.0, 61260.0, 142584.0, 242671.0, 259198.0, 172741.0, 80678.0, 30491.0, 10846.0, 4156.0, 1938.0, 1025.0, 650.0, 475.0, 322.0, 256.0, 211.0, 172.0, 142.0, 87.0, 85.0, 65.0, 49.0, 28.0, 18.0, 13.0, 14.0, 7.0, 5.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0], "bins": [-4.1953125, -4.05615234375, -3.9169921875, -3.77783203125, -3.638671875, -3.49951171875, -3.3603515625, -3.22119140625, -3.08203125, -2.94287109375, -2.8037109375, -2.66455078125, -2.525390625, -2.38623046875, -2.2470703125, -2.10791015625, -1.96875, -1.82958984375, -1.6904296875, -1.55126953125, -1.412109375, -1.27294921875, -1.1337890625, -0.99462890625, -0.85546875, -0.71630859375, -0.5771484375, -0.43798828125, -0.298828125, -0.15966796875, -0.0205078125, 0.11865234375, 0.2578125, 0.39697265625, 0.5361328125, 0.67529296875, 0.814453125, 0.95361328125, 1.0927734375, 1.23193359375, 1.37109375, 1.51025390625, 1.6494140625, 1.78857421875, 1.927734375, 2.06689453125, 2.2060546875, 2.34521484375, 2.484375, 2.62353515625, 2.7626953125, 2.90185546875, 3.041015625, 3.18017578125, 3.3193359375, 3.45849609375, 3.59765625, 3.73681640625, 3.8759765625, 4.01513671875, 4.154296875, 4.29345703125, 4.4326171875, 4.57177734375, 4.7109375]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 4.0, 11.0, 29.0, 53.0, 72.0, 109.0, 124.0, 147.0, 135.0, 111.0, 69.0, 58.0, 40.0, 15.0, 13.0, 4.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00057220458984375, -0.0005498304963111877, -0.0005274564027786255, -0.0005050823092460632, -0.000482708215713501, -0.0004603341221809387, -0.00043796002864837646, -0.0004155859351158142, -0.00039321184158325195, -0.0003708377480506897, -0.00034846365451812744, -0.0003260895609855652, -0.00030371546745300293, -0.0002813413739204407, -0.0002589672803878784, -0.00023659318685531616, -0.0002142190933227539, -0.00019184499979019165, -0.0001694709062576294, -0.00014709681272506714, -0.00012472271919250488, -0.00010234862565994263, -7.997453212738037e-05, -5.7600438594818115e-05, -3.522634506225586e-05, -1.2852251529693604e-05, 9.521842002868652e-06, 3.189593553543091e-05, 5.4270029067993164e-05, 7.664412260055542e-05, 9.901821613311768e-05, 0.00012139230966567993, 0.0001437664031982422, 0.00016614049673080444, 0.0001885145902633667, 0.00021088868379592896, 0.0002332627773284912, 0.00025563687086105347, 0.0002780109643936157, 0.000300385057926178, 0.00032275915145874023, 0.0003451332449913025, 0.00036750733852386475, 0.000389881432056427, 0.00041225552558898926, 0.0004346296191215515, 0.00045700371265411377, 0.000479377806186676, 0.0005017518997192383, 0.0005241259932518005, 0.0005465000867843628, 0.000568874180316925, 0.0005912482738494873, 0.0006136223673820496, 0.0006359964609146118, 0.0006583705544471741, 0.0006807446479797363, 0.0007031187415122986, 0.0007254928350448608, 0.0007478669285774231, 0.0007702410221099854, 0.0007926151156425476, 0.0008149892091751099, 0.0008373633027076721, 0.0008597373962402344]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 6.0, 3.0, 2.0, 6.0, 1.0, 7.0, 12.0, 18.0, 17.0, 23.0, 37.0, 41.0, 72.0, 88.0, 143.0, 160.0, 226.0, 356.0, 432.0, 719.0, 1137.0, 2084.0, 4668.0, 14505.0, 53294.0, 171285.0, 332568.0, 291104.0, 122352.0, 35169.0, 9819.0, 3481.0, 1632.0, 998.0, 600.0, 443.0, 291.0, 203.0, 139.0, 106.0, 74.0, 58.0, 44.0, 39.0, 25.0, 27.0, 14.0, 5.0, 6.0, 14.0, 5.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.91015625, -5.71209716796875, -5.5140380859375, -5.31597900390625, -5.117919921875, -4.91986083984375, -4.7218017578125, -4.52374267578125, -4.32568359375, -4.12762451171875, -3.9295654296875, -3.73150634765625, -3.533447265625, -3.33538818359375, -3.1373291015625, -2.93927001953125, -2.7412109375, -2.54315185546875, -2.3450927734375, -2.14703369140625, -1.948974609375, -1.75091552734375, -1.5528564453125, -1.35479736328125, -1.15673828125, -0.95867919921875, -0.7606201171875, -0.56256103515625, -0.364501953125, -0.16644287109375, 0.0316162109375, 0.22967529296875, 0.427734375, 0.62579345703125, 0.8238525390625, 1.02191162109375, 1.219970703125, 1.41802978515625, 1.6160888671875, 1.81414794921875, 2.01220703125, 2.21026611328125, 2.4083251953125, 2.60638427734375, 2.804443359375, 3.00250244140625, 3.2005615234375, 3.39862060546875, 3.5966796875, 3.79473876953125, 3.9927978515625, 4.19085693359375, 4.388916015625, 4.58697509765625, 4.7850341796875, 4.98309326171875, 5.18115234375, 5.37921142578125, 5.5772705078125, 5.77532958984375, 5.973388671875, 6.17144775390625, 6.3695068359375, 6.56756591796875, 6.765625]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 3.0, 2.0, 3.0, 3.0, 7.0, 10.0, 6.0, 9.0, 24.0, 35.0, 32.0, 50.0, 49.0, 76.0, 58.0, 75.0, 78.0, 73.0, 65.0, 72.0, 62.0, 46.0, 42.0, 28.0, 31.0, 17.0, 15.0, 12.0, 8.0, 7.0, 3.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.361328125, -1.315826416015625, -1.27032470703125, -1.224822998046875, -1.1793212890625, -1.133819580078125, -1.08831787109375, -1.042816162109375, -0.997314453125, -0.951812744140625, -0.90631103515625, -0.860809326171875, -0.8153076171875, -0.769805908203125, -0.72430419921875, -0.678802490234375, -0.63330078125, -0.587799072265625, -0.54229736328125, -0.496795654296875, -0.4512939453125, -0.405792236328125, -0.36029052734375, -0.314788818359375, -0.269287109375, -0.223785400390625, -0.17828369140625, -0.132781982421875, -0.0872802734375, -0.041778564453125, 0.00372314453125, 0.049224853515625, 0.0947265625, 0.140228271484375, 0.18572998046875, 0.231231689453125, 0.2767333984375, 0.322235107421875, 0.36773681640625, 0.413238525390625, 0.458740234375, 0.504241943359375, 0.54974365234375, 0.595245361328125, 0.6407470703125, 0.686248779296875, 0.73175048828125, 0.777252197265625, 0.82275390625, 0.868255615234375, 0.91375732421875, 0.959259033203125, 1.0047607421875, 1.050262451171875, 1.09576416015625, 1.141265869140625, 1.186767578125, 1.232269287109375, 1.27777099609375, 1.323272705078125, 1.3687744140625, 1.414276123046875, 1.45977783203125, 1.505279541015625, 1.55078125]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 4.0, 6.0, 5.0, 3.0, 6.0, 11.0, 6.0, 11.0, 15.0, 12.0, 15.0, 24.0, 18.0, 27.0, 27.0, 29.0, 39.0, 35.0, 45.0, 39.0, 34.0, 43.0, 29.0, 47.0, 39.0, 41.0, 45.0, 37.0, 38.0, 45.0, 27.0, 37.0, 20.0, 12.0, 15.0, 23.0, 14.0, 17.0, 20.0, 17.0, 8.0, 3.0, 11.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-7.595223426818848, -7.367879390716553, -7.140535354614258, -6.913191318511963, -6.685847282409668, -6.458503723144531, -6.231159687042236, -6.003815650939941, -5.7764716148376465, -5.549127578735352, -5.321783542633057, -5.094439506530762, -4.867095947265625, -4.639751434326172, -4.412407875061035, -4.18506383895874, -3.9577198028564453, -3.7303757667541504, -3.5030317306518555, -3.2756879329681396, -3.0483438968658447, -2.82099986076355, -2.593656063079834, -2.366312026977539, -2.138967990875244, -1.9116239547729492, -1.6842800378799438, -1.4569361209869385, -1.2295920848846436, -1.0022480487823486, -0.7749041318893433, -0.5475602149963379, -0.32021665573120117, -0.09287267923355103, 0.13447129726409912, 0.36181527376174927, 0.5891592502593994, 0.8165032863616943, 1.0438472032546997, 1.271191120147705, 1.49853515625, 1.725879192352295, 1.9532231092453003, 2.1805670261383057, 2.4079110622406006, 2.6352550983428955, 2.8625988960266113, 3.0899429321289062, 3.317286968231201, 3.544631004333496, 3.771975040435791, 3.999318838119507, 4.226662635803223, 4.454007148742676, 4.6813507080078125, 4.908694744110107, 5.136038780212402, 5.363382816314697, 5.590726852416992, 5.818070888519287, 6.045414924621582, 6.272758483886719, 6.500102519989014, 6.727446556091309, 6.9547905921936035]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 3.0, 2.0, 4.0, 2.0, 7.0, 7.0, 8.0, 7.0, 9.0, 15.0, 5.0, 13.0, 8.0, 28.0, 22.0, 11.0, 22.0, 22.0, 31.0, 28.0, 34.0, 52.0, 23.0, 31.0, 46.0, 36.0, 37.0, 42.0, 37.0, 41.0, 31.0, 28.0, 33.0, 34.0, 32.0, 31.0, 19.0, 18.0, 24.0, 21.0, 15.0, 15.0, 10.0, 12.0, 10.0, 3.0, 8.0, 7.0, 7.0, 6.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0], "bins": [-7.609628200531006, -7.362005233764648, -7.114382266998291, -6.866759300231934, -6.619136333465576, -6.371513366699219, -6.123889923095703, -5.876267433166504, -5.628643989562988, -5.381021022796631, -5.133398056030273, -4.885775089263916, -4.638152122497559, -4.390529155731201, -4.142906188964844, -3.8952829837799072, -3.647660255432129, -3.4000372886657715, -3.152414321899414, -2.9047913551330566, -2.657168388366699, -2.409545421600342, -2.1619222164154053, -1.9142992496490479, -1.6666762828826904, -1.419053316116333, -1.1714303493499756, -0.9238072633743286, -0.6761842966079712, -0.42856132984161377, -0.1809382438659668, 0.06668472290039062, 0.31430721282958984, 0.5619301795959473, 0.8095532059669495, 1.0571762323379517, 1.304799199104309, 1.5524221658706665, 1.8000452518463135, 2.047668218612671, 2.2952911853790283, 2.5429141521453857, 2.790537118911743, 3.0381603240966797, 3.285783290863037, 3.5334062576293945, 3.781029224395752, 4.028652191162109, 4.276275157928467, 4.523898124694824, 4.771521091461182, 5.019144058227539, 5.2667670249938965, 5.514389991760254, 5.7620134353637695, 6.009635925292969, 6.257259368896484, 6.504882335662842, 6.752505302429199, 7.000128269195557, 7.247751235961914, 7.4953742027282715, 7.742997169494629, 7.9906206130981445, 8.238243103027344]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 8.0, 9.0, 17.0, 21.0, 47.0, 69.0, 99.0, 155.0, 227.0, 314.0, 490.0, 783.0, 1117.0, 1725.0, 2705.0, 4052.0, 6608.0, 10880.0, 17950.0, 31846.0, 58187.0, 107615.0, 198754.0, 346950.0, 538522.0, 696946.0, 713958.0, 578149.0, 383212.0, 220802.0, 120742.0, 64229.0, 35411.0, 19783.0, 11660.0, 7085.0, 4476.0, 2891.0, 1835.0, 1237.0, 814.0, 549.0, 418.0, 281.0, 197.0, 144.0, 99.0, 59.0, 44.0, 36.0, 31.0, 19.0, 12.0, 7.0, 9.0, 3.0, 6.0, 3.0, 3.0], "bins": [-6.93359375, -6.71063232421875, -6.4876708984375, -6.26470947265625, -6.041748046875, -5.81878662109375, -5.5958251953125, -5.37286376953125, -5.14990234375, -4.92694091796875, -4.7039794921875, -4.48101806640625, -4.258056640625, -4.03509521484375, -3.8121337890625, -3.58917236328125, -3.3662109375, -3.14324951171875, -2.9202880859375, -2.69732666015625, -2.474365234375, -2.25140380859375, -2.0284423828125, -1.80548095703125, -1.58251953125, -1.35955810546875, -1.1365966796875, -0.91363525390625, -0.690673828125, -0.46771240234375, -0.2447509765625, -0.02178955078125, 0.201171875, 0.42413330078125, 0.6470947265625, 0.87005615234375, 1.093017578125, 1.31597900390625, 1.5389404296875, 1.76190185546875, 1.98486328125, 2.20782470703125, 2.4307861328125, 2.65374755859375, 2.876708984375, 3.09967041015625, 3.3226318359375, 3.54559326171875, 3.7685546875, 3.99151611328125, 4.2144775390625, 4.43743896484375, 4.660400390625, 4.88336181640625, 5.1063232421875, 5.32928466796875, 5.55224609375, 5.77520751953125, 5.9981689453125, 6.22113037109375, 6.444091796875, 6.66705322265625, 6.8900146484375, 7.11297607421875, 7.3359375]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 3.0, 1.0, 11.0, 5.0, 4.0, 4.0, 7.0, 9.0, 12.0, 14.0, 15.0, 19.0, 16.0, 21.0, 10.0, 23.0, 22.0, 23.0, 36.0, 30.0, 37.0, 41.0, 27.0, 41.0, 38.0, 40.0, 28.0, 47.0, 37.0, 27.0, 41.0, 36.0, 27.0, 22.0, 29.0, 34.0, 21.0, 23.0, 11.0, 15.0, 20.0, 14.0, 11.0, 6.0, 9.0, 10.0, 7.0, 5.0, 6.0, 4.0, 1.0, 3.0, 6.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.56640625, -6.341796875, -6.1171875, -5.892578125, -5.66796875, -5.443359375, -5.21875, -4.994140625, -4.76953125, -4.544921875, -4.3203125, -4.095703125, -3.87109375, -3.646484375, -3.421875, -3.197265625, -2.97265625, -2.748046875, -2.5234375, -2.298828125, -2.07421875, -1.849609375, -1.625, -1.400390625, -1.17578125, -0.951171875, -0.7265625, -0.501953125, -0.27734375, -0.052734375, 0.171875, 0.396484375, 0.62109375, 0.845703125, 1.0703125, 1.294921875, 1.51953125, 1.744140625, 1.96875, 2.193359375, 2.41796875, 2.642578125, 2.8671875, 3.091796875, 3.31640625, 3.541015625, 3.765625, 3.990234375, 4.21484375, 4.439453125, 4.6640625, 4.888671875, 5.11328125, 5.337890625, 5.5625, 5.787109375, 6.01171875, 6.236328125, 6.4609375, 6.685546875, 6.91015625, 7.134765625, 7.359375, 7.583984375, 7.80859375]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 4.0, 6.0, 5.0, 15.0, 11.0, 20.0, 25.0, 50.0, 81.0, 109.0, 179.0, 273.0, 433.0, 629.0, 947.0, 1595.0, 2758.0, 4681.0, 8342.0, 14675.0, 27442.0, 52369.0, 100500.0, 193632.0, 353711.0, 578828.0, 765455.0, 763066.0, 572614.0, 349901.0, 190333.0, 99008.0, 51350.0, 27104.0, 14442.0, 8064.0, 4585.0, 2672.0, 1671.0, 976.0, 620.0, 366.0, 255.0, 169.0, 108.0, 68.0, 48.0, 36.0, 20.0, 12.0, 11.0, 8.0, 6.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.90625, -8.6092529296875, -8.312255859375, -8.0152587890625, -7.71826171875, -7.4212646484375, -7.124267578125, -6.8272705078125, -6.5302734375, -6.2332763671875, -5.936279296875, -5.6392822265625, -5.34228515625, -5.0452880859375, -4.748291015625, -4.4512939453125, -4.154296875, -3.8572998046875, -3.560302734375, -3.2633056640625, -2.96630859375, -2.6693115234375, -2.372314453125, -2.0753173828125, -1.7783203125, -1.4813232421875, -1.184326171875, -0.8873291015625, -0.59033203125, -0.2933349609375, 0.003662109375, 0.3006591796875, 0.59765625, 0.8946533203125, 1.191650390625, 1.4886474609375, 1.78564453125, 2.0826416015625, 2.379638671875, 2.6766357421875, 2.9736328125, 3.2706298828125, 3.567626953125, 3.8646240234375, 4.16162109375, 4.4586181640625, 4.755615234375, 5.0526123046875, 5.349609375, 5.6466064453125, 5.943603515625, 6.2406005859375, 6.53759765625, 6.8345947265625, 7.131591796875, 7.4285888671875, 7.7255859375, 8.0225830078125, 8.319580078125, 8.6165771484375, 8.91357421875, 9.2105712890625, 9.507568359375, 9.8045654296875, 10.1015625]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 1.0, 6.0, 3.0, 1.0, 7.0, 9.0, 15.0, 12.0, 19.0, 24.0, 36.0, 30.0, 41.0, 44.0, 65.0, 75.0, 88.0, 105.0, 136.0, 132.0, 156.0, 189.0, 194.0, 198.0, 210.0, 215.0, 194.0, 182.0, 188.0, 207.0, 182.0, 171.0, 133.0, 138.0, 129.0, 98.0, 92.0, 69.0, 57.0, 52.0, 42.0, 25.0, 24.0, 23.0, 16.0, 19.0, 2.0, 10.0, 4.0, 3.0, 6.0, 4.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.009765625, -2.9105224609375, -2.811279296875, -2.7120361328125, -2.61279296875, -2.5135498046875, -2.414306640625, -2.3150634765625, -2.2158203125, -2.1165771484375, -2.017333984375, -1.9180908203125, -1.81884765625, -1.7196044921875, -1.620361328125, -1.5211181640625, -1.421875, -1.3226318359375, -1.223388671875, -1.1241455078125, -1.02490234375, -0.9256591796875, -0.826416015625, -0.7271728515625, -0.6279296875, -0.5286865234375, -0.429443359375, -0.3302001953125, -0.23095703125, -0.1317138671875, -0.032470703125, 0.0667724609375, 0.166015625, 0.2652587890625, 0.364501953125, 0.4637451171875, 0.56298828125, 0.6622314453125, 0.761474609375, 0.8607177734375, 0.9599609375, 1.0592041015625, 1.158447265625, 1.2576904296875, 1.35693359375, 1.4561767578125, 1.555419921875, 1.6546630859375, 1.75390625, 1.8531494140625, 1.952392578125, 2.0516357421875, 2.15087890625, 2.2501220703125, 2.349365234375, 2.4486083984375, 2.5478515625, 2.6470947265625, 2.746337890625, 2.8455810546875, 2.94482421875, 3.0440673828125, 3.143310546875, 3.2425537109375, 3.341796875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 2.0, 6.0, 3.0, 2.0, 5.0, 5.0, 8.0, 18.0, 18.0, 25.0, 21.0, 29.0, 30.0, 28.0, 33.0, 32.0, 43.0, 42.0, 47.0, 46.0, 41.0, 35.0, 46.0, 49.0, 40.0, 34.0, 41.0, 29.0, 31.0, 24.0, 35.0, 32.0, 18.0, 15.0, 9.0, 13.0, 15.0, 12.0, 10.0, 6.0, 2.0, 4.0, 6.0, 3.0, 4.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-8.041964530944824, -7.7941999435424805, -7.546435356140137, -7.298671245574951, -7.050906658172607, -6.803142070770264, -6.55537748336792, -6.307613372802734, -6.059848785400391, -5.812084197998047, -5.564319610595703, -5.316555500030518, -5.068790912628174, -4.82102632522583, -4.573261737823486, -4.325497627258301, -4.077733039855957, -3.8299684524536133, -3.5822041034698486, -3.334439516067505, -3.0866751670837402, -2.8389105796813965, -2.5911459922790527, -2.343381643295288, -2.0956168174743652, -1.847852349281311, -1.6000878810882568, -1.352323293685913, -1.1045589447021484, -0.8567943572998047, -0.6090298891067505, -0.3612654209136963, -0.11350107192993164, 0.13426341116428375, 0.38202789425849915, 0.6297923922538757, 0.8775568604469299, 1.125321388244629, 1.373085856437683, 1.6208503246307373, 1.8686147928237915, 2.1163792610168457, 2.3641438484191895, 2.611908197402954, 2.859672784805298, 3.1074371337890625, 3.3552017211914062, 3.60296630859375, 3.8507306575775146, 4.098495006561279, 4.346259593963623, 4.594024181365967, 4.8417887687683105, 5.089552879333496, 5.33731746673584, 5.585082054138184, 5.832846641540527, 6.080611228942871, 6.328375816345215, 6.5761399269104, 6.823904514312744, 7.071669101715088, 7.319433689117432, 7.567197799682617, 7.814962387084961]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 4.0, 4.0, 3.0, 7.0, 5.0, 4.0, 5.0, 10.0, 12.0, 11.0, 11.0, 16.0, 13.0, 19.0, 18.0, 25.0, 21.0, 21.0, 31.0, 31.0, 30.0, 32.0, 31.0, 40.0, 29.0, 34.0, 25.0, 32.0, 29.0, 35.0, 41.0, 45.0, 44.0, 17.0, 32.0, 23.0, 20.0, 20.0, 19.0, 24.0, 24.0, 12.0, 15.0, 11.0, 15.0, 8.0, 10.0, 7.0, 6.0, 7.0, 6.0, 4.0, 4.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0], "bins": [-7.477407932281494, -7.238779067993164, -7.000150203704834, -6.761521339416504, -6.522892951965332, -6.284264087677002, -6.045635223388672, -5.807006359100342, -5.568377494812012, -5.329748630523682, -5.091119766235352, -4.85249137878418, -4.61386251449585, -4.3752336502075195, -4.1366047859191895, -3.8979759216308594, -3.6593472957611084, -3.4207184314727783, -3.1820898056030273, -2.9434609413146973, -2.704832077026367, -2.466203212738037, -2.227574586868286, -1.988945722579956, -1.7503169775009155, -1.511688232421875, -1.273059368133545, -1.0344306230545044, -0.7958018183708191, -0.5571730136871338, -0.31854426860809326, -0.07991540431976318, 0.15871334075927734, 0.39734214544296265, 0.635970950126648, 0.8745996952056885, 1.1132285594940186, 1.351857304573059, 1.5904860496520996, 1.8291149139404297, 2.0677437782287598, 2.30637264251709, 2.545001268386841, 2.783630132675171, 3.022258996963501, 3.260887622833252, 3.499516487121582, 3.738145351409912, 3.976773977279663, 4.215402603149414, 4.454031467437744, 4.692660331726074, 4.931289196014404, 5.169918060302734, 5.408546447753906, 5.6471757888793945, 5.885804176330566, 6.1244330406188965, 6.363061904907227, 6.601690292358398, 6.8403191566467285, 7.078948020935059, 7.317576885223389, 7.556205749511719, 7.794834613800049]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 7.0, 15.0, 11.0, 31.0, 43.0, 89.0, 151.0, 269.0, 542.0, 1001.0, 2037.0, 4064.0, 7982.0, 16243.0, 31710.0, 61478.0, 109264.0, 167821.0, 201664.0, 178363.0, 121340.0, 69760.0, 36919.0, 18955.0, 9273.0, 4646.0, 2321.0, 1198.0, 642.0, 312.0, 181.0, 83.0, 55.0, 36.0, 21.0, 11.0, 5.0, 5.0, 0.0, 4.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.451171875, -1.3986053466796875, -1.346038818359375, -1.2934722900390625, -1.24090576171875, -1.1883392333984375, -1.135772705078125, -1.0832061767578125, -1.0306396484375, -0.9780731201171875, -0.925506591796875, -0.8729400634765625, -0.82037353515625, -0.7678070068359375, -0.715240478515625, -0.6626739501953125, -0.610107421875, -0.5575408935546875, -0.504974365234375, -0.4524078369140625, -0.39984130859375, -0.3472747802734375, -0.294708251953125, -0.2421417236328125, -0.1895751953125, -0.1370086669921875, -0.084442138671875, -0.0318756103515625, 0.02069091796875, 0.0732574462890625, 0.125823974609375, 0.1783905029296875, 0.23095703125, 0.2835235595703125, 0.336090087890625, 0.3886566162109375, 0.44122314453125, 0.4937896728515625, 0.546356201171875, 0.5989227294921875, 0.6514892578125, 0.7040557861328125, 0.756622314453125, 0.8091888427734375, 0.86175537109375, 0.9143218994140625, 0.966888427734375, 1.0194549560546875, 1.072021484375, 1.1245880126953125, 1.177154541015625, 1.2297210693359375, 1.28228759765625, 1.3348541259765625, 1.387420654296875, 1.4399871826171875, 1.4925537109375, 1.5451202392578125, 1.597686767578125, 1.6502532958984375, 1.70281982421875, 1.7553863525390625, 1.807952880859375, 1.8605194091796875, 1.9130859375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 7.0, 7.0, 6.0, 9.0, 7.0, 7.0, 9.0, 15.0, 6.0, 10.0, 9.0, 17.0, 19.0, 28.0, 24.0, 32.0, 37.0, 29.0, 36.0, 47.0, 30.0, 38.0, 31.0, 29.0, 34.0, 42.0, 47.0, 41.0, 30.0, 36.0, 39.0, 26.0, 22.0, 24.0, 19.0, 22.0, 22.0, 18.0, 14.0, 16.0, 16.0, 11.0, 7.0, 8.0, 8.0, 2.0, 6.0, 4.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.1484375, -7.8807373046875, -7.613037109375, -7.3453369140625, -7.07763671875, -6.8099365234375, -6.542236328125, -6.2745361328125, -6.0068359375, -5.7391357421875, -5.471435546875, -5.2037353515625, -4.93603515625, -4.6683349609375, -4.400634765625, -4.1329345703125, -3.865234375, -3.5975341796875, -3.329833984375, -3.0621337890625, -2.79443359375, -2.5267333984375, -2.259033203125, -1.9913330078125, -1.7236328125, -1.4559326171875, -1.188232421875, -0.9205322265625, -0.65283203125, -0.3851318359375, -0.117431640625, 0.1502685546875, 0.41796875, 0.6856689453125, 0.953369140625, 1.2210693359375, 1.48876953125, 1.7564697265625, 2.024169921875, 2.2918701171875, 2.5595703125, 2.8272705078125, 3.094970703125, 3.3626708984375, 3.63037109375, 3.8980712890625, 4.165771484375, 4.4334716796875, 4.701171875, 4.9688720703125, 5.236572265625, 5.5042724609375, 5.77197265625, 6.0396728515625, 6.307373046875, 6.5750732421875, 6.8427734375, 7.1104736328125, 7.378173828125, 7.6458740234375, 7.91357421875, 8.1812744140625, 8.448974609375, 8.7166748046875, 8.984375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 5.0, 12.0, 16.0, 13.0, 18.0, 31.0, 48.0, 80.0, 92.0, 154.0, 199.0, 382.0, 625.0, 1056.0, 1789.0, 3145.0, 5170.0, 9049.0, 15808.0, 31839.0, 181280.0, 673648.0, 69625.0, 23424.0, 12959.0, 7421.0, 4301.0, 2595.0, 1445.0, 863.0, 521.0, 316.0, 222.0, 133.0, 78.0, 46.0, 52.0, 27.0, 18.0, 18.0, 10.0, 10.0, 5.0, 4.0, 5.0, 2.0, 2.0], "bins": [-3.3828125, -3.29449462890625, -3.2061767578125, -3.11785888671875, -3.029541015625, -2.94122314453125, -2.8529052734375, -2.76458740234375, -2.67626953125, -2.58795166015625, -2.4996337890625, -2.41131591796875, -2.322998046875, -2.23468017578125, -2.1463623046875, -2.05804443359375, -1.9697265625, -1.88140869140625, -1.7930908203125, -1.70477294921875, -1.616455078125, -1.52813720703125, -1.4398193359375, -1.35150146484375, -1.26318359375, -1.17486572265625, -1.0865478515625, -0.99822998046875, -0.909912109375, -0.82159423828125, -0.7332763671875, -0.64495849609375, -0.556640625, -0.46832275390625, -0.3800048828125, -0.29168701171875, -0.203369140625, -0.11505126953125, -0.0267333984375, 0.06158447265625, 0.14990234375, 0.23822021484375, 0.3265380859375, 0.41485595703125, 0.503173828125, 0.59149169921875, 0.6798095703125, 0.76812744140625, 0.8564453125, 0.94476318359375, 1.0330810546875, 1.12139892578125, 1.209716796875, 1.29803466796875, 1.3863525390625, 1.47467041015625, 1.56298828125, 1.65130615234375, 1.7396240234375, 1.82794189453125, 1.916259765625, 2.00457763671875, 2.0928955078125, 2.18121337890625, 2.26953125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 7.0, 5.0, 3.0, 6.0, 2.0, 5.0, 9.0, 10.0, 7.0, 16.0, 18.0, 19.0, 29.0, 20.0, 24.0, 17.0, 33.0, 27.0, 29.0, 24.0, 31.0, 45.0, 23.0, 41.0, 38.0, 52.0, 28.0, 28.0, 39.0, 34.0, 40.0, 36.0, 33.0, 29.0, 27.0, 18.0, 18.0, 18.0, 26.0, 22.0, 9.0, 12.0, 6.0, 8.0, 7.0, 12.0, 4.0, 3.0, 7.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 5.0, 0.0, 1.0], "bins": [-5.5859375, -5.4075927734375, -5.229248046875, -5.0509033203125, -4.87255859375, -4.6942138671875, -4.515869140625, -4.3375244140625, -4.1591796875, -3.9808349609375, -3.802490234375, -3.6241455078125, -3.44580078125, -3.2674560546875, -3.089111328125, -2.9107666015625, -2.732421875, -2.5540771484375, -2.375732421875, -2.1973876953125, -2.01904296875, -1.8406982421875, -1.662353515625, -1.4840087890625, -1.3056640625, -1.1273193359375, -0.948974609375, -0.7706298828125, -0.59228515625, -0.4139404296875, -0.235595703125, -0.0572509765625, 0.12109375, 0.2994384765625, 0.477783203125, 0.6561279296875, 0.83447265625, 1.0128173828125, 1.191162109375, 1.3695068359375, 1.5478515625, 1.7261962890625, 1.904541015625, 2.0828857421875, 2.26123046875, 2.4395751953125, 2.617919921875, 2.7962646484375, 2.974609375, 3.1529541015625, 3.331298828125, 3.5096435546875, 3.68798828125, 3.8663330078125, 4.044677734375, 4.2230224609375, 4.4013671875, 4.5797119140625, 4.758056640625, 4.9364013671875, 5.11474609375, 5.2930908203125, 5.471435546875, 5.6497802734375, 5.828125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 10.0, 12.0, 9.0, 24.0, 29.0, 44.0, 55.0, 96.0, 144.0, 219.0, 295.0, 483.0, 857.0, 1359.0, 2460.0, 4121.0, 7626.0, 13757.0, 25766.0, 100055.0, 792290.0, 50662.0, 21458.0, 11405.0, 6425.0, 3678.0, 2077.0, 1176.0, 735.0, 433.0, 289.0, 180.0, 104.0, 72.0, 46.0, 44.0, 16.0, 24.0, 13.0, 8.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.39501953125, -0.38242340087890625, -0.3698272705078125, -0.35723114013671875, -0.344635009765625, -0.33203887939453125, -0.3194427490234375, -0.30684661865234375, -0.29425048828125, -0.28165435791015625, -0.2690582275390625, -0.25646209716796875, -0.243865966796875, -0.23126983642578125, -0.2186737060546875, -0.20607757568359375, -0.1934814453125, -0.18088531494140625, -0.1682891845703125, -0.15569305419921875, -0.143096923828125, -0.13050079345703125, -0.1179046630859375, -0.10530853271484375, -0.09271240234375, -0.08011627197265625, -0.0675201416015625, -0.05492401123046875, -0.042327880859375, -0.02973175048828125, -0.0171356201171875, -0.00453948974609375, 0.008056640625, 0.02065277099609375, 0.0332489013671875, 0.04584503173828125, 0.058441162109375, 0.07103729248046875, 0.0836334228515625, 0.09622955322265625, 0.10882568359375, 0.12142181396484375, 0.1340179443359375, 0.14661407470703125, 0.159210205078125, 0.17180633544921875, 0.1844024658203125, 0.19699859619140625, 0.2095947265625, 0.22219085693359375, 0.2347869873046875, 0.24738311767578125, 0.259979248046875, 0.27257537841796875, 0.2851715087890625, 0.29776763916015625, 0.31036376953125, 0.32295989990234375, 0.3355560302734375, 0.34815216064453125, 0.360748291015625, 0.37334442138671875, 0.3859405517578125, 0.39853668212890625, 0.4111328125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 4.0, 1.0, 9.0, 5.0, 3.0, 4.0, 4.0, 11.0, 18.0, 16.0, 32.0, 16.0, 30.0, 34.0, 38.0, 33.0, 60.0, 39.0, 61.0, 50.0, 41.0, 50.0, 57.0, 57.0, 34.0, 63.0, 34.0, 33.0, 22.0, 28.0, 26.0, 18.0, 14.0, 19.0, 11.0, 7.0, 4.0, 4.0, 4.0, 2.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.531839370727539e-05, -1.4890916645526886e-05, -1.4463439583778381e-05, -1.4035962522029877e-05, -1.3608485460281372e-05, -1.3181008398532867e-05, -1.2753531336784363e-05, -1.2326054275035858e-05, -1.1898577213287354e-05, -1.1471100151538849e-05, -1.1043623089790344e-05, -1.061614602804184e-05, -1.0188668966293335e-05, -9.76119190454483e-06, -9.333714842796326e-06, -8.906237781047821e-06, -8.478760719299316e-06, -8.051283657550812e-06, -7.623806595802307e-06, -7.1963295340538025e-06, -6.768852472305298e-06, -6.341375410556793e-06, -5.9138983488082886e-06, -5.486421287059784e-06, -5.058944225311279e-06, -4.631467163562775e-06, -4.20399010181427e-06, -3.7765130400657654e-06, -3.3490359783172607e-06, -2.921558916568756e-06, -2.4940818548202515e-06, -2.066604793071747e-06, -1.6391277313232422e-06, -1.2116506695747375e-06, -7.841736078262329e-07, -3.5669654607772827e-07, 7.078051567077637e-08, 4.98257577419281e-07, 9.257346391677856e-07, 1.3532117009162903e-06, 1.780688762664795e-06, 2.2081658244132996e-06, 2.635642886161804e-06, 3.063119947910309e-06, 3.4905970096588135e-06, 3.918074071407318e-06, 4.345551133155823e-06, 4.773028194904327e-06, 5.200505256652832e-06, 5.627982318401337e-06, 6.055459380149841e-06, 6.482936441898346e-06, 6.910413503646851e-06, 7.337890565395355e-06, 7.76536762714386e-06, 8.192844688892365e-06, 8.620321750640869e-06, 9.047798812389374e-06, 9.475275874137878e-06, 9.902752935886383e-06, 1.0330229997634888e-05, 1.0757707059383392e-05, 1.1185184121131897e-05, 1.1612661182880402e-05, 1.2040138244628906e-05]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 10.0, 19.0, 26.0, 44.0, 65.0, 117.0, 153.0, 203.0, 364.0, 568.0, 878.0, 1270.0, 1976.0, 2878.0, 4552.0, 6823.0, 10285.0, 15832.0, 24779.0, 37925.0, 57638.0, 87065.0, 123261.0, 154185.0, 152398.0, 120345.0, 84206.0, 55799.0, 36449.0, 23692.0, 15424.0, 10246.0, 6549.0, 4281.0, 2902.0, 1830.0, 1207.0, 781.0, 537.0, 360.0, 211.0, 152.0, 120.0, 60.0, 32.0, 26.0, 18.0, 7.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.28125, -0.2724494934082031, -0.26364898681640625, -0.2548484802246094, -0.2460479736328125, -0.23724746704101562, -0.22844696044921875, -0.21964645385742188, -0.210845947265625, -0.20204544067382812, -0.19324493408203125, -0.18444442749023438, -0.1756439208984375, -0.16684341430664062, -0.15804290771484375, -0.14924240112304688, -0.14044189453125, -0.13164138793945312, -0.12284088134765625, -0.11404037475585938, -0.1052398681640625, -0.09643936157226562, -0.08763885498046875, -0.07883834838867188, -0.070037841796875, -0.061237335205078125, -0.05243682861328125, -0.043636322021484375, -0.0348358154296875, -0.026035308837890625, -0.01723480224609375, -0.008434295654296875, 0.0003662109375, 0.009166717529296875, 0.01796722412109375, 0.026767730712890625, 0.0355682373046875, 0.044368743896484375, 0.05316925048828125, 0.061969757080078125, 0.070770263671875, 0.07957077026367188, 0.08837127685546875, 0.09717178344726562, 0.1059722900390625, 0.11477279663085938, 0.12357330322265625, 0.13237380981445312, 0.14117431640625, 0.14997482299804688, 0.15877532958984375, 0.16757583618164062, 0.1763763427734375, 0.18517684936523438, 0.19397735595703125, 0.20277786254882812, 0.211578369140625, 0.22037887573242188, 0.22917938232421875, 0.23797988891601562, 0.2467803955078125, 0.2555809020996094, 0.26438140869140625, 0.2731819152832031, 0.281982421875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 4.0, 5.0, 5.0, 9.0, 4.0, 8.0, 11.0, 13.0, 22.0, 16.0, 19.0, 17.0, 22.0, 37.0, 22.0, 44.0, 36.0, 33.0, 32.0, 51.0, 35.0, 43.0, 50.0, 43.0, 48.0, 40.0, 35.0, 44.0, 40.0, 23.0, 18.0, 23.0, 20.0, 14.0, 21.0, 10.0, 13.0, 10.0, 13.0, 11.0, 13.0, 6.0, 3.0, 7.0, 5.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0965576171875, -0.0932912826538086, -0.09002494812011719, -0.08675861358642578, -0.08349227905273438, -0.08022594451904297, -0.07695960998535156, -0.07369327545166016, -0.07042694091796875, -0.06716060638427734, -0.06389427185058594, -0.06062793731689453, -0.057361602783203125, -0.05409526824951172, -0.05082893371582031, -0.047562599182128906, -0.0442962646484375, -0.041029930114746094, -0.03776359558105469, -0.03449726104736328, -0.031230926513671875, -0.02796459197998047, -0.024698257446289062, -0.021431922912597656, -0.01816558837890625, -0.014899253845214844, -0.011632919311523438, -0.008366584777832031, -0.005100250244140625, -0.0018339157104492188, 0.0014324188232421875, 0.004698753356933594, 0.007965087890625, 0.011231422424316406, 0.014497756958007812, 0.01776409149169922, 0.021030426025390625, 0.02429676055908203, 0.027563095092773438, 0.030829429626464844, 0.03409576416015625, 0.037362098693847656, 0.04062843322753906, 0.04389476776123047, 0.047161102294921875, 0.05042743682861328, 0.05369377136230469, 0.056960105895996094, 0.0602264404296875, 0.0634927749633789, 0.06675910949707031, 0.07002544403076172, 0.07329177856445312, 0.07655811309814453, 0.07982444763183594, 0.08309078216552734, 0.08635711669921875, 0.08962345123291016, 0.09288978576660156, 0.09615612030029297, 0.09942245483398438, 0.10268878936767578, 0.10595512390136719, 0.1092214584350586, 0.11248779296875]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 6.0, 3.0, 4.0, 5.0, 4.0, 2.0, 6.0, 7.0, 11.0, 18.0, 20.0, 15.0, 28.0, 26.0, 34.0, 32.0, 34.0, 41.0, 34.0, 48.0, 46.0, 49.0, 38.0, 35.0, 48.0, 50.0, 34.0, 43.0, 31.0, 36.0, 32.0, 18.0, 38.0, 23.0, 18.0, 13.0, 8.0, 12.0, 12.0, 17.0, 7.0, 4.0, 3.0, 6.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.928347110748291, -7.68032169342041, -7.432296276092529, -7.184270858764648, -6.936245918273926, -6.688220024108887, -6.440195083618164, -6.192169666290283, -5.944144248962402, -5.6961188316345215, -5.448093414306641, -5.20006799697876, -4.952042579650879, -4.704017639160156, -4.455992221832275, -4.2079668045043945, -3.9599413871765137, -3.711915969848633, -3.463890552520752, -3.21586537361145, -2.9678399562835693, -2.7198145389556885, -2.4717893600463867, -2.223763942718506, -1.975738525390625, -1.7277131080627441, -1.4796878099441528, -1.2316625118255615, -0.9836370944976807, -0.7356116771697998, -0.4875863790512085, -0.2395610809326172, 0.008463859558105469, 0.25648921728134155, 0.5045145750045776, 0.7525399327278137, 1.0005652904510498, 1.2485907077789307, 1.496616005897522, 1.7446413040161133, 1.9926667213439941, 2.240692138671875, 2.488717555999756, 2.7367427349090576, 2.9847681522369385, 3.2327935695648193, 3.480818748474121, 3.728844165802002, 3.976869583129883, 4.224895000457764, 4.4729204177856445, 4.720945835113525, 4.968971252441406, 5.216996192932129, 5.46502161026001, 5.713047027587891, 5.9610724449157715, 6.209097862243652, 6.457123279571533, 6.705148696899414, 6.953173637390137, 7.201199531555176, 7.449224472045898, 7.697249889373779, 7.94527530670166]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 4.0, 3.0, 3.0, 6.0, 5.0, 6.0, 4.0, 9.0, 12.0, 10.0, 13.0, 15.0, 16.0, 15.0, 21.0, 24.0, 19.0, 23.0, 29.0, 35.0, 23.0, 35.0, 29.0, 42.0, 30.0, 35.0, 28.0, 27.0, 27.0, 40.0, 39.0, 39.0, 51.0, 14.0, 31.0, 27.0, 21.0, 20.0, 17.0, 25.0, 25.0, 12.0, 12.0, 13.0, 16.0, 6.0, 12.0, 6.0, 7.0, 6.0, 7.0, 5.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0], "bins": [-7.467939376831055, -7.229875087738037, -6.991811275482178, -6.75374698638916, -6.515683174133301, -6.277618885040283, -6.039554595947266, -5.801490783691406, -5.563426971435547, -5.325362682342529, -5.08729887008667, -4.849234580993652, -4.611170768737793, -4.373106479644775, -4.135042190551758, -3.8969783782958984, -3.658914089202881, -3.4208500385284424, -3.182785987854004, -2.9447216987609863, -2.706657886505127, -2.4685935974121094, -2.230529546737671, -1.9924654960632324, -1.754401445388794, -1.5163373947143555, -1.278273344039917, -1.040209174156189, -0.8021451234817505, -0.564081072807312, -0.326016902923584, -0.08795285224914551, 0.15011119842529297, 0.38817527890205383, 0.6262393593788147, 0.864303469657898, 1.1023675203323364, 1.340431571006775, 1.578495740890503, 1.8165597915649414, 2.05462384223938, 2.2926878929138184, 2.530751943588257, 2.7688159942626953, 3.006880283355713, 3.2449440956115723, 3.48300838470459, 3.7210724353790283, 3.959136486053467, 4.197200775146484, 4.435264587402344, 4.673328876495361, 4.911392688751221, 5.149456977844238, 5.387520790100098, 5.625585079193115, 5.863649368286133, 6.10171365737915, 6.33977746963501, 6.577841758728027, 6.815905570983887, 7.053969860076904, 7.292034149169922, 7.530097961425781, 7.768161773681641]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 5.0, 3.0, 3.0, 8.0, 11.0, 26.0, 33.0, 67.0, 74.0, 118.0, 228.0, 357.0, 482.0, 790.0, 1275.0, 1891.0, 3150.0, 4729.0, 7241.0, 10884.0, 16328.0, 23965.0, 33901.0, 46144.0, 60845.0, 76198.0, 89891.0, 99724.0, 102874.0, 98900.0, 89103.0, 74882.0, 58822.0, 44857.0, 32485.0, 22609.0, 15673.0, 10352.0, 7011.0, 4499.0, 2963.0, 1853.0, 1166.0, 791.0, 489.0, 316.0, 202.0, 116.0, 81.0, 50.0, 30.0, 33.0, 18.0, 9.0, 2.0, 7.0, 1.0, 5.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.08984375, -3.95550537109375, -3.8211669921875, -3.68682861328125, -3.552490234375, -3.41815185546875, -3.2838134765625, -3.14947509765625, -3.01513671875, -2.88079833984375, -2.7464599609375, -2.61212158203125, -2.477783203125, -2.34344482421875, -2.2091064453125, -2.07476806640625, -1.9404296875, -1.80609130859375, -1.6717529296875, -1.53741455078125, -1.403076171875, -1.26873779296875, -1.1343994140625, -1.00006103515625, -0.86572265625, -0.73138427734375, -0.5970458984375, -0.46270751953125, -0.328369140625, -0.19403076171875, -0.0596923828125, 0.07464599609375, 0.208984375, 0.34332275390625, 0.4776611328125, 0.61199951171875, 0.746337890625, 0.88067626953125, 1.0150146484375, 1.14935302734375, 1.28369140625, 1.41802978515625, 1.5523681640625, 1.68670654296875, 1.821044921875, 1.95538330078125, 2.0897216796875, 2.22406005859375, 2.3583984375, 2.49273681640625, 2.6270751953125, 2.76141357421875, 2.895751953125, 3.03009033203125, 3.1644287109375, 3.29876708984375, 3.43310546875, 3.56744384765625, 3.7017822265625, 3.83612060546875, 3.970458984375, 4.10479736328125, 4.2391357421875, 4.37347412109375, 4.5078125]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 0.0, 4.0, 12.0, 4.0, 5.0, 10.0, 15.0, 11.0, 13.0, 13.0, 25.0, 22.0, 24.0, 30.0, 30.0, 29.0, 30.0, 32.0, 39.0, 39.0, 45.0, 32.0, 37.0, 34.0, 45.0, 33.0, 40.0, 26.0, 35.0, 30.0, 22.0, 25.0, 31.0, 30.0, 25.0, 21.0, 12.0, 17.0, 10.0, 10.0, 12.0, 9.0, 8.0, 9.0, 6.0, 5.0, 2.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.7265625, -7.461181640625, -7.19580078125, -6.930419921875, -6.6650390625, -6.399658203125, -6.13427734375, -5.868896484375, -5.603515625, -5.338134765625, -5.07275390625, -4.807373046875, -4.5419921875, -4.276611328125, -4.01123046875, -3.745849609375, -3.48046875, -3.215087890625, -2.94970703125, -2.684326171875, -2.4189453125, -2.153564453125, -1.88818359375, -1.622802734375, -1.357421875, -1.092041015625, -0.82666015625, -0.561279296875, -0.2958984375, -0.030517578125, 0.23486328125, 0.500244140625, 0.765625, 1.031005859375, 1.29638671875, 1.561767578125, 1.8271484375, 2.092529296875, 2.35791015625, 2.623291015625, 2.888671875, 3.154052734375, 3.41943359375, 3.684814453125, 3.9501953125, 4.215576171875, 4.48095703125, 4.746337890625, 5.01171875, 5.277099609375, 5.54248046875, 5.807861328125, 6.0732421875, 6.338623046875, 6.60400390625, 6.869384765625, 7.134765625, 7.400146484375, 7.66552734375, 7.930908203125, 8.1962890625, 8.461669921875, 8.72705078125, 8.992431640625, 9.2578125]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 7.0, 8.0, 10.0, 26.0, 31.0, 50.0, 64.0, 128.0, 201.0, 269.0, 478.0, 811.0, 1170.0, 1810.0, 2901.0, 4156.0, 6554.0, 9733.0, 14556.0, 21125.0, 30521.0, 42205.0, 56773.0, 72403.0, 87677.0, 99809.0, 103985.0, 101700.0, 92210.0, 78408.0, 62776.0, 47092.0, 34476.0, 24461.0, 16815.0, 11351.0, 7578.0, 4907.0, 3343.0, 2142.0, 1380.0, 937.0, 571.0, 359.0, 200.0, 139.0, 88.0, 66.0, 37.0, 28.0, 11.0, 10.0, 9.0, 7.0, 1.0, 2.0, 2.0, 1.0], "bins": [-4.8515625, -4.703125, -4.5546875, -4.40625, -4.2578125, -4.109375, -3.9609375, -3.8125, -3.6640625, -3.515625, -3.3671875, -3.21875, -3.0703125, -2.921875, -2.7734375, -2.625, -2.4765625, -2.328125, -2.1796875, -2.03125, -1.8828125, -1.734375, -1.5859375, -1.4375, -1.2890625, -1.140625, -0.9921875, -0.84375, -0.6953125, -0.546875, -0.3984375, -0.25, -0.1015625, 0.046875, 0.1953125, 0.34375, 0.4921875, 0.640625, 0.7890625, 0.9375, 1.0859375, 1.234375, 1.3828125, 1.53125, 1.6796875, 1.828125, 1.9765625, 2.125, 2.2734375, 2.421875, 2.5703125, 2.71875, 2.8671875, 3.015625, 3.1640625, 3.3125, 3.4609375, 3.609375, 3.7578125, 3.90625, 4.0546875, 4.203125, 4.3515625, 4.5, 4.6484375]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 6.0, 7.0, 7.0, 8.0, 8.0, 16.0, 16.0, 10.0, 9.0, 23.0, 25.0, 28.0, 25.0, 26.0, 33.0, 34.0, 50.0, 37.0, 44.0, 42.0, 56.0, 34.0, 36.0, 45.0, 31.0, 35.0, 37.0, 26.0, 43.0, 18.0, 29.0, 26.0, 21.0, 22.0, 11.0, 10.0, 8.0, 10.0, 5.0, 12.0, 13.0, 9.0, 3.0, 4.0, 3.0, 5.0, 4.0, 0.0, 1.0, 2.0, 1.0], "bins": [-6.4765625, -6.2877197265625, -6.098876953125, -5.9100341796875, -5.72119140625, -5.5323486328125, -5.343505859375, -5.1546630859375, -4.9658203125, -4.7769775390625, -4.588134765625, -4.3992919921875, -4.21044921875, -4.0216064453125, -3.832763671875, -3.6439208984375, -3.455078125, -3.2662353515625, -3.077392578125, -2.8885498046875, -2.69970703125, -2.5108642578125, -2.322021484375, -2.1331787109375, -1.9443359375, -1.7554931640625, -1.566650390625, -1.3778076171875, -1.18896484375, -1.0001220703125, -0.811279296875, -0.6224365234375, -0.43359375, -0.2447509765625, -0.055908203125, 0.1329345703125, 0.32177734375, 0.5106201171875, 0.699462890625, 0.8883056640625, 1.0771484375, 1.2659912109375, 1.454833984375, 1.6436767578125, 1.83251953125, 2.0213623046875, 2.210205078125, 2.3990478515625, 2.587890625, 2.7767333984375, 2.965576171875, 3.1544189453125, 3.34326171875, 3.5321044921875, 3.720947265625, 3.9097900390625, 4.0986328125, 4.2874755859375, 4.476318359375, 4.6651611328125, 4.85400390625, 5.0428466796875, 5.231689453125, 5.4205322265625, 5.609375]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 4.0, 9.0, 16.0, 24.0, 32.0, 42.0, 74.0, 103.0, 167.0, 275.0, 385.0, 621.0, 996.0, 1563.0, 2444.0, 3535.0, 5368.0, 8525.0, 12835.0, 19073.0, 27672.0, 39360.0, 52731.0, 68250.0, 82997.0, 95746.0, 103093.0, 102372.0, 95336.0, 83149.0, 67411.0, 52358.0, 38876.0, 27525.0, 18898.0, 12639.0, 8353.0, 5637.0, 3541.0, 2324.0, 1506.0, 944.0, 628.0, 384.0, 249.0, 188.0, 108.0, 62.0, 44.0, 36.0, 19.0, 11.0, 9.0, 6.0, 10.0], "bins": [-1.95703125, -1.90264892578125, -1.8482666015625, -1.79388427734375, -1.739501953125, -1.68511962890625, -1.6307373046875, -1.57635498046875, -1.52197265625, -1.46759033203125, -1.4132080078125, -1.35882568359375, -1.304443359375, -1.25006103515625, -1.1956787109375, -1.14129638671875, -1.0869140625, -1.03253173828125, -0.9781494140625, -0.92376708984375, -0.869384765625, -0.81500244140625, -0.7606201171875, -0.70623779296875, -0.65185546875, -0.59747314453125, -0.5430908203125, -0.48870849609375, -0.434326171875, -0.37994384765625, -0.3255615234375, -0.27117919921875, -0.216796875, -0.16241455078125, -0.1080322265625, -0.05364990234375, 0.000732421875, 0.05511474609375, 0.1094970703125, 0.16387939453125, 0.21826171875, 0.27264404296875, 0.3270263671875, 0.38140869140625, 0.435791015625, 0.49017333984375, 0.5445556640625, 0.59893798828125, 0.6533203125, 0.70770263671875, 0.7620849609375, 0.81646728515625, 0.870849609375, 0.92523193359375, 0.9796142578125, 1.03399658203125, 1.08837890625, 1.14276123046875, 1.1971435546875, 1.25152587890625, 1.305908203125, 1.36029052734375, 1.4146728515625, 1.46905517578125, 1.5234375]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 6.0, 6.0, 8.0, 8.0, 14.0, 9.0, 18.0, 18.0, 23.0, 22.0, 28.0, 39.0, 27.0, 43.0, 34.0, 42.0, 41.0, 57.0, 49.0, 47.0, 41.0, 59.0, 38.0, 48.0, 39.0, 40.0, 28.0, 17.0, 25.0, 21.0, 18.0, 24.0, 13.0, 11.0, 8.0, 5.0, 8.0, 5.0, 3.0, 1.0, 4.0, 2.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00021839141845703125, -0.00021095946431159973, -0.0002035275101661682, -0.0001960955560207367, -0.00018866360187530518, -0.00018123164772987366, -0.00017379969358444214, -0.00016636773943901062, -0.0001589357852935791, -0.00015150383114814758, -0.00014407187700271606, -0.00013663992285728455, -0.00012920796871185303, -0.00012177601456642151, -0.00011434406042098999, -0.00010691210627555847, -9.948015213012695e-05, -9.204819798469543e-05, -8.461624383926392e-05, -7.71842896938324e-05, -6.975233554840088e-05, -6.232038140296936e-05, -5.488842725753784e-05, -4.745647311210632e-05, -4.0024518966674805e-05, -3.2592564821243286e-05, -2.5160610675811768e-05, -1.772865653038025e-05, -1.029670238494873e-05, -2.864748239517212e-06, 4.567205905914307e-06, 1.1999160051345825e-05, 1.9431114196777344e-05, 2.6863068342208862e-05, 3.429502248764038e-05, 4.17269766330719e-05, 4.915893077850342e-05, 5.6590884923934937e-05, 6.402283906936646e-05, 7.145479321479797e-05, 7.888674736022949e-05, 8.631870150566101e-05, 9.375065565109253e-05, 0.00010118260979652405, 0.00010861456394195557, 0.00011604651808738708, 0.0001234784722328186, 0.00013091042637825012, 0.00013834238052368164, 0.00014577433466911316, 0.00015320628881454468, 0.0001606382429599762, 0.00016807019710540771, 0.00017550215125083923, 0.00018293410539627075, 0.00019036605954170227, 0.0001977980136871338, 0.0002052299678325653, 0.00021266192197799683, 0.00022009387612342834, 0.00022752583026885986, 0.00023495778441429138, 0.0002423897385597229, 0.0002498216927051544, 0.00025725364685058594]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 8.0, 2.0, 8.0, 13.0, 23.0, 37.0, 88.0, 110.0, 206.0, 320.0, 570.0, 887.0, 1504.0, 2517.0, 4202.0, 7291.0, 12235.0, 20352.0, 33275.0, 51673.0, 74825.0, 101523.0, 123024.0, 133184.0, 127667.0, 110120.0, 84351.0, 59384.0, 38853.0, 24225.0, 14776.0, 8673.0, 5147.0, 3018.0, 1760.0, 1100.0, 678.0, 364.0, 232.0, 138.0, 68.0, 65.0, 36.0, 15.0, 10.0, 5.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3046875, -2.22955322265625, -2.1544189453125, -2.07928466796875, -2.004150390625, -1.92901611328125, -1.8538818359375, -1.77874755859375, -1.70361328125, -1.62847900390625, -1.5533447265625, -1.47821044921875, -1.403076171875, -1.32794189453125, -1.2528076171875, -1.17767333984375, -1.1025390625, -1.02740478515625, -0.9522705078125, -0.87713623046875, -0.802001953125, -0.72686767578125, -0.6517333984375, -0.57659912109375, -0.50146484375, -0.42633056640625, -0.3511962890625, -0.27606201171875, -0.200927734375, -0.12579345703125, -0.0506591796875, 0.02447509765625, 0.099609375, 0.17474365234375, 0.2498779296875, 0.32501220703125, 0.400146484375, 0.47528076171875, 0.5504150390625, 0.62554931640625, 0.70068359375, 0.77581787109375, 0.8509521484375, 0.92608642578125, 1.001220703125, 1.07635498046875, 1.1514892578125, 1.22662353515625, 1.3017578125, 1.37689208984375, 1.4520263671875, 1.52716064453125, 1.602294921875, 1.67742919921875, 1.7525634765625, 1.82769775390625, 1.90283203125, 1.97796630859375, 2.0531005859375, 2.12823486328125, 2.203369140625, 2.27850341796875, 2.3536376953125, 2.42877197265625, 2.50390625]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 1.0, 2.0, 4.0, 3.0, 6.0, 7.0, 5.0, 6.0, 7.0, 9.0, 11.0, 12.0, 18.0, 14.0, 22.0, 35.0, 28.0, 28.0, 37.0, 32.0, 40.0, 48.0, 53.0, 37.0, 44.0, 37.0, 40.0, 44.0, 43.0, 38.0, 22.0, 29.0, 45.0, 31.0, 27.0, 22.0, 21.0, 16.0, 13.0, 19.0, 9.0, 10.0, 3.0, 9.0, 2.0, 4.0, 5.0, 1.0, 3.0, 6.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.88427734375, -0.856048583984375, -0.82781982421875, -0.799591064453125, -0.7713623046875, -0.743133544921875, -0.71490478515625, -0.686676025390625, -0.658447265625, -0.630218505859375, -0.60198974609375, -0.573760986328125, -0.5455322265625, -0.517303466796875, -0.48907470703125, -0.460845947265625, -0.4326171875, -0.404388427734375, -0.37615966796875, -0.347930908203125, -0.3197021484375, -0.291473388671875, -0.26324462890625, -0.235015869140625, -0.206787109375, -0.178558349609375, -0.15032958984375, -0.122100830078125, -0.0938720703125, -0.065643310546875, -0.03741455078125, -0.009185791015625, 0.01904296875, 0.047271728515625, 0.07550048828125, 0.103729248046875, 0.1319580078125, 0.160186767578125, 0.18841552734375, 0.216644287109375, 0.244873046875, 0.273101806640625, 0.30133056640625, 0.329559326171875, 0.3577880859375, 0.386016845703125, 0.41424560546875, 0.442474365234375, 0.470703125, 0.498931884765625, 0.52716064453125, 0.555389404296875, 0.5836181640625, 0.611846923828125, 0.64007568359375, 0.668304443359375, 0.696533203125, 0.724761962890625, 0.75299072265625, 0.781219482421875, 0.8094482421875, 0.837677001953125, 0.86590576171875, 0.894134521484375, 0.92236328125]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 5.0, 5.0, 9.0, 7.0, 6.0, 11.0, 11.0, 16.0, 18.0, 22.0, 23.0, 22.0, 36.0, 33.0, 31.0, 51.0, 39.0, 46.0, 37.0, 51.0, 38.0, 52.0, 48.0, 52.0, 45.0, 35.0, 32.0, 31.0, 25.0, 31.0, 18.0, 22.0, 12.0, 20.0, 9.0, 14.0, 4.0, 4.0, 13.0, 8.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.693584442138672, -7.441046237945557, -7.188507556915283, -6.935969352722168, -6.6834306716918945, -6.430892467498779, -6.178354263305664, -5.925815582275391, -5.673277378082275, -5.42073917388916, -5.168200492858887, -4.9156622886657715, -4.663124084472656, -4.410585403442383, -4.158047199249268, -3.9055087566375732, -3.652970314025879, -3.4004318714141846, -3.1478934288024902, -2.895355224609375, -2.6428167819976807, -2.3902783393859863, -2.137740135192871, -1.8852016925811768, -1.6326632499694824, -1.380124807357788, -1.1275864839553833, -0.8750481009483337, -0.6225097179412842, -0.36997127532958984, -0.11743295192718506, 0.13510537147521973, 0.38764286041259766, 0.6401812434196472, 0.8927196264266968, 1.1452579498291016, 1.397796392440796, 1.6503348350524902, 1.902873158454895, 2.1554114818573, 2.407949924468994, 2.6604883670806885, 2.913026809692383, 3.165565013885498, 3.4181034564971924, 3.6706418991088867, 3.923180103302002, 4.175718307495117, 4.428256988525391, 4.680795192718506, 4.933333873748779, 5.1858720779418945, 5.438410758972168, 5.690948963165283, 5.943487167358398, 6.196025848388672, 6.448564052581787, 6.701102256774902, 6.953640937805176, 7.206179141998291, 7.458717346191406, 7.71125602722168, 7.963794231414795, 8.21633243560791, 8.468871116638184]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 5.0, 4.0, 8.0, 4.0, 8.0, 14.0, 10.0, 8.0, 13.0, 18.0, 19.0, 24.0, 16.0, 22.0, 25.0, 26.0, 36.0, 45.0, 34.0, 32.0, 29.0, 43.0, 30.0, 53.0, 35.0, 37.0, 39.0, 38.0, 34.0, 29.0, 31.0, 31.0, 20.0, 29.0, 26.0, 17.0, 25.0, 14.0, 11.0, 9.0, 11.0, 14.0, 10.0, 5.0, 6.0, 2.0, 3.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.92663860321045, -8.634382247924805, -8.342124938964844, -8.0498685836792, -7.757611274719238, -7.465354919433594, -7.173098087310791, -6.880841255187988, -6.5885844230651855, -6.296327590942383, -6.00407075881958, -5.711813926696777, -5.419557571411133, -5.127300262451172, -4.835043907165527, -4.542787075042725, -4.250530242919922, -3.958273410797119, -3.6660165786743164, -3.3737599849700928, -3.08150315284729, -2.7892463207244873, -2.4969897270202637, -2.204732894897461, -1.9124760627746582, -1.6202192306518555, -1.3279625177383423, -1.035705804824829, -0.7434489727020264, -0.45119214057922363, -0.15893542766571045, 0.13332128524780273, 0.42557811737060547, 0.7178348898887634, 1.0100916624069214, 1.3023483753204346, 1.5946052074432373, 1.88686203956604, 2.1791186332702637, 2.4713754653930664, 2.763632297515869, 3.055889129638672, 3.3481459617614746, 3.6404025554656982, 3.932659387588501, 4.224916458129883, 4.517172813415527, 4.80942964553833, 5.101686477661133, 5.3939433097839355, 5.686200141906738, 5.978456974029541, 6.270713806152344, 6.562970161437988, 6.855226993560791, 7.147483825683594, 7.4397406578063965, 7.731997489929199, 8.024253845214844, 8.316511154174805, 8.60876750946045, 8.90102481842041, 9.193281173706055, 9.485538482666016, 9.77779483795166]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [5.0, 4.0, 5.0, 11.0, 9.0, 30.0, 27.0, 54.0, 55.0, 91.0, 137.0, 200.0, 359.0, 495.0, 731.0, 1157.0, 1739.0, 2788.0, 4526.0, 7349.0, 12112.0, 20186.0, 35150.0, 62621.0, 113206.0, 203183.0, 344364.0, 523847.0, 671296.0, 690997.0, 569327.0, 387708.0, 232835.0, 130863.0, 72820.0, 41053.0, 23879.0, 14200.0, 8627.0, 5417.0, 3379.0, 2357.0, 1495.0, 1044.0, 661.0, 493.0, 379.0, 282.0, 208.0, 148.0, 102.0, 69.0, 55.0, 49.0, 29.0, 20.0, 21.0, 16.0, 9.0, 9.0, 5.0, 3.0, 4.0, 4.0], "bins": [-7.36328125, -7.11053466796875, -6.8577880859375, -6.60504150390625, -6.352294921875, -6.09954833984375, -5.8468017578125, -5.59405517578125, -5.34130859375, -5.08856201171875, -4.8358154296875, -4.58306884765625, -4.330322265625, -4.07757568359375, -3.8248291015625, -3.57208251953125, -3.3193359375, -3.06658935546875, -2.8138427734375, -2.56109619140625, -2.308349609375, -2.05560302734375, -1.8028564453125, -1.55010986328125, -1.29736328125, -1.04461669921875, -0.7918701171875, -0.53912353515625, -0.286376953125, -0.03363037109375, 0.2191162109375, 0.47186279296875, 0.724609375, 0.97735595703125, 1.2301025390625, 1.48284912109375, 1.735595703125, 1.98834228515625, 2.2410888671875, 2.49383544921875, 2.74658203125, 2.99932861328125, 3.2520751953125, 3.50482177734375, 3.757568359375, 4.01031494140625, 4.2630615234375, 4.51580810546875, 4.7685546875, 5.02130126953125, 5.2740478515625, 5.52679443359375, 5.779541015625, 6.03228759765625, 6.2850341796875, 6.53778076171875, 6.79052734375, 7.04327392578125, 7.2960205078125, 7.54876708984375, 7.801513671875, 8.05426025390625, 8.3070068359375, 8.55975341796875, 8.8125]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 3.0, 6.0, 9.0, 7.0, 10.0, 11.0, 16.0, 10.0, 17.0, 15.0, 18.0, 26.0, 23.0, 27.0, 26.0, 32.0, 36.0, 47.0, 29.0, 44.0, 37.0, 40.0, 45.0, 32.0, 35.0, 39.0, 32.0, 37.0, 39.0, 27.0, 29.0, 23.0, 26.0, 28.0, 17.0, 17.0, 22.0, 9.0, 13.0, 10.0, 8.0, 7.0, 9.0, 2.0, 6.0, 1.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.0625, -7.7884521484375, -7.514404296875, -7.2403564453125, -6.96630859375, -6.6922607421875, -6.418212890625, -6.1441650390625, -5.8701171875, -5.5960693359375, -5.322021484375, -5.0479736328125, -4.77392578125, -4.4998779296875, -4.225830078125, -3.9517822265625, -3.677734375, -3.4036865234375, -3.129638671875, -2.8555908203125, -2.58154296875, -2.3074951171875, -2.033447265625, -1.7593994140625, -1.4853515625, -1.2113037109375, -0.937255859375, -0.6632080078125, -0.38916015625, -0.1151123046875, 0.158935546875, 0.4329833984375, 0.70703125, 0.9810791015625, 1.255126953125, 1.5291748046875, 1.80322265625, 2.0772705078125, 2.351318359375, 2.6253662109375, 2.8994140625, 3.1734619140625, 3.447509765625, 3.7215576171875, 3.99560546875, 4.2696533203125, 4.543701171875, 4.8177490234375, 5.091796875, 5.3658447265625, 5.639892578125, 5.9139404296875, 6.18798828125, 6.4620361328125, 6.736083984375, 7.0101318359375, 7.2841796875, 7.5582275390625, 7.832275390625, 8.1063232421875, 8.38037109375, 8.6544189453125, 8.928466796875, 9.2025146484375, 9.4765625]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 3.0, 11.0, 14.0, 20.0, 27.0, 38.0, 63.0, 105.0, 167.0, 244.0, 396.0, 579.0, 863.0, 1420.0, 2308.0, 3889.0, 6554.0, 11512.0, 20833.0, 39032.0, 76035.0, 149406.0, 283658.0, 490468.0, 711953.0, 792944.0, 663907.0, 431446.0, 241360.0, 125753.0, 63890.0, 33184.0, 17756.0, 9898.0, 5657.0, 3440.0, 1990.0, 1270.0, 788.0, 507.0, 310.0, 200.0, 131.0, 99.0, 58.0, 41.0, 21.0, 16.0, 12.0, 8.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-11.2421875, -10.8948974609375, -10.547607421875, -10.2003173828125, -9.85302734375, -9.5057373046875, -9.158447265625, -8.8111572265625, -8.4638671875, -8.1165771484375, -7.769287109375, -7.4219970703125, -7.07470703125, -6.7274169921875, -6.380126953125, -6.0328369140625, -5.685546875, -5.3382568359375, -4.990966796875, -4.6436767578125, -4.29638671875, -3.9490966796875, -3.601806640625, -3.2545166015625, -2.9072265625, -2.5599365234375, -2.212646484375, -1.8653564453125, -1.51806640625, -1.1707763671875, -0.823486328125, -0.4761962890625, -0.12890625, 0.2183837890625, 0.565673828125, 0.9129638671875, 1.26025390625, 1.6075439453125, 1.954833984375, 2.3021240234375, 2.6494140625, 2.9967041015625, 3.343994140625, 3.6912841796875, 4.03857421875, 4.3858642578125, 4.733154296875, 5.0804443359375, 5.427734375, 5.7750244140625, 6.122314453125, 6.4696044921875, 6.81689453125, 7.1641845703125, 7.511474609375, 7.8587646484375, 8.2060546875, 8.5533447265625, 8.900634765625, 9.2479248046875, 9.59521484375, 9.9425048828125, 10.289794921875, 10.6370849609375, 10.984375]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 3.0, 4.0, 7.0, 13.0, 13.0, 8.0, 23.0, 37.0, 29.0, 37.0, 52.0, 78.0, 107.0, 116.0, 132.0, 167.0, 202.0, 187.0, 229.0, 249.0, 265.0, 263.0, 243.0, 243.0, 227.0, 182.0, 182.0, 160.0, 137.0, 113.0, 77.0, 60.0, 65.0, 60.0, 26.0, 24.0, 16.0, 16.0, 9.0, 9.0, 5.0, 2.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0546875, -3.91229248046875, -3.7698974609375, -3.62750244140625, -3.485107421875, -3.34271240234375, -3.2003173828125, -3.05792236328125, -2.91552734375, -2.77313232421875, -2.6307373046875, -2.48834228515625, -2.345947265625, -2.20355224609375, -2.0611572265625, -1.91876220703125, -1.7763671875, -1.63397216796875, -1.4915771484375, -1.34918212890625, -1.206787109375, -1.06439208984375, -0.9219970703125, -0.77960205078125, -0.63720703125, -0.49481201171875, -0.3524169921875, -0.21002197265625, -0.067626953125, 0.07476806640625, 0.2171630859375, 0.35955810546875, 0.501953125, 0.64434814453125, 0.7867431640625, 0.92913818359375, 1.071533203125, 1.21392822265625, 1.3563232421875, 1.49871826171875, 1.64111328125, 1.78350830078125, 1.9259033203125, 2.06829833984375, 2.210693359375, 2.35308837890625, 2.4954833984375, 2.63787841796875, 2.7802734375, 2.92266845703125, 3.0650634765625, 3.20745849609375, 3.349853515625, 3.49224853515625, 3.6346435546875, 3.77703857421875, 3.91943359375, 4.06182861328125, 4.2042236328125, 4.34661865234375, 4.489013671875, 4.63140869140625, 4.7738037109375, 4.91619873046875, 5.05859375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 6.0, 5.0, 8.0, 19.0, 12.0, 9.0, 12.0, 21.0, 24.0, 23.0, 34.0, 35.0, 51.0, 37.0, 63.0, 64.0, 47.0, 52.0, 58.0, 53.0, 54.0, 44.0, 42.0, 48.0, 28.0, 20.0, 16.0, 17.0, 16.0, 20.0, 16.0, 11.0, 11.0, 7.0, 7.0, 4.0, 7.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.95535659790039, -10.61943244934082, -10.28350830078125, -9.94758415222168, -9.611659049987793, -9.275734901428223, -8.939810752868652, -8.603886604309082, -8.267962455749512, -7.932038307189941, -7.596113681793213, -7.260189533233643, -6.924265384674072, -6.588340759277344, -6.252416610717773, -5.916492462158203, -5.580567836761475, -5.244643688201904, -4.908719062805176, -4.5727949142456055, -4.236870765686035, -3.9009463787078857, -3.5650219917297363, -3.229097843170166, -2.8931734561920166, -2.557249069213867, -2.221324920654297, -1.8854005336761475, -1.5494762659072876, -1.2135519981384277, -0.8776276111602783, -0.541703462600708, -0.2057790756225586, 0.13014522194862366, 0.4660695195198059, 0.8019938468933105, 1.1379181146621704, 1.4738423824310303, 1.8097667694091797, 2.14569091796875, 2.4816153049468994, 2.817539691925049, 3.153463840484619, 3.4893882274627686, 3.825312614440918, 4.161236763000488, 4.497160911560059, 4.833085060119629, 5.169009685516357, 5.504933834075928, 5.840858459472656, 6.176782608032227, 6.512706756591797, 6.848630905151367, 7.184555530548096, 7.520479679107666, 7.8564043045043945, 8.192328453063965, 8.528252601623535, 8.864177703857422, 9.200101852416992, 9.536026000976562, 9.871950149536133, 10.207874298095703, 10.543798446655273]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 8.0, 4.0, 1.0, 5.0, 9.0, 8.0, 6.0, 8.0, 16.0, 9.0, 12.0, 13.0, 23.0, 14.0, 25.0, 28.0, 27.0, 25.0, 34.0, 31.0, 40.0, 36.0, 43.0, 44.0, 20.0, 35.0, 43.0, 33.0, 44.0, 28.0, 43.0, 33.0, 22.0, 29.0, 39.0, 28.0, 21.0, 24.0, 13.0, 13.0, 13.0, 13.0, 8.0, 9.0, 5.0, 10.0, 9.0, 0.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.206802368164062, -8.891074180603027, -8.575345039367676, -8.25961685180664, -7.943887710571289, -7.628159523010254, -7.3124308586120605, -6.996702194213867, -6.680973529815674, -6.3652448654174805, -6.049516201019287, -5.733787536621094, -5.418059349060059, -5.102330207824707, -4.786602020263672, -4.4708733558654785, -4.155144691467285, -3.839416027069092, -3.5236873626708984, -3.207958936691284, -2.892230272293091, -2.5765016078948975, -2.260773181915283, -1.9450445175170898, -1.6293158531188965, -1.3135871887207031, -0.9978586435317993, -0.6821300387382507, -0.36640143394470215, -0.05067276954650879, 0.265055775642395, 0.5807843208312988, 0.8965120315551758, 1.2122406959533691, 1.527969241142273, 1.8436977863311768, 2.15942645072937, 2.4751551151275635, 2.7908835411071777, 3.106612205505371, 3.4223408699035645, 3.738069534301758, 4.053798198699951, 4.3695268630981445, 4.68525505065918, 5.000984191894531, 5.316712379455566, 5.63244104385376, 5.948169708251953, 6.2638983726501465, 6.57962703704834, 6.895355701446533, 7.211084365844727, 7.526812553405762, 7.842541217803955, 8.158269882202148, 8.4739990234375, 8.789727210998535, 9.105456352233887, 9.421184539794922, 9.736913681030273, 10.052641868591309, 10.36837100982666, 10.684099197387695, 10.99982738494873]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 7.0, 11.0, 11.0, 27.0, 27.0, 39.0, 77.0, 111.0, 177.0, 292.0, 495.0, 808.0, 1344.0, 2201.0, 3858.0, 6469.0, 11359.0, 19038.0, 32500.0, 53905.0, 85353.0, 123288.0, 155941.0, 162468.0, 135900.0, 97050.0, 62403.0, 38292.0, 22827.0, 13466.0, 7683.0, 4495.0, 2618.0, 1560.0, 916.0, 606.0, 353.0, 226.0, 129.0, 84.0, 61.0, 32.0, 14.0, 17.0, 7.0, 7.0, 4.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7041015625, -1.6527099609375, -1.601318359375, -1.5499267578125, -1.49853515625, -1.4471435546875, -1.395751953125, -1.3443603515625, -1.29296875, -1.2415771484375, -1.190185546875, -1.1387939453125, -1.08740234375, -1.0360107421875, -0.984619140625, -0.9332275390625, -0.8818359375, -0.8304443359375, -0.779052734375, -0.7276611328125, -0.67626953125, -0.6248779296875, -0.573486328125, -0.5220947265625, -0.470703125, -0.4193115234375, -0.367919921875, -0.3165283203125, -0.26513671875, -0.2137451171875, -0.162353515625, -0.1109619140625, -0.0595703125, -0.0081787109375, 0.043212890625, 0.0946044921875, 0.14599609375, 0.1973876953125, 0.248779296875, 0.3001708984375, 0.3515625, 0.4029541015625, 0.454345703125, 0.5057373046875, 0.55712890625, 0.6085205078125, 0.659912109375, 0.7113037109375, 0.7626953125, 0.8140869140625, 0.865478515625, 0.9168701171875, 0.96826171875, 1.0196533203125, 1.071044921875, 1.1224365234375, 1.173828125, 1.2252197265625, 1.276611328125, 1.3280029296875, 1.37939453125, 1.4307861328125, 1.482177734375, 1.5335693359375, 1.5849609375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 6.0, 7.0, 4.0, 5.0, 3.0, 9.0, 14.0, 13.0, 12.0, 16.0, 17.0, 20.0, 17.0, 30.0, 30.0, 43.0, 35.0, 41.0, 35.0, 37.0, 37.0, 33.0, 39.0, 36.0, 48.0, 41.0, 27.0, 36.0, 36.0, 34.0, 27.0, 26.0, 32.0, 23.0, 19.0, 19.0, 16.0, 18.0, 11.0, 16.0, 8.0, 8.0, 5.0, 6.0, 5.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.078125, -9.7420654296875, -9.406005859375, -9.0699462890625, -8.73388671875, -8.3978271484375, -8.061767578125, -7.7257080078125, -7.3896484375, -7.0535888671875, -6.717529296875, -6.3814697265625, -6.04541015625, -5.7093505859375, -5.373291015625, -5.0372314453125, -4.701171875, -4.3651123046875, -4.029052734375, -3.6929931640625, -3.35693359375, -3.0208740234375, -2.684814453125, -2.3487548828125, -2.0126953125, -1.6766357421875, -1.340576171875, -1.0045166015625, -0.66845703125, -0.3323974609375, 0.003662109375, 0.3397216796875, 0.67578125, 1.0118408203125, 1.347900390625, 1.6839599609375, 2.02001953125, 2.3560791015625, 2.692138671875, 3.0281982421875, 3.3642578125, 3.7003173828125, 4.036376953125, 4.3724365234375, 4.70849609375, 5.0445556640625, 5.380615234375, 5.7166748046875, 6.052734375, 6.3887939453125, 6.724853515625, 7.0609130859375, 7.39697265625, 7.7330322265625, 8.069091796875, 8.4051513671875, 8.7412109375, 9.0772705078125, 9.413330078125, 9.7493896484375, 10.08544921875, 10.4215087890625, 10.757568359375, 11.0936279296875, 11.4296875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 5.0, 8.0, 7.0, 15.0, 30.0, 46.0, 75.0, 124.0, 198.0, 365.0, 674.0, 1268.0, 2382.0, 4515.0, 8434.0, 16642.0, 38842.0, 373214.0, 518630.0, 45310.0, 18224.0, 9192.0, 4855.0, 2589.0, 1309.0, 690.0, 381.0, 215.0, 111.0, 85.0, 54.0, 31.0, 14.0, 9.0, 6.0, 2.0, 2.0, 3.0, 0.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.076171875, -2.962493896484375, -2.84881591796875, -2.735137939453125, -2.6214599609375, -2.507781982421875, -2.39410400390625, -2.280426025390625, -2.166748046875, -2.053070068359375, -1.93939208984375, -1.825714111328125, -1.7120361328125, -1.598358154296875, -1.48468017578125, -1.371002197265625, -1.25732421875, -1.143646240234375, -1.02996826171875, -0.916290283203125, -0.8026123046875, -0.688934326171875, -0.57525634765625, -0.461578369140625, -0.347900390625, -0.234222412109375, -0.12054443359375, -0.006866455078125, 0.1068115234375, 0.220489501953125, 0.33416748046875, 0.447845458984375, 0.5615234375, 0.675201416015625, 0.78887939453125, 0.902557373046875, 1.0162353515625, 1.129913330078125, 1.24359130859375, 1.357269287109375, 1.470947265625, 1.584625244140625, 1.69830322265625, 1.811981201171875, 1.9256591796875, 2.039337158203125, 2.15301513671875, 2.266693115234375, 2.38037109375, 2.494049072265625, 2.60772705078125, 2.721405029296875, 2.8350830078125, 2.948760986328125, 3.06243896484375, 3.176116943359375, 3.289794921875, 3.403472900390625, 3.51715087890625, 3.630828857421875, 3.7445068359375, 3.858184814453125, 3.97186279296875, 4.085540771484375, 4.19921875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 5.0, 3.0, 6.0, 11.0, 11.0, 12.0, 5.0, 17.0, 13.0, 35.0, 22.0, 28.0, 32.0, 31.0, 36.0, 45.0, 40.0, 46.0, 41.0, 42.0, 50.0, 46.0, 37.0, 33.0, 35.0, 33.0, 32.0, 29.0, 40.0, 31.0, 22.0, 25.0, 25.0, 20.0, 13.0, 11.0, 9.0, 11.0, 4.0, 4.0, 2.0, 1.0, 5.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.15625, -7.897705078125, -7.63916015625, -7.380615234375, -7.1220703125, -6.863525390625, -6.60498046875, -6.346435546875, -6.087890625, -5.829345703125, -5.57080078125, -5.312255859375, -5.0537109375, -4.795166015625, -4.53662109375, -4.278076171875, -4.01953125, -3.760986328125, -3.50244140625, -3.243896484375, -2.9853515625, -2.726806640625, -2.46826171875, -2.209716796875, -1.951171875, -1.692626953125, -1.43408203125, -1.175537109375, -0.9169921875, -0.658447265625, -0.39990234375, -0.141357421875, 0.1171875, 0.375732421875, 0.63427734375, 0.892822265625, 1.1513671875, 1.409912109375, 1.66845703125, 1.927001953125, 2.185546875, 2.444091796875, 2.70263671875, 2.961181640625, 3.2197265625, 3.478271484375, 3.73681640625, 3.995361328125, 4.25390625, 4.512451171875, 4.77099609375, 5.029541015625, 5.2880859375, 5.546630859375, 5.80517578125, 6.063720703125, 6.322265625, 6.580810546875, 6.83935546875, 7.097900390625, 7.3564453125, 7.614990234375, 7.87353515625, 8.132080078125, 8.390625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 5.0, 7.0, 4.0, 9.0, 7.0, 16.0, 35.0, 33.0, 48.0, 64.0, 90.0, 162.0, 201.0, 309.0, 446.0, 665.0, 1052.0, 1785.0, 2622.0, 4306.0, 7030.0, 11329.0, 19659.0, 39231.0, 579930.0, 302434.0, 32588.0, 17047.0, 10263.0, 6340.0, 3864.0, 2464.0, 1522.0, 961.0, 657.0, 422.0, 285.0, 186.0, 144.0, 94.0, 73.0, 57.0, 34.0, 21.0, 22.0, 9.0, 12.0, 6.0, 6.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.420166015625, -0.4065666198730469, -0.39296722412109375, -0.3793678283691406, -0.3657684326171875, -0.3521690368652344, -0.33856964111328125, -0.3249702453613281, -0.311370849609375, -0.2977714538574219, -0.28417205810546875, -0.2705726623535156, -0.2569732666015625, -0.24337387084960938, -0.22977447509765625, -0.21617507934570312, -0.20257568359375, -0.18897628784179688, -0.17537689208984375, -0.16177749633789062, -0.1481781005859375, -0.13457870483398438, -0.12097930908203125, -0.10737991333007812, -0.093780517578125, -0.08018112182617188, -0.06658172607421875, -0.052982330322265625, -0.0393829345703125, -0.025783538818359375, -0.01218414306640625, 0.001415252685546875, 0.0150146484375, 0.028614044189453125, 0.04221343994140625, 0.055812835693359375, 0.0694122314453125, 0.08301162719726562, 0.09661102294921875, 0.11021041870117188, 0.123809814453125, 0.13740921020507812, 0.15100860595703125, 0.16460800170898438, 0.1782073974609375, 0.19180679321289062, 0.20540618896484375, 0.21900558471679688, 0.23260498046875, 0.24620437622070312, 0.25980377197265625, 0.2734031677246094, 0.2870025634765625, 0.3006019592285156, 0.31420135498046875, 0.3278007507324219, 0.341400146484375, 0.3549995422363281, 0.36859893798828125, 0.3821983337402344, 0.3957977294921875, 0.4093971252441406, 0.42299652099609375, 0.4365959167480469, 0.4501953125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 0.0, 7.0, 8.0, 4.0, 2.0, 2.0, 7.0, 7.0, 10.0, 15.0, 21.0, 20.0, 30.0, 31.0, 28.0, 35.0, 37.0, 34.0, 61.0, 47.0, 58.0, 51.0, 56.0, 53.0, 55.0, 43.0, 42.0, 49.0, 38.0, 29.0, 21.0, 24.0, 22.0, 12.0, 15.0, 10.0, 6.0, 2.0, 6.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5079975128173828e-05, -1.4567747712135315e-05, -1.4055520296096802e-05, -1.3543292880058289e-05, -1.3031065464019775e-05, -1.2518838047981262e-05, -1.2006610631942749e-05, -1.1494383215904236e-05, -1.0982155799865723e-05, -1.046992838382721e-05, -9.957700967788696e-06, -9.445473551750183e-06, -8.93324613571167e-06, -8.421018719673157e-06, -7.908791303634644e-06, -7.39656388759613e-06, -6.884336471557617e-06, -6.372109055519104e-06, -5.859881639480591e-06, -5.347654223442078e-06, -4.8354268074035645e-06, -4.323199391365051e-06, -3.810971975326538e-06, -3.298744559288025e-06, -2.7865171432495117e-06, -2.2742897272109985e-06, -1.7620623111724854e-06, -1.2498348951339722e-06, -7.37607479095459e-07, -2.253800630569458e-07, 2.868473529815674e-07, 7.990747690200806e-07, 1.3113021850585938e-06, 1.823529601097107e-06, 2.33575701713562e-06, 2.8479844331741333e-06, 3.3602118492126465e-06, 3.87243926525116e-06, 4.384666681289673e-06, 4.896894097328186e-06, 5.409121513366699e-06, 5.921348929405212e-06, 6.433576345443726e-06, 6.945803761482239e-06, 7.458031177520752e-06, 7.970258593559265e-06, 8.482486009597778e-06, 8.994713425636292e-06, 9.506940841674805e-06, 1.0019168257713318e-05, 1.0531395673751831e-05, 1.1043623089790344e-05, 1.1555850505828857e-05, 1.206807792186737e-05, 1.2580305337905884e-05, 1.3092532753944397e-05, 1.360476016998291e-05, 1.4116987586021423e-05, 1.4629215002059937e-05, 1.514144241809845e-05, 1.5653669834136963e-05, 1.6165897250175476e-05, 1.667812466621399e-05, 1.7190352082252502e-05, 1.7702579498291016e-05]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 4.0, 4.0, 6.0, 12.0, 20.0, 26.0, 39.0, 55.0, 91.0, 147.0, 182.0, 287.0, 456.0, 624.0, 919.0, 1366.0, 1899.0, 2878.0, 4312.0, 6516.0, 9748.0, 14864.0, 22556.0, 34825.0, 53183.0, 81440.0, 120740.0, 158868.0, 161979.0, 124132.0, 84432.0, 55532.0, 36348.0, 23658.0, 15519.0, 10286.0, 6647.0, 4599.0, 3062.0, 1966.0, 1372.0, 934.0, 679.0, 419.0, 299.0, 194.0, 149.0, 107.0, 60.0, 46.0, 25.0, 22.0, 11.0, 9.0, 6.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.33447265625, -0.323699951171875, -0.31292724609375, -0.302154541015625, -0.2913818359375, -0.280609130859375, -0.26983642578125, -0.259063720703125, -0.248291015625, -0.237518310546875, -0.22674560546875, -0.215972900390625, -0.2052001953125, -0.194427490234375, -0.18365478515625, -0.172882080078125, -0.162109375, -0.151336669921875, -0.14056396484375, -0.129791259765625, -0.1190185546875, -0.108245849609375, -0.09747314453125, -0.086700439453125, -0.075927734375, -0.065155029296875, -0.05438232421875, -0.043609619140625, -0.0328369140625, -0.022064208984375, -0.01129150390625, -0.000518798828125, 0.01025390625, 0.021026611328125, 0.03179931640625, 0.042572021484375, 0.0533447265625, 0.064117431640625, 0.07489013671875, 0.085662841796875, 0.096435546875, 0.107208251953125, 0.11798095703125, 0.128753662109375, 0.1395263671875, 0.150299072265625, 0.16107177734375, 0.171844482421875, 0.1826171875, 0.193389892578125, 0.20416259765625, 0.214935302734375, 0.2257080078125, 0.236480712890625, 0.24725341796875, 0.258026123046875, 0.268798828125, 0.279571533203125, 0.29034423828125, 0.301116943359375, 0.3118896484375, 0.322662353515625, 0.33343505859375, 0.344207763671875, 0.35498046875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 7.0, 6.0, 6.0, 14.0, 16.0, 10.0, 10.0, 20.0, 16.0, 20.0, 35.0, 36.0, 41.0, 51.0, 43.0, 40.0, 57.0, 60.0, 61.0, 53.0, 50.0, 61.0, 38.0, 35.0, 43.0, 31.0, 23.0, 20.0, 27.0, 11.0, 21.0, 9.0, 12.0, 4.0, 3.0, 2.0, 3.0, 5.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.1507568359375, -0.1459789276123047, -0.14120101928710938, -0.13642311096191406, -0.13164520263671875, -0.12686729431152344, -0.12208938598632812, -0.11731147766113281, -0.1125335693359375, -0.10775566101074219, -0.10297775268554688, -0.09819984436035156, -0.09342193603515625, -0.08864402770996094, -0.08386611938476562, -0.07908821105957031, -0.074310302734375, -0.06953239440917969, -0.06475448608398438, -0.05997657775878906, -0.05519866943359375, -0.05042076110839844, -0.045642852783203125, -0.04086494445800781, -0.0360870361328125, -0.03130912780761719, -0.026531219482421875, -0.021753311157226562, -0.01697540283203125, -0.012197494506835938, -0.007419586181640625, -0.0026416778564453125, 0.00213623046875, 0.0069141387939453125, 0.011692047119140625, 0.016469955444335938, 0.02124786376953125, 0.026025772094726562, 0.030803680419921875, 0.03558158874511719, 0.0403594970703125, 0.04513740539550781, 0.049915313720703125, 0.05469322204589844, 0.05947113037109375, 0.06424903869628906, 0.06902694702148438, 0.07380485534667969, 0.078582763671875, 0.08336067199707031, 0.08813858032226562, 0.09291648864746094, 0.09769439697265625, 0.10247230529785156, 0.10725021362304688, 0.11202812194824219, 0.1168060302734375, 0.12158393859863281, 0.12636184692382812, 0.13113975524902344, 0.13591766357421875, 0.14069557189941406, 0.14547348022460938, 0.1502513885498047, 0.155029296875]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 6.0, 5.0, 10.0, 15.0, 14.0, 9.0, 11.0, 22.0, 20.0, 27.0, 33.0, 35.0, 46.0, 51.0, 59.0, 58.0, 61.0, 49.0, 66.0, 49.0, 57.0, 38.0, 53.0, 45.0, 21.0, 20.0, 17.0, 19.0, 17.0, 15.0, 18.0, 12.0, 4.0, 11.0, 3.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.823431015014648, -10.47871208190918, -10.133993148803711, -9.789275169372559, -9.44455623626709, -9.099837303161621, -8.755118370056152, -8.410400390625, -8.065681457519531, -7.7209625244140625, -7.376244068145752, -7.031525135040283, -6.686806678771973, -6.342087745666504, -5.997368812561035, -5.652650356292725, -5.307931423187256, -4.963212490081787, -4.618494033813477, -4.273775100708008, -3.9290566444396973, -3.5843377113342285, -3.239619016647339, -2.894900321960449, -2.5501816272735596, -2.20546293258667, -1.8607442378997803, -1.516025424003601, -1.1713067293167114, -0.8265880346298218, -0.4818692207336426, -0.13715052604675293, 0.20756816864013672, 0.5522868633270264, 0.8970056176185608, 1.2417243719100952, 1.5864430665969849, 1.9311617612838745, 2.2758805751800537, 2.6205992698669434, 2.965317964553833, 3.3100366592407227, 3.6547553539276123, 3.999474048614502, 4.344192981719971, 4.688911437988281, 5.03363037109375, 5.378349304199219, 5.723067760467529, 6.067786693572998, 6.412505149841309, 6.757224082946777, 7.101942539215088, 7.446661472320557, 7.791379928588867, 8.136098861694336, 8.480817794799805, 8.825536727905273, 9.170255661010742, 9.514973640441895, 9.859692573547363, 10.204411506652832, 10.5491304397583, 10.893848419189453, 11.238567352294922]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 10.0, 1.0, 3.0, 4.0, 14.0, 3.0, 11.0, 8.0, 15.0, 14.0, 10.0, 24.0, 12.0, 20.0, 28.0, 25.0, 27.0, 29.0, 36.0, 29.0, 49.0, 43.0, 40.0, 26.0, 32.0, 46.0, 33.0, 42.0, 31.0, 36.0, 37.0, 22.0, 30.0, 30.0, 38.0, 24.0, 25.0, 13.0, 10.0, 17.0, 10.0, 10.0, 10.0, 6.0, 8.0, 10.0, 1.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.361050605773926, -9.04484748840332, -8.728645324707031, -8.412442207336426, -8.09623908996582, -7.780035972595215, -7.463833332061768, -7.14763069152832, -6.831427574157715, -6.515224456787109, -6.199021816253662, -5.882819175720215, -5.566616058349609, -5.250412940979004, -4.934210300445557, -4.618007659912109, -4.301804542541504, -3.9856016635894775, -3.669398784637451, -3.353195905685425, -3.0369930267333984, -2.720790147781372, -2.4045872688293457, -2.0883843898773193, -1.772181510925293, -1.4559786319732666, -1.1397757530212402, -0.8235728740692139, -0.5073699951171875, -0.19116711616516113, 0.12503576278686523, 0.4412386417388916, 0.757441520690918, 1.0736443996429443, 1.3898472785949707, 1.706050157546997, 2.0222530364990234, 2.33845591545105, 2.654658794403076, 2.9708616733551025, 3.287064552307129, 3.6032674312591553, 3.9194703102111816, 4.235672950744629, 4.551876068115234, 4.86807918548584, 5.184281826019287, 5.500484466552734, 5.81668758392334, 6.132890701293945, 6.449093341827393, 6.76529598236084, 7.081499099731445, 7.397702217102051, 7.713904857635498, 8.030107498168945, 8.34631061553955, 8.662513732910156, 8.978715896606445, 9.29491901397705, 9.611122131347656, 9.927325248718262, 10.243528366088867, 10.559730529785156, 10.875933647155762]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 7.0, 10.0, 14.0, 20.0, 36.0, 60.0, 70.0, 142.0, 218.0, 345.0, 453.0, 685.0, 1058.0, 1726.0, 2712.0, 4358.0, 7002.0, 11306.0, 18443.0, 29275.0, 45380.0, 66283.0, 90862.0, 113156.0, 127259.0, 128163.0, 114401.0, 91374.0, 67372.0, 46037.0, 30068.0, 18854.0, 11756.0, 7314.0, 4581.0, 2808.0, 1749.0, 1125.0, 690.0, 480.0, 307.0, 206.0, 145.0, 95.0, 63.0, 26.0, 20.0, 16.0, 10.0, 10.0, 5.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.8671875, -6.65277099609375, -6.4383544921875, -6.22393798828125, -6.009521484375, -5.79510498046875, -5.5806884765625, -5.36627197265625, -5.15185546875, -4.93743896484375, -4.7230224609375, -4.50860595703125, -4.294189453125, -4.07977294921875, -3.8653564453125, -3.65093994140625, -3.4365234375, -3.22210693359375, -3.0076904296875, -2.79327392578125, -2.578857421875, -2.36444091796875, -2.1500244140625, -1.93560791015625, -1.72119140625, -1.50677490234375, -1.2923583984375, -1.07794189453125, -0.863525390625, -0.64910888671875, -0.4346923828125, -0.22027587890625, -0.005859375, 0.20855712890625, 0.4229736328125, 0.63739013671875, 0.851806640625, 1.06622314453125, 1.2806396484375, 1.49505615234375, 1.70947265625, 1.92388916015625, 2.1383056640625, 2.35272216796875, 2.567138671875, 2.78155517578125, 2.9959716796875, 3.21038818359375, 3.4248046875, 3.63922119140625, 3.8536376953125, 4.06805419921875, 4.282470703125, 4.49688720703125, 4.7113037109375, 4.92572021484375, 5.14013671875, 5.35455322265625, 5.5689697265625, 5.78338623046875, 5.997802734375, 6.21221923828125, 6.4266357421875, 6.64105224609375, 6.85546875]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 8.0, 3.0, 5.0, 10.0, 2.0, 9.0, 11.0, 7.0, 12.0, 21.0, 19.0, 13.0, 28.0, 18.0, 27.0, 27.0, 31.0, 45.0, 36.0, 41.0, 36.0, 43.0, 37.0, 40.0, 40.0, 50.0, 47.0, 28.0, 28.0, 45.0, 30.0, 22.0, 30.0, 28.0, 20.0, 16.0, 21.0, 10.0, 13.0, 13.0, 6.0, 13.0, 6.0, 5.0, 5.0, 3.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.5078125, -9.1844482421875, -8.861083984375, -8.5377197265625, -8.21435546875, -7.8909912109375, -7.567626953125, -7.2442626953125, -6.9208984375, -6.5975341796875, -6.274169921875, -5.9508056640625, -5.62744140625, -5.3040771484375, -4.980712890625, -4.6573486328125, -4.333984375, -4.0106201171875, -3.687255859375, -3.3638916015625, -3.04052734375, -2.7171630859375, -2.393798828125, -2.0704345703125, -1.7470703125, -1.4237060546875, -1.100341796875, -0.7769775390625, -0.45361328125, -0.1302490234375, 0.193115234375, 0.5164794921875, 0.83984375, 1.1632080078125, 1.486572265625, 1.8099365234375, 2.13330078125, 2.4566650390625, 2.780029296875, 3.1033935546875, 3.4267578125, 3.7501220703125, 4.073486328125, 4.3968505859375, 4.72021484375, 5.0435791015625, 5.366943359375, 5.6903076171875, 6.013671875, 6.3370361328125, 6.660400390625, 6.9837646484375, 7.30712890625, 7.6304931640625, 7.953857421875, 8.2772216796875, 8.6005859375, 8.9239501953125, 9.247314453125, 9.5706787109375, 9.89404296875, 10.2174072265625, 10.540771484375, 10.8641357421875, 11.1875]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 5.0, 4.0, 8.0, 13.0, 20.0, 49.0, 61.0, 84.0, 160.0, 241.0, 308.0, 531.0, 761.0, 1176.0, 1693.0, 2721.0, 4084.0, 6162.0, 9554.0, 14058.0, 20919.0, 30683.0, 43008.0, 58727.0, 76137.0, 92502.0, 104095.0, 108652.0, 105184.0, 92896.0, 76110.0, 59951.0, 43262.0, 30999.0, 21358.0, 14211.0, 9602.0, 6421.0, 4171.0, 2753.0, 1845.0, 1201.0, 756.0, 484.0, 327.0, 198.0, 159.0, 97.0, 48.0, 40.0, 28.0, 21.0, 13.0, 9.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.234375, -6.03009033203125, -5.8258056640625, -5.62152099609375, -5.417236328125, -5.21295166015625, -5.0086669921875, -4.80438232421875, -4.60009765625, -4.39581298828125, -4.1915283203125, -3.98724365234375, -3.782958984375, -3.57867431640625, -3.3743896484375, -3.17010498046875, -2.9658203125, -2.76153564453125, -2.5572509765625, -2.35296630859375, -2.148681640625, -1.94439697265625, -1.7401123046875, -1.53582763671875, -1.33154296875, -1.12725830078125, -0.9229736328125, -0.71868896484375, -0.514404296875, -0.31011962890625, -0.1058349609375, 0.09844970703125, 0.302734375, 0.50701904296875, 0.7113037109375, 0.91558837890625, 1.119873046875, 1.32415771484375, 1.5284423828125, 1.73272705078125, 1.93701171875, 2.14129638671875, 2.3455810546875, 2.54986572265625, 2.754150390625, 2.95843505859375, 3.1627197265625, 3.36700439453125, 3.5712890625, 3.77557373046875, 3.9798583984375, 4.18414306640625, 4.388427734375, 4.59271240234375, 4.7969970703125, 5.00128173828125, 5.20556640625, 5.40985107421875, 5.6141357421875, 5.81842041015625, 6.022705078125, 6.22698974609375, 6.4312744140625, 6.63555908203125, 6.83984375]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 6.0, 2.0, 4.0, 3.0, 2.0, 2.0, 9.0, 6.0, 7.0, 10.0, 7.0, 13.0, 9.0, 16.0, 17.0, 15.0, 18.0, 21.0, 22.0, 22.0, 23.0, 32.0, 33.0, 37.0, 31.0, 25.0, 32.0, 28.0, 29.0, 42.0, 42.0, 34.0, 35.0, 35.0, 28.0, 29.0, 32.0, 29.0, 18.0, 26.0, 22.0, 22.0, 23.0, 22.0, 19.0, 11.0, 13.0, 8.0, 11.0, 7.0, 5.0, 2.0, 5.0, 4.0, 4.0, 3.0, 4.0, 1.0, 3.0, 2.0], "bins": [-6.1484375, -5.967041015625, -5.78564453125, -5.604248046875, -5.4228515625, -5.241455078125, -5.06005859375, -4.878662109375, -4.697265625, -4.515869140625, -4.33447265625, -4.153076171875, -3.9716796875, -3.790283203125, -3.60888671875, -3.427490234375, -3.24609375, -3.064697265625, -2.88330078125, -2.701904296875, -2.5205078125, -2.339111328125, -2.15771484375, -1.976318359375, -1.794921875, -1.613525390625, -1.43212890625, -1.250732421875, -1.0693359375, -0.887939453125, -0.70654296875, -0.525146484375, -0.34375, -0.162353515625, 0.01904296875, 0.200439453125, 0.3818359375, 0.563232421875, 0.74462890625, 0.926025390625, 1.107421875, 1.288818359375, 1.47021484375, 1.651611328125, 1.8330078125, 2.014404296875, 2.19580078125, 2.377197265625, 2.55859375, 2.739990234375, 2.92138671875, 3.102783203125, 3.2841796875, 3.465576171875, 3.64697265625, 3.828369140625, 4.009765625, 4.191162109375, 4.37255859375, 4.553955078125, 4.7353515625, 4.916748046875, 5.09814453125, 5.279541015625, 5.4609375]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 8.0, 2.0, 4.0, 6.0, 10.0, 15.0, 19.0, 22.0, 32.0, 65.0, 104.0, 146.0, 266.0, 379.0, 686.0, 1020.0, 1818.0, 3173.0, 5515.0, 10928.0, 21996.0, 45277.0, 89409.0, 155509.0, 211145.0, 202434.0, 141205.0, 77862.0, 39013.0, 19107.0, 9523.0, 4994.0, 2742.0, 1546.0, 944.0, 572.0, 388.0, 222.0, 146.0, 91.0, 65.0, 56.0, 22.0, 25.0, 16.0, 10.0, 14.0, 5.0, 3.0, 3.0, 2.0, 5.0, 1.0, 0.0, 1.0], "bins": [-6.1796875, -5.99737548828125, -5.8150634765625, -5.63275146484375, -5.450439453125, -5.26812744140625, -5.0858154296875, -4.90350341796875, -4.72119140625, -4.53887939453125, -4.3565673828125, -4.17425537109375, -3.991943359375, -3.80963134765625, -3.6273193359375, -3.44500732421875, -3.2626953125, -3.08038330078125, -2.8980712890625, -2.71575927734375, -2.533447265625, -2.35113525390625, -2.1688232421875, -1.98651123046875, -1.80419921875, -1.62188720703125, -1.4395751953125, -1.25726318359375, -1.074951171875, -0.89263916015625, -0.7103271484375, -0.52801513671875, -0.345703125, -0.16339111328125, 0.0189208984375, 0.20123291015625, 0.383544921875, 0.56585693359375, 0.7481689453125, 0.93048095703125, 1.11279296875, 1.29510498046875, 1.4774169921875, 1.65972900390625, 1.842041015625, 2.02435302734375, 2.2066650390625, 2.38897705078125, 2.5712890625, 2.75360107421875, 2.9359130859375, 3.11822509765625, 3.300537109375, 3.48284912109375, 3.6651611328125, 3.84747314453125, 4.02978515625, 4.21209716796875, 4.3944091796875, 4.57672119140625, 4.759033203125, 4.94134521484375, 5.1236572265625, 5.30596923828125, 5.48828125]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 4.0, 10.0, 4.0, 16.0, 16.0, 24.0, 37.0, 35.0, 34.0, 47.0, 60.0, 47.0, 75.0, 73.0, 71.0, 72.0, 59.0, 61.0, 62.0, 40.0, 42.0, 16.0, 27.0, 21.0, 14.0, 15.0, 4.0, 6.0, 5.0, 0.0, 2.0, 3.0, 3.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0006961822509765625, -0.0006779134273529053, -0.000659644603729248, -0.0006413757801055908, -0.0006231069564819336, -0.0006048381328582764, -0.0005865693092346191, -0.0005683004856109619, -0.0005500316619873047, -0.0005317628383636475, -0.0005134940147399902, -0.000495225191116333, -0.0004769563674926758, -0.00045868754386901855, -0.00044041872024536133, -0.0004221498966217041, -0.0004038810729980469, -0.00038561224937438965, -0.0003673434257507324, -0.0003490746021270752, -0.00033080577850341797, -0.00031253695487976074, -0.0002942681312561035, -0.0002759993076324463, -0.00025773048400878906, -0.00023946166038513184, -0.0002211928367614746, -0.00020292401313781738, -0.00018465518951416016, -0.00016638636589050293, -0.0001481175422668457, -0.00012984871864318848, -0.00011157989501953125, -9.331107139587402e-05, -7.50422477722168e-05, -5.677342414855957e-05, -3.8504600524902344e-05, -2.0235776901245117e-05, -1.9669532775878906e-06, 1.6301870346069336e-05, 3.457069396972656e-05, 5.283951759338379e-05, 7.110834121704102e-05, 8.937716484069824e-05, 0.00010764598846435547, 0.0001259148120880127, 0.00014418363571166992, 0.00016245245933532715, 0.00018072128295898438, 0.0001989901065826416, 0.00021725893020629883, 0.00023552775382995605, 0.0002537965774536133, 0.0002720654010772705, 0.00029033422470092773, 0.00030860304832458496, 0.0003268718719482422, 0.0003451406955718994, 0.00036340951919555664, 0.00038167834281921387, 0.0003999471664428711, 0.0004182159900665283, 0.00043648481369018555, 0.0004547536373138428, 0.0004730224609375]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 1.0, 3.0, 8.0, 8.0, 14.0, 19.0, 42.0, 48.0, 87.0, 105.0, 187.0, 308.0, 410.0, 685.0, 1142.0, 1877.0, 3085.0, 5186.0, 9303.0, 17130.0, 32140.0, 58224.0, 100605.0, 149514.0, 181847.0, 172850.0, 129741.0, 81654.0, 46133.0, 24914.0, 13171.0, 7235.0, 4335.0, 2484.0, 1472.0, 940.0, 599.0, 396.0, 226.0, 141.0, 96.0, 76.0, 41.0, 30.0, 18.0, 9.0, 8.0, 6.0, 2.0, 7.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.22265625, -5.06341552734375, -4.9041748046875, -4.74493408203125, -4.585693359375, -4.42645263671875, -4.2672119140625, -4.10797119140625, -3.94873046875, -3.78948974609375, -3.6302490234375, -3.47100830078125, -3.311767578125, -3.15252685546875, -2.9932861328125, -2.83404541015625, -2.6748046875, -2.51556396484375, -2.3563232421875, -2.19708251953125, -2.037841796875, -1.87860107421875, -1.7193603515625, -1.56011962890625, -1.40087890625, -1.24163818359375, -1.0823974609375, -0.92315673828125, -0.763916015625, -0.60467529296875, -0.4454345703125, -0.28619384765625, -0.126953125, 0.03228759765625, 0.1915283203125, 0.35076904296875, 0.510009765625, 0.66925048828125, 0.8284912109375, 0.98773193359375, 1.14697265625, 1.30621337890625, 1.4654541015625, 1.62469482421875, 1.783935546875, 1.94317626953125, 2.1024169921875, 2.26165771484375, 2.4208984375, 2.58013916015625, 2.7393798828125, 2.89862060546875, 3.057861328125, 3.21710205078125, 3.3763427734375, 3.53558349609375, 3.69482421875, 3.85406494140625, 4.0133056640625, 4.17254638671875, 4.331787109375, 4.49102783203125, 4.6502685546875, 4.80950927734375, 4.96875]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 3.0, 4.0, 5.0, 6.0, 8.0, 11.0, 15.0, 13.0, 16.0, 25.0, 32.0, 34.0, 42.0, 48.0, 51.0, 51.0, 59.0, 55.0, 72.0, 57.0, 56.0, 44.0, 64.0, 33.0, 35.0, 37.0, 28.0, 19.0, 16.0, 17.0, 13.0, 5.0, 8.0, 4.0, 7.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.685546875, -1.63519287109375, -1.5848388671875, -1.53448486328125, -1.484130859375, -1.43377685546875, -1.3834228515625, -1.33306884765625, -1.28271484375, -1.23236083984375, -1.1820068359375, -1.13165283203125, -1.081298828125, -1.03094482421875, -0.9805908203125, -0.93023681640625, -0.8798828125, -0.82952880859375, -0.7791748046875, -0.72882080078125, -0.678466796875, -0.62811279296875, -0.5777587890625, -0.52740478515625, -0.47705078125, -0.42669677734375, -0.3763427734375, -0.32598876953125, -0.275634765625, -0.22528076171875, -0.1749267578125, -0.12457275390625, -0.07421875, -0.02386474609375, 0.0264892578125, 0.07684326171875, 0.127197265625, 0.17755126953125, 0.2279052734375, 0.27825927734375, 0.32861328125, 0.37896728515625, 0.4293212890625, 0.47967529296875, 0.530029296875, 0.58038330078125, 0.6307373046875, 0.68109130859375, 0.7314453125, 0.78179931640625, 0.8321533203125, 0.88250732421875, 0.932861328125, 0.98321533203125, 1.0335693359375, 1.08392333984375, 1.13427734375, 1.18463134765625, 1.2349853515625, 1.28533935546875, 1.335693359375, 1.38604736328125, 1.4364013671875, 1.48675537109375, 1.537109375]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 7.0, 7.0, 8.0, 10.0, 14.0, 11.0, 18.0, 25.0, 26.0, 22.0, 33.0, 37.0, 40.0, 41.0, 59.0, 41.0, 50.0, 54.0, 47.0, 55.0, 53.0, 52.0, 36.0, 33.0, 33.0, 32.0, 30.0, 24.0, 20.0, 14.0, 16.0, 13.0, 10.0, 8.0, 8.0, 1.0, 11.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.82801628112793, -9.502305030822754, -9.176593780517578, -8.850882530212402, -8.525171279907227, -8.19946002960205, -7.873749256134033, -7.548038005828857, -7.222326755523682, -6.896615505218506, -6.57090425491333, -6.245193004608154, -5.919482231140137, -5.593770980834961, -5.268059730529785, -4.942348480224609, -4.616637229919434, -4.290925979614258, -3.965214729309082, -3.6395037174224854, -3.3137924671173096, -2.988081216812134, -2.662370204925537, -2.3366589546203613, -2.0109477043151855, -1.6852364540100098, -1.3595253229141235, -1.0338141918182373, -0.7081029415130615, -0.38239169120788574, -0.05668056011199951, 0.2690305709838867, 0.5947408676147461, 0.9204520583152771, 1.246163249015808, 1.5718743801116943, 1.8975856304168701, 2.223296880722046, 2.5490078926086426, 2.8747191429138184, 3.200430393218994, 3.52614164352417, 3.8518528938293457, 4.1775641441345215, 4.503274917602539, 4.828986167907715, 5.154697418212891, 5.480408668518066, 5.806119918823242, 6.131831169128418, 6.457542419433594, 6.7832536697387695, 7.108964920043945, 7.434676170349121, 7.760386943817139, 8.086097717285156, 8.411809921264648, 8.737521171569824, 9.063232421875, 9.388943672180176, 9.714654922485352, 10.040366172790527, 10.366077423095703, 10.691787719726562, 11.017498970031738]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 5.0, 8.0, 2.0, 6.0, 3.0, 8.0, 6.0, 14.0, 14.0, 10.0, 14.0, 24.0, 16.0, 25.0, 22.0, 23.0, 33.0, 26.0, 35.0, 24.0, 23.0, 34.0, 38.0, 40.0, 27.0, 30.0, 27.0, 35.0, 35.0, 32.0, 29.0, 28.0, 30.0, 42.0, 28.0, 20.0, 30.0, 17.0, 13.0, 25.0, 23.0, 13.0, 13.0, 16.0, 8.0, 8.0, 7.0, 4.0, 3.0, 2.0, 4.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 4.0], "bins": [-10.502972602844238, -10.168293952941895, -9.83361530303955, -9.498936653137207, -9.164257049560547, -8.829578399658203, -8.49489974975586, -8.160221099853516, -7.825542449951172, -7.490863800048828, -7.156185150146484, -6.821506023406982, -6.486827373504639, -6.152148723602295, -5.817469596862793, -5.482790946960449, -5.1481122970581055, -4.813433647155762, -4.478754997253418, -4.144075870513916, -3.8093972206115723, -3.4747185707092285, -3.1400396823883057, -2.805360794067383, -2.470682144165039, -2.1360034942626953, -1.8013246059417725, -1.4666458368301392, -1.1319670677185059, -0.7972882986068726, -0.46260952949523926, -0.1279306411743164, 0.20674705505371094, 0.5414258241653442, 0.8761045932769775, 1.2107833623886108, 1.5454621315002441, 1.8801409006118774, 2.2148196697235107, 2.5494985580444336, 2.8841772079467773, 3.218855857849121, 3.553534746170044, 3.888213634490967, 4.2228922843933105, 4.557570934295654, 4.892250061035156, 5.2269287109375, 5.561607360839844, 5.8962860107421875, 6.230964660644531, 6.565643787384033, 6.900322437286377, 7.235001087188721, 7.569680213928223, 7.904358863830566, 8.23903751373291, 8.573716163635254, 8.908394813537598, 9.243073463439941, 9.577753067016602, 9.912431716918945, 10.247110366821289, 10.581789016723633, 10.916467666625977]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 6.0, 2.0, 4.0, 5.0, 17.0, 14.0, 18.0, 28.0, 30.0, 55.0, 68.0, 99.0, 137.0, 272.0, 579.0, 1287.0, 3017.0, 8907.0, 1023208.0, 7742.0, 2793.0, 1067.0, 517.0, 237.0, 171.0, 102.0, 60.0, 51.0, 27.0, 23.0, 15.0, 15.0, 9.0, 6.0, 3.0, 6.0, 4.0, 5.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-254.05751037597656, -246.45989990234375, -238.8623046875, -231.26470947265625, -223.66709899902344, -216.06948852539062, -208.47189331054688, -200.87429809570312, -193.2766876220703, -185.6790771484375, -178.08148193359375, -170.48388671875, -162.8862762451172, -155.28866577148438, -147.69107055664062, -140.09347534179688, -132.49586486816406, -124.89826202392578, -117.3006591796875, -109.70305633544922, -102.10545349121094, -94.50785064697266, -86.91024780273438, -79.3126449584961, -71.71504211425781, -64.11743927001953, -56.51983642578125, -48.92223358154297, -41.32463073730469, -33.727027893066406, -26.129425048828125, -18.531822204589844, -10.934234619140625, -3.3366317749023438, 4.2609710693359375, 11.858573913574219, 19.4561767578125, 27.05377960205078, 34.65138244628906, 42.248985290527344, 49.846588134765625, 57.444190979003906, 65.04179382324219, 72.63939666748047, 80.23699951171875, 87.83460235595703, 95.43220520019531, 103.0298080444336, 110.62741088867188, 118.22501373291016, 125.82261657714844, 133.42022705078125, 141.017822265625, 148.61541748046875, 156.21302795410156, 163.81063842773438, 171.40823364257812, 179.00582885742188, 186.6034393310547, 194.2010498046875, 201.79864501953125, 209.396240234375, 216.9938507080078, 224.59146118164062, 232.18905639648438]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 1.0, 7.0, 12.0, 4.0, 16.0, 20.0, 40.0, 50.0, 87.0, 148.0, 201.0, 326.0, 561.0, 877.0, 1336.0, 1886.0, 3122.0, 5205.0, 11358.0, 65778.0, 51344392.0, 18745.0, 6811.0, 3698.0, 2242.0, 1578.0, 995.0, 699.0, 455.0, 250.0, 171.0, 79.0, 58.0, 42.0, 25.0, 19.0, 11.0, 7.0, 12.0, 5.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-215.9821319580078, -209.27438354492188, -202.566650390625, -195.85891723632812, -189.1511688232422, -182.44342041015625, -175.73568725585938, -169.0279541015625, -162.32020568847656, -155.61245727539062, -148.90472412109375, -142.19699096679688, -135.48924255371094, -128.781494140625, -122.07376098632812, -115.36602020263672, -108.65827941894531, -101.9505386352539, -95.2427978515625, -88.5350570678711, -81.82731628417969, -75.11957550048828, -68.41183471679688, -61.70409393310547, -54.99635314941406, -48.288612365722656, -41.58087158203125, -34.873130798339844, -28.165390014648438, -21.45764923095703, -14.749908447265625, -8.042167663574219, -1.334442138671875, 5.373298645019531, 12.081039428710938, 18.788780212402344, 25.49652099609375, 32.204261779785156, 38.91200256347656, 45.61974334716797, 52.327484130859375, 59.03522491455078, 65.74296569824219, 72.4507064819336, 79.158447265625, 85.8661880493164, 92.57392883300781, 99.28166961669922, 105.98941040039062, 112.69715118408203, 119.40489196777344, 126.11263275146484, 132.82037353515625, 139.52810668945312, 146.23585510253906, 152.943603515625, 159.65133666992188, 166.35906982421875, 173.0668182373047, 179.77456665039062, 186.4822998046875, 193.19003295898438, 199.8977813720703, 206.60552978515625, 213.31326293945312]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 6.0, 6.0, 13.0, 16.0, 20.0, 26.0, 33.0, 33.0, 44.0, 55.0, 61.0, 87.0, 94.0, 82.0, 98.0, 62.0, 56.0, 55.0, 31.0, 29.0, 24.0, 20.0, 16.0, 8.0, 5.0, 6.0, 8.0, 3.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-252.26809692382812, -244.88331604003906, -237.49855041503906, -230.11376953125, -222.72900390625, -215.34422302246094, -207.95944213867188, -200.57467651367188, -193.1898956298828, -185.80511474609375, -178.42034912109375, -171.0355682373047, -163.65078735351562, -156.26602172851562, -148.88124084472656, -141.4964599609375, -134.1116943359375, -126.72692108154297, -119.34214782714844, -111.95736694335938, -104.57259368896484, -97.18782043457031, -89.80303955078125, -82.41826629638672, -75.03349304199219, -67.64871978759766, -60.26394271850586, -52.87916564941406, -45.49439239501953, -38.109619140625, -30.724842071533203, -23.340065002441406, -15.955291748046875, -8.570516586303711, -1.1857414245605469, 6.199033737182617, 13.583808898925781, 20.968582153320312, 28.35335922241211, 35.738136291503906, 43.12290954589844, 50.50768280029297, 57.892459869384766, 65.27723693847656, 72.6620101928711, 80.04678344726562, 87.43156433105469, 94.81633758544922, 102.20111083984375, 109.58588409423828, 116.97065734863281, 124.35543823242188, 131.74020385742188, 139.12498474121094, 146.509765625, 153.89453125, 161.27931213378906, 168.66409301757812, 176.04885864257812, 183.4336395263672, 190.81842041015625, 198.20318603515625, 205.5879669189453, 212.97274780273438, 220.35751342773438]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 2.0, 3.0, 4.0, 6.0, 4.0, 9.0, 9.0, 7.0, 6.0, 17.0, 8.0, 13.0, 19.0, 18.0, 22.0, 22.0, 34.0, 34.0, 38.0, 37.0, 61.0, 56.0, 85.0, 70.0, 61.0, 42.0, 43.0, 40.0, 25.0, 37.0, 30.0, 20.0, 14.0, 11.0, 15.0, 17.0, 6.0, 7.0, 11.0, 4.0, 2.0, 8.0, 6.0, 8.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 3.0], "bins": [-262.26580810546875, -254.90625, -247.54669189453125, -240.1871337890625, -232.82757568359375, -225.468017578125, -218.1084747314453, -210.74891662597656, -203.3893585205078, -196.02980041503906, -188.6702423095703, -181.31068420410156, -173.95114135742188, -166.59158325195312, -159.23202514648438, -151.87246704101562, -144.51290893554688, -137.15335083007812, -129.79379272460938, -122.43424224853516, -115.0746841430664, -107.71512603759766, -100.35557556152344, -92.99601745605469, -85.63645935058594, -78.27690124511719, -70.91734313964844, -63.55779266357422, -56.19823455810547, -48.83867645263672, -41.479122161865234, -34.11956787109375, -26.760009765625, -19.400453567504883, -12.040897369384766, -4.681341171264648, 2.6782150268554688, 10.037773132324219, 17.397327423095703, 24.756881713867188, 32.11643981933594, 39.47599792480469, 46.83555221557617, 54.195106506347656, 61.554664611816406, 68.91422271728516, 76.27377319335938, 83.63333129882812, 90.99288940429688, 98.35244750976562, 105.71200561523438, 113.0715560913086, 120.43111419677734, 127.7906723022461, 135.1502227783203, 142.50978088378906, 149.8693389892578, 157.22889709472656, 164.5884552001953, 171.94801330566406, 179.30755615234375, 186.6671142578125, 194.02667236328125, 201.38623046875, 208.74578857421875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 10.0, 6.0, 3.0, 8.0, 12.0, 13.0, 22.0, 29.0, 40.0, 63.0, 89.0, 111.0, 160.0, 237.0, 366.0, 566.0, 830.0, 1272.0, 1869.0, 2921.0, 4713.0, 7546.0, 12634.0, 21670.0, 39091.0, 73539.0, 145802.0, 308505.0, 722654.0, 1631404.0, 652793.0, 279477.0, 132035.0, 67101.0, 36078.0, 20145.0, 11674.0, 7009.0, 4201.0, 2615.0, 1750.0, 1114.0, 689.0, 465.0, 332.0, 197.0, 136.0, 94.0, 73.0, 41.0, 28.0, 21.0, 14.0, 9.0, 8.0, 2.0, 4.0, 4.0, 0.0, 2.0], "bins": [-2.81640625, -2.732208251953125, -2.64801025390625, -2.563812255859375, -2.4796142578125, -2.395416259765625, -2.31121826171875, -2.227020263671875, -2.142822265625, -2.058624267578125, -1.97442626953125, -1.890228271484375, -1.8060302734375, -1.721832275390625, -1.63763427734375, -1.553436279296875, -1.46923828125, -1.385040283203125, -1.30084228515625, -1.216644287109375, -1.1324462890625, -1.048248291015625, -0.96405029296875, -0.879852294921875, -0.795654296875, -0.711456298828125, -0.62725830078125, -0.543060302734375, -0.4588623046875, -0.374664306640625, -0.29046630859375, -0.206268310546875, -0.1220703125, -0.037872314453125, 0.04632568359375, 0.130523681640625, 0.2147216796875, 0.298919677734375, 0.38311767578125, 0.467315673828125, 0.551513671875, 0.635711669921875, 0.71990966796875, 0.804107666015625, 0.8883056640625, 0.972503662109375, 1.05670166015625, 1.140899658203125, 1.22509765625, 1.309295654296875, 1.39349365234375, 1.477691650390625, 1.5618896484375, 1.646087646484375, 1.73028564453125, 1.814483642578125, 1.898681640625, 1.982879638671875, 2.06707763671875, 2.151275634765625, 2.2354736328125, 2.319671630859375, 2.40386962890625, 2.488067626953125, 2.572265625]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 7.0, 7.0, 5.0, 10.0, 14.0, 24.0, 25.0, 22.0, 30.0, 37.0, 42.0, 55.0, 61.0, 82.0, 67.0, 77.0, 87.0, 81.0, 50.0, 41.0, 45.0, 28.0, 19.0, 19.0, 16.0, 10.0, 11.0, 9.0, 6.0, 5.0, 4.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.47607421875, -0.4616889953613281, -0.44730377197265625, -0.4329185485839844, -0.4185333251953125, -0.4041481018066406, -0.38976287841796875, -0.3753776550292969, -0.360992431640625, -0.3466072082519531, -0.33222198486328125, -0.3178367614746094, -0.3034515380859375, -0.2890663146972656, -0.27468109130859375, -0.2602958679199219, -0.24591064453125, -0.23152542114257812, -0.21714019775390625, -0.20275497436523438, -0.1883697509765625, -0.17398452758789062, -0.15959930419921875, -0.14521408081054688, -0.130828857421875, -0.11644363403320312, -0.10205841064453125, -0.08767318725585938, -0.0732879638671875, -0.058902740478515625, -0.04451751708984375, -0.030132293701171875, -0.0157470703125, -0.001361846923828125, 0.01302337646484375, 0.027408599853515625, 0.0417938232421875, 0.056179046630859375, 0.07056427001953125, 0.08494949340820312, 0.099334716796875, 0.11371994018554688, 0.12810516357421875, 0.14249038696289062, 0.1568756103515625, 0.17126083374023438, 0.18564605712890625, 0.20003128051757812, 0.21441650390625, 0.22880172729492188, 0.24318695068359375, 0.2575721740722656, 0.2719573974609375, 0.2863426208496094, 0.30072784423828125, 0.3151130676269531, 0.329498291015625, 0.3438835144042969, 0.35826873779296875, 0.3726539611816406, 0.3870391845703125, 0.4014244079589844, 0.41580963134765625, 0.4301948547363281, 0.444580078125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 5.0, 5.0, 11.0, 12.0, 14.0, 17.0, 28.0, 27.0, 66.0, 67.0, 133.0, 166.0, 275.0, 441.0, 787.0, 1403.0, 2647.0, 5325.0, 11133.0, 24019.0, 54886.0, 130373.0, 321559.0, 783181.0, 1507114.0, 796917.0, 324336.0, 130078.0, 53549.0, 23738.0, 10808.0, 5139.0, 2645.0, 1439.0, 735.0, 430.0, 265.0, 166.0, 121.0, 51.0, 54.0, 28.0, 27.0, 28.0, 8.0, 8.0, 9.0, 7.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-2.2578125, -2.1904296875, -2.123046875, -2.0556640625, -1.98828125, -1.9208984375, -1.853515625, -1.7861328125, -1.71875, -1.6513671875, -1.583984375, -1.5166015625, -1.44921875, -1.3818359375, -1.314453125, -1.2470703125, -1.1796875, -1.1123046875, -1.044921875, -0.9775390625, -0.91015625, -0.8427734375, -0.775390625, -0.7080078125, -0.640625, -0.5732421875, -0.505859375, -0.4384765625, -0.37109375, -0.3037109375, -0.236328125, -0.1689453125, -0.1015625, -0.0341796875, 0.033203125, 0.1005859375, 0.16796875, 0.2353515625, 0.302734375, 0.3701171875, 0.4375, 0.5048828125, 0.572265625, 0.6396484375, 0.70703125, 0.7744140625, 0.841796875, 0.9091796875, 0.9765625, 1.0439453125, 1.111328125, 1.1787109375, 1.24609375, 1.3134765625, 1.380859375, 1.4482421875, 1.515625, 1.5830078125, 1.650390625, 1.7177734375, 1.78515625, 1.8525390625, 1.919921875, 1.9873046875, 2.0546875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 5.0, 6.0, 10.0, 12.0, 18.0, 24.0, 18.0, 28.0, 30.0, 46.0, 56.0, 56.0, 69.0, 100.0, 108.0, 134.0, 175.0, 209.0, 237.0, 271.0, 325.0, 363.0, 304.0, 265.0, 241.0, 181.0, 150.0, 121.0, 114.0, 85.0, 79.0, 44.0, 40.0, 31.0, 25.0, 37.0, 19.0, 10.0, 10.0, 6.0, 7.0, 3.0, 0.0, 2.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.82763671875, -0.8028182983398438, -0.7779998779296875, -0.7531814575195312, -0.728363037109375, -0.7035446166992188, -0.6787261962890625, -0.6539077758789062, -0.62908935546875, -0.6042709350585938, -0.5794525146484375, -0.5546340942382812, -0.529815673828125, -0.5049972534179688, -0.4801788330078125, -0.45536041259765625, -0.4305419921875, -0.40572357177734375, -0.3809051513671875, -0.35608673095703125, -0.331268310546875, -0.30644989013671875, -0.2816314697265625, -0.25681304931640625, -0.23199462890625, -0.20717620849609375, -0.1823577880859375, -0.15753936767578125, -0.132720947265625, -0.10790252685546875, -0.0830841064453125, -0.05826568603515625, -0.033447265625, -0.00862884521484375, 0.0161895751953125, 0.04100799560546875, 0.065826416015625, 0.09064483642578125, 0.1154632568359375, 0.14028167724609375, 0.16510009765625, 0.18991851806640625, 0.2147369384765625, 0.23955535888671875, 0.264373779296875, 0.28919219970703125, 0.3140106201171875, 0.33882904052734375, 0.3636474609375, 0.38846588134765625, 0.4132843017578125, 0.43810272216796875, 0.462921142578125, 0.48773956298828125, 0.5125579833984375, 0.5373764038085938, 0.56219482421875, 0.5870132446289062, 0.6118316650390625, 0.6366500854492188, 0.661468505859375, 0.6862869262695312, 0.7111053466796875, 0.7359237670898438, 0.7607421875]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 9.0, 7.0, 14.0, 26.0, 21.0, 44.0, 49.0, 74.0, 104.0, 107.0, 103.0, 106.0, 104.0, 74.0, 44.0, 34.0, 32.0, 13.0, 13.0, 4.0, 10.0, 1.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.388839721679688, -11.077253341674805, -10.765666007995605, -10.454078674316406, -10.142492294311523, -9.83090591430664, -9.519318580627441, -9.207731246948242, -8.89614486694336, -8.584558486938477, -8.272971153259277, -7.961384296417236, -7.649797439575195, -7.338210582733154, -7.026623725891113, -6.715036869049072, -6.403450012207031, -6.09186315536499, -5.780276298522949, -5.468689441680908, -5.157102584838867, -4.845515727996826, -4.533928871154785, -4.222342014312744, -3.910755157470703, -3.599168300628662, -3.287581443786621, -2.97599458694458, -2.664407730102539, -2.352820873260498, -2.041234016418457, -1.729647159576416, -1.4180593490600586, -1.1064724922180176, -0.7948856353759766, -0.48329877853393555, -0.17171192169189453, 0.13987493515014648, 0.4514617919921875, 0.7630486488342285, 1.0746355056762695, 1.3862223625183105, 1.6978092193603516, 2.0093960762023926, 2.3209829330444336, 2.6325697898864746, 2.9441566467285156, 3.2557435035705566, 3.5673303604125977, 3.8789172172546387, 4.19050407409668, 4.502090930938721, 4.813677787780762, 5.125264644622803, 5.436851501464844, 5.748438358306885, 6.060025215148926, 6.371612071990967, 6.683198928833008, 6.994785785675049, 7.30637264251709, 7.617959499359131, 7.929546356201172, 8.241132736206055, 8.552720069885254]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 4.0, 6.0, 6.0, 6.0, 7.0, 10.0, 5.0, 18.0, 19.0, 13.0, 18.0, 25.0, 30.0, 25.0, 40.0, 33.0, 43.0, 52.0, 47.0, 64.0, 50.0, 39.0, 63.0, 46.0, 45.0, 44.0, 36.0, 42.0, 33.0, 29.0, 18.0, 22.0, 15.0, 19.0, 9.0, 8.0, 7.0, 1.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.017878532409668, -5.813581943511963, -5.609285354614258, -5.404989242553711, -5.200692653656006, -4.996396064758301, -4.792099475860596, -4.587802886962891, -4.3835062980651855, -4.1792097091674805, -3.9749133586883545, -3.7706167697906494, -3.5663201808929443, -3.3620238304138184, -3.1577272415161133, -2.953430652618408, -2.7491343021392822, -2.544837713241577, -2.340541362762451, -2.136244773864746, -1.931948184967041, -1.7276517152786255, -1.52335524559021, -1.3190586566925049, -1.1147621870040894, -0.910465657711029, -0.7061691284179688, -0.5018726587295532, -0.2975761294364929, -0.09327960014343262, 0.11101686954498291, 0.315313458442688, 0.5196099281311035, 0.7239064574241638, 0.9282029867172241, 1.1324994564056396, 1.3367960453033447, 1.5410925149917603, 1.7453889846801758, 1.9496855735778809, 2.153982162475586, 2.358278751373291, 2.562575101852417, 2.766871690750122, 2.971168279647827, 3.175464630126953, 3.379761219024658, 3.5840578079223633, 3.7883541584014893, 3.9926507472991943, 4.19694709777832, 4.401243686676025, 4.6055402755737305, 4.8098368644714355, 5.014133453369141, 5.2184295654296875, 5.422726154327393, 5.627022743225098, 5.831319332122803, 6.035615921020508, 6.239912033081055, 6.44420862197876, 6.648505210876465, 6.85280179977417, 7.057098388671875]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 5.0, 4.0, 2.0, 5.0, 11.0, 21.0, 23.0, 31.0, 42.0, 58.0, 95.0, 131.0, 176.0, 275.0, 355.0, 545.0, 858.0, 1395.0, 2143.0, 3473.0, 5774.0, 10200.0, 17986.0, 33186.0, 62743.0, 118936.0, 204653.0, 235327.0, 159956.0, 86716.0, 45739.0, 24265.0, 13404.0, 7659.0, 4652.0, 2716.0, 1750.0, 1095.0, 680.0, 465.0, 324.0, 211.0, 142.0, 109.0, 62.0, 50.0, 33.0, 23.0, 25.0, 10.0, 13.0, 6.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 5.0, 0.0, 0.0, 1.0], "bins": [-1.1484375, -1.1091766357421875, -1.069915771484375, -1.0306549072265625, -0.99139404296875, -0.9521331787109375, -0.912872314453125, -0.8736114501953125, -0.8343505859375, -0.7950897216796875, -0.755828857421875, -0.7165679931640625, -0.67730712890625, -0.6380462646484375, -0.598785400390625, -0.5595245361328125, -0.520263671875, -0.4810028076171875, -0.441741943359375, -0.4024810791015625, -0.36322021484375, -0.3239593505859375, -0.284698486328125, -0.2454376220703125, -0.2061767578125, -0.1669158935546875, -0.127655029296875, -0.0883941650390625, -0.04913330078125, -0.0098724365234375, 0.029388427734375, 0.0686492919921875, 0.10791015625, 0.1471710205078125, 0.186431884765625, 0.2256927490234375, 0.26495361328125, 0.3042144775390625, 0.343475341796875, 0.3827362060546875, 0.4219970703125, 0.4612579345703125, 0.500518798828125, 0.5397796630859375, 0.57904052734375, 0.6183013916015625, 0.657562255859375, 0.6968231201171875, 0.736083984375, 0.7753448486328125, 0.814605712890625, 0.8538665771484375, 0.89312744140625, 0.9323883056640625, 0.971649169921875, 1.0109100341796875, 1.0501708984375, 1.0894317626953125, 1.128692626953125, 1.1679534912109375, 1.20721435546875, 1.2464752197265625, 1.285736083984375, 1.3249969482421875, 1.3642578125]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 3.0, 5.0, 5.0, 10.0, 7.0, 23.0, 10.0, 25.0, 24.0, 32.0, 30.0, 35.0, 46.0, 53.0, 71.0, 60.0, 59.0, 57.0, 66.0, 62.0, 43.0, 43.0, 44.0, 39.0, 32.0, 17.0, 17.0, 16.0, 17.0, 11.0, 14.0, 6.0, 3.0, 3.0, 1.0, 4.0, 4.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.424072265625, -0.41042327880859375, -0.3967742919921875, -0.38312530517578125, -0.369476318359375, -0.35582733154296875, -0.3421783447265625, -0.32852935791015625, -0.31488037109375, -0.30123138427734375, -0.2875823974609375, -0.27393341064453125, -0.260284423828125, -0.24663543701171875, -0.2329864501953125, -0.21933746337890625, -0.2056884765625, -0.19203948974609375, -0.1783905029296875, -0.16474151611328125, -0.151092529296875, -0.13744354248046875, -0.1237945556640625, -0.11014556884765625, -0.09649658203125, -0.08284759521484375, -0.0691986083984375, -0.05554962158203125, -0.041900634765625, -0.02825164794921875, -0.0146026611328125, -0.00095367431640625, 0.0126953125, 0.02634429931640625, 0.0399932861328125, 0.05364227294921875, 0.067291259765625, 0.08094024658203125, 0.0945892333984375, 0.10823822021484375, 0.12188720703125, 0.13553619384765625, 0.1491851806640625, 0.16283416748046875, 0.176483154296875, 0.19013214111328125, 0.2037811279296875, 0.21743011474609375, 0.2310791015625, 0.24472808837890625, 0.2583770751953125, 0.27202606201171875, 0.285675048828125, 0.29932403564453125, 0.3129730224609375, 0.32662200927734375, 0.34027099609375, 0.35391998291015625, 0.3675689697265625, 0.38121795654296875, 0.394866943359375, 0.40851593017578125, 0.4221649169921875, 0.43581390380859375, 0.449462890625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 5.0, 6.0, 8.0, 8.0, 14.0, 10.0, 32.0, 19.0, 32.0, 62.0, 119.0, 163.0, 327.0, 535.0, 1127.0, 2630.0, 6915.0, 20800.0, 80812.0, 380511.0, 425037.0, 93213.0, 23198.0, 7468.0, 2745.0, 1285.0, 623.0, 323.0, 191.0, 109.0, 67.0, 43.0, 28.0, 15.0, 17.0, 12.0, 21.0, 7.0, 7.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-3.134765625, -3.050140380859375, -2.96551513671875, -2.880889892578125, -2.7962646484375, -2.711639404296875, -2.62701416015625, -2.542388916015625, -2.457763671875, -2.373138427734375, -2.28851318359375, -2.203887939453125, -2.1192626953125, -2.034637451171875, -1.95001220703125, -1.865386962890625, -1.78076171875, -1.696136474609375, -1.61151123046875, -1.526885986328125, -1.4422607421875, -1.357635498046875, -1.27301025390625, -1.188385009765625, -1.103759765625, -1.019134521484375, -0.93450927734375, -0.849884033203125, -0.7652587890625, -0.680633544921875, -0.59600830078125, -0.511383056640625, -0.4267578125, -0.342132568359375, -0.25750732421875, -0.172882080078125, -0.0882568359375, -0.003631591796875, 0.08099365234375, 0.165618896484375, 0.250244140625, 0.334869384765625, 0.41949462890625, 0.504119873046875, 0.5887451171875, 0.673370361328125, 0.75799560546875, 0.842620849609375, 0.92724609375, 1.011871337890625, 1.09649658203125, 1.181121826171875, 1.2657470703125, 1.350372314453125, 1.43499755859375, 1.519622802734375, 1.604248046875, 1.688873291015625, 1.77349853515625, 1.858123779296875, 1.9427490234375, 2.027374267578125, 2.11199951171875, 2.196624755859375, 2.28125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 1.0, 3.0, 1.0, 10.0, 3.0, 10.0, 9.0, 15.0, 18.0, 18.0, 21.0, 28.0, 34.0, 29.0, 33.0, 32.0, 41.0, 35.0, 32.0, 47.0, 48.0, 41.0, 47.0, 51.0, 40.0, 33.0, 47.0, 42.0, 36.0, 37.0, 23.0, 27.0, 25.0, 19.0, 13.0, 7.0, 11.0, 8.0, 8.0, 9.0, 9.0, 3.0, 2.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8134765625, -1.7518463134765625, -1.690216064453125, -1.6285858154296875, -1.56695556640625, -1.5053253173828125, -1.443695068359375, -1.3820648193359375, -1.3204345703125, -1.2588043212890625, -1.197174072265625, -1.1355438232421875, -1.07391357421875, -1.0122833251953125, -0.950653076171875, -0.8890228271484375, -0.827392578125, -0.7657623291015625, -0.704132080078125, -0.6425018310546875, -0.58087158203125, -0.5192413330078125, -0.457611083984375, -0.3959808349609375, -0.3343505859375, -0.2727203369140625, -0.211090087890625, -0.1494598388671875, -0.08782958984375, -0.0261993408203125, 0.035430908203125, 0.0970611572265625, 0.15869140625, 0.2203216552734375, 0.281951904296875, 0.3435821533203125, 0.40521240234375, 0.4668426513671875, 0.528472900390625, 0.5901031494140625, 0.6517333984375, 0.7133636474609375, 0.774993896484375, 0.8366241455078125, 0.89825439453125, 0.9598846435546875, 1.021514892578125, 1.0831451416015625, 1.144775390625, 1.2064056396484375, 1.268035888671875, 1.3296661376953125, 1.39129638671875, 1.4529266357421875, 1.514556884765625, 1.5761871337890625, 1.6378173828125, 1.6994476318359375, 1.761077880859375, 1.8227081298828125, 1.88433837890625, 1.9459686279296875, 2.007598876953125, 2.0692291259765625, 2.130859375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 0.0, 4.0, 1.0, 2.0, 7.0, 10.0, 14.0, 28.0, 33.0, 54.0, 45.0, 104.0, 182.0, 310.0, 636.0, 1456.0, 3909.0, 14621.0, 130666.0, 807018.0, 73133.0, 10760.0, 3146.0, 1186.0, 541.0, 258.0, 161.0, 90.0, 64.0, 34.0, 28.0, 15.0, 12.0, 6.0, 5.0, 5.0, 3.0, 2.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.91015625, -5.7091064453125, -5.508056640625, -5.3070068359375, -5.10595703125, -4.9049072265625, -4.703857421875, -4.5028076171875, -4.3017578125, -4.1007080078125, -3.899658203125, -3.6986083984375, -3.49755859375, -3.2965087890625, -3.095458984375, -2.8944091796875, -2.693359375, -2.4923095703125, -2.291259765625, -2.0902099609375, -1.88916015625, -1.6881103515625, -1.487060546875, -1.2860107421875, -1.0849609375, -0.8839111328125, -0.682861328125, -0.4818115234375, -0.28076171875, -0.0797119140625, 0.121337890625, 0.3223876953125, 0.5234375, 0.7244873046875, 0.925537109375, 1.1265869140625, 1.32763671875, 1.5286865234375, 1.729736328125, 1.9307861328125, 2.1318359375, 2.3328857421875, 2.533935546875, 2.7349853515625, 2.93603515625, 3.1370849609375, 3.338134765625, 3.5391845703125, 3.740234375, 3.9412841796875, 4.142333984375, 4.3433837890625, 4.54443359375, 4.7454833984375, 4.946533203125, 5.1475830078125, 5.3486328125, 5.5496826171875, 5.750732421875, 5.9517822265625, 6.15283203125, 6.3538818359375, 6.554931640625, 6.7559814453125, 6.95703125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 4.0, 6.0, 7.0, 11.0, 17.0, 28.0, 28.0, 40.0, 57.0, 75.0, 88.0, 86.0, 114.0, 103.0, 89.0, 69.0, 58.0, 31.0, 26.0, 19.0, 8.0, 14.0, 9.0, 7.0, 4.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001404285430908203, -0.0001338757574558258, -0.0001273229718208313, -0.00012077018618583679, -0.00011421740055084229, -0.00010766461491584778, -0.00010111182928085327, -9.455904364585876e-05, -8.800625801086426e-05, -8.145347237586975e-05, -7.490068674087524e-05, -6.834790110588074e-05, -6.179511547088623e-05, -5.5242329835891724e-05, -4.868954420089722e-05, -4.213675856590271e-05, -3.55839729309082e-05, -2.9031187295913696e-05, -2.247840166091919e-05, -1.5925616025924683e-05, -9.372830390930176e-06, -2.820044755935669e-06, 3.732740879058838e-06, 1.0285526514053345e-05, 1.683831214904785e-05, 2.339109778404236e-05, 2.9943883419036865e-05, 3.649666905403137e-05, 4.304945468902588e-05, 4.9602240324020386e-05, 5.615502595901489e-05, 6.27078115940094e-05, 6.92605972290039e-05, 7.581338286399841e-05, 8.236616849899292e-05, 8.891895413398743e-05, 9.547173976898193e-05, 0.00010202452540397644, 0.00010857731103897095, 0.00011513009667396545, 0.00012168288230895996, 0.00012823566794395447, 0.00013478845357894897, 0.00014134123921394348, 0.000147894024848938, 0.0001544468104839325, 0.000160999596118927, 0.0001675523817539215, 0.00017410516738891602, 0.00018065795302391052, 0.00018721073865890503, 0.00019376352429389954, 0.00020031630992889404, 0.00020686909556388855, 0.00021342188119888306, 0.00021997466683387756, 0.00022652745246887207, 0.00023308023810386658, 0.00023963302373886108, 0.0002461858093738556, 0.0002527385950088501, 0.0002592913806438446, 0.0002658441662788391, 0.0002723969519138336, 0.0002789497375488281]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 4.0, 6.0, 6.0, 2.0, 5.0, 13.0, 20.0, 26.0, 30.0, 51.0, 65.0, 102.0, 134.0, 182.0, 291.0, 459.0, 804.0, 1249.0, 2217.0, 4152.0, 8586.0, 22076.0, 80842.0, 511638.0, 329122.0, 54415.0, 16845.0, 7007.0, 3402.0, 1788.0, 1050.0, 637.0, 429.0, 290.0, 200.0, 109.0, 89.0, 58.0, 51.0, 27.0, 18.0, 20.0, 14.0, 5.0, 10.0, 5.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.734375, -3.6171875, -3.5, -3.3828125, -3.265625, -3.1484375, -3.03125, -2.9140625, -2.796875, -2.6796875, -2.5625, -2.4453125, -2.328125, -2.2109375, -2.09375, -1.9765625, -1.859375, -1.7421875, -1.625, -1.5078125, -1.390625, -1.2734375, -1.15625, -1.0390625, -0.921875, -0.8046875, -0.6875, -0.5703125, -0.453125, -0.3359375, -0.21875, -0.1015625, 0.015625, 0.1328125, 0.25, 0.3671875, 0.484375, 0.6015625, 0.71875, 0.8359375, 0.953125, 1.0703125, 1.1875, 1.3046875, 1.421875, 1.5390625, 1.65625, 1.7734375, 1.890625, 2.0078125, 2.125, 2.2421875, 2.359375, 2.4765625, 2.59375, 2.7109375, 2.828125, 2.9453125, 3.0625, 3.1796875, 3.296875, 3.4140625, 3.53125, 3.6484375, 3.765625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 4.0, 3.0, 1.0, 5.0, 1.0, 5.0, 4.0, 5.0, 5.0, 3.0, 8.0, 14.0, 18.0, 26.0, 53.0, 64.0, 104.0, 108.0, 138.0, 117.0, 116.0, 53.0, 36.0, 31.0, 20.0, 16.0, 9.0, 6.0, 8.0, 3.0, 6.0, 10.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.03125, -3.92645263671875, -3.8216552734375, -3.71685791015625, -3.612060546875, -3.50726318359375, -3.4024658203125, -3.29766845703125, -3.19287109375, -3.08807373046875, -2.9832763671875, -2.87847900390625, -2.773681640625, -2.66888427734375, -2.5640869140625, -2.45928955078125, -2.3544921875, -2.24969482421875, -2.1448974609375, -2.04010009765625, -1.935302734375, -1.83050537109375, -1.7257080078125, -1.62091064453125, -1.51611328125, -1.41131591796875, -1.3065185546875, -1.20172119140625, -1.096923828125, -0.99212646484375, -0.8873291015625, -0.78253173828125, -0.677734375, -0.57293701171875, -0.4681396484375, -0.36334228515625, -0.258544921875, -0.15374755859375, -0.0489501953125, 0.05584716796875, 0.16064453125, 0.26544189453125, 0.3702392578125, 0.47503662109375, 0.579833984375, 0.68463134765625, 0.7894287109375, 0.89422607421875, 0.9990234375, 1.10382080078125, 1.2086181640625, 1.31341552734375, 1.418212890625, 1.52301025390625, 1.6278076171875, 1.73260498046875, 1.83740234375, 1.94219970703125, 2.0469970703125, 2.15179443359375, 2.256591796875, 2.36138916015625, 2.4661865234375, 2.57098388671875, 2.67578125]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 3.0, 3.0, 13.0, 18.0, 29.0, 53.0, 103.0, 155.0, 198.0, 175.0, 112.0, 60.0, 32.0, 15.0, 9.0, 6.0, 7.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.592954635620117, -29.657163619995117, -28.721370697021484, -27.785579681396484, -26.84978675842285, -25.91399574279785, -24.97820281982422, -24.04241180419922, -23.106618881225586, -22.170827865600586, -21.235034942626953, -20.299243927001953, -19.36345100402832, -18.42765998840332, -17.491867065429688, -16.556076049804688, -15.620284080505371, -14.684492111206055, -13.748700141906738, -12.812908172607422, -11.877116203308105, -10.941324234008789, -10.005533218383789, -9.069740295410156, -8.133949279785156, -7.19815731048584, -6.262365341186523, -5.326573371887207, -4.390781402587891, -3.4549899101257324, -2.519197940826416, -1.5834059715270996, -0.647613525390625, 0.28817838430404663, 1.2239702939987183, 2.159762144088745, 3.0955541133880615, 4.031345844268799, 4.967137813568115, 5.902929782867432, 6.838721752166748, 7.7745137214660645, 8.710305213928223, 9.646097183227539, 10.581889152526855, 11.517681121826172, 12.453473091125488, 13.389265060424805, 14.325057029724121, 15.260848999023438, 16.196640014648438, 17.13243293762207, 18.06822395324707, 19.004016876220703, 19.939807891845703, 20.875600814819336, 21.811391830444336, 22.747182846069336, 23.68297576904297, 24.61876678466797, 25.5545597076416, 26.4903507232666, 27.426143646240234, 28.361934661865234, 29.297727584838867]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 3.0, 3.0, 4.0, 2.0, 4.0, 6.0, 13.0, 16.0, 19.0, 31.0, 58.0, 65.0, 89.0, 109.0, 113.0, 109.0, 104.0, 64.0, 46.0, 40.0, 24.0, 17.0, 10.0, 6.0, 6.0, 1.0, 5.0, 7.0, 6.0, 8.0, 1.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-37.261329650878906, -36.241424560546875, -35.221519470214844, -34.20161437988281, -33.18170928955078, -32.16180419921875, -31.14189910888672, -30.121994018554688, -29.102088928222656, -28.082183837890625, -27.062278747558594, -26.042373657226562, -25.02246856689453, -24.0025634765625, -22.98265838623047, -21.962753295898438, -20.942848205566406, -19.922943115234375, -18.903038024902344, -17.883132934570312, -16.86322784423828, -15.84332275390625, -14.823417663574219, -13.803512573242188, -12.783607482910156, -11.763702392578125, -10.743797302246094, -9.723892211914062, -8.703987121582031, -7.68408203125, -6.664176940917969, -5.6442718505859375, -4.624366760253906, -3.604461669921875, -2.5845565795898438, -1.5646514892578125, -0.5447463989257812, 0.47515869140625, 1.4950637817382812, 2.5149688720703125, 3.5348739624023438, 4.554779052734375, 5.574684143066406, 6.5945892333984375, 7.614494323730469, 8.6343994140625, 9.654304504394531, 10.674209594726562, 11.694114685058594, 12.714019775390625, 13.733924865722656, 14.753829956054688, 15.773735046386719, 16.79364013671875, 17.81354522705078, 18.833450317382812, 19.853355407714844, 20.873260498046875, 21.893165588378906, 22.913070678710938, 23.93297576904297, 24.952880859375, 25.97278594970703, 26.992691040039062, 28.012596130371094]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 6.0, 1.0, 0.0, 6.0, 3.0, 4.0, 13.0, 13.0, 11.0, 31.0, 34.0, 56.0, 82.0, 137.0, 222.0, 467.0, 951.0, 1967.0, 4728.0, 11654.0, 32715.0, 111761.0, 714555.0, 3018725.0, 211643.0, 53947.0, 18223.0, 6778.0, 2955.0, 1257.0, 611.0, 291.0, 138.0, 82.0, 62.0, 40.0, 30.0, 21.0, 13.0, 13.0, 10.0, 6.0, 5.0, 2.0, 5.0, 4.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.59375, -7.3651123046875, -7.136474609375, -6.9078369140625, -6.67919921875, -6.4505615234375, -6.221923828125, -5.9932861328125, -5.7646484375, -5.5360107421875, -5.307373046875, -5.0787353515625, -4.85009765625, -4.6214599609375, -4.392822265625, -4.1641845703125, -3.935546875, -3.7069091796875, -3.478271484375, -3.2496337890625, -3.02099609375, -2.7923583984375, -2.563720703125, -2.3350830078125, -2.1064453125, -1.8778076171875, -1.649169921875, -1.4205322265625, -1.19189453125, -0.9632568359375, -0.734619140625, -0.5059814453125, -0.27734375, -0.0487060546875, 0.179931640625, 0.4085693359375, 0.63720703125, 0.8658447265625, 1.094482421875, 1.3231201171875, 1.5517578125, 1.7803955078125, 2.009033203125, 2.2376708984375, 2.46630859375, 2.6949462890625, 2.923583984375, 3.1522216796875, 3.380859375, 3.6094970703125, 3.838134765625, 4.0667724609375, 4.29541015625, 4.5240478515625, 4.752685546875, 4.9813232421875, 5.2099609375, 5.4385986328125, 5.667236328125, 5.8958740234375, 6.12451171875, 6.3531494140625, 6.581787109375, 6.8104248046875, 7.0390625]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 1.0, 5.0, 6.0, 3.0, 11.0, 7.0, 15.0, 16.0, 20.0, 16.0, 28.0, 25.0, 26.0, 31.0, 33.0, 31.0, 52.0, 46.0, 43.0, 58.0, 49.0, 41.0, 49.0, 41.0, 47.0, 36.0, 36.0, 30.0, 33.0, 21.0, 21.0, 16.0, 17.0, 11.0, 23.0, 12.0, 11.0, 7.0, 3.0, 8.0, 4.0, 2.0, 3.0, 4.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.353759765625, -0.3422393798828125, -0.330718994140625, -0.3191986083984375, -0.30767822265625, -0.2961578369140625, -0.284637451171875, -0.2731170654296875, -0.2615966796875, -0.2500762939453125, -0.238555908203125, -0.2270355224609375, -0.21551513671875, -0.2039947509765625, -0.192474365234375, -0.1809539794921875, -0.16943359375, -0.1579132080078125, -0.146392822265625, -0.1348724365234375, -0.12335205078125, -0.1118316650390625, -0.100311279296875, -0.0887908935546875, -0.0772705078125, -0.0657501220703125, -0.054229736328125, -0.0427093505859375, -0.03118896484375, -0.0196685791015625, -0.008148193359375, 0.0033721923828125, 0.014892578125, 0.0264129638671875, 0.037933349609375, 0.0494537353515625, 0.06097412109375, 0.0724945068359375, 0.084014892578125, 0.0955352783203125, 0.1070556640625, 0.1185760498046875, 0.130096435546875, 0.1416168212890625, 0.15313720703125, 0.1646575927734375, 0.176177978515625, 0.1876983642578125, 0.19921875, 0.2107391357421875, 0.222259521484375, 0.2337799072265625, 0.24530029296875, 0.2568206787109375, 0.268341064453125, 0.2798614501953125, 0.2913818359375, 0.3029022216796875, 0.314422607421875, 0.3259429931640625, 0.33746337890625, 0.3489837646484375, 0.360504150390625, 0.3720245361328125, 0.383544921875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 8.0, 4.0, 6.0, 20.0, 16.0, 37.0, 44.0, 58.0, 91.0, 152.0, 201.0, 373.0, 617.0, 1018.0, 1814.0, 3267.0, 5794.0, 11013.0, 22458.0, 46800.0, 108222.0, 295651.0, 1591978.0, 1606506.0, 297076.0, 108049.0, 46559.0, 21730.0, 10984.0, 5828.0, 3277.0, 1801.0, 1081.0, 641.0, 426.0, 231.0, 149.0, 110.0, 55.0, 40.0, 22.0, 31.0, 14.0, 10.0, 6.0, 2.0, 3.0, 4.0, 6.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.9609375, -3.840911865234375, -3.72088623046875, -3.600860595703125, -3.4808349609375, -3.360809326171875, -3.24078369140625, -3.120758056640625, -3.000732421875, -2.880706787109375, -2.76068115234375, -2.640655517578125, -2.5206298828125, -2.400604248046875, -2.28057861328125, -2.160552978515625, -2.04052734375, -1.920501708984375, -1.80047607421875, -1.680450439453125, -1.5604248046875, -1.440399169921875, -1.32037353515625, -1.200347900390625, -1.080322265625, -0.960296630859375, -0.84027099609375, -0.720245361328125, -0.6002197265625, -0.480194091796875, -0.36016845703125, -0.240142822265625, -0.1201171875, -9.1552734375e-05, 0.11993408203125, 0.239959716796875, 0.3599853515625, 0.480010986328125, 0.60003662109375, 0.720062255859375, 0.840087890625, 0.960113525390625, 1.08013916015625, 1.200164794921875, 1.3201904296875, 1.440216064453125, 1.56024169921875, 1.680267333984375, 1.80029296875, 1.920318603515625, 2.04034423828125, 2.160369873046875, 2.2803955078125, 2.400421142578125, 2.52044677734375, 2.640472412109375, 2.760498046875, 2.880523681640625, 3.00054931640625, 3.120574951171875, 3.2406005859375, 3.360626220703125, 3.48065185546875, 3.600677490234375, 3.720703125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 7.0, 2.0, 12.0, 7.0, 8.0, 15.0, 14.0, 22.0, 26.0, 33.0, 44.0, 62.0, 82.0, 99.0, 155.0, 240.0, 369.0, 908.0, 849.0, 362.0, 211.0, 151.0, 104.0, 72.0, 49.0, 46.0, 30.0, 23.0, 14.0, 18.0, 8.0, 8.0, 8.0, 6.0, 6.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.85107421875, -0.8252716064453125, -0.799468994140625, -0.7736663818359375, -0.74786376953125, -0.7220611572265625, -0.696258544921875, -0.6704559326171875, -0.6446533203125, -0.6188507080078125, -0.593048095703125, -0.5672454833984375, -0.54144287109375, -0.5156402587890625, -0.489837646484375, -0.4640350341796875, -0.438232421875, -0.4124298095703125, -0.386627197265625, -0.3608245849609375, -0.33502197265625, -0.3092193603515625, -0.283416748046875, -0.2576141357421875, -0.2318115234375, -0.2060089111328125, -0.180206298828125, -0.1544036865234375, -0.12860107421875, -0.1027984619140625, -0.076995849609375, -0.0511932373046875, -0.025390625, 0.0004119873046875, 0.026214599609375, 0.0520172119140625, 0.07781982421875, 0.1036224365234375, 0.129425048828125, 0.1552276611328125, 0.1810302734375, 0.2068328857421875, 0.232635498046875, 0.2584381103515625, 0.28424072265625, 0.3100433349609375, 0.335845947265625, 0.3616485595703125, 0.387451171875, 0.4132537841796875, 0.439056396484375, 0.4648590087890625, 0.49066162109375, 0.5164642333984375, 0.542266845703125, 0.5680694580078125, 0.5938720703125, 0.6196746826171875, 0.645477294921875, 0.6712799072265625, 0.69708251953125, 0.7228851318359375, 0.748687744140625, 0.7744903564453125, 0.80029296875]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 8.0, 4.0, 9.0, 23.0, 43.0, 70.0, 115.0, 147.0, 177.0, 144.0, 113.0, 58.0, 35.0, 19.0, 15.0, 10.0, 8.0, 3.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.97010612487793, -4.688153266906738, -4.406199932098389, -4.124247074127197, -3.8422939777374268, -3.5603408813476562, -3.278388023376465, -2.9964349269866943, -2.714481830596924, -2.4325287342071533, -2.150575637817383, -1.8686227798461914, -1.586669683456421, -1.3047165870666504, -1.0227636098861694, -0.7408106327056885, -0.45885753631591797, -0.17690449953079224, 0.1050485372543335, 0.38700157403945923, 0.668954610824585, 0.9509077072143555, 1.2328606843948364, 1.5148136615753174, 1.796766757965088, 2.0787198543548584, 2.360672950744629, 2.6426258087158203, 2.924578905105591, 3.2065320014953613, 3.4884848594665527, 3.7704379558563232, 4.052390098571777, 4.334342956542969, 4.616296291351318, 4.89824914932251, 5.180202484130859, 5.462155342102051, 5.744108200073242, 6.026061058044434, 6.308014392852783, 6.589967250823975, 6.871920585632324, 7.153873443603516, 7.435826301574707, 7.717779636383057, 7.999732494354248, 8.281685829162598, 8.563638687133789, 8.84559154510498, 9.127544403076172, 9.40949821472168, 9.691451072692871, 9.973403930664062, 10.255356788635254, 10.537309646606445, 10.819263458251953, 11.101216316223145, 11.383169174194336, 11.665122985839844, 11.947075843811035, 12.229028701782227, 12.510981559753418, 12.79293441772461, 13.0748872756958]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 14.0, 10.0, 20.0, 11.0, 23.0, 30.0, 42.0, 55.0, 56.0, 59.0, 62.0, 62.0, 69.0, 62.0, 67.0, 61.0, 49.0, 39.0, 36.0, 42.0, 35.0, 22.0, 18.0, 14.0, 13.0, 7.0, 5.0, 5.0, 5.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.490595817565918, -4.343323230743408, -4.196050643920898, -4.048778057098389, -3.901505470275879, -3.754232883453369, -3.6069605350494385, -3.4596879482269287, -3.312415361404419, -3.165142774581909, -3.0178701877593994, -2.8705976009368896, -2.723325252532959, -2.576052665710449, -2.4287800788879395, -2.2815074920654297, -2.13423490524292, -1.9869623184204102, -1.8396897315979004, -1.6924172639846802, -1.5451446771621704, -1.3978720903396606, -1.2505996227264404, -1.1033270359039307, -0.9560544490814209, -0.8087818622589111, -0.6615093350410461, -0.5142368078231812, -0.3669642210006714, -0.21969163417816162, -0.07241910696029663, 0.07485342025756836, 0.22212600708007812, 0.3693985641002655, 0.5166711211204529, 0.6639436483383179, 0.8112162351608276, 0.9584888219833374, 1.1057612895965576, 1.2530338764190674, 1.4003064632415771, 1.547579050064087, 1.6948516368865967, 1.842124104499817, 1.9893966913223267, 2.136669158935547, 2.2839417457580566, 2.4312143325805664, 2.578486919403076, 2.725759506225586, 2.8730320930480957, 3.0203046798706055, 3.1675772666931152, 3.314849853515625, 3.4621222019195557, 3.6093947887420654, 3.756667375564575, 3.903939962387085, 4.051212310791016, 4.198484897613525, 4.345757484436035, 4.493030071258545, 4.640302658081055, 4.7875752449035645, 4.934847831726074]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 2.0, 3.0, 6.0, 6.0, 8.0, 8.0, 14.0, 15.0, 22.0, 24.0, 50.0, 77.0, 153.0, 349.0, 1039.0, 3274.0, 11980.0, 52321.0, 247265.0, 510074.0, 172695.0, 36413.0, 8874.0, 2495.0, 775.0, 255.0, 134.0, 60.0, 44.0, 36.0, 18.0, 16.0, 12.0, 18.0, 6.0, 3.0, 7.0, 5.0, 4.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.796875, -6.58697509765625, -6.3770751953125, -6.16717529296875, -5.957275390625, -5.74737548828125, -5.5374755859375, -5.32757568359375, -5.11767578125, -4.90777587890625, -4.6978759765625, -4.48797607421875, -4.278076171875, -4.06817626953125, -3.8582763671875, -3.64837646484375, -3.4384765625, -3.22857666015625, -3.0186767578125, -2.80877685546875, -2.598876953125, -2.38897705078125, -2.1790771484375, -1.96917724609375, -1.75927734375, -1.54937744140625, -1.3394775390625, -1.12957763671875, -0.919677734375, -0.70977783203125, -0.4998779296875, -0.28997802734375, -0.080078125, 0.12982177734375, 0.3397216796875, 0.54962158203125, 0.759521484375, 0.96942138671875, 1.1793212890625, 1.38922119140625, 1.59912109375, 1.80902099609375, 2.0189208984375, 2.22882080078125, 2.438720703125, 2.64862060546875, 2.8585205078125, 3.06842041015625, 3.2783203125, 3.48822021484375, 3.6981201171875, 3.90802001953125, 4.117919921875, 4.32781982421875, 4.5377197265625, 4.74761962890625, 4.95751953125, 5.16741943359375, 5.3773193359375, 5.58721923828125, 5.797119140625, 6.00701904296875, 6.2169189453125, 6.42681884765625, 6.63671875]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 5.0, 5.0, 7.0, 6.0, 10.0, 9.0, 16.0, 23.0, 19.0, 20.0, 20.0, 31.0, 42.0, 32.0, 42.0, 37.0, 58.0, 64.0, 50.0, 44.0, 50.0, 60.0, 37.0, 35.0, 37.0, 40.0, 32.0, 35.0, 18.0, 20.0, 20.0, 17.0, 7.0, 14.0, 10.0, 4.0, 9.0, 7.0, 2.0, 2.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.402587890625, -0.3901023864746094, -0.37761688232421875, -0.3651313781738281, -0.3526458740234375, -0.3401603698730469, -0.32767486572265625, -0.3151893615722656, -0.302703857421875, -0.2902183532714844, -0.27773284912109375, -0.2652473449707031, -0.2527618408203125, -0.24027633666992188, -0.22779083251953125, -0.21530532836914062, -0.20281982421875, -0.19033432006835938, -0.17784881591796875, -0.16536331176757812, -0.1528778076171875, -0.14039230346679688, -0.12790679931640625, -0.11542129516601562, -0.102935791015625, -0.09045028686523438, -0.07796478271484375, -0.06547927856445312, -0.0529937744140625, -0.040508270263671875, -0.02802276611328125, -0.015537261962890625, -0.0030517578125, 0.009433746337890625, 0.02191925048828125, 0.034404754638671875, 0.0468902587890625, 0.059375762939453125, 0.07186126708984375, 0.08434677124023438, 0.096832275390625, 0.10931777954101562, 0.12180328369140625, 0.13428878784179688, 0.1467742919921875, 0.15925979614257812, 0.17174530029296875, 0.18423080444335938, 0.19671630859375, 0.20920181274414062, 0.22168731689453125, 0.23417282104492188, 0.2466583251953125, 0.2591438293457031, 0.27162933349609375, 0.2841148376464844, 0.296600341796875, 0.3090858459472656, 0.32157135009765625, 0.3340568542480469, 0.3465423583984375, 0.3590278625488281, 0.37151336669921875, 0.3839988708496094, 0.396484375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 6.0, 13.0, 22.0, 53.0, 111.0, 350.0, 1327.0, 5552.0, 31691.0, 285063.0, 628807.0, 80426.0, 11736.0, 2444.0, 600.0, 197.0, 78.0, 38.0, 15.0, 7.0, 2.0, 5.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.8046875, -8.56817626953125, -8.3316650390625, -8.09515380859375, -7.858642578125, -7.62213134765625, -7.3856201171875, -7.14910888671875, -6.91259765625, -6.67608642578125, -6.4395751953125, -6.20306396484375, -5.966552734375, -5.73004150390625, -5.4935302734375, -5.25701904296875, -5.0205078125, -4.78399658203125, -4.5474853515625, -4.31097412109375, -4.074462890625, -3.83795166015625, -3.6014404296875, -3.36492919921875, -3.12841796875, -2.89190673828125, -2.6553955078125, -2.41888427734375, -2.182373046875, -1.94586181640625, -1.7093505859375, -1.47283935546875, -1.236328125, -0.99981689453125, -0.7633056640625, -0.52679443359375, -0.290283203125, -0.05377197265625, 0.1827392578125, 0.41925048828125, 0.65576171875, 0.89227294921875, 1.1287841796875, 1.36529541015625, 1.601806640625, 1.83831787109375, 2.0748291015625, 2.31134033203125, 2.5478515625, 2.78436279296875, 3.0208740234375, 3.25738525390625, 3.493896484375, 3.73040771484375, 3.9669189453125, 4.20343017578125, 4.43994140625, 4.67645263671875, 4.9129638671875, 5.14947509765625, 5.385986328125, 5.62249755859375, 5.8590087890625, 6.09552001953125, 6.33203125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 2.0, 5.0, 10.0, 8.0, 8.0, 15.0, 10.0, 18.0, 9.0, 22.0, 23.0, 33.0, 26.0, 32.0, 31.0, 42.0, 45.0, 54.0, 50.0, 55.0, 54.0, 50.0, 24.0, 41.0, 48.0, 29.0, 31.0, 31.0, 35.0, 23.0, 27.0, 18.0, 13.0, 24.0, 8.0, 2.0, 13.0, 9.0, 7.0, 5.0, 7.0, 0.0, 6.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-2.01953125, -1.955780029296875, -1.89202880859375, -1.828277587890625, -1.7645263671875, -1.700775146484375, -1.63702392578125, -1.573272705078125, -1.509521484375, -1.445770263671875, -1.38201904296875, -1.318267822265625, -1.2545166015625, -1.190765380859375, -1.12701416015625, -1.063262939453125, -0.99951171875, -0.935760498046875, -0.87200927734375, -0.808258056640625, -0.7445068359375, -0.680755615234375, -0.61700439453125, -0.553253173828125, -0.489501953125, -0.425750732421875, -0.36199951171875, -0.298248291015625, -0.2344970703125, -0.170745849609375, -0.10699462890625, -0.043243408203125, 0.0205078125, 0.084259033203125, 0.14801025390625, 0.211761474609375, 0.2755126953125, 0.339263916015625, 0.40301513671875, 0.466766357421875, 0.530517578125, 0.594268798828125, 0.65802001953125, 0.721771240234375, 0.7855224609375, 0.849273681640625, 0.91302490234375, 0.976776123046875, 1.04052734375, 1.104278564453125, 1.16802978515625, 1.231781005859375, 1.2955322265625, 1.359283447265625, 1.42303466796875, 1.486785888671875, 1.550537109375, 1.614288330078125, 1.67803955078125, 1.741790771484375, 1.8055419921875, 1.869293212890625, 1.93304443359375, 1.996795654296875, 2.060546875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 5.0, 9.0, 16.0, 27.0, 54.0, 94.0, 243.0, 636.0, 2020.0, 11543.0, 851747.0, 174246.0, 5820.0, 1318.0, 427.0, 169.0, 86.0, 37.0, 29.0, 12.0, 10.0, 2.0, 6.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.875, -39.942626953125, -39.01025390625, -38.077880859375, -37.1455078125, -36.213134765625, -35.28076171875, -34.348388671875, -33.416015625, -32.483642578125, -31.55126953125, -30.618896484375, -29.6865234375, -28.754150390625, -27.82177734375, -26.889404296875, -25.95703125, -25.024658203125, -24.09228515625, -23.159912109375, -22.2275390625, -21.295166015625, -20.36279296875, -19.430419921875, -18.498046875, -17.565673828125, -16.63330078125, -15.700927734375, -14.7685546875, -13.836181640625, -12.90380859375, -11.971435546875, -11.0390625, -10.106689453125, -9.17431640625, -8.241943359375, -7.3095703125, -6.377197265625, -5.44482421875, -4.512451171875, -3.580078125, -2.647705078125, -1.71533203125, -0.782958984375, 0.1494140625, 1.081787109375, 2.01416015625, 2.946533203125, 3.87890625, 4.811279296875, 5.74365234375, 6.676025390625, 7.6083984375, 8.540771484375, 9.47314453125, 10.405517578125, 11.337890625, 12.270263671875, 13.20263671875, 14.135009765625, 15.0673828125, 15.999755859375, 16.93212890625, 17.864501953125, 18.796875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 8.0, 17.0, 24.0, 56.0, 124.0, 307.0, 270.0, 94.0, 47.0, 29.0, 10.0, 6.0, 3.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00146484375, -0.0014174580574035645, -0.001370072364807129, -0.0013226866722106934, -0.0012753009796142578, -0.0012279152870178223, -0.0011805295944213867, -0.0011331439018249512, -0.0010857582092285156, -0.00103837251663208, -0.0009909868240356445, -0.000943601131439209, -0.0008962154388427734, -0.0008488297462463379, -0.0008014440536499023, -0.0007540583610534668, -0.0007066726684570312, -0.0006592869758605957, -0.0006119012832641602, -0.0005645155906677246, -0.0005171298980712891, -0.0004697442054748535, -0.00042235851287841797, -0.0003749728202819824, -0.0003275871276855469, -0.00028020143508911133, -0.00023281574249267578, -0.00018543004989624023, -0.0001380443572998047, -9.065866470336914e-05, -4.3272972106933594e-05, 4.112720489501953e-06, 5.14984130859375e-05, 9.888410568237305e-05, 0.0001462697982788086, 0.00019365549087524414, 0.0002410411834716797, 0.00028842687606811523, 0.0003358125686645508, 0.00038319826126098633, 0.0004305839538574219, 0.0004779696464538574, 0.000525355339050293, 0.0005727410316467285, 0.0006201267242431641, 0.0006675124168395996, 0.0007148981094360352, 0.0007622838020324707, 0.0008096694946289062, 0.0008570551872253418, 0.0009044408798217773, 0.0009518265724182129, 0.0009992122650146484, 0.001046597957611084, 0.0010939836502075195, 0.001141369342803955, 0.0011887550354003906, 0.0012361407279968262, 0.0012835264205932617, 0.0013309121131896973, 0.0013782978057861328, 0.0014256834983825684, 0.001473069190979004, 0.0015204548835754395, 0.001567840576171875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 8.0, 4.0, 8.0, 12.0, 12.0, 23.0, 32.0, 44.0, 90.0, 133.0, 207.0, 314.0, 554.0, 1018.0, 2007.0, 4492.0, 12802.0, 72045.0, 703358.0, 214795.0, 23985.0, 6662.0, 2821.0, 1334.0, 726.0, 403.0, 237.0, 149.0, 96.0, 52.0, 50.0, 23.0, 21.0, 15.0, 8.0, 8.0, 2.0, 5.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.8125, -10.46044921875, -10.1083984375, -9.75634765625, -9.404296875, -9.05224609375, -8.7001953125, -8.34814453125, -7.99609375, -7.64404296875, -7.2919921875, -6.93994140625, -6.587890625, -6.23583984375, -5.8837890625, -5.53173828125, -5.1796875, -4.82763671875, -4.4755859375, -4.12353515625, -3.771484375, -3.41943359375, -3.0673828125, -2.71533203125, -2.36328125, -2.01123046875, -1.6591796875, -1.30712890625, -0.955078125, -0.60302734375, -0.2509765625, 0.10107421875, 0.453125, 0.80517578125, 1.1572265625, 1.50927734375, 1.861328125, 2.21337890625, 2.5654296875, 2.91748046875, 3.26953125, 3.62158203125, 3.9736328125, 4.32568359375, 4.677734375, 5.02978515625, 5.3818359375, 5.73388671875, 6.0859375, 6.43798828125, 6.7900390625, 7.14208984375, 7.494140625, 7.84619140625, 8.1982421875, 8.55029296875, 8.90234375, 9.25439453125, 9.6064453125, 9.95849609375, 10.310546875, 10.66259765625, 11.0146484375, 11.36669921875, 11.71875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 9.0, 8.0, 4.0, 9.0, 16.0, 17.0, 40.0, 68.0, 123.0, 191.0, 184.0, 130.0, 79.0, 43.0, 20.0, 22.0, 11.0, 5.0, 2.0, 6.0, 3.0, 3.0, 3.0, 1.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.7265625, -6.51715087890625, -6.3077392578125, -6.09832763671875, -5.888916015625, -5.67950439453125, -5.4700927734375, -5.26068115234375, -5.05126953125, -4.84185791015625, -4.6324462890625, -4.42303466796875, -4.213623046875, -4.00421142578125, -3.7947998046875, -3.58538818359375, -3.3759765625, -3.16656494140625, -2.9571533203125, -2.74774169921875, -2.538330078125, -2.32891845703125, -2.1195068359375, -1.91009521484375, -1.70068359375, -1.49127197265625, -1.2818603515625, -1.07244873046875, -0.863037109375, -0.65362548828125, -0.4442138671875, -0.23480224609375, -0.025390625, 0.18402099609375, 0.3934326171875, 0.60284423828125, 0.812255859375, 1.02166748046875, 1.2310791015625, 1.44049072265625, 1.64990234375, 1.85931396484375, 2.0687255859375, 2.27813720703125, 2.487548828125, 2.69696044921875, 2.9063720703125, 3.11578369140625, 3.3251953125, 3.53460693359375, 3.7440185546875, 3.95343017578125, 4.162841796875, 4.37225341796875, 4.5816650390625, 4.79107666015625, 5.00048828125, 5.20989990234375, 5.4193115234375, 5.62872314453125, 5.838134765625, 6.04754638671875, 6.2569580078125, 6.46636962890625, 6.67578125]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 8.0, 4.0, 13.0, 19.0, 38.0, 63.0, 109.0, 180.0, 193.0, 171.0, 88.0, 57.0, 29.0, 18.0, 6.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.536346435546875, -39.24641036987305, -37.95647048950195, -36.666534423828125, -35.37659454345703, -34.0866584777832, -32.796722412109375, -31.50678253173828, -30.216846466064453, -28.926908493041992, -27.63697052001953, -26.347034454345703, -25.057096481323242, -23.76715850830078, -22.47722053527832, -21.18728256225586, -19.8973445892334, -18.607406616210938, -17.317468643188477, -16.027530670166016, -14.737594604492188, -13.447656631469727, -12.157718658447266, -10.867781639099121, -9.57784366607666, -8.2879056930542, -6.997968673706055, -5.708030700683594, -4.418093204498291, -3.1281557083129883, -1.8382177352905273, -0.5482807159423828, 0.7416572570800781, 2.031594753265381, 3.3215324878692627, 4.6114702224731445, 5.901407718658447, 7.19134521484375, 8.481283187866211, 9.771220207214355, 11.061158180236816, 12.351096153259277, 13.641033172607422, 14.930971145629883, 16.220909118652344, 17.510845184326172, 18.800785064697266, 20.090721130371094, 21.380659103393555, 22.670597076416016, 23.960535049438477, 25.250473022460938, 26.540409088134766, 27.830347061157227, 29.120285034179688, 30.410221099853516, 31.70016098022461, 32.99009704589844, 34.28003692626953, 35.56997299194336, 36.85991287231445, 38.14984893798828, 39.439788818359375, 40.7297248840332, 42.01966094970703]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 7.0, 0.0, 1.0, 5.0, 10.0, 15.0, 13.0, 18.0, 28.0, 28.0, 53.0, 43.0, 57.0, 78.0, 101.0, 92.0, 102.0, 64.0, 72.0, 70.0, 34.0, 29.0, 23.0, 21.0, 12.0, 9.0, 3.0, 6.0, 5.0, 3.0, 3.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.149734497070312, -28.30647087097168, -27.463207244873047, -26.619943618774414, -25.77667999267578, -24.933414459228516, -24.090150833129883, -23.24688720703125, -22.403623580932617, -21.560359954833984, -20.71709632873535, -19.87383270263672, -19.030567169189453, -18.187305450439453, -17.344039916992188, -16.500776290893555, -15.657512664794922, -14.814249038696289, -13.970985412597656, -13.127720832824707, -12.284457206726074, -11.441193580627441, -10.597929000854492, -9.75466537475586, -8.911401748657227, -8.068138122558594, -7.224874019622803, -6.381609916687012, -5.538346290588379, -4.695082664489746, -3.851818561553955, -3.008554458618164, -2.1652908325195312, -1.3220269680023193, -0.4787631034851074, 0.3645007610321045, 1.2077646255493164, 2.051028251647949, 2.8942923545837402, 3.7375564575195312, 4.580820083618164, 5.424083709716797, 6.267347812652588, 7.110611915588379, 7.953875541687012, 8.797139167785645, 9.640403747558594, 10.483667373657227, 11.32693099975586, 12.170194625854492, 13.013458251953125, 13.856722831726074, 14.699986457824707, 15.54325008392334, 16.38651466369629, 17.229778289794922, 18.073041915893555, 18.916305541992188, 19.75956916809082, 20.602832794189453, 21.44609832763672, 22.28936004638672, 23.132625579833984, 23.975889205932617, 24.81915283203125]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 5.0, 3.0, 15.0, 13.0, 9.0, 47.0, 97.0, 165.0, 314.0, 543.0, 1129.0, 2124.0, 4337.0, 9099.0, 20292.0, 48795.0, 140064.0, 605070.0, 2808496.0, 380550.0, 103429.0, 38048.0, 16308.0, 7511.0, 3629.0, 1874.0, 937.0, 514.0, 293.0, 185.0, 112.0, 66.0, 49.0, 37.0, 25.0, 13.0, 13.0, 12.0, 12.0, 14.0, 7.0, 7.0, 8.0, 5.0, 3.0, 3.0, 6.0, 2.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.78515625, -4.56121826171875, -4.3372802734375, -4.11334228515625, -3.889404296875, -3.66546630859375, -3.4415283203125, -3.21759033203125, -2.99365234375, -2.76971435546875, -2.5457763671875, -2.32183837890625, -2.097900390625, -1.87396240234375, -1.6500244140625, -1.42608642578125, -1.2021484375, -0.97821044921875, -0.7542724609375, -0.53033447265625, -0.306396484375, -0.08245849609375, 0.1414794921875, 0.36541748046875, 0.58935546875, 0.81329345703125, 1.0372314453125, 1.26116943359375, 1.485107421875, 1.70904541015625, 1.9329833984375, 2.15692138671875, 2.380859375, 2.60479736328125, 2.8287353515625, 3.05267333984375, 3.276611328125, 3.50054931640625, 3.7244873046875, 3.94842529296875, 4.17236328125, 4.39630126953125, 4.6202392578125, 4.84417724609375, 5.068115234375, 5.29205322265625, 5.5159912109375, 5.73992919921875, 5.9638671875, 6.18780517578125, 6.4117431640625, 6.63568115234375, 6.859619140625, 7.08355712890625, 7.3074951171875, 7.53143310546875, 7.75537109375, 7.97930908203125, 8.2032470703125, 8.42718505859375, 8.651123046875, 8.87506103515625, 9.0989990234375, 9.32293701171875, 9.546875]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 7.0, 5.0, 3.0, 6.0, 7.0, 7.0, 8.0, 8.0, 18.0, 23.0, 22.0, 25.0, 32.0, 38.0, 41.0, 46.0, 31.0, 59.0, 39.0, 43.0, 52.0, 51.0, 55.0, 38.0, 42.0, 53.0, 26.0, 36.0, 31.0, 24.0, 16.0, 21.0, 17.0, 14.0, 11.0, 12.0, 9.0, 18.0, 3.0, 2.0, 2.0, 1.0, 4.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.40869140625, -0.3954124450683594, -0.38213348388671875, -0.3688545227050781, -0.3555755615234375, -0.3422966003417969, -0.32901763916015625, -0.3157386779785156, -0.302459716796875, -0.2891807556152344, -0.27590179443359375, -0.2626228332519531, -0.2493438720703125, -0.23606491088867188, -0.22278594970703125, -0.20950698852539062, -0.19622802734375, -0.18294906616210938, -0.16967010498046875, -0.15639114379882812, -0.1431121826171875, -0.12983322143554688, -0.11655426025390625, -0.10327529907226562, -0.089996337890625, -0.07671737670898438, -0.06343841552734375, -0.050159454345703125, -0.0368804931640625, -0.023601531982421875, -0.01032257080078125, 0.002956390380859375, 0.0162353515625, 0.029514312744140625, 0.04279327392578125, 0.056072235107421875, 0.0693511962890625, 0.08263015747070312, 0.09590911865234375, 0.10918807983398438, 0.122467041015625, 0.13574600219726562, 0.14902496337890625, 0.16230392456054688, 0.1755828857421875, 0.18886184692382812, 0.20214080810546875, 0.21541976928710938, 0.22869873046875, 0.24197769165039062, 0.25525665283203125, 0.2685356140136719, 0.2818145751953125, 0.2950935363769531, 0.30837249755859375, 0.3216514587402344, 0.334930419921875, 0.3482093811035156, 0.36148834228515625, 0.3747673034667969, 0.3880462646484375, 0.4013252258300781, 0.41460418701171875, 0.4278831481933594, 0.441162109375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 8.0, 3.0, 6.0, 9.0, 18.0, 23.0, 34.0, 52.0, 61.0, 102.0, 238.0, 1203.0, 50560.0, 4044090.0, 95619.0, 1623.0, 276.0, 116.0, 70.0, 50.0, 32.0, 32.0, 23.0, 16.0, 11.0, 8.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.515625, -29.408447265625, -28.30126953125, -27.194091796875, -26.0869140625, -24.979736328125, -23.87255859375, -22.765380859375, -21.658203125, -20.551025390625, -19.44384765625, -18.336669921875, -17.2294921875, -16.122314453125, -15.01513671875, -13.907958984375, -12.80078125, -11.693603515625, -10.58642578125, -9.479248046875, -8.3720703125, -7.264892578125, -6.15771484375, -5.050537109375, -3.943359375, -2.836181640625, -1.72900390625, -0.621826171875, 0.4853515625, 1.592529296875, 2.69970703125, 3.806884765625, 4.9140625, 6.021240234375, 7.12841796875, 8.235595703125, 9.3427734375, 10.449951171875, 11.55712890625, 12.664306640625, 13.771484375, 14.878662109375, 15.98583984375, 17.093017578125, 18.2001953125, 19.307373046875, 20.41455078125, 21.521728515625, 22.62890625, 23.736083984375, 24.84326171875, 25.950439453125, 27.0576171875, 28.164794921875, 29.27197265625, 30.379150390625, 31.486328125, 32.593505859375, 33.70068359375, 34.807861328125, 35.9150390625, 37.022216796875, 38.12939453125, 39.236572265625, 40.34375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 5.0, 5.0, 13.0, 22.0, 32.0, 66.0, 158.0, 242.0, 593.0, 1517.0, 757.0, 335.0, 168.0, 78.0, 39.0, 25.0, 13.0, 12.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0478515625, -0.9647674560546875, -0.881683349609375, -0.7985992431640625, -0.71551513671875, -0.6324310302734375, -0.549346923828125, -0.4662628173828125, -0.3831787109375, -0.3000946044921875, -0.217010498046875, -0.1339263916015625, -0.05084228515625, 0.0322418212890625, 0.115325927734375, 0.1984100341796875, 0.281494140625, 0.3645782470703125, 0.447662353515625, 0.5307464599609375, 0.61383056640625, 0.6969146728515625, 0.779998779296875, 0.8630828857421875, 0.9461669921875, 1.0292510986328125, 1.112335205078125, 1.1954193115234375, 1.27850341796875, 1.3615875244140625, 1.444671630859375, 1.5277557373046875, 1.61083984375, 1.6939239501953125, 1.777008056640625, 1.8600921630859375, 1.94317626953125, 2.0262603759765625, 2.109344482421875, 2.1924285888671875, 2.2755126953125, 2.3585968017578125, 2.441680908203125, 2.5247650146484375, 2.60784912109375, 2.6909332275390625, 2.774017333984375, 2.8571014404296875, 2.940185546875, 3.0232696533203125, 3.106353759765625, 3.1894378662109375, 3.27252197265625, 3.3556060791015625, 3.438690185546875, 3.5217742919921875, 3.6048583984375, 3.6879425048828125, 3.771026611328125, 3.8541107177734375, 3.93719482421875, 4.0202789306640625, 4.103363037109375, 4.1864471435546875, 4.26953125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 15.0, 47.0, 88.0, 246.0, 342.0, 178.0, 58.0, 18.0, 9.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-45.49464797973633, -44.33457946777344, -43.17451477050781, -42.01444625854492, -40.85437774658203, -39.694313049316406, -38.534244537353516, -37.374176025390625, -36.214111328125, -35.05404281616211, -33.893978118896484, -32.733909606933594, -31.573843002319336, -30.413776397705078, -29.253707885742188, -28.09364128112793, -26.93357276916504, -25.77350616455078, -24.61343765258789, -23.453371047973633, -22.293304443359375, -21.133235931396484, -19.973169326782227, -18.81310272216797, -17.653034210205078, -16.49296760559082, -15.332900047302246, -14.172832489013672, -13.012765884399414, -11.85269832611084, -10.692630767822266, -9.532564163208008, -8.37249755859375, -7.212430477142334, -6.052363395690918, -4.892295837402344, -3.7322287559509277, -2.5721616744995117, -1.4120941162109375, -0.2520275115966797, 0.9080400466918945, 2.0681071281433105, 3.2281744480133057, 4.388241767883301, 5.548308849334717, 6.708375930786133, 7.868443489074707, 9.028510093688965, 10.188577651977539, 11.348645210266113, 12.508711814880371, 13.668779373168945, 14.828845977783203, 15.988913536071777, 17.14898109436035, 18.30904769897461, 19.4691162109375, 20.629182815551758, 21.78925132751465, 22.949317932128906, 24.109384536743164, 25.269451141357422, 26.429519653320312, 27.58958625793457, 28.749652862548828]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 13.0, 23.0, 38.0, 75.0, 106.0, 170.0, 177.0, 146.0, 106.0, 78.0, 43.0, 20.0, 9.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.124515533447266, -11.244817733764648, -10.365119934082031, -9.485422134399414, -8.605724334716797, -7.72602653503418, -6.8463287353515625, -5.966630935668945, -5.086933135986328, -4.207235336303711, -3.3275375366210938, -2.4478397369384766, -1.5681419372558594, -0.6884441375732422, 0.191253662109375, 1.0709514617919922, 1.9506492614746094, 2.8303470611572266, 3.7100448608398438, 4.589742660522461, 5.469440460205078, 6.349138259887695, 7.2288360595703125, 8.10853385925293, 8.988231658935547, 9.867929458618164, 10.747627258300781, 11.627325057983398, 12.507022857666016, 13.386720657348633, 14.26641845703125, 15.146116256713867, 16.025814056396484, 16.9055118560791, 17.78520965576172, 18.664907455444336, 19.544605255126953, 20.42430305480957, 21.304000854492188, 22.183698654174805, 23.063396453857422, 23.94309425354004, 24.822792053222656, 25.702489852905273, 26.58218765258789, 27.461885452270508, 28.341583251953125, 29.221281051635742, 30.10097885131836, 30.980676651000977, 31.860374450683594, 32.740074157714844, 33.61977005004883, 34.49946594238281, 35.37916564941406, 36.25886535644531, 37.1385612487793, 38.01825714111328, 38.89795684814453, 39.77765655517578, 40.657352447509766, 41.53704833984375, 42.416748046875, 43.29644775390625, 44.176143646240234]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 0.0, 0.0, 9.0, 6.0, 3.0, 7.0, 8.0, 9.0, 13.0, 15.0, 15.0, 21.0, 25.0, 32.0, 37.0, 60.0, 48.0, 41.0, 43.0, 149.0, 1043289.0, 4270.0, 62.0, 58.0, 55.0, 46.0, 32.0, 35.0, 44.0, 23.0, 28.0, 20.0, 18.0, 11.0, 9.0, 5.0, 5.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-92.8125, -89.78515625, -86.7578125, -83.73046875, -80.703125, -77.67578125, -74.6484375, -71.62109375, -68.59375, -65.56640625, -62.5390625, -59.51171875, -56.484375, -53.45703125, -50.4296875, -47.40234375, -44.375, -41.34765625, -38.3203125, -35.29296875, -32.265625, -29.23828125, -26.2109375, -23.18359375, -20.15625, -17.12890625, -14.1015625, -11.07421875, -8.046875, -5.01953125, -1.9921875, 1.03515625, 4.0625, 7.08984375, 10.1171875, 13.14453125, 16.171875, 19.19921875, 22.2265625, 25.25390625, 28.28125, 31.30859375, 34.3359375, 37.36328125, 40.390625, 43.41796875, 46.4453125, 49.47265625, 52.5, 55.52734375, 58.5546875, 61.58203125, 64.609375, 67.63671875, 70.6640625, 73.69140625, 76.71875, 79.74609375, 82.7734375, 85.80078125, 88.828125, 91.85546875, 94.8828125, 97.91015625, 100.9375]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [12.0, 121.0, 355.0, 407.0, 113.0, 14.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.44287109375, -0.29898834228515625, -0.1551055908203125, -0.01122283935546875, 0.132659912109375, 0.27654266357421875, 0.4204254150390625, 0.5643081665039062, 0.70819091796875, 0.8520736694335938, 0.9959564208984375, 1.1398391723632812, 1.283721923828125, 1.4276046752929688, 1.5714874267578125, 1.7153701782226562, 1.8592529296875, 2.0031356811523438, 2.1470184326171875, 2.2909011840820312, 2.434783935546875, 2.5786666870117188, 2.7225494384765625, 2.8664321899414062, 3.01031494140625, 3.1541976928710938, 3.2980804443359375, 3.4419631958007812, 3.585845947265625, 3.7297286987304688, 3.8736114501953125, 4.017494201660156, 4.161376953125, 4.305259704589844, 4.4491424560546875, 4.593025207519531, 4.736907958984375, 4.880790710449219, 5.0246734619140625, 5.168556213378906, 5.31243896484375, 5.456321716308594, 5.6002044677734375, 5.744087219238281, 5.887969970703125, 6.031852722167969, 6.1757354736328125, 6.319618225097656, 6.4635009765625, 6.607383728027344, 6.7512664794921875, 6.895149230957031, 7.039031982421875, 7.182914733886719, 7.3267974853515625, 7.470680236816406, 7.61456298828125, 7.758445739746094, 7.9023284912109375, 8.046211242675781, 8.190093994140625, 8.333976745605469, 8.477859497070312, 8.621742248535156, 8.765625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 0.0, 1.0, 3.0, 4.0, 5.0, 10.0, 12.0, 5.0, 14.0, 19.0, 38.0, 48.0, 71.0, 104.0, 155.0, 321.0, 538.0, 1173.0, 3255.0, 11088.0, 65912.0, 580111.0, 337839.0, 36022.0, 7390.0, 2258.0, 995.0, 486.0, 249.0, 148.0, 79.0, 47.0, 44.0, 39.0, 15.0, 18.0, 13.0, 7.0, 8.0, 5.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.21875, -22.48974609375, -21.7607421875, -21.03173828125, -20.302734375, -19.57373046875, -18.8447265625, -18.11572265625, -17.38671875, -16.65771484375, -15.9287109375, -15.19970703125, -14.470703125, -13.74169921875, -13.0126953125, -12.28369140625, -11.5546875, -10.82568359375, -10.0966796875, -9.36767578125, -8.638671875, -7.90966796875, -7.1806640625, -6.45166015625, -5.72265625, -4.99365234375, -4.2646484375, -3.53564453125, -2.806640625, -2.07763671875, -1.3486328125, -0.61962890625, 0.109375, 0.83837890625, 1.5673828125, 2.29638671875, 3.025390625, 3.75439453125, 4.4833984375, 5.21240234375, 5.94140625, 6.67041015625, 7.3994140625, 8.12841796875, 8.857421875, 9.58642578125, 10.3154296875, 11.04443359375, 11.7734375, 12.50244140625, 13.2314453125, 13.96044921875, 14.689453125, 15.41845703125, 16.1474609375, 16.87646484375, 17.60546875, 18.33447265625, 19.0634765625, 19.79248046875, 20.521484375, 21.25048828125, 21.9794921875, 22.70849609375, 23.4375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 5.0, 6.0, 1.0, 12.0, 6.0, 10.0, 13.0, 12.0, 17.0, 33.0, 30.0, 31.0, 42.0, 56.0, 42.0, 49.0, 52.0, 44.0, 60.0, 52.0, 74.0, 47.0, 46.0, 38.0, 43.0, 41.0, 25.0, 28.0, 19.0, 18.0, 5.0, 12.0, 4.0, 5.0, 5.0, 8.0, 7.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.6875, -6.4815673828125, -6.275634765625, -6.0697021484375, -5.86376953125, -5.6578369140625, -5.451904296875, -5.2459716796875, -5.0400390625, -4.8341064453125, -4.628173828125, -4.4222412109375, -4.21630859375, -4.0103759765625, -3.804443359375, -3.5985107421875, -3.392578125, -3.1866455078125, -2.980712890625, -2.7747802734375, -2.56884765625, -2.3629150390625, -2.156982421875, -1.9510498046875, -1.7451171875, -1.5391845703125, -1.333251953125, -1.1273193359375, -0.92138671875, -0.7154541015625, -0.509521484375, -0.3035888671875, -0.09765625, 0.1082763671875, 0.314208984375, 0.5201416015625, 0.72607421875, 0.9320068359375, 1.137939453125, 1.3438720703125, 1.5498046875, 1.7557373046875, 1.961669921875, 2.1676025390625, 2.37353515625, 2.5794677734375, 2.785400390625, 2.9913330078125, 3.197265625, 3.4031982421875, 3.609130859375, 3.8150634765625, 4.02099609375, 4.2269287109375, 4.432861328125, 4.6387939453125, 4.8447265625, 5.0506591796875, 5.256591796875, 5.4625244140625, 5.66845703125, 5.8743896484375, 6.080322265625, 6.2862548828125, 6.4921875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 7.0, 6.0, 13.0, 15.0, 27.0, 26.0, 57.0, 110.0, 175.0, 324.0, 654.0, 1546.0, 3510.0, 9390.0, 28146.0, 98453.0, 381898.0, 381343.0, 98576.0, 28149.0, 9524.0, 3558.0, 1539.0, 716.0, 319.0, 203.0, 106.0, 53.0, 35.0, 22.0, 16.0, 12.0, 5.0, 6.0, 6.0, 3.0, 1.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.15625, -8.8701171875, -8.583984375, -8.2978515625, -8.01171875, -7.7255859375, -7.439453125, -7.1533203125, -6.8671875, -6.5810546875, -6.294921875, -6.0087890625, -5.72265625, -5.4365234375, -5.150390625, -4.8642578125, -4.578125, -4.2919921875, -4.005859375, -3.7197265625, -3.43359375, -3.1474609375, -2.861328125, -2.5751953125, -2.2890625, -2.0029296875, -1.716796875, -1.4306640625, -1.14453125, -0.8583984375, -0.572265625, -0.2861328125, 0.0, 0.2861328125, 0.572265625, 0.8583984375, 1.14453125, 1.4306640625, 1.716796875, 2.0029296875, 2.2890625, 2.5751953125, 2.861328125, 3.1474609375, 3.43359375, 3.7197265625, 4.005859375, 4.2919921875, 4.578125, 4.8642578125, 5.150390625, 5.4365234375, 5.72265625, 6.0087890625, 6.294921875, 6.5810546875, 6.8671875, 7.1533203125, 7.439453125, 7.7255859375, 8.01171875, 8.2978515625, 8.583984375, 8.8701171875, 9.15625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 6.0, 5.0, 3.0, 6.0, 4.0, 8.0, 22.0, 21.0, 24.0, 34.0, 41.0, 69.0, 98.0, 127.0, 143.0, 101.0, 69.0, 55.0, 60.0, 27.0, 26.0, 24.0, 12.0, 3.0, 2.0, 7.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001590728759765625, -0.0015393942594528198, -0.0014880597591400146, -0.0014367252588272095, -0.0013853907585144043, -0.0013340562582015991, -0.001282721757888794, -0.0012313872575759888, -0.0011800527572631836, -0.0011287182569503784, -0.0010773837566375732, -0.001026049256324768, -0.0009747147560119629, -0.0009233802556991577, -0.0008720457553863525, -0.0008207112550735474, -0.0007693767547607422, -0.000718042254447937, -0.0006667077541351318, -0.0006153732538223267, -0.0005640387535095215, -0.0005127042531967163, -0.00046136975288391113, -0.00041003525257110596, -0.0003587007522583008, -0.0003073662519454956, -0.00025603175163269043, -0.00020469725131988525, -0.00015336275100708008, -0.0001020282506942749, -5.0693750381469727e-05, 6.407499313354492e-07, 5.1975250244140625e-05, 0.0001033097505569458, 0.00015464425086975098, 0.00020597875118255615, 0.00025731325149536133, 0.0003086477518081665, 0.0003599822521209717, 0.00041131675243377686, 0.00046265125274658203, 0.0005139857530593872, 0.0005653202533721924, 0.0006166547536849976, 0.0006679892539978027, 0.0007193237543106079, 0.0007706582546234131, 0.0008219927549362183, 0.0008733272552490234, 0.0009246617555618286, 0.0009759962558746338, 0.001027330756187439, 0.0010786652565002441, 0.0011299997568130493, 0.0011813342571258545, 0.0012326687574386597, 0.0012840032577514648, 0.00133533775806427, 0.0013866722583770752, 0.0014380067586898804, 0.0014893412590026855, 0.0015406757593154907, 0.001592010259628296, 0.001643344759941101, 0.0016946792602539062]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 2.0, 12.0, 12.0, 20.0, 19.0, 22.0, 33.0, 50.0, 60.0, 100.0, 145.0, 244.0, 359.0, 624.0, 1251.0, 2538.0, 5335.0, 12384.0, 34571.0, 121810.0, 448355.0, 304575.0, 74566.0, 23665.0, 9292.0, 4051.0, 1996.0, 972.0, 562.0, 306.0, 180.0, 136.0, 74.0, 69.0, 40.0, 32.0, 20.0, 13.0, 15.0, 7.0, 12.0, 8.0, 6.0, 6.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-9.09375, -8.816650390625, -8.53955078125, -8.262451171875, -7.9853515625, -7.708251953125, -7.43115234375, -7.154052734375, -6.876953125, -6.599853515625, -6.32275390625, -6.045654296875, -5.7685546875, -5.491455078125, -5.21435546875, -4.937255859375, -4.66015625, -4.383056640625, -4.10595703125, -3.828857421875, -3.5517578125, -3.274658203125, -2.99755859375, -2.720458984375, -2.443359375, -2.166259765625, -1.88916015625, -1.612060546875, -1.3349609375, -1.057861328125, -0.78076171875, -0.503662109375, -0.2265625, 0.050537109375, 0.32763671875, 0.604736328125, 0.8818359375, 1.158935546875, 1.43603515625, 1.713134765625, 1.990234375, 2.267333984375, 2.54443359375, 2.821533203125, 3.0986328125, 3.375732421875, 3.65283203125, 3.929931640625, 4.20703125, 4.484130859375, 4.76123046875, 5.038330078125, 5.3154296875, 5.592529296875, 5.86962890625, 6.146728515625, 6.423828125, 6.700927734375, 6.97802734375, 7.255126953125, 7.5322265625, 7.809326171875, 8.08642578125, 8.363525390625, 8.640625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 2.0, 2.0, 3.0, 3.0, 6.0, 8.0, 6.0, 8.0, 8.0, 16.0, 26.0, 33.0, 30.0, 37.0, 38.0, 51.0, 59.0, 70.0, 65.0, 53.0, 86.0, 64.0, 56.0, 41.0, 48.0, 35.0, 20.0, 30.0, 18.0, 13.0, 8.0, 8.0, 7.0, 9.0, 7.0, 7.0, 2.0, 4.0, 3.0, 3.0, 1.0, 6.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 5.0], "bins": [-3.927734375, -3.813140869140625, -3.69854736328125, -3.583953857421875, -3.4693603515625, -3.354766845703125, -3.24017333984375, -3.125579833984375, -3.010986328125, -2.896392822265625, -2.78179931640625, -2.667205810546875, -2.5526123046875, -2.438018798828125, -2.32342529296875, -2.208831787109375, -2.09423828125, -1.979644775390625, -1.86505126953125, -1.750457763671875, -1.6358642578125, -1.521270751953125, -1.40667724609375, -1.292083740234375, -1.177490234375, -1.062896728515625, -0.94830322265625, -0.833709716796875, -0.7191162109375, -0.604522705078125, -0.48992919921875, -0.375335693359375, -0.2607421875, -0.146148681640625, -0.03155517578125, 0.083038330078125, 0.1976318359375, 0.312225341796875, 0.42681884765625, 0.541412353515625, 0.656005859375, 0.770599365234375, 0.88519287109375, 0.999786376953125, 1.1143798828125, 1.228973388671875, 1.34356689453125, 1.458160400390625, 1.57275390625, 1.687347412109375, 1.80194091796875, 1.916534423828125, 2.0311279296875, 2.145721435546875, 2.26031494140625, 2.374908447265625, 2.489501953125, 2.604095458984375, 2.71868896484375, 2.833282470703125, 2.9478759765625, 3.062469482421875, 3.17706298828125, 3.291656494140625, 3.40625]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 0.0, 1.0, 5.0, 4.0, 5.0, 7.0, 4.0, 14.0, 20.0, 22.0, 27.0, 35.0, 52.0, 74.0, 93.0, 108.0, 136.0, 110.0, 89.0, 61.0, 43.0, 32.0, 17.0, 9.0, 9.0, 7.0, 5.0, 2.0, 3.0, 1.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.47447204589844, -61.74241638183594, -60.01036071777344, -58.27830505371094, -56.54624938964844, -54.81419372558594, -53.08213424682617, -51.35007858276367, -49.61802291870117, -47.88596725463867, -46.15391159057617, -44.42185592651367, -42.689796447753906, -40.957740783691406, -39.225685119628906, -37.493629455566406, -35.761573791503906, -34.029518127441406, -32.297462463378906, -30.565404891967773, -28.833349227905273, -27.101293563842773, -25.36923599243164, -23.63718032836914, -21.90512466430664, -20.17306900024414, -18.44101333618164, -16.708955764770508, -14.976900100708008, -13.244844436645508, -11.512787818908691, -9.780731201171875, -8.04867172241211, -6.316615581512451, -4.584559440612793, -2.8525032997131348, -1.1204471588134766, 0.6116085052490234, 2.34366512298584, 4.075721740722656, 5.807777404785156, 7.5398335456848145, 9.271889686584473, 11.003946304321289, 12.736001968383789, 14.468057632446289, 16.200115203857422, 17.932170867919922, 19.664226531982422, 21.396282196044922, 23.128337860107422, 24.860395431518555, 26.592451095581055, 28.324506759643555, 30.056564331054688, 31.788619995117188, 33.52067565917969, 35.25273132324219, 36.98478698730469, 38.71684265136719, 40.44889831542969, 42.18095397949219, 43.91301345825195, 45.64506912231445, 47.37712478637695]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 11.0, 8.0, 3.0, 8.0, 10.0, 11.0, 11.0, 16.0, 16.0, 29.0, 26.0, 30.0, 39.0, 36.0, 25.0, 40.0, 34.0, 44.0, 52.0, 41.0, 41.0, 47.0, 52.0, 43.0, 32.0, 38.0, 40.0, 39.0, 20.0, 28.0, 25.0, 13.0, 20.0, 17.0, 12.0, 11.0, 8.0, 8.0, 5.0, 1.0, 4.0, 4.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-34.61534881591797, -33.503578186035156, -32.39180374145508, -31.280033111572266, -30.16826057434082, -29.056488037109375, -27.944717407226562, -26.832944869995117, -25.721172332763672, -24.609399795532227, -23.49762725830078, -22.38585662841797, -21.274084091186523, -20.162311553955078, -19.050540924072266, -17.93876838684082, -16.826995849609375, -15.71522331237793, -14.6034517288208, -13.491680145263672, -12.379907608032227, -11.268135070800781, -10.156363487243652, -9.044591903686523, -7.932819366455078, -6.821047306060791, -5.709275245666504, -4.597503185272217, -3.4857311248779297, -2.3739590644836426, -1.2621870040893555, -0.15041494369506836, 0.9613533020019531, 2.0731253623962402, 3.1848974227905273, 4.2966694831848145, 5.408441543579102, 6.520213603973389, 7.631985664367676, 8.743757247924805, 9.85552978515625, 10.967302322387695, 12.079073905944824, 13.190845489501953, 14.302618026733398, 15.414390563964844, 16.526161193847656, 17.6379337310791, 18.749706268310547, 19.861478805541992, 20.973251342773438, 22.08502197265625, 23.196794509887695, 24.30856704711914, 25.420337677001953, 26.5321102142334, 27.643882751464844, 28.75565528869629, 29.867427825927734, 30.979198455810547, 32.090972900390625, 33.20274353027344, 34.31451416015625, 35.42628860473633, 36.53805923461914]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [56.0, 3156.0, 4035387.0, 154478.0, 626.0, 53.0, 31.0, 33.0, 31.0, 26.0, 23.0, 44.0, 31.0, 18.0, 20.0, 34.0, 21.0, 21.0, 23.0, 15.0, 18.0, 13.0, 15.0, 7.0, 11.0, 10.0, 13.0, 12.0, 9.0, 8.0, 4.0, 7.0, 6.0, 6.0, 3.0, 5.0, 4.0, 1.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.03125, -4.53466796875, -2.0380859375, 0.45849609375, 2.955078125, 5.45166015625, 7.9482421875, 10.44482421875, 12.94140625, 15.43798828125, 17.9345703125, 20.43115234375, 22.927734375, 25.42431640625, 27.9208984375, 30.41748046875, 32.9140625, 35.41064453125, 37.9072265625, 40.40380859375, 42.900390625, 45.39697265625, 47.8935546875, 50.39013671875, 52.88671875, 55.38330078125, 57.8798828125, 60.37646484375, 62.873046875, 65.36962890625, 67.8662109375, 70.36279296875, 72.859375, 75.35595703125, 77.8525390625, 80.34912109375, 82.845703125, 85.34228515625, 87.8388671875, 90.33544921875, 92.83203125, 95.32861328125, 97.8251953125, 100.32177734375, 102.818359375, 105.31494140625, 107.8115234375, 110.30810546875, 112.8046875, 115.30126953125, 117.7978515625, 120.29443359375, 122.791015625, 125.28759765625, 127.7841796875, 130.28076171875, 132.77734375, 135.27392578125, 137.7705078125, 140.26708984375, 142.763671875, 145.26025390625, 147.7568359375, 150.25341796875, 152.75]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [6.0, 12.0, 90.0, 236.0, 285.0, 255.0, 113.0, 21.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.703125, -0.552001953125, -0.40087890625, -0.249755859375, -0.0986328125, 0.052490234375, 0.20361328125, 0.354736328125, 0.505859375, 0.656982421875, 0.80810546875, 0.959228515625, 1.1103515625, 1.261474609375, 1.41259765625, 1.563720703125, 1.71484375, 1.865966796875, 2.01708984375, 2.168212890625, 2.3193359375, 2.470458984375, 2.62158203125, 2.772705078125, 2.923828125, 3.074951171875, 3.22607421875, 3.377197265625, 3.5283203125, 3.679443359375, 3.83056640625, 3.981689453125, 4.1328125, 4.283935546875, 4.43505859375, 4.586181640625, 4.7373046875, 4.888427734375, 5.03955078125, 5.190673828125, 5.341796875, 5.492919921875, 5.64404296875, 5.795166015625, 5.9462890625, 6.097412109375, 6.24853515625, 6.399658203125, 6.55078125, 6.701904296875, 6.85302734375, 7.004150390625, 7.1552734375, 7.306396484375, 7.45751953125, 7.608642578125, 7.759765625, 7.910888671875, 8.06201171875, 8.213134765625, 8.3642578125, 8.515380859375, 8.66650390625, 8.817626953125, 8.96875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 6.0, 8.0, 11.0, 13.0, 26.0, 29.0, 43.0, 48.0, 49.0, 62.0, 196.0, 4021374.0, 171862.0, 168.0, 94.0, 63.0, 54.0, 48.0, 38.0, 45.0, 17.0, 16.0, 7.0, 6.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-269.5, -257.21875, -244.9375, -232.65625, -220.375, -208.09375, -195.8125, -183.53125, -171.25, -158.96875, -146.6875, -134.40625, -122.125, -109.84375, -97.5625, -85.28125, -73.0, -60.71875, -48.4375, -36.15625, -23.875, -11.59375, 0.6875, 12.96875, 25.25, 37.53125, 49.8125, 62.09375, 74.375, 86.65625, 98.9375, 111.21875, 123.5, 135.78125, 148.0625, 160.34375, 172.625, 184.90625, 197.1875, 209.46875, 221.75, 234.03125, 246.3125, 258.59375, 270.875, 283.15625, 295.4375, 307.71875, 320.0, 332.28125, 344.5625, 356.84375, 369.125, 381.40625, 393.6875, 405.96875, 418.25, 430.53125, 442.8125, 455.09375, 467.375, 479.65625, 491.9375, 504.21875, 516.5]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 3.0, 9.0, 33.0, 216.0, 3457.0, 309.0, 59.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.44921875, -4.47003173828125, -3.4908447265625, -2.51165771484375, -1.532470703125, -0.55328369140625, 0.4259033203125, 1.40509033203125, 2.38427734375, 3.36346435546875, 4.3426513671875, 5.32183837890625, 6.301025390625, 7.28021240234375, 8.2593994140625, 9.23858642578125, 10.2177734375, 11.19696044921875, 12.1761474609375, 13.15533447265625, 14.134521484375, 15.11370849609375, 16.0928955078125, 17.07208251953125, 18.05126953125, 19.03045654296875, 20.0096435546875, 20.98883056640625, 21.968017578125, 22.94720458984375, 23.9263916015625, 24.90557861328125, 25.884765625, 26.86395263671875, 27.8431396484375, 28.82232666015625, 29.801513671875, 30.78070068359375, 31.7598876953125, 32.73907470703125, 33.71826171875, 34.69744873046875, 35.6766357421875, 36.65582275390625, 37.635009765625, 38.61419677734375, 39.5933837890625, 40.57257080078125, 41.5517578125, 42.53094482421875, 43.5101318359375, 44.48931884765625, 45.468505859375, 46.44769287109375, 47.4268798828125, 48.40606689453125, 49.38525390625, 50.36444091796875, 51.3436279296875, 52.32281494140625, 53.302001953125, 54.28118896484375, 55.2603759765625, 56.23956298828125, 57.21875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 9.0, 51.0, 705.0, 221.0, 20.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-599.5783081054688, -584.8592529296875, -570.1401977539062, -555.421142578125, -540.7020263671875, -525.9829711914062, -511.263916015625, -496.54486083984375, -481.8258056640625, -467.10675048828125, -452.3876647949219, -437.6686096191406, -422.9495544433594, -408.23046875, -393.51141357421875, -378.7923583984375, -364.0732727050781, -349.3542175292969, -334.6351318359375, -319.91607666015625, -305.197021484375, -290.47796630859375, -275.7588806152344, -261.0398254394531, -246.3207550048828, -231.6016845703125, -216.88262939453125, -202.16355895996094, -187.44448852539062, -172.72543334960938, -158.00636291503906, -143.28729248046875, -128.56826782226562, -113.84920501708984, -99.13014221191406, -84.41107177734375, -69.69200897216797, -54.97294616699219, -40.253875732421875, -25.534812927246094, -10.815750122070312, 3.9033145904541016, 18.622379302978516, 33.34144592285156, 48.060508728027344, 62.779571533203125, 77.49864196777344, 92.21770477294922, 106.936767578125, 121.65583038330078, 136.37489318847656, 151.09396362304688, 165.81301879882812, 180.53208923339844, 195.25115966796875, 209.97021484375, 224.6892852783203, 239.40835571289062, 254.12741088867188, 268.84649658203125, 283.5655517578125, 298.28460693359375, 313.003662109375, 327.7227478027344, 342.4418029785156]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 7.0, 15.0, 41.0, 57.0, 82.0, 103.0, 121.0, 131.0, 118.0, 119.0, 84.0, 51.0, 31.0, 14.0, 11.0, 6.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-119.50402069091797, -116.36165618896484, -113.21928405761719, -110.07691955566406, -106.93455505371094, -103.79219055175781, -100.64981842041016, -97.50745391845703, -94.36508178710938, -91.22271728515625, -88.0803451538086, -84.93798065185547, -81.79561614990234, -78.65324401855469, -75.51087951660156, -72.36851501464844, -69.22615051269531, -66.08378601074219, -62.9414176940918, -59.799049377441406, -56.65668487548828, -53.51431655883789, -50.3719482421875, -47.229583740234375, -44.087215423583984, -40.944847106933594, -37.80248260498047, -34.66011428833008, -31.51774787902832, -28.375381469726562, -25.233013153076172, -22.090646743774414, -18.948280334472656, -15.805913925170898, -12.663546562194824, -9.52117919921875, -6.378812789916992, -3.2364463806152344, -0.09407806396484375, 3.048288345336914, 6.190654754638672, 9.33302116394043, 12.475388526916504, 15.617755889892578, 18.760122299194336, 21.902488708496094, 25.044857025146484, 28.187223434448242, 31.32958984375, 34.47195816040039, 37.614322662353516, 40.756690979003906, 43.89905548095703, 47.04142379760742, 50.18379211425781, 53.32615661621094, 56.46852493286133, 59.61089324951172, 62.753257751464844, 65.8956298828125, 69.03799438476562, 72.18035888671875, 75.32272338867188, 78.46509552001953, 81.60746002197266]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 6.0, 6.0, 2.0, 5.0, 8.0, 6.0, 14.0, 15.0, 20.0, 13.0, 34.0, 45.0, 54.0, 103.0, 175.0, 441.0, 1322.0, 7253.0, 239847.0, 781616.0, 14427.0, 1960.0, 553.0, 257.0, 119.0, 67.0, 42.0, 37.0, 21.0, 22.0, 16.0, 14.0, 7.0, 11.0, 3.0, 3.0, 4.0, 4.0, 4.0, 2.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.5625, -74.251953125, -71.94140625, -69.630859375, -67.3203125, -65.009765625, -62.69921875, -60.388671875, -58.078125, -55.767578125, -53.45703125, -51.146484375, -48.8359375, -46.525390625, -44.21484375, -41.904296875, -39.59375, -37.283203125, -34.97265625, -32.662109375, -30.3515625, -28.041015625, -25.73046875, -23.419921875, -21.109375, -18.798828125, -16.48828125, -14.177734375, -11.8671875, -9.556640625, -7.24609375, -4.935546875, -2.625, -0.314453125, 1.99609375, 4.306640625, 6.6171875, 8.927734375, 11.23828125, 13.548828125, 15.859375, 18.169921875, 20.48046875, 22.791015625, 25.1015625, 27.412109375, 29.72265625, 32.033203125, 34.34375, 36.654296875, 38.96484375, 41.275390625, 43.5859375, 45.896484375, 48.20703125, 50.517578125, 52.828125, 55.138671875, 57.44921875, 59.759765625, 62.0703125, 64.380859375, 66.69140625, 69.001953125, 71.3125]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 7.0, 24.0, 40.0, 104.0, 197.0, 229.0, 193.0, 90.0, 68.0, 33.0, 6.0, 6.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.169921875, -2.967803955078125, -2.76568603515625, -2.563568115234375, -2.3614501953125, -2.159332275390625, -1.95721435546875, -1.755096435546875, -1.552978515625, -1.350860595703125, -1.14874267578125, -0.946624755859375, -0.7445068359375, -0.542388916015625, -0.34027099609375, -0.138153076171875, 0.06396484375, 0.266082763671875, 0.46820068359375, 0.670318603515625, 0.8724365234375, 1.074554443359375, 1.27667236328125, 1.478790283203125, 1.680908203125, 1.883026123046875, 2.08514404296875, 2.287261962890625, 2.4893798828125, 2.691497802734375, 2.89361572265625, 3.095733642578125, 3.2978515625, 3.499969482421875, 3.70208740234375, 3.904205322265625, 4.1063232421875, 4.308441162109375, 4.51055908203125, 4.712677001953125, 4.914794921875, 5.116912841796875, 5.31903076171875, 5.521148681640625, 5.7232666015625, 5.925384521484375, 6.12750244140625, 6.329620361328125, 6.53173828125, 6.733856201171875, 6.93597412109375, 7.138092041015625, 7.3402099609375, 7.542327880859375, 7.74444580078125, 7.946563720703125, 8.148681640625, 8.350799560546875, 8.55291748046875, 8.755035400390625, 8.9571533203125, 9.159271240234375, 9.36138916015625, 9.563507080078125, 9.765625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 3.0, 6.0, 7.0, 9.0, 7.0, 22.0, 23.0, 34.0, 34.0, 56.0, 86.0, 131.0, 204.0, 320.0, 689.0, 1412.0, 3790.0, 14781.0, 87205.0, 598917.0, 289931.0, 38182.0, 7932.0, 2522.0, 995.0, 507.0, 270.0, 136.0, 88.0, 79.0, 37.0, 36.0, 28.0, 20.0, 15.0, 11.0, 8.0, 3.0, 5.0, 5.0, 0.0, 4.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-27.734375, -26.80322265625, -25.8720703125, -24.94091796875, -24.009765625, -23.07861328125, -22.1474609375, -21.21630859375, -20.28515625, -19.35400390625, -18.4228515625, -17.49169921875, -16.560546875, -15.62939453125, -14.6982421875, -13.76708984375, -12.8359375, -11.90478515625, -10.9736328125, -10.04248046875, -9.111328125, -8.18017578125, -7.2490234375, -6.31787109375, -5.38671875, -4.45556640625, -3.5244140625, -2.59326171875, -1.662109375, -0.73095703125, 0.2001953125, 1.13134765625, 2.0625, 2.99365234375, 3.9248046875, 4.85595703125, 5.787109375, 6.71826171875, 7.6494140625, 8.58056640625, 9.51171875, 10.44287109375, 11.3740234375, 12.30517578125, 13.236328125, 14.16748046875, 15.0986328125, 16.02978515625, 16.9609375, 17.89208984375, 18.8232421875, 19.75439453125, 20.685546875, 21.61669921875, 22.5478515625, 23.47900390625, 24.41015625, 25.34130859375, 26.2724609375, 27.20361328125, 28.134765625, 29.06591796875, 29.9970703125, 30.92822265625, 31.859375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 5.0, 6.0, 7.0, 7.0, 6.0, 12.0, 17.0, 18.0, 29.0, 23.0, 28.0, 29.0, 42.0, 49.0, 41.0, 57.0, 47.0, 55.0, 50.0, 55.0, 42.0, 46.0, 44.0, 44.0, 44.0, 31.0, 27.0, 27.0, 25.0, 22.0, 19.0, 14.0, 12.0, 3.0, 6.0, 3.0, 6.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-10.65625, -10.309326171875, -9.96240234375, -9.615478515625, -9.2685546875, -8.921630859375, -8.57470703125, -8.227783203125, -7.880859375, -7.533935546875, -7.18701171875, -6.840087890625, -6.4931640625, -6.146240234375, -5.79931640625, -5.452392578125, -5.10546875, -4.758544921875, -4.41162109375, -4.064697265625, -3.7177734375, -3.370849609375, -3.02392578125, -2.677001953125, -2.330078125, -1.983154296875, -1.63623046875, -1.289306640625, -0.9423828125, -0.595458984375, -0.24853515625, 0.098388671875, 0.4453125, 0.792236328125, 1.13916015625, 1.486083984375, 1.8330078125, 2.179931640625, 2.52685546875, 2.873779296875, 3.220703125, 3.567626953125, 3.91455078125, 4.261474609375, 4.6083984375, 4.955322265625, 5.30224609375, 5.649169921875, 5.99609375, 6.343017578125, 6.68994140625, 7.036865234375, 7.3837890625, 7.730712890625, 8.07763671875, 8.424560546875, 8.771484375, 9.118408203125, 9.46533203125, 9.812255859375, 10.1591796875, 10.506103515625, 10.85302734375, 11.199951171875, 11.546875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 3.0, 2.0, 3.0, 5.0, 4.0, 7.0, 13.0, 14.0, 17.0, 21.0, 22.0, 32.0, 44.0, 85.0, 135.0, 219.0, 509.0, 1380.0, 4767.0, 25273.0, 290373.0, 661995.0, 52051.0, 8109.0, 2031.0, 692.0, 284.0, 142.0, 98.0, 70.0, 34.0, 23.0, 28.0, 11.0, 15.0, 14.0, 8.0, 7.0, 4.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-21.515625, -20.825439453125, -20.13525390625, -19.445068359375, -18.7548828125, -18.064697265625, -17.37451171875, -16.684326171875, -15.994140625, -15.303955078125, -14.61376953125, -13.923583984375, -13.2333984375, -12.543212890625, -11.85302734375, -11.162841796875, -10.47265625, -9.782470703125, -9.09228515625, -8.402099609375, -7.7119140625, -7.021728515625, -6.33154296875, -5.641357421875, -4.951171875, -4.260986328125, -3.57080078125, -2.880615234375, -2.1904296875, -1.500244140625, -0.81005859375, -0.119873046875, 0.5703125, 1.260498046875, 1.95068359375, 2.640869140625, 3.3310546875, 4.021240234375, 4.71142578125, 5.401611328125, 6.091796875, 6.781982421875, 7.47216796875, 8.162353515625, 8.8525390625, 9.542724609375, 10.23291015625, 10.923095703125, 11.61328125, 12.303466796875, 12.99365234375, 13.683837890625, 14.3740234375, 15.064208984375, 15.75439453125, 16.444580078125, 17.134765625, 17.824951171875, 18.51513671875, 19.205322265625, 19.8955078125, 20.585693359375, 21.27587890625, 21.966064453125, 22.65625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 4.0, 6.0, 9.0, 23.0, 27.0, 48.0, 72.0, 151.0, 246.0, 174.0, 95.0, 56.0, 30.0, 24.0, 14.0, 7.0, 12.0, 1.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0031375885009765625, -0.003010302782058716, -0.002883017063140869, -0.0027557313442230225, -0.0026284456253051758, -0.002501159906387329, -0.0023738741874694824, -0.0022465884685516357, -0.002119302749633789, -0.0019920170307159424, -0.0018647313117980957, -0.001737445592880249, -0.0016101598739624023, -0.0014828741550445557, -0.001355588436126709, -0.0012283027172088623, -0.0011010169982910156, -0.0009737312793731689, -0.0008464455604553223, -0.0007191598415374756, -0.0005918741226196289, -0.0004645884037017822, -0.00033730268478393555, -0.00021001696586608887, -8.273124694824219e-05, 4.455447196960449e-05, 0.00017184019088745117, 0.00029912590980529785, 0.00042641162872314453, 0.0005536973476409912, 0.0006809830665588379, 0.0008082687854766846, 0.0009355545043945312, 0.001062840223312378, 0.0011901259422302246, 0.0013174116611480713, 0.001444697380065918, 0.0015719830989837646, 0.0016992688179016113, 0.001826554536819458, 0.0019538402557373047, 0.0020811259746551514, 0.002208411693572998, 0.0023356974124908447, 0.0024629831314086914, 0.002590268850326538, 0.0027175545692443848, 0.0028448402881622314, 0.002972126007080078, 0.003099411725997925, 0.0032266974449157715, 0.003353983163833618, 0.003481268882751465, 0.0036085546016693115, 0.003735840320587158, 0.003863126039505005, 0.0039904117584228516, 0.004117697477340698, 0.004244983196258545, 0.004372268915176392, 0.004499554634094238, 0.004626840353012085, 0.004754126071929932, 0.004881411790847778, 0.005008697509765625]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 7.0, 2.0, 11.0, 9.0, 16.0, 31.0, 43.0, 42.0, 110.0, 194.0, 390.0, 1025.0, 3094.0, 15127.0, 612734.0, 398725.0, 12523.0, 2758.0, 888.0, 368.0, 195.0, 95.0, 58.0, 43.0, 14.0, 18.0, 10.0, 5.0, 1.0, 4.0, 4.0, 8.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-48.84375, -47.52197265625, -46.2001953125, -44.87841796875, -43.556640625, -42.23486328125, -40.9130859375, -39.59130859375, -38.26953125, -36.94775390625, -35.6259765625, -34.30419921875, -32.982421875, -31.66064453125, -30.3388671875, -29.01708984375, -27.6953125, -26.37353515625, -25.0517578125, -23.72998046875, -22.408203125, -21.08642578125, -19.7646484375, -18.44287109375, -17.12109375, -15.79931640625, -14.4775390625, -13.15576171875, -11.833984375, -10.51220703125, -9.1904296875, -7.86865234375, -6.546875, -5.22509765625, -3.9033203125, -2.58154296875, -1.259765625, 0.06201171875, 1.3837890625, 2.70556640625, 4.02734375, 5.34912109375, 6.6708984375, 7.99267578125, 9.314453125, 10.63623046875, 11.9580078125, 13.27978515625, 14.6015625, 15.92333984375, 17.2451171875, 18.56689453125, 19.888671875, 21.21044921875, 22.5322265625, 23.85400390625, 25.17578125, 26.49755859375, 27.8193359375, 29.14111328125, 30.462890625, 31.78466796875, 33.1064453125, 34.42822265625, 35.75]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 4.0, 7.0, 17.0, 19.0, 39.0, 60.0, 96.0, 119.0, 128.0, 160.0, 124.0, 89.0, 48.0, 36.0, 23.0, 13.0, 5.0, 3.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.8984375, -14.4605712890625, -14.022705078125, -13.5848388671875, -13.14697265625, -12.7091064453125, -12.271240234375, -11.8333740234375, -11.3955078125, -10.9576416015625, -10.519775390625, -10.0819091796875, -9.64404296875, -9.2061767578125, -8.768310546875, -8.3304443359375, -7.892578125, -7.4547119140625, -7.016845703125, -6.5789794921875, -6.14111328125, -5.7032470703125, -5.265380859375, -4.8275146484375, -4.3896484375, -3.9517822265625, -3.513916015625, -3.0760498046875, -2.63818359375, -2.2003173828125, -1.762451171875, -1.3245849609375, -0.88671875, -0.4488525390625, -0.010986328125, 0.4268798828125, 0.86474609375, 1.3026123046875, 1.740478515625, 2.1783447265625, 2.6162109375, 3.0540771484375, 3.491943359375, 3.9298095703125, 4.36767578125, 4.8055419921875, 5.243408203125, 5.6812744140625, 6.119140625, 6.5570068359375, 6.994873046875, 7.4327392578125, 7.87060546875, 8.3084716796875, 8.746337890625, 9.1842041015625, 9.6220703125, 10.0599365234375, 10.497802734375, 10.9356689453125, 11.37353515625, 11.8114013671875, 12.249267578125, 12.6871337890625, 13.125]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 2.0, 1.0, 16.0, 59.0, 163.0, 356.0, 263.0, 101.0, 27.0, 10.0, 6.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-363.7420654296875, -354.343505859375, -344.9449768066406, -335.5464172363281, -326.14788818359375, -316.74932861328125, -307.35076904296875, -297.95220947265625, -288.5536804199219, -279.1551208496094, -269.756591796875, -260.3580322265625, -250.95948791503906, -241.56094360351562, -232.16238403320312, -222.7638397216797, -213.36529541015625, -203.9667510986328, -194.56820678710938, -185.16964721679688, -175.77110290527344, -166.37255859375, -156.9739990234375, -147.57545471191406, -138.17691040039062, -128.7783660888672, -119.37981414794922, -109.98126220703125, -100.58271789550781, -91.18417358398438, -81.7856216430664, -72.38706970214844, -62.988555908203125, -53.59000778198242, -44.19145965576172, -34.792911529541016, -25.394363403320312, -15.99581527709961, -6.597267150878906, 2.8012847900390625, 12.1998291015625, 21.598377227783203, 30.996925354003906, 40.39547348022461, 49.79402160644531, 59.192569732666016, 68.59111785888672, 77.98966979980469, 87.38821411132812, 96.78675842285156, 106.18531036376953, 115.5838623046875, 124.98240661621094, 134.38095092773438, 143.77951049804688, 153.1780548095703, 162.57659912109375, 171.9751434326172, 181.37368774414062, 190.77224731445312, 200.17079162597656, 209.5693359375, 218.9678955078125, 228.36643981933594, 237.76498413085938]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 2.0, 3.0, 9.0, 7.0, 4.0, 17.0, 17.0, 14.0, 24.0, 52.0, 44.0, 51.0, 53.0, 74.0, 65.0, 60.0, 64.0, 66.0, 75.0, 55.0, 55.0, 46.0, 31.0, 30.0, 20.0, 21.0, 18.0, 10.0, 5.0, 7.0, 5.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-121.52098846435547, -118.16458892822266, -114.80819702148438, -111.45179748535156, -108.09539794921875, -104.73900604248047, -101.38260650634766, -98.02621459960938, -94.66981506347656, -91.31341552734375, -87.95702362060547, -84.60062408447266, -81.24422454833984, -77.88783264160156, -74.53143310546875, -71.17503356933594, -67.81863403320312, -64.46223449707031, -61.105838775634766, -57.74944305419922, -54.39304733276367, -51.036651611328125, -47.68025207519531, -44.323856353759766, -40.96746063232422, -37.61106491088867, -34.25466537475586, -30.898269653320312, -27.541873931884766, -24.185476303100586, -20.829078674316406, -17.47268295288086, -14.116287231445312, -10.75989055633545, -7.403493404388428, -4.047096252441406, -0.690699577331543, 2.6656970977783203, 6.0220947265625, 9.378490447998047, 12.734888076782227, 16.091285705566406, 19.447681427001953, 22.804079055786133, 26.160476684570312, 29.51687240600586, 32.873268127441406, 36.22966766357422, 39.586063385009766, 42.94245910644531, 46.298858642578125, 49.65525436401367, 53.01165008544922, 56.36804962158203, 59.72444534301758, 63.080841064453125, 66.43724060058594, 69.79364013671875, 73.15003204345703, 76.50643157958984, 79.86283111572266, 83.21922302246094, 86.57562255859375, 89.93202209472656, 93.28841400146484]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 3.0, 4.0, 9.0, 15.0, 22.0, 42.0, 100.0, 234.0, 555.0, 2146.0, 14948.0, 3926665.0, 239440.0, 7800.0, 1390.0, 373.0, 152.0, 84.0, 66.0, 39.0, 25.0, 24.0, 12.0, 25.0, 12.0, 15.0, 9.0, 8.0, 11.0, 10.0, 12.0, 11.0, 6.0, 7.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.3125, -35.73828125, -33.1640625, -30.58984375, -28.015625, -25.44140625, -22.8671875, -20.29296875, -17.71875, -15.14453125, -12.5703125, -9.99609375, -7.421875, -4.84765625, -2.2734375, 0.30078125, 2.875, 5.44921875, 8.0234375, 10.59765625, 13.171875, 15.74609375, 18.3203125, 20.89453125, 23.46875, 26.04296875, 28.6171875, 31.19140625, 33.765625, 36.33984375, 38.9140625, 41.48828125, 44.0625, 46.63671875, 49.2109375, 51.78515625, 54.359375, 56.93359375, 59.5078125, 62.08203125, 64.65625, 67.23046875, 69.8046875, 72.37890625, 74.953125, 77.52734375, 80.1015625, 82.67578125, 85.25, 87.82421875, 90.3984375, 92.97265625, 95.546875, 98.12109375, 100.6953125, 103.26953125, 105.84375, 108.41796875, 110.9921875, 113.56640625, 116.140625, 118.71484375, 121.2890625, 123.86328125, 126.4375]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 15.0, 25.0, 57.0, 100.0, 143.0, 167.0, 175.0, 127.0, 87.0, 64.0, 24.0, 16.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.51171875, -2.33270263671875, -2.1536865234375, -1.97467041015625, -1.795654296875, -1.61663818359375, -1.4376220703125, -1.25860595703125, -1.07958984375, -0.90057373046875, -0.7215576171875, -0.54254150390625, -0.363525390625, -0.18450927734375, -0.0054931640625, 0.17352294921875, 0.3525390625, 0.53155517578125, 0.7105712890625, 0.88958740234375, 1.068603515625, 1.24761962890625, 1.4266357421875, 1.60565185546875, 1.78466796875, 1.96368408203125, 2.1427001953125, 2.32171630859375, 2.500732421875, 2.67974853515625, 2.8587646484375, 3.03778076171875, 3.216796875, 3.39581298828125, 3.5748291015625, 3.75384521484375, 3.932861328125, 4.11187744140625, 4.2908935546875, 4.46990966796875, 4.64892578125, 4.82794189453125, 5.0069580078125, 5.18597412109375, 5.364990234375, 5.54400634765625, 5.7230224609375, 5.90203857421875, 6.0810546875, 6.26007080078125, 6.4390869140625, 6.61810302734375, 6.797119140625, 6.97613525390625, 7.1551513671875, 7.33416748046875, 7.51318359375, 7.69219970703125, 7.8712158203125, 8.05023193359375, 8.229248046875, 8.40826416015625, 8.5872802734375, 8.76629638671875, 8.9453125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 8.0, 16.0, 32.0, 28.0, 45.0, 69.0, 120.0, 229.0, 666.0, 3126.0, 30008.0, 4071759.0, 80724.0, 5570.0, 1078.0, 330.0, 166.0, 98.0, 65.0, 53.0, 35.0, 21.0, 18.0, 9.0, 6.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.75, -50.8671875, -47.984375, -45.1015625, -42.21875, -39.3359375, -36.453125, -33.5703125, -30.6875, -27.8046875, -24.921875, -22.0390625, -19.15625, -16.2734375, -13.390625, -10.5078125, -7.625, -4.7421875, -1.859375, 1.0234375, 3.90625, 6.7890625, 9.671875, 12.5546875, 15.4375, 18.3203125, 21.203125, 24.0859375, 26.96875, 29.8515625, 32.734375, 35.6171875, 38.5, 41.3828125, 44.265625, 47.1484375, 50.03125, 52.9140625, 55.796875, 58.6796875, 61.5625, 64.4453125, 67.328125, 70.2109375, 73.09375, 75.9765625, 78.859375, 81.7421875, 84.625, 87.5078125, 90.390625, 93.2734375, 96.15625, 99.0390625, 101.921875, 104.8046875, 107.6875, 110.5703125, 113.453125, 116.3359375, 119.21875, 122.1015625, 124.984375, 127.8671875, 130.75]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 7.0, 3.0, 5.0, 12.0, 15.0, 29.0, 53.0, 86.0, 219.0, 1126.0, 2095.0, 227.0, 71.0, 44.0, 40.0, 12.0, 10.0, 12.0, 4.0, 6.0, 5.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.3203125, -5.9500732421875, -5.579833984375, -5.2095947265625, -4.83935546875, -4.4691162109375, -4.098876953125, -3.7286376953125, -3.3583984375, -2.9881591796875, -2.617919921875, -2.2476806640625, -1.87744140625, -1.5072021484375, -1.136962890625, -0.7667236328125, -0.396484375, -0.0262451171875, 0.343994140625, 0.7142333984375, 1.08447265625, 1.4547119140625, 1.824951171875, 2.1951904296875, 2.5654296875, 2.9356689453125, 3.305908203125, 3.6761474609375, 4.04638671875, 4.4166259765625, 4.786865234375, 5.1571044921875, 5.52734375, 5.8975830078125, 6.267822265625, 6.6380615234375, 7.00830078125, 7.3785400390625, 7.748779296875, 8.1190185546875, 8.4892578125, 8.8594970703125, 9.229736328125, 9.5999755859375, 9.97021484375, 10.3404541015625, 10.710693359375, 11.0809326171875, 11.451171875, 11.8214111328125, 12.191650390625, 12.5618896484375, 12.93212890625, 13.3023681640625, 13.672607421875, 14.0428466796875, 14.4130859375, 14.7833251953125, 15.153564453125, 15.5238037109375, 15.89404296875, 16.2642822265625, 16.634521484375, 17.0047607421875, 17.375]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 25.0, 71.0, 300.0, 440.0, 119.0, 34.0, 14.0, 7.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.32054138183594, -35.01451110839844, -30.70848274230957, -26.402454376220703, -22.096424102783203, -17.790393829345703, -13.484365463256836, -9.178337097167969, -4.872306823730469, -0.5662775039672852, 3.7397518157958984, 8.045781135559082, 12.351810455322266, 16.657840728759766, 20.963869094848633, 25.2698974609375, 29.575927734375, 33.8819580078125, 38.18798828125, 42.494014739990234, 46.800045013427734, 51.106075286865234, 55.41210174560547, 59.71813201904297, 64.02416229248047, 68.33019256591797, 72.63622283935547, 76.94225311279297, 81.24827575683594, 85.55430603027344, 89.86033630371094, 94.16636657714844, 98.472412109375, 102.7784423828125, 107.08447265625, 111.3905029296875, 115.696533203125, 120.0025634765625, 124.30858612060547, 128.6146240234375, 132.920654296875, 137.2266845703125, 141.53271484375, 145.8387451171875, 150.144775390625, 154.4508056640625, 158.7568359375, 163.0628662109375, 167.36888122558594, 171.67491149902344, 175.98094177246094, 180.28697204589844, 184.59300231933594, 188.89903259277344, 193.20506286621094, 197.51107788085938, 201.81710815429688, 206.12313842773438, 210.42916870117188, 214.73519897460938, 219.04122924804688, 223.34725952148438, 227.65328979492188, 231.95932006835938, 236.26535034179688]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 13.0, 12.0, 17.0, 17.0, 20.0, 29.0, 31.0, 46.0, 37.0, 63.0, 51.0, 68.0, 68.0, 67.0, 86.0, 63.0, 40.0, 58.0, 49.0, 40.0, 24.0, 25.0, 18.0, 11.0, 19.0, 11.0, 13.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.883390426635742, -26.872522354125977, -25.861652374267578, -24.850784301757812, -23.839916229248047, -22.82904815673828, -21.818180084228516, -20.807310104370117, -19.79644203186035, -18.785573959350586, -17.774703979492188, -16.763835906982422, -15.752967834472656, -14.74209976196289, -13.731230735778809, -12.720361709594727, -11.709493637084961, -10.698625564575195, -9.687756538391113, -8.676887512207031, -7.666019439697266, -6.655150890350342, -5.644282341003418, -4.633413791656494, -3.6225452423095703, -2.6116766929626465, -1.6008081436157227, -0.5899395942687988, 0.420928955078125, 1.4317975044250488, 2.4426660537719727, 3.4535346031188965, 4.464405059814453, 5.475273609161377, 6.486142158508301, 7.497010707855225, 8.507879257202148, 9.518747329711914, 10.529616355895996, 11.540485382080078, 12.551353454589844, 13.56222152709961, 14.573090553283691, 15.583959579467773, 16.59482765197754, 17.605695724487305, 18.616565704345703, 19.62743377685547, 20.638301849365234, 21.649169921875, 22.660037994384766, 23.670907974243164, 24.68177604675293, 25.692644119262695, 26.703514099121094, 27.71438217163086, 28.725250244140625, 29.73611831665039, 30.746986389160156, 31.757856369018555, 32.76872253417969, 33.77959442138672, 34.790462493896484, 35.80133056640625, 36.812198638916016]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 5.0, 5.0, 3.0, 6.0, 5.0, 8.0, 12.0, 18.0, 18.0, 21.0, 20.0, 32.0, 41.0, 63.0, 101.0, 163.0, 342.0, 829.0, 3179.0, 20500.0, 435712.0, 557144.0, 25012.0, 3556.0, 882.0, 351.0, 158.0, 106.0, 69.0, 46.0, 34.0, 29.0, 21.0, 13.0, 6.0, 4.0, 4.0, 8.0, 5.0, 3.0, 7.0, 1.0, 5.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-51.0, -49.54443359375, -48.0888671875, -46.63330078125, -45.177734375, -43.72216796875, -42.2666015625, -40.81103515625, -39.35546875, -37.89990234375, -36.4443359375, -34.98876953125, -33.533203125, -32.07763671875, -30.6220703125, -29.16650390625, -27.7109375, -26.25537109375, -24.7998046875, -23.34423828125, -21.888671875, -20.43310546875, -18.9775390625, -17.52197265625, -16.06640625, -14.61083984375, -13.1552734375, -11.69970703125, -10.244140625, -8.78857421875, -7.3330078125, -5.87744140625, -4.421875, -2.96630859375, -1.5107421875, -0.05517578125, 1.400390625, 2.85595703125, 4.3115234375, 5.76708984375, 7.22265625, 8.67822265625, 10.1337890625, 11.58935546875, 13.044921875, 14.50048828125, 15.9560546875, 17.41162109375, 18.8671875, 20.32275390625, 21.7783203125, 23.23388671875, 24.689453125, 26.14501953125, 27.6005859375, 29.05615234375, 30.51171875, 31.96728515625, 33.4228515625, 34.87841796875, 36.333984375, 37.78955078125, 39.2451171875, 40.70068359375, 42.15625]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 11.0, 10.0, 40.0, 57.0, 99.0, 126.0, 161.0, 137.0, 124.0, 91.0, 63.0, 39.0, 30.0, 12.0, 8.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.970703125, -2.797454833984375, -2.62420654296875, -2.450958251953125, -2.2777099609375, -2.104461669921875, -1.93121337890625, -1.757965087890625, -1.584716796875, -1.411468505859375, -1.23822021484375, -1.064971923828125, -0.8917236328125, -0.718475341796875, -0.54522705078125, -0.371978759765625, -0.19873046875, -0.025482177734375, 0.14776611328125, 0.321014404296875, 0.4942626953125, 0.667510986328125, 0.84075927734375, 1.014007568359375, 1.187255859375, 1.360504150390625, 1.53375244140625, 1.707000732421875, 1.8802490234375, 2.053497314453125, 2.22674560546875, 2.399993896484375, 2.5732421875, 2.746490478515625, 2.91973876953125, 3.092987060546875, 3.2662353515625, 3.439483642578125, 3.61273193359375, 3.785980224609375, 3.959228515625, 4.132476806640625, 4.30572509765625, 4.478973388671875, 4.6522216796875, 4.825469970703125, 4.99871826171875, 5.171966552734375, 5.34521484375, 5.518463134765625, 5.69171142578125, 5.864959716796875, 6.0382080078125, 6.211456298828125, 6.38470458984375, 6.557952880859375, 6.731201171875, 6.904449462890625, 7.07769775390625, 7.250946044921875, 7.4241943359375, 7.597442626953125, 7.77069091796875, 7.943939208984375, 8.1171875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 3.0, 4.0, 5.0, 6.0, 7.0, 15.0, 16.0, 22.0, 11.0, 24.0, 37.0, 55.0, 56.0, 78.0, 108.0, 155.0, 271.0, 363.0, 715.0, 1328.0, 2717.0, 6705.0, 18474.0, 60835.0, 254195.0, 501954.0, 141398.0, 37477.0, 12332.0, 4688.0, 1932.0, 980.0, 533.0, 304.0, 214.0, 171.0, 93.0, 61.0, 62.0, 38.0, 28.0, 21.0, 19.0, 15.0, 9.0, 10.0, 6.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.75, -17.217041015625, -16.68408203125, -16.151123046875, -15.6181640625, -15.085205078125, -14.55224609375, -14.019287109375, -13.486328125, -12.953369140625, -12.42041015625, -11.887451171875, -11.3544921875, -10.821533203125, -10.28857421875, -9.755615234375, -9.22265625, -8.689697265625, -8.15673828125, -7.623779296875, -7.0908203125, -6.557861328125, -6.02490234375, -5.491943359375, -4.958984375, -4.426025390625, -3.89306640625, -3.360107421875, -2.8271484375, -2.294189453125, -1.76123046875, -1.228271484375, -0.6953125, -0.162353515625, 0.37060546875, 0.903564453125, 1.4365234375, 1.969482421875, 2.50244140625, 3.035400390625, 3.568359375, 4.101318359375, 4.63427734375, 5.167236328125, 5.7001953125, 6.233154296875, 6.76611328125, 7.299072265625, 7.83203125, 8.364990234375, 8.89794921875, 9.430908203125, 9.9638671875, 10.496826171875, 11.02978515625, 11.562744140625, 12.095703125, 12.628662109375, 13.16162109375, 13.694580078125, 14.2275390625, 14.760498046875, 15.29345703125, 15.826416015625, 16.359375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 1.0, 3.0, 3.0, 10.0, 7.0, 7.0, 10.0, 10.0, 9.0, 13.0, 16.0, 17.0, 22.0, 18.0, 19.0, 39.0, 28.0, 47.0, 40.0, 38.0, 37.0, 31.0, 43.0, 41.0, 46.0, 40.0, 38.0, 38.0, 31.0, 34.0, 43.0, 33.0, 19.0, 31.0, 25.0, 21.0, 14.0, 13.0, 8.0, 11.0, 9.0, 4.0, 9.0, 3.0, 10.0, 6.0, 1.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 1.0], "bins": [-8.9375, -8.658935546875, -8.38037109375, -8.101806640625, -7.8232421875, -7.544677734375, -7.26611328125, -6.987548828125, -6.708984375, -6.430419921875, -6.15185546875, -5.873291015625, -5.5947265625, -5.316162109375, -5.03759765625, -4.759033203125, -4.48046875, -4.201904296875, -3.92333984375, -3.644775390625, -3.3662109375, -3.087646484375, -2.80908203125, -2.530517578125, -2.251953125, -1.973388671875, -1.69482421875, -1.416259765625, -1.1376953125, -0.859130859375, -0.58056640625, -0.302001953125, -0.0234375, 0.255126953125, 0.53369140625, 0.812255859375, 1.0908203125, 1.369384765625, 1.64794921875, 1.926513671875, 2.205078125, 2.483642578125, 2.76220703125, 3.040771484375, 3.3193359375, 3.597900390625, 3.87646484375, 4.155029296875, 4.43359375, 4.712158203125, 4.99072265625, 5.269287109375, 5.5478515625, 5.826416015625, 6.10498046875, 6.383544921875, 6.662109375, 6.940673828125, 7.21923828125, 7.497802734375, 7.7763671875, 8.054931640625, 8.33349609375, 8.612060546875, 8.890625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 3.0, 5.0, 14.0, 8.0, 19.0, 26.0, 32.0, 52.0, 100.0, 191.0, 342.0, 998.0, 3483.0, 18009.0, 205189.0, 744037.0, 64316.0, 8518.0, 1906.0, 653.0, 299.0, 137.0, 71.0, 47.0, 33.0, 32.0, 14.0, 10.0, 2.0, 6.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.75, -9.379150390625, -9.00830078125, -8.637451171875, -8.2666015625, -7.895751953125, -7.52490234375, -7.154052734375, -6.783203125, -6.412353515625, -6.04150390625, -5.670654296875, -5.2998046875, -4.928955078125, -4.55810546875, -4.187255859375, -3.81640625, -3.445556640625, -3.07470703125, -2.703857421875, -2.3330078125, -1.962158203125, -1.59130859375, -1.220458984375, -0.849609375, -0.478759765625, -0.10791015625, 0.262939453125, 0.6337890625, 1.004638671875, 1.37548828125, 1.746337890625, 2.1171875, 2.488037109375, 2.85888671875, 3.229736328125, 3.6005859375, 3.971435546875, 4.34228515625, 4.713134765625, 5.083984375, 5.454833984375, 5.82568359375, 6.196533203125, 6.5673828125, 6.938232421875, 7.30908203125, 7.679931640625, 8.05078125, 8.421630859375, 8.79248046875, 9.163330078125, 9.5341796875, 9.905029296875, 10.27587890625, 10.646728515625, 11.017578125, 11.388427734375, 11.75927734375, 12.130126953125, 12.5009765625, 12.871826171875, 13.24267578125, 13.613525390625, 13.984375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 6.0, 7.0, 13.0, 17.0, 21.0, 33.0, 50.0, 86.0, 147.0, 206.0, 157.0, 91.0, 63.0, 43.0, 25.0, 16.0, 6.0, 10.0, 7.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0019083023071289062, -0.001830950379371643, -0.0017535984516143799, -0.0016762465238571167, -0.0015988945960998535, -0.0015215426683425903, -0.0014441907405853271, -0.001366838812828064, -0.0012894868850708008, -0.0012121349573135376, -0.0011347830295562744, -0.0010574311017990112, -0.000980079174041748, -0.0009027272462844849, -0.0008253753185272217, -0.0007480233907699585, -0.0006706714630126953, -0.0005933195352554321, -0.0005159676074981689, -0.00043861567974090576, -0.0003612637519836426, -0.0002839118242263794, -0.0002065598964691162, -0.00012920796871185303, -5.1856040954589844e-05, 2.549588680267334e-05, 0.00010284781455993652, 0.0001801997423171997, 0.0002575516700744629, 0.0003349035978317261, 0.00041225552558898926, 0.0004896074533462524, 0.0005669593811035156, 0.0006443113088607788, 0.000721663236618042, 0.0007990151643753052, 0.0008763670921325684, 0.0009537190198898315, 0.0010310709476470947, 0.001108422875404358, 0.001185774803161621, 0.0012631267309188843, 0.0013404786586761475, 0.0014178305864334106, 0.0014951825141906738, 0.001572534441947937, 0.0016498863697052002, 0.0017272382974624634, 0.0018045902252197266, 0.0018819421529769897, 0.001959294080734253, 0.002036646008491516, 0.0021139979362487793, 0.0021913498640060425, 0.0022687017917633057, 0.002346053719520569, 0.002423405647277832, 0.002500757575035095, 0.0025781095027923584, 0.0026554614305496216, 0.0027328133583068848, 0.002810165286064148, 0.002887517213821411, 0.0029648691415786743, 0.0030422210693359375]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 5.0, 5.0, 10.0, 5.0, 15.0, 22.0, 21.0, 31.0, 52.0, 59.0, 107.0, 176.0, 261.0, 551.0, 981.0, 2244.0, 5292.0, 16400.0, 73616.0, 483974.0, 384822.0, 57220.0, 13920.0, 4635.0, 1995.0, 906.0, 467.0, 281.0, 146.0, 84.0, 78.0, 43.0, 34.0, 29.0, 15.0, 13.0, 10.0, 10.0, 3.0, 3.0, 3.0, 4.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-8.109375, -7.870361328125, -7.63134765625, -7.392333984375, -7.1533203125, -6.914306640625, -6.67529296875, -6.436279296875, -6.197265625, -5.958251953125, -5.71923828125, -5.480224609375, -5.2412109375, -5.002197265625, -4.76318359375, -4.524169921875, -4.28515625, -4.046142578125, -3.80712890625, -3.568115234375, -3.3291015625, -3.090087890625, -2.85107421875, -2.612060546875, -2.373046875, -2.134033203125, -1.89501953125, -1.656005859375, -1.4169921875, -1.177978515625, -0.93896484375, -0.699951171875, -0.4609375, -0.221923828125, 0.01708984375, 0.256103515625, 0.4951171875, 0.734130859375, 0.97314453125, 1.212158203125, 1.451171875, 1.690185546875, 1.92919921875, 2.168212890625, 2.4072265625, 2.646240234375, 2.88525390625, 3.124267578125, 3.36328125, 3.602294921875, 3.84130859375, 4.080322265625, 4.3193359375, 4.558349609375, 4.79736328125, 5.036376953125, 5.275390625, 5.514404296875, 5.75341796875, 5.992431640625, 6.2314453125, 6.470458984375, 6.70947265625, 6.948486328125, 7.1875]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 2.0, 4.0, 2.0, 4.0, 6.0, 6.0, 7.0, 13.0, 15.0, 21.0, 11.0, 27.0, 35.0, 33.0, 44.0, 71.0, 52.0, 62.0, 82.0, 70.0, 71.0, 81.0, 49.0, 48.0, 32.0, 30.0, 30.0, 15.0, 10.0, 12.0, 15.0, 5.0, 5.0, 5.0, 4.0, 5.0, 3.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0], "bins": [-3.3046875, -3.197845458984375, -3.09100341796875, -2.984161376953125, -2.8773193359375, -2.770477294921875, -2.66363525390625, -2.556793212890625, -2.449951171875, -2.343109130859375, -2.23626708984375, -2.129425048828125, -2.0225830078125, -1.915740966796875, -1.80889892578125, -1.702056884765625, -1.59521484375, -1.488372802734375, -1.38153076171875, -1.274688720703125, -1.1678466796875, -1.061004638671875, -0.95416259765625, -0.847320556640625, -0.740478515625, -0.633636474609375, -0.52679443359375, -0.419952392578125, -0.3131103515625, -0.206268310546875, -0.09942626953125, 0.007415771484375, 0.1142578125, 0.221099853515625, 0.32794189453125, 0.434783935546875, 0.5416259765625, 0.648468017578125, 0.75531005859375, 0.862152099609375, 0.968994140625, 1.075836181640625, 1.18267822265625, 1.289520263671875, 1.3963623046875, 1.503204345703125, 1.61004638671875, 1.716888427734375, 1.82373046875, 1.930572509765625, 2.03741455078125, 2.144256591796875, 2.2510986328125, 2.357940673828125, 2.46478271484375, 2.571624755859375, 2.678466796875, 2.785308837890625, 2.89215087890625, 2.998992919921875, 3.1058349609375, 3.212677001953125, 3.31951904296875, 3.426361083984375, 3.533203125]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 11.0, 12.0, 14.0, 34.0, 54.0, 99.0, 131.0, 147.0, 217.0, 107.0, 74.0, 51.0, 31.0, 13.0, 7.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.857452392578125, -50.17935562133789, -46.501258850097656, -42.823158264160156, -39.14506530761719, -35.46696472167969, -31.788867950439453, -28.11077117919922, -24.432674407958984, -20.75457763671875, -17.076480865478516, -13.398382186889648, -9.720285415649414, -6.04218864440918, -2.3640899658203125, 1.3140068054199219, 4.992103576660156, 8.67020034790039, 12.348298072814941, 16.026395797729492, 19.704492568969727, 23.38258934020996, 27.060688018798828, 30.738784790039062, 34.4168815612793, 38.09497833251953, 41.773075103759766, 45.451171875, 49.1292724609375, 52.80736541748047, 56.48546600341797, 60.1635627746582, 63.84165954589844, 67.51976013183594, 71.1978530883789, 74.8759536743164, 78.55404663085938, 82.23214721679688, 85.91024780273438, 89.58834075927734, 93.26643371582031, 96.94453430175781, 100.62262725830078, 104.30072784423828, 107.97882080078125, 111.65692138671875, 115.33502197265625, 119.01311492919922, 122.69121551513672, 126.36931610107422, 130.0474090576172, 133.7255096435547, 137.4036102294922, 141.08169555664062, 144.75979614257812, 148.43789672851562, 152.11599731445312, 155.79409790039062, 159.47219848632812, 163.15028381347656, 166.82838439941406, 170.50648498535156, 174.18458557128906, 177.8626708984375, 181.540771484375]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 3.0, 5.0, 10.0, 10.0, 9.0, 10.0, 12.0, 11.0, 10.0, 23.0, 20.0, 30.0, 37.0, 43.0, 34.0, 36.0, 34.0, 46.0, 40.0, 47.0, 45.0, 38.0, 50.0, 37.0, 42.0, 40.0, 37.0, 30.0, 34.0, 29.0, 27.0, 27.0, 13.0, 19.0, 10.0, 10.0, 12.0, 8.0, 6.0, 3.0, 5.0, 2.0, 7.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-59.016456604003906, -57.15349578857422, -55.29053497314453, -53.427574157714844, -51.56460952758789, -49.7016487121582, -47.838687896728516, -45.97572708129883, -44.112762451171875, -42.24980163574219, -40.3868408203125, -38.52388000488281, -36.66091537475586, -34.79795455932617, -32.934993743896484, -31.072032928466797, -29.20907211303711, -27.346111297607422, -25.4831485748291, -23.620187759399414, -21.757225036621094, -19.894264221191406, -18.03130340576172, -16.16834259033203, -14.305379867553711, -12.442418098449707, -10.579456329345703, -8.716495513916016, -6.853533744812012, -4.990571975708008, -3.1276111602783203, -1.2646493911743164, 0.5983085632324219, 2.4612700939178467, 4.3242316246032715, 6.187192916870117, 8.050154685974121, 9.913116455078125, 11.776077270507812, 13.639039039611816, 15.50200080871582, 17.364961624145508, 19.227924346923828, 21.090885162353516, 22.953845977783203, 24.816808700561523, 26.67976951599121, 28.54273223876953, 30.40569305419922, 32.268653869628906, 34.131614685058594, 35.99457550048828, 37.857540130615234, 39.72050094604492, 41.58346176147461, 43.4464225769043, 45.30938720703125, 47.17234802246094, 49.035308837890625, 50.89826965332031, 52.761234283447266, 54.62419509887695, 56.48715591430664, 58.35011672973633, 60.213077545166016]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 6.0, 6.0, 3.0, 12.0, 14.0, 38.0, 74.0, 153.0, 389.0, 1243.0, 6745.0, 576685.0, 3599508.0, 7104.0, 1346.0, 448.0, 177.0, 106.0, 69.0, 36.0, 35.0, 15.0, 12.0, 10.0, 13.0, 8.0, 6.0, 3.0, 1.0, 3.0, 7.0, 2.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.28125, -34.95556640625, -32.6298828125, -30.30419921875, -27.978515625, -25.65283203125, -23.3271484375, -21.00146484375, -18.67578125, -16.35009765625, -14.0244140625, -11.69873046875, -9.373046875, -7.04736328125, -4.7216796875, -2.39599609375, -0.0703125, 2.25537109375, 4.5810546875, 6.90673828125, 9.232421875, 11.55810546875, 13.8837890625, 16.20947265625, 18.53515625, 20.86083984375, 23.1865234375, 25.51220703125, 27.837890625, 30.16357421875, 32.4892578125, 34.81494140625, 37.140625, 39.46630859375, 41.7919921875, 44.11767578125, 46.443359375, 48.76904296875, 51.0947265625, 53.42041015625, 55.74609375, 58.07177734375, 60.3974609375, 62.72314453125, 65.048828125, 67.37451171875, 69.7001953125, 72.02587890625, 74.3515625, 76.67724609375, 79.0029296875, 81.32861328125, 83.654296875, 85.97998046875, 88.3056640625, 90.63134765625, 92.95703125, 95.28271484375, 97.6083984375, 99.93408203125, 102.259765625, 104.58544921875, 106.9111328125, 109.23681640625, 111.5625]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 5.0, 9.0, 32.0, 43.0, 70.0, 105.0, 153.0, 149.0, 136.0, 125.0, 78.0, 43.0, 31.0, 17.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.078125, -2.9031982421875, -2.728271484375, -2.5533447265625, -2.37841796875, -2.2034912109375, -2.028564453125, -1.8536376953125, -1.6787109375, -1.5037841796875, -1.328857421875, -1.1539306640625, -0.97900390625, -0.8040771484375, -0.629150390625, -0.4542236328125, -0.279296875, -0.1043701171875, 0.070556640625, 0.2454833984375, 0.42041015625, 0.5953369140625, 0.770263671875, 0.9451904296875, 1.1201171875, 1.2950439453125, 1.469970703125, 1.6448974609375, 1.81982421875, 1.9947509765625, 2.169677734375, 2.3446044921875, 2.51953125, 2.6944580078125, 2.869384765625, 3.0443115234375, 3.21923828125, 3.3941650390625, 3.569091796875, 3.7440185546875, 3.9189453125, 4.0938720703125, 4.268798828125, 4.4437255859375, 4.61865234375, 4.7935791015625, 4.968505859375, 5.1434326171875, 5.318359375, 5.4932861328125, 5.668212890625, 5.8431396484375, 6.01806640625, 6.1929931640625, 6.367919921875, 6.5428466796875, 6.7177734375, 6.8927001953125, 7.067626953125, 7.2425537109375, 7.41748046875, 7.5924072265625, 7.767333984375, 7.9422607421875, 8.1171875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 6.0, 5.0, 10.0, 22.0, 24.0, 21.0, 31.0, 39.0, 62.0, 136.0, 346.0, 2533.0, 102110.0, 4081971.0, 5839.0, 616.0, 189.0, 86.0, 61.0, 37.0, 36.0, 33.0, 23.0, 17.0, 21.0, 8.0, 2.0, 5.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.625, -58.751953125, -54.87890625, -51.005859375, -47.1328125, -43.259765625, -39.38671875, -35.513671875, -31.640625, -27.767578125, -23.89453125, -20.021484375, -16.1484375, -12.275390625, -8.40234375, -4.529296875, -0.65625, 3.216796875, 7.08984375, 10.962890625, 14.8359375, 18.708984375, 22.58203125, 26.455078125, 30.328125, 34.201171875, 38.07421875, 41.947265625, 45.8203125, 49.693359375, 53.56640625, 57.439453125, 61.3125, 65.185546875, 69.05859375, 72.931640625, 76.8046875, 80.677734375, 84.55078125, 88.423828125, 92.296875, 96.169921875, 100.04296875, 103.916015625, 107.7890625, 111.662109375, 115.53515625, 119.408203125, 123.28125, 127.154296875, 131.02734375, 134.900390625, 138.7734375, 142.646484375, 146.51953125, 150.392578125, 154.265625, 158.138671875, 162.01171875, 165.884765625, 169.7578125, 173.630859375, 177.50390625, 181.376953125, 185.25]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 7.0, 9.0, 12.0, 26.0, 36.0, 117.0, 665.0, 2944.0, 173.0, 53.0, 10.0, 18.0, 8.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.48828125, -4.94891357421875, -4.4095458984375, -3.87017822265625, -3.330810546875, -2.79144287109375, -2.2520751953125, -1.71270751953125, -1.17333984375, -0.63397216796875, -0.0946044921875, 0.44476318359375, 0.984130859375, 1.52349853515625, 2.0628662109375, 2.60223388671875, 3.1416015625, 3.68096923828125, 4.2203369140625, 4.75970458984375, 5.299072265625, 5.83843994140625, 6.3778076171875, 6.91717529296875, 7.45654296875, 7.99591064453125, 8.5352783203125, 9.07464599609375, 9.614013671875, 10.15338134765625, 10.6927490234375, 11.23211669921875, 11.771484375, 12.31085205078125, 12.8502197265625, 13.38958740234375, 13.928955078125, 14.46832275390625, 15.0076904296875, 15.54705810546875, 16.08642578125, 16.62579345703125, 17.1651611328125, 17.70452880859375, 18.243896484375, 18.78326416015625, 19.3226318359375, 19.86199951171875, 20.4013671875, 20.94073486328125, 21.4801025390625, 22.01947021484375, 22.558837890625, 23.09820556640625, 23.6375732421875, 24.17694091796875, 24.71630859375, 25.25567626953125, 25.7950439453125, 26.33441162109375, 26.873779296875, 27.41314697265625, 27.9525146484375, 28.49188232421875, 29.03125]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 7.0, 15.0, 45.0, 186.0, 503.0, 195.0, 44.0, 12.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-234.19064331054688, -229.65040588378906, -225.1101531982422, -220.56991577148438, -216.0296630859375, -211.4894256591797, -206.94918823242188, -202.408935546875, -197.8686981201172, -193.32846069335938, -188.7882080078125, -184.2479705810547, -179.70773315429688, -175.16748046875, -170.6272430419922, -166.0869903564453, -161.5467529296875, -157.0065155029297, -152.4662628173828, -147.926025390625, -143.38577270507812, -138.8455352783203, -134.3052978515625, -129.76504516601562, -125.22480773925781, -120.68456268310547, -116.14431762695312, -111.60408020019531, -107.06383514404297, -102.52359008789062, -97.98335266113281, -93.44310760498047, -88.90287780761719, -84.36263275146484, -79.8223876953125, -75.28215026855469, -70.74190521240234, -66.20166015625, -61.66141891479492, -57.121177673339844, -52.580928802490234, -48.040687561035156, -43.50044250488281, -38.96019744873047, -34.41995620727539, -29.87971305847168, -25.33946990966797, -20.799226760864258, -16.258983612060547, -11.718740463256836, -7.178497314453125, -2.638254165649414, 1.9019889831542969, 6.442232131958008, 10.982475280761719, 15.52271842956543, 20.06296157836914, 24.60320472717285, 29.143447875976562, 33.683692932128906, 38.223934173583984, 42.76417541503906, 47.304420471191406, 51.84466552734375, 56.38490676879883]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 7.0, 4.0, 9.0, 23.0, 17.0, 21.0, 27.0, 34.0, 45.0, 38.0, 74.0, 73.0, 76.0, 67.0, 76.0, 70.0, 68.0, 55.0, 54.0, 42.0, 32.0, 21.0, 19.0, 12.0, 22.0, 8.0, 6.0, 6.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.779701232910156, -38.707027435302734, -37.63435363769531, -36.561683654785156, -35.489009857177734, -34.41633605957031, -33.34366226196289, -32.27098846435547, -31.198314666748047, -30.125640869140625, -29.052968978881836, -27.980295181274414, -26.907621383666992, -25.834949493408203, -24.76227569580078, -23.68960189819336, -22.61693000793457, -21.54425621032715, -20.47158432006836, -19.398910522460938, -18.326236724853516, -17.253562927246094, -16.180891036987305, -15.108217239379883, -14.035544395446777, -12.962871551513672, -11.89019775390625, -10.817524909973145, -9.744852066040039, -8.672178268432617, -7.599505424499512, -6.526832103729248, -5.454156875610352, -4.381483554840088, -3.3088104724884033, -2.2361373901367188, -1.163464069366455, -0.0907907485961914, 0.9818820953369141, 2.0545554161071777, 3.1272287368774414, 4.199902057647705, 5.272575378417969, 6.345248222351074, 7.417921543121338, 8.490594863891602, 9.563267707824707, 10.635940551757812, 11.708614349365234, 12.78128719329834, 13.853960990905762, 14.926633834838867, 15.999307632446289, 17.071979522705078, 18.1446533203125, 19.217327117919922, 20.290000915527344, 21.362674713134766, 22.435346603393555, 23.508020401000977, 24.5806941986084, 25.653366088867188, 26.72603988647461, 27.79871368408203, 28.87138557434082]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 6.0, 7.0, 9.0, 9.0, 14.0, 18.0, 42.0, 47.0, 67.0, 104.0, 140.0, 219.0, 329.0, 610.0, 1089.0, 2120.0, 5225.0, 14762.0, 60618.0, 441717.0, 436978.0, 59697.0, 14952.0, 4955.0, 2151.0, 1036.0, 602.0, 372.0, 216.0, 125.0, 103.0, 60.0, 45.0, 27.0, 18.0, 19.0, 14.0, 8.0, 8.0, 8.0, 3.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-25.34375, -24.526123046875, -23.70849609375, -22.890869140625, -22.0732421875, -21.255615234375, -20.43798828125, -19.620361328125, -18.802734375, -17.985107421875, -17.16748046875, -16.349853515625, -15.5322265625, -14.714599609375, -13.89697265625, -13.079345703125, -12.26171875, -11.444091796875, -10.62646484375, -9.808837890625, -8.9912109375, -8.173583984375, -7.35595703125, -6.538330078125, -5.720703125, -4.903076171875, -4.08544921875, -3.267822265625, -2.4501953125, -1.632568359375, -0.81494140625, 0.002685546875, 0.8203125, 1.637939453125, 2.45556640625, 3.273193359375, 4.0908203125, 4.908447265625, 5.72607421875, 6.543701171875, 7.361328125, 8.178955078125, 8.99658203125, 9.814208984375, 10.6318359375, 11.449462890625, 12.26708984375, 13.084716796875, 13.90234375, 14.719970703125, 15.53759765625, 16.355224609375, 17.1728515625, 17.990478515625, 18.80810546875, 19.625732421875, 20.443359375, 21.260986328125, 22.07861328125, 22.896240234375, 23.7138671875, 24.531494140625, 25.34912109375, 26.166748046875, 26.984375]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 6.0, 4.0, 8.0, 13.0, 24.0, 29.0, 30.0, 32.0, 55.0, 50.0, 73.0, 90.0, 81.0, 85.0, 86.0, 68.0, 54.0, 61.0, 46.0, 28.0, 20.0, 18.0, 10.0, 10.0, 6.0, 8.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.076171875, -2.9737548828125, -2.871337890625, -2.7689208984375, -2.66650390625, -2.5640869140625, -2.461669921875, -2.3592529296875, -2.2568359375, -2.1544189453125, -2.052001953125, -1.9495849609375, -1.84716796875, -1.7447509765625, -1.642333984375, -1.5399169921875, -1.4375, -1.3350830078125, -1.232666015625, -1.1302490234375, -1.02783203125, -0.9254150390625, -0.822998046875, -0.7205810546875, -0.6181640625, -0.5157470703125, -0.413330078125, -0.3109130859375, -0.20849609375, -0.1060791015625, -0.003662109375, 0.0987548828125, 0.201171875, 0.3035888671875, 0.406005859375, 0.5084228515625, 0.61083984375, 0.7132568359375, 0.815673828125, 0.9180908203125, 1.0205078125, 1.1229248046875, 1.225341796875, 1.3277587890625, 1.43017578125, 1.5325927734375, 1.635009765625, 1.7374267578125, 1.83984375, 1.9422607421875, 2.044677734375, 2.1470947265625, 2.24951171875, 2.3519287109375, 2.454345703125, 2.5567626953125, 2.6591796875, 2.7615966796875, 2.864013671875, 2.9664306640625, 3.06884765625, 3.1712646484375, 3.273681640625, 3.3760986328125, 3.478515625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 7.0, 3.0, 9.0, 9.0, 5.0, 12.0, 26.0, 24.0, 44.0, 62.0, 91.0, 128.0, 147.0, 256.0, 340.0, 517.0, 977.0, 1864.0, 4573.0, 14377.0, 56015.0, 296864.0, 524789.0, 109493.0, 24849.0, 7097.0, 2689.0, 1286.0, 645.0, 447.0, 240.0, 197.0, 144.0, 105.0, 67.0, 53.0, 31.0, 22.0, 21.0, 13.0, 11.0, 6.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.9375, -16.357666015625, -15.77783203125, -15.197998046875, -14.6181640625, -14.038330078125, -13.45849609375, -12.878662109375, -12.298828125, -11.718994140625, -11.13916015625, -10.559326171875, -9.9794921875, -9.399658203125, -8.81982421875, -8.239990234375, -7.66015625, -7.080322265625, -6.50048828125, -5.920654296875, -5.3408203125, -4.760986328125, -4.18115234375, -3.601318359375, -3.021484375, -2.441650390625, -1.86181640625, -1.281982421875, -0.7021484375, -0.122314453125, 0.45751953125, 1.037353515625, 1.6171875, 2.197021484375, 2.77685546875, 3.356689453125, 3.9365234375, 4.516357421875, 5.09619140625, 5.676025390625, 6.255859375, 6.835693359375, 7.41552734375, 7.995361328125, 8.5751953125, 9.155029296875, 9.73486328125, 10.314697265625, 10.89453125, 11.474365234375, 12.05419921875, 12.634033203125, 13.2138671875, 13.793701171875, 14.37353515625, 14.953369140625, 15.533203125, 16.113037109375, 16.69287109375, 17.272705078125, 17.8525390625, 18.432373046875, 19.01220703125, 19.592041015625, 20.171875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 4.0, 1.0, 3.0, 1.0, 3.0, 4.0, 10.0, 6.0, 9.0, 10.0, 15.0, 13.0, 13.0, 17.0, 31.0, 26.0, 30.0, 29.0, 43.0, 37.0, 36.0, 37.0, 42.0, 36.0, 42.0, 42.0, 42.0, 44.0, 45.0, 31.0, 41.0, 30.0, 36.0, 30.0, 21.0, 22.0, 24.0, 20.0, 13.0, 14.0, 9.0, 4.0, 9.0, 11.0, 5.0, 3.0, 1.0, 2.0, 6.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-9.5390625, -9.24951171875, -8.9599609375, -8.67041015625, -8.380859375, -8.09130859375, -7.8017578125, -7.51220703125, -7.22265625, -6.93310546875, -6.6435546875, -6.35400390625, -6.064453125, -5.77490234375, -5.4853515625, -5.19580078125, -4.90625, -4.61669921875, -4.3271484375, -4.03759765625, -3.748046875, -3.45849609375, -3.1689453125, -2.87939453125, -2.58984375, -2.30029296875, -2.0107421875, -1.72119140625, -1.431640625, -1.14208984375, -0.8525390625, -0.56298828125, -0.2734375, 0.01611328125, 0.3056640625, 0.59521484375, 0.884765625, 1.17431640625, 1.4638671875, 1.75341796875, 2.04296875, 2.33251953125, 2.6220703125, 2.91162109375, 3.201171875, 3.49072265625, 3.7802734375, 4.06982421875, 4.359375, 4.64892578125, 4.9384765625, 5.22802734375, 5.517578125, 5.80712890625, 6.0966796875, 6.38623046875, 6.67578125, 6.96533203125, 7.2548828125, 7.54443359375, 7.833984375, 8.12353515625, 8.4130859375, 8.70263671875, 8.9921875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 8.0, 2.0, 9.0, 7.0, 17.0, 16.0, 26.0, 33.0, 38.0, 51.0, 61.0, 98.0, 133.0, 196.0, 259.0, 328.0, 503.0, 808.0, 1255.0, 2248.0, 4199.0, 10182.0, 30827.0, 143005.0, 569961.0, 217518.0, 42182.0, 12847.0, 5089.0, 2333.0, 1404.0, 831.0, 621.0, 404.0, 271.0, 205.0, 142.0, 119.0, 89.0, 45.0, 47.0, 40.0, 35.0, 14.0, 12.0, 9.0, 6.0, 6.0, 5.0, 6.0, 4.0, 3.0, 4.0, 0.0, 0.0, 2.0], "bins": [-6.5234375, -6.32342529296875, -6.1234130859375, -5.92340087890625, -5.723388671875, -5.52337646484375, -5.3233642578125, -5.12335205078125, -4.92333984375, -4.72332763671875, -4.5233154296875, -4.32330322265625, -4.123291015625, -3.92327880859375, -3.7232666015625, -3.52325439453125, -3.3232421875, -3.12322998046875, -2.9232177734375, -2.72320556640625, -2.523193359375, -2.32318115234375, -2.1231689453125, -1.92315673828125, -1.72314453125, -1.52313232421875, -1.3231201171875, -1.12310791015625, -0.923095703125, -0.72308349609375, -0.5230712890625, -0.32305908203125, -0.123046875, 0.07696533203125, 0.2769775390625, 0.47698974609375, 0.677001953125, 0.87701416015625, 1.0770263671875, 1.27703857421875, 1.47705078125, 1.67706298828125, 1.8770751953125, 2.07708740234375, 2.277099609375, 2.47711181640625, 2.6771240234375, 2.87713623046875, 3.0771484375, 3.27716064453125, 3.4771728515625, 3.67718505859375, 3.877197265625, 4.07720947265625, 4.2772216796875, 4.47723388671875, 4.67724609375, 4.87725830078125, 5.0772705078125, 5.27728271484375, 5.477294921875, 5.67730712890625, 5.8773193359375, 6.07733154296875, 6.27734375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 4.0, 4.0, 10.0, 13.0, 16.0, 28.0, 35.0, 78.0, 186.0, 287.0, 173.0, 70.0, 36.0, 18.0, 19.0, 6.0, 8.0, 4.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0021991729736328125, -0.0020802319049835205, -0.0019612908363342285, -0.0018423497676849365, -0.0017234086990356445, -0.0016044676303863525, -0.0014855265617370605, -0.0013665854930877686, -0.0012476444244384766, -0.0011287033557891846, -0.0010097622871398926, -0.0008908212184906006, -0.0007718801498413086, -0.0006529390811920166, -0.0005339980125427246, -0.0004150569438934326, -0.0002961158752441406, -0.00017717480659484863, -5.823373794555664e-05, 6.070733070373535e-05, 0.00017964839935302734, 0.00029858946800231934, 0.00041753053665161133, 0.0005364716053009033, 0.0006554126739501953, 0.0007743537425994873, 0.0008932948112487793, 0.0010122358798980713, 0.0011311769485473633, 0.0012501180171966553, 0.0013690590858459473, 0.0014880001544952393, 0.0016069412231445312, 0.0017258822917938232, 0.0018448233604431152, 0.0019637644290924072, 0.0020827054977416992, 0.002201646566390991, 0.002320587635040283, 0.002439528703689575, 0.002558469772338867, 0.002677410840988159, 0.002796351909637451, 0.002915292978286743, 0.003034234046936035, 0.003153175115585327, 0.003272116184234619, 0.003391057252883911, 0.003509998321533203, 0.003628939390182495, 0.003747880458831787, 0.003866821527481079, 0.003985762596130371, 0.004104703664779663, 0.004223644733428955, 0.004342585802078247, 0.004461526870727539, 0.004580467939376831, 0.004699409008026123, 0.004818350076675415, 0.004937291145324707, 0.005056232213973999, 0.005175173282623291, 0.005294114351272583, 0.005413055419921875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 6.0, 10.0, 10.0, 17.0, 19.0, 12.0, 16.0, 31.0, 40.0, 73.0, 116.0, 260.0, 486.0, 944.0, 2216.0, 6410.0, 34482.0, 406240.0, 538656.0, 46146.0, 7692.0, 2451.0, 1081.0, 483.0, 264.0, 133.0, 78.0, 49.0, 37.0, 16.0, 21.0, 15.0, 11.0, 5.0, 6.0, 9.0, 3.0, 3.0, 2.0, 1.0, 6.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.9453125, -10.6331787109375, -10.321044921875, -10.0089111328125, -9.69677734375, -9.3846435546875, -9.072509765625, -8.7603759765625, -8.4482421875, -8.1361083984375, -7.823974609375, -7.5118408203125, -7.19970703125, -6.8875732421875, -6.575439453125, -6.2633056640625, -5.951171875, -5.6390380859375, -5.326904296875, -5.0147705078125, -4.70263671875, -4.3905029296875, -4.078369140625, -3.7662353515625, -3.4541015625, -3.1419677734375, -2.829833984375, -2.5177001953125, -2.20556640625, -1.8934326171875, -1.581298828125, -1.2691650390625, -0.95703125, -0.6448974609375, -0.332763671875, -0.0206298828125, 0.29150390625, 0.6036376953125, 0.915771484375, 1.2279052734375, 1.5400390625, 1.8521728515625, 2.164306640625, 2.4764404296875, 2.78857421875, 3.1007080078125, 3.412841796875, 3.7249755859375, 4.037109375, 4.3492431640625, 4.661376953125, 4.9735107421875, 5.28564453125, 5.5977783203125, 5.909912109375, 6.2220458984375, 6.5341796875, 6.8463134765625, 7.158447265625, 7.4705810546875, 7.78271484375, 8.0948486328125, 8.406982421875, 8.7191162109375, 9.03125]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 6.0, 2.0, 5.0, 13.0, 10.0, 13.0, 20.0, 28.0, 32.0, 51.0, 55.0, 74.0, 75.0, 117.0, 87.0, 91.0, 68.0, 72.0, 39.0, 39.0, 36.0, 21.0, 13.0, 10.0, 6.0, 5.0, 4.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-5.453125, -5.30194091796875, -5.1507568359375, -4.99957275390625, -4.848388671875, -4.69720458984375, -4.5460205078125, -4.39483642578125, -4.24365234375, -4.09246826171875, -3.9412841796875, -3.79010009765625, -3.638916015625, -3.48773193359375, -3.3365478515625, -3.18536376953125, -3.0341796875, -2.88299560546875, -2.7318115234375, -2.58062744140625, -2.429443359375, -2.27825927734375, -2.1270751953125, -1.97589111328125, -1.82470703125, -1.67352294921875, -1.5223388671875, -1.37115478515625, -1.219970703125, -1.06878662109375, -0.9176025390625, -0.76641845703125, -0.615234375, -0.46405029296875, -0.3128662109375, -0.16168212890625, -0.010498046875, 0.14068603515625, 0.2918701171875, 0.44305419921875, 0.59423828125, 0.74542236328125, 0.8966064453125, 1.04779052734375, 1.198974609375, 1.35015869140625, 1.5013427734375, 1.65252685546875, 1.8037109375, 1.95489501953125, 2.1060791015625, 2.25726318359375, 2.408447265625, 2.55963134765625, 2.7108154296875, 2.86199951171875, 3.01318359375, 3.16436767578125, 3.3155517578125, 3.46673583984375, 3.617919921875, 3.76910400390625, 3.9202880859375, 4.07147216796875, 4.22265625]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 8.0, 30.0, 48.0, 119.0, 251.0, 257.0, 164.0, 56.0, 42.0, 18.0, 8.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-136.45655822753906, -130.5247039794922, -124.59284973144531, -118.66099548339844, -112.72914123535156, -106.79728698730469, -100.86544036865234, -94.93358612060547, -89.0017318725586, -83.06987762451172, -77.13802337646484, -71.2061767578125, -65.27432250976562, -59.342464447021484, -53.410614013671875, -47.478759765625, -41.546905517578125, -35.61505126953125, -29.683198928833008, -23.751346588134766, -17.81949234008789, -11.887638092041016, -5.955787658691406, -0.02393341064453125, 5.907920837402344, 11.839774131774902, 17.77162742614746, 23.703479766845703, 29.635334014892578, 35.56718826293945, 41.49903869628906, 47.43089294433594, 53.362762451171875, 59.29461669921875, 65.22647094726562, 71.1583251953125, 77.09017944335938, 83.02203369140625, 88.9538803100586, 94.88573455810547, 100.81758880615234, 106.74944305419922, 112.6812973022461, 118.61314392089844, 124.54499816894531, 130.4768524169922, 136.40870666503906, 142.34056091308594, 148.2724151611328, 154.2042694091797, 160.13612365722656, 166.06797790527344, 171.9998321533203, 177.9316864013672, 183.863525390625, 189.79537963867188, 195.72723388671875, 201.65908813476562, 207.5909423828125, 213.52279663085938, 219.45465087890625, 225.38650512695312, 231.318359375, 237.25021362304688, 243.18206787109375]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 4.0, 2.0, 7.0, 9.0, 13.0, 17.0, 30.0, 27.0, 27.0, 37.0, 37.0, 30.0, 36.0, 50.0, 53.0, 52.0, 58.0, 49.0, 49.0, 65.0, 49.0, 42.0, 36.0, 34.0, 36.0, 30.0, 16.0, 29.0, 18.0, 17.0, 14.0, 6.0, 4.0, 7.0, 6.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.933692932128906, -61.603919982910156, -59.274147033691406, -56.944374084472656, -54.614601135253906, -52.284828186035156, -49.95505142211914, -47.62527847290039, -45.29550552368164, -42.96573257446289, -40.63595962524414, -38.30618667602539, -35.976409912109375, -33.646636962890625, -31.316864013671875, -28.987091064453125, -26.657318115234375, -24.327545166015625, -21.997772216796875, -19.667997360229492, -17.338224411010742, -15.008451461791992, -12.678677558898926, -10.34890365600586, -8.01913070678711, -5.689357280731201, -3.359583854675293, -1.0298104286193848, 1.2999629974365234, 3.6297359466552734, 5.95950984954834, 8.289283752441406, 10.619064331054688, 12.948837280273438, 15.278611183166504, 17.60838508605957, 19.93815803527832, 22.26793098449707, 24.597705841064453, 26.927478790283203, 29.257251739501953, 31.587024688720703, 33.91679763793945, 36.2465705871582, 38.57634735107422, 40.90612030029297, 43.23589324951172, 45.56566619873047, 47.89543914794922, 50.22521209716797, 52.55498504638672, 54.88475799560547, 57.21453094482422, 59.54430389404297, 61.874080657958984, 64.203857421875, 66.53363037109375, 68.8634033203125, 71.19317626953125, 73.52294921875, 75.85272216796875, 78.1824951171875, 80.51226806640625, 82.842041015625, 85.17181396484375]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 10.0, 17.0, 20.0, 40.0, 83.0, 153.0, 335.0, 1057.0, 4139.0, 25209.0, 3962394.0, 185657.0, 10605.0, 2625.0, 827.0, 412.0, 235.0, 133.0, 71.0, 59.0, 35.0, 32.0, 27.0, 18.0, 14.0, 17.0, 7.0, 8.0, 6.0, 3.0, 1.0, 6.0, 5.0, 2.0, 3.0, 3.0, 3.0, 2.0, 3.0, 3.0, 4.0, 6.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.734375, -26.083251953125, -24.43212890625, -22.781005859375, -21.1298828125, -19.478759765625, -17.82763671875, -16.176513671875, -14.525390625, -12.874267578125, -11.22314453125, -9.572021484375, -7.9208984375, -6.269775390625, -4.61865234375, -2.967529296875, -1.31640625, 0.334716796875, 1.98583984375, 3.636962890625, 5.2880859375, 6.939208984375, 8.59033203125, 10.241455078125, 11.892578125, 13.543701171875, 15.19482421875, 16.845947265625, 18.4970703125, 20.148193359375, 21.79931640625, 23.450439453125, 25.1015625, 26.752685546875, 28.40380859375, 30.054931640625, 31.7060546875, 33.357177734375, 35.00830078125, 36.659423828125, 38.310546875, 39.961669921875, 41.61279296875, 43.263916015625, 44.9150390625, 46.566162109375, 48.21728515625, 49.868408203125, 51.51953125, 53.170654296875, 54.82177734375, 56.472900390625, 58.1240234375, 59.775146484375, 61.42626953125, 63.077392578125, 64.728515625, 66.379638671875, 68.03076171875, 69.681884765625, 71.3330078125, 72.984130859375, 74.63525390625, 76.286376953125, 77.9375]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 7.0, 7.0, 17.0, 38.0, 53.0, 78.0, 131.0, 139.0, 143.0, 138.0, 79.0, 66.0, 51.0, 31.0, 17.0, 4.0, 1.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.966796875, -2.783721923828125, -2.60064697265625, -2.417572021484375, -2.2344970703125, -2.051422119140625, -1.86834716796875, -1.685272216796875, -1.502197265625, -1.319122314453125, -1.13604736328125, -0.952972412109375, -0.7698974609375, -0.586822509765625, -0.40374755859375, -0.220672607421875, -0.03759765625, 0.145477294921875, 0.32855224609375, 0.511627197265625, 0.6947021484375, 0.877777099609375, 1.06085205078125, 1.243927001953125, 1.427001953125, 1.610076904296875, 1.79315185546875, 1.976226806640625, 2.1593017578125, 2.342376708984375, 2.52545166015625, 2.708526611328125, 2.8916015625, 3.074676513671875, 3.25775146484375, 3.440826416015625, 3.6239013671875, 3.806976318359375, 3.99005126953125, 4.173126220703125, 4.356201171875, 4.539276123046875, 4.72235107421875, 4.905426025390625, 5.0885009765625, 5.271575927734375, 5.45465087890625, 5.637725830078125, 5.82080078125, 6.003875732421875, 6.18695068359375, 6.370025634765625, 6.5531005859375, 6.736175537109375, 6.91925048828125, 7.102325439453125, 7.285400390625, 7.468475341796875, 7.65155029296875, 7.834625244140625, 8.0177001953125, 8.200775146484375, 8.38385009765625, 8.566925048828125, 8.75]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 6.0, 5.0, 12.0, 19.0, 39.0, 51.0, 95.0, 223.0, 511.0, 1883.0, 14378.0, 4049003.0, 120726.0, 5413.0, 1124.0, 373.0, 190.0, 88.0, 45.0, 42.0, 27.0, 15.0, 4.0, 5.0, 4.0, 1.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.9375, -60.048828125, -57.16015625, -54.271484375, -51.3828125, -48.494140625, -45.60546875, -42.716796875, -39.828125, -36.939453125, -34.05078125, -31.162109375, -28.2734375, -25.384765625, -22.49609375, -19.607421875, -16.71875, -13.830078125, -10.94140625, -8.052734375, -5.1640625, -2.275390625, 0.61328125, 3.501953125, 6.390625, 9.279296875, 12.16796875, 15.056640625, 17.9453125, 20.833984375, 23.72265625, 26.611328125, 29.5, 32.388671875, 35.27734375, 38.166015625, 41.0546875, 43.943359375, 46.83203125, 49.720703125, 52.609375, 55.498046875, 58.38671875, 61.275390625, 64.1640625, 67.052734375, 69.94140625, 72.830078125, 75.71875, 78.607421875, 81.49609375, 84.384765625, 87.2734375, 90.162109375, 93.05078125, 95.939453125, 98.828125, 101.716796875, 104.60546875, 107.494140625, 110.3828125, 113.271484375, 116.16015625, 119.048828125, 121.9375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 9.0, 6.0, 9.0, 16.0, 26.0, 35.0, 82.0, 168.0, 1211.0, 2137.0, 202.0, 69.0, 34.0, 32.0, 12.0, 7.0, 12.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.0703125, -12.5037841796875, -11.937255859375, -11.3707275390625, -10.80419921875, -10.2376708984375, -9.671142578125, -9.1046142578125, -8.5380859375, -7.9715576171875, -7.405029296875, -6.8385009765625, -6.27197265625, -5.7054443359375, -5.138916015625, -4.5723876953125, -4.005859375, -3.4393310546875, -2.872802734375, -2.3062744140625, -1.73974609375, -1.1732177734375, -0.606689453125, -0.0401611328125, 0.5263671875, 1.0928955078125, 1.659423828125, 2.2259521484375, 2.79248046875, 3.3590087890625, 3.925537109375, 4.4920654296875, 5.05859375, 5.6251220703125, 6.191650390625, 6.7581787109375, 7.32470703125, 7.8912353515625, 8.457763671875, 9.0242919921875, 9.5908203125, 10.1573486328125, 10.723876953125, 11.2904052734375, 11.85693359375, 12.4234619140625, 12.989990234375, 13.5565185546875, 14.123046875, 14.6895751953125, 15.256103515625, 15.8226318359375, 16.38916015625, 16.9556884765625, 17.522216796875, 18.0887451171875, 18.6552734375, 19.2218017578125, 19.788330078125, 20.3548583984375, 20.92138671875, 21.4879150390625, 22.054443359375, 22.6209716796875, 23.1875]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 10.0, 32.0, 217.0, 642.0, 99.0, 11.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-359.1016540527344, -349.2215576171875, -339.3414611816406, -329.46136474609375, -319.5812683105469, -309.701171875, -299.8210754394531, -289.94097900390625, -280.0608825683594, -270.1807861328125, -260.3006896972656, -250.42059326171875, -240.54049682617188, -230.660400390625, -220.78030395507812, -210.90020751953125, -201.02011108398438, -191.1400146484375, -181.25991821289062, -171.37982177734375, -161.49972534179688, -151.61962890625, -141.73953247070312, -131.85943603515625, -121.97933959960938, -112.0992431640625, -102.21914672851562, -92.33905029296875, -82.45895385742188, -72.578857421875, -62.698760986328125, -52.81866455078125, -42.93853759765625, -33.058441162109375, -23.1783447265625, -13.298248291015625, -3.41815185546875, 6.461944580078125, 16.342041015625, 26.222137451171875, 36.10223388671875, 45.982330322265625, 55.8624267578125, 65.74252319335938, 75.62261962890625, 85.50271606445312, 95.3828125, 105.26290893554688, 115.14300537109375, 125.02310180664062, 134.9031982421875, 144.78329467773438, 154.66339111328125, 164.54348754882812, 174.423583984375, 184.30368041992188, 194.18377685546875, 204.06387329101562, 213.9439697265625, 223.82406616210938, 233.70416259765625, 243.58425903320312, 253.46435546875, 263.3444519042969, 273.22454833984375]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 11.0, 10.0, 24.0, 35.0, 43.0, 68.0, 67.0, 86.0, 93.0, 95.0, 113.0, 76.0, 77.0, 70.0, 42.0, 27.0, 29.0, 13.0, 9.0, 7.0, 6.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.95846557617188, -62.82013702392578, -60.68181228637695, -58.54348373413086, -56.405155181884766, -54.26683044433594, -52.128501892089844, -49.99017333984375, -47.851844787597656, -45.71351623535156, -43.575191497802734, -41.43686294555664, -39.29853439331055, -37.16020965576172, -35.021881103515625, -32.88355255126953, -30.745227813720703, -28.606901168823242, -26.46857261657715, -24.330245971679688, -22.191917419433594, -20.053590774536133, -17.915264129638672, -15.776936531066895, -13.638608932495117, -11.50028133392334, -9.361953735351562, -7.223627090454102, -5.085299491882324, -2.946971893310547, -0.8086452484130859, 1.3296823501586914, 3.4680099487304688, 5.606337547302246, 7.744664669036865, 9.882991790771484, 12.021319389343262, 14.159646987915039, 16.2979736328125, 18.436302185058594, 20.574628829956055, 22.712955474853516, 24.85128402709961, 26.98961067199707, 29.12793731689453, 31.266265869140625, 33.40459442138672, 35.54291915893555, 37.68124771118164, 39.819576263427734, 41.95790100097656, 44.096229553222656, 46.23455810546875, 48.372886657714844, 50.51121139526367, 52.649539947509766, 54.787864685058594, 56.92619323730469, 59.064517974853516, 61.20284652709961, 63.3411750793457, 65.47949981689453, 67.61782836914062, 69.75615692138672, 71.89448547363281]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 6.0, 5.0, 3.0, 5.0, 5.0, 8.0, 16.0, 20.0, 30.0, 46.0, 68.0, 152.0, 253.0, 604.0, 1752.0, 8429.0, 141271.0, 858582.0, 31472.0, 3909.0, 992.0, 429.0, 210.0, 115.0, 65.0, 35.0, 23.0, 17.0, 14.0, 5.0, 8.0, 4.0, 3.0, 3.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.28125, -33.54150390625, -31.8017578125, -30.06201171875, -28.322265625, -26.58251953125, -24.8427734375, -23.10302734375, -21.36328125, -19.62353515625, -17.8837890625, -16.14404296875, -14.404296875, -12.66455078125, -10.9248046875, -9.18505859375, -7.4453125, -5.70556640625, -3.9658203125, -2.22607421875, -0.486328125, 1.25341796875, 2.9931640625, 4.73291015625, 6.47265625, 8.21240234375, 9.9521484375, 11.69189453125, 13.431640625, 15.17138671875, 16.9111328125, 18.65087890625, 20.390625, 22.13037109375, 23.8701171875, 25.60986328125, 27.349609375, 29.08935546875, 30.8291015625, 32.56884765625, 34.30859375, 36.04833984375, 37.7880859375, 39.52783203125, 41.267578125, 43.00732421875, 44.7470703125, 46.48681640625, 48.2265625, 49.96630859375, 51.7060546875, 53.44580078125, 55.185546875, 56.92529296875, 58.6650390625, 60.40478515625, 62.14453125, 63.88427734375, 65.6240234375, 67.36376953125, 69.103515625, 70.84326171875, 72.5830078125, 74.32275390625, 76.0625]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 6.0, 10.0, 14.0, 25.0, 39.0, 57.0, 96.0, 119.0, 126.0, 128.0, 116.0, 81.0, 73.0, 49.0, 33.0, 16.0, 7.0, 4.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.873046875, -2.705718994140625, -2.53839111328125, -2.371063232421875, -2.2037353515625, -2.036407470703125, -1.86907958984375, -1.701751708984375, -1.534423828125, -1.367095947265625, -1.19976806640625, -1.032440185546875, -0.8651123046875, -0.697784423828125, -0.53045654296875, -0.363128662109375, -0.19580078125, -0.028472900390625, 0.13885498046875, 0.306182861328125, 0.4735107421875, 0.640838623046875, 0.80816650390625, 0.975494384765625, 1.142822265625, 1.310150146484375, 1.47747802734375, 1.644805908203125, 1.8121337890625, 1.979461669921875, 2.14678955078125, 2.314117431640625, 2.4814453125, 2.648773193359375, 2.81610107421875, 2.983428955078125, 3.1507568359375, 3.318084716796875, 3.48541259765625, 3.652740478515625, 3.820068359375, 3.987396240234375, 4.15472412109375, 4.322052001953125, 4.4893798828125, 4.656707763671875, 4.82403564453125, 4.991363525390625, 5.15869140625, 5.326019287109375, 5.49334716796875, 5.660675048828125, 5.8280029296875, 5.995330810546875, 6.16265869140625, 6.329986572265625, 6.497314453125, 6.664642333984375, 6.83197021484375, 6.999298095703125, 7.1666259765625, 7.333953857421875, 7.50128173828125, 7.668609619140625, 7.8359375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 10.0, 6.0, 9.0, 20.0, 11.0, 26.0, 31.0, 52.0, 54.0, 97.0, 145.0, 233.0, 365.0, 654.0, 1331.0, 3103.0, 9071.0, 34316.0, 168333.0, 604668.0, 174055.0, 35820.0, 9675.0, 3301.0, 1463.0, 694.0, 351.0, 224.0, 122.0, 89.0, 65.0, 34.0, 41.0, 28.0, 16.0, 16.0, 5.0, 4.0, 4.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-19.34375, -18.783203125, -18.22265625, -17.662109375, -17.1015625, -16.541015625, -15.98046875, -15.419921875, -14.859375, -14.298828125, -13.73828125, -13.177734375, -12.6171875, -12.056640625, -11.49609375, -10.935546875, -10.375, -9.814453125, -9.25390625, -8.693359375, -8.1328125, -7.572265625, -7.01171875, -6.451171875, -5.890625, -5.330078125, -4.76953125, -4.208984375, -3.6484375, -3.087890625, -2.52734375, -1.966796875, -1.40625, -0.845703125, -0.28515625, 0.275390625, 0.8359375, 1.396484375, 1.95703125, 2.517578125, 3.078125, 3.638671875, 4.19921875, 4.759765625, 5.3203125, 5.880859375, 6.44140625, 7.001953125, 7.5625, 8.123046875, 8.68359375, 9.244140625, 9.8046875, 10.365234375, 10.92578125, 11.486328125, 12.046875, 12.607421875, 13.16796875, 13.728515625, 14.2890625, 14.849609375, 15.41015625, 15.970703125, 16.53125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 1.0, 4.0, 3.0, 2.0, 9.0, 6.0, 5.0, 12.0, 9.0, 12.0, 15.0, 16.0, 17.0, 24.0, 22.0, 26.0, 24.0, 28.0, 33.0, 47.0, 25.0, 51.0, 35.0, 39.0, 41.0, 47.0, 35.0, 50.0, 39.0, 35.0, 40.0, 33.0, 38.0, 27.0, 35.0, 17.0, 14.0, 19.0, 14.0, 6.0, 12.0, 6.0, 10.0, 8.0, 7.0, 3.0, 5.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-10.2890625, -9.98974609375, -9.6904296875, -9.39111328125, -9.091796875, -8.79248046875, -8.4931640625, -8.19384765625, -7.89453125, -7.59521484375, -7.2958984375, -6.99658203125, -6.697265625, -6.39794921875, -6.0986328125, -5.79931640625, -5.5, -5.20068359375, -4.9013671875, -4.60205078125, -4.302734375, -4.00341796875, -3.7041015625, -3.40478515625, -3.10546875, -2.80615234375, -2.5068359375, -2.20751953125, -1.908203125, -1.60888671875, -1.3095703125, -1.01025390625, -0.7109375, -0.41162109375, -0.1123046875, 0.18701171875, 0.486328125, 0.78564453125, 1.0849609375, 1.38427734375, 1.68359375, 1.98291015625, 2.2822265625, 2.58154296875, 2.880859375, 3.18017578125, 3.4794921875, 3.77880859375, 4.078125, 4.37744140625, 4.6767578125, 4.97607421875, 5.275390625, 5.57470703125, 5.8740234375, 6.17333984375, 6.47265625, 6.77197265625, 7.0712890625, 7.37060546875, 7.669921875, 7.96923828125, 8.2685546875, 8.56787109375, 8.8671875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 9.0, 9.0, 17.0, 13.0, 38.0, 83.0, 131.0, 311.0, 744.0, 1739.0, 4737.0, 14584.0, 75265.0, 761556.0, 157427.0, 21582.0, 6330.0, 2369.0, 894.0, 361.0, 175.0, 77.0, 47.0, 19.0, 13.0, 8.0, 4.0, 3.0, 2.0, 5.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.4453125, -9.0089111328125, -8.572509765625, -8.1361083984375, -7.69970703125, -7.2633056640625, -6.826904296875, -6.3905029296875, -5.9541015625, -5.5177001953125, -5.081298828125, -4.6448974609375, -4.20849609375, -3.7720947265625, -3.335693359375, -2.8992919921875, -2.462890625, -2.0264892578125, -1.590087890625, -1.1536865234375, -0.71728515625, -0.2808837890625, 0.155517578125, 0.5919189453125, 1.0283203125, 1.4647216796875, 1.901123046875, 2.3375244140625, 2.77392578125, 3.2103271484375, 3.646728515625, 4.0831298828125, 4.51953125, 4.9559326171875, 5.392333984375, 5.8287353515625, 6.26513671875, 6.7015380859375, 7.137939453125, 7.5743408203125, 8.0107421875, 8.4471435546875, 8.883544921875, 9.3199462890625, 9.75634765625, 10.1927490234375, 10.629150390625, 11.0655517578125, 11.501953125, 11.9383544921875, 12.374755859375, 12.8111572265625, 13.24755859375, 13.6839599609375, 14.120361328125, 14.5567626953125, 14.9931640625, 15.4295654296875, 15.865966796875, 16.3023681640625, 16.73876953125, 17.1751708984375, 17.611572265625, 18.0479736328125, 18.484375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 11.0, 4.0, 14.0, 13.0, 13.0, 30.0, 36.0, 86.0, 165.0, 269.0, 158.0, 75.0, 49.0, 23.0, 20.0, 10.0, 6.0, 3.0, 7.0, 3.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0022830963134765625, -0.0021968185901641846, -0.0021105408668518066, -0.0020242631435394287, -0.0019379854202270508, -0.0018517076969146729, -0.001765429973602295, -0.001679152250289917, -0.001592874526977539, -0.0015065968036651611, -0.0014203190803527832, -0.0013340413570404053, -0.0012477636337280273, -0.0011614859104156494, -0.0010752081871032715, -0.0009889304637908936, -0.0009026527404785156, -0.0008163750171661377, -0.0007300972938537598, -0.0006438195705413818, -0.0005575418472290039, -0.000471264123916626, -0.00038498640060424805, -0.0002987086772918701, -0.0002124309539794922, -0.00012615323066711426, -3.987550735473633e-05, 4.64022159576416e-05, 0.00013267993927001953, 0.00021895766258239746, 0.0003052353858947754, 0.0003915131092071533, 0.00047779083251953125, 0.0005640685558319092, 0.0006503462791442871, 0.000736624002456665, 0.000822901725769043, 0.0009091794490814209, 0.0009954571723937988, 0.0010817348957061768, 0.0011680126190185547, 0.0012542903423309326, 0.0013405680656433105, 0.0014268457889556885, 0.0015131235122680664, 0.0015994012355804443, 0.0016856789588928223, 0.0017719566822052002, 0.0018582344055175781, 0.001944512128829956, 0.002030789852142334, 0.002117067575454712, 0.00220334529876709, 0.0022896230220794678, 0.0023759007453918457, 0.0024621784687042236, 0.0025484561920166016, 0.0026347339153289795, 0.0027210116386413574, 0.0028072893619537354, 0.0028935670852661133, 0.002979844808578491, 0.003066122531890869, 0.003152400255203247, 0.003238677978515625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 0.0, 3.0, 3.0, 4.0, 8.0, 11.0, 8.0, 19.0, 18.0, 32.0, 44.0, 103.0, 168.0, 304.0, 480.0, 1195.0, 3073.0, 9075.0, 35899.0, 593416.0, 364251.0, 28130.0, 7463.0, 2681.0, 1036.0, 477.0, 260.0, 128.0, 91.0, 56.0, 44.0, 20.0, 20.0, 12.0, 9.0, 7.0, 2.0, 2.0, 1.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.421875, -16.9083251953125, -16.394775390625, -15.8812255859375, -15.36767578125, -14.8541259765625, -14.340576171875, -13.8270263671875, -13.3134765625, -12.7999267578125, -12.286376953125, -11.7728271484375, -11.25927734375, -10.7457275390625, -10.232177734375, -9.7186279296875, -9.205078125, -8.6915283203125, -8.177978515625, -7.6644287109375, -7.15087890625, -6.6373291015625, -6.123779296875, -5.6102294921875, -5.0966796875, -4.5831298828125, -4.069580078125, -3.5560302734375, -3.04248046875, -2.5289306640625, -2.015380859375, -1.5018310546875, -0.98828125, -0.4747314453125, 0.038818359375, 0.5523681640625, 1.06591796875, 1.5794677734375, 2.093017578125, 2.6065673828125, 3.1201171875, 3.6336669921875, 4.147216796875, 4.6607666015625, 5.17431640625, 5.6878662109375, 6.201416015625, 6.7149658203125, 7.228515625, 7.7420654296875, 8.255615234375, 8.7691650390625, 9.28271484375, 9.7962646484375, 10.309814453125, 10.8233642578125, 11.3369140625, 11.8504638671875, 12.364013671875, 12.8775634765625, 13.39111328125, 13.9046630859375, 14.418212890625, 14.9317626953125, 15.4453125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 6.0, 5.0, 4.0, 8.0, 9.0, 13.0, 8.0, 21.0, 27.0, 35.0, 68.0, 76.0, 123.0, 142.0, 148.0, 102.0, 55.0, 38.0, 24.0, 15.0, 14.0, 17.0, 5.0, 10.0, 6.0, 7.0, 3.0, 1.0, 5.0, 3.0, 1.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.125, -7.8831787109375, -7.641357421875, -7.3995361328125, -7.15771484375, -6.9158935546875, -6.674072265625, -6.4322509765625, -6.1904296875, -5.9486083984375, -5.706787109375, -5.4649658203125, -5.22314453125, -4.9813232421875, -4.739501953125, -4.4976806640625, -4.255859375, -4.0140380859375, -3.772216796875, -3.5303955078125, -3.28857421875, -3.0467529296875, -2.804931640625, -2.5631103515625, -2.3212890625, -2.0794677734375, -1.837646484375, -1.5958251953125, -1.35400390625, -1.1121826171875, -0.870361328125, -0.6285400390625, -0.38671875, -0.1448974609375, 0.096923828125, 0.3387451171875, 0.58056640625, 0.8223876953125, 1.064208984375, 1.3060302734375, 1.5478515625, 1.7896728515625, 2.031494140625, 2.2733154296875, 2.51513671875, 2.7569580078125, 2.998779296875, 3.2406005859375, 3.482421875, 3.7242431640625, 3.966064453125, 4.2078857421875, 4.44970703125, 4.6915283203125, 4.933349609375, 5.1751708984375, 5.4169921875, 5.6588134765625, 5.900634765625, 6.1424560546875, 6.38427734375, 6.6260986328125, 6.867919921875, 7.1097412109375, 7.3515625]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 10.0, 16.0, 54.0, 149.0, 238.0, 296.0, 148.0, 51.0, 35.0, 8.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-91.10647583007812, -84.15635681152344, -77.20623779296875, -70.2561264038086, -63.306007385253906, -56.35588836669922, -49.4057731628418, -42.455657958984375, -35.50553894042969, -28.555421829223633, -21.605304718017578, -14.655187606811523, -7.705070495605469, -0.7549514770507812, 6.195163726806641, 13.145278930664062, 20.09539794921875, 27.045515060424805, 33.99563217163086, 40.94574737548828, 47.89586639404297, 54.845985412597656, 61.79610061645508, 68.7462158203125, 75.69633483886719, 82.64645385742188, 89.59657287597656, 96.54668426513672, 103.4968032836914, 110.4469223022461, 117.39703369140625, 124.34715270996094, 131.29727172851562, 138.2473907470703, 145.197509765625, 152.1476287841797, 159.09774780273438, 166.0478515625, 172.9979705810547, 179.94808959960938, 186.89820861816406, 193.84832763671875, 200.79844665527344, 207.74856567382812, 214.69866943359375, 221.6488037109375, 228.59890747070312, 235.5490264892578, 242.4991455078125, 249.4492645263672, 256.3993835449219, 263.3494873046875, 270.29962158203125, 277.2497253417969, 284.1998596191406, 291.14996337890625, 298.10009765625, 305.0502014160156, 312.0003356933594, 318.950439453125, 325.90057373046875, 332.8506774902344, 339.8008117675781, 346.75091552734375, 353.7010192871094]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 4.0, 2.0, 4.0, 7.0, 11.0, 9.0, 6.0, 21.0, 25.0, 29.0, 37.0, 39.0, 39.0, 64.0, 60.0, 72.0, 64.0, 58.0, 66.0, 70.0, 61.0, 48.0, 43.0, 36.0, 29.0, 23.0, 23.0, 18.0, 10.0, 11.0, 10.0, 6.0, 2.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-80.23942565917969, -77.6066665649414, -74.9738998413086, -72.34114074707031, -69.7083740234375, -67.07561492919922, -64.44285583496094, -61.81009292602539, -59.177330017089844, -56.5445671081543, -53.91180419921875, -51.27904510498047, -48.64628219604492, -46.013519287109375, -43.380760192871094, -40.74799728393555, -38.115234375, -35.48247146606445, -32.849708557128906, -30.216949462890625, -27.584186553955078, -24.95142364501953, -22.318662643432617, -19.685901641845703, -17.053138732910156, -14.420376777648926, -11.787614822387695, -9.154852867126465, -6.522090911865234, -3.889328956604004, -1.2565670013427734, 1.3761940002441406, 4.008964538574219, 6.641726493835449, 9.27448844909668, 11.90725040435791, 14.54001235961914, 17.172775268554688, 19.8055362701416, 22.438297271728516, 25.071060180664062, 27.70382308959961, 30.336584091186523, 32.96934509277344, 35.602108001708984, 38.23487091064453, 40.86763000488281, 43.50039291381836, 46.133155822753906, 48.76591873168945, 51.398681640625, 54.03144073486328, 56.66420364379883, 59.296966552734375, 61.929725646972656, 64.56248474121094, 67.19525146484375, 69.82801055908203, 72.46077728271484, 75.09353637695312, 77.72630310058594, 80.35906219482422, 82.9918212890625, 85.62458801269531, 88.2573471069336]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 11.0, 16.0, 18.0, 25.0, 33.0, 56.0, 71.0, 112.0, 188.0, 345.0, 678.0, 1714.0, 4998.0, 24777.0, 3919205.0, 223939.0, 12288.0, 3153.0, 1135.0, 520.0, 321.0, 205.0, 120.0, 80.0, 63.0, 43.0, 39.0, 27.0, 27.0, 18.0, 17.0, 14.0, 4.0, 7.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.46875, -30.2958984375, -29.123046875, -27.9501953125, -26.77734375, -25.6044921875, -24.431640625, -23.2587890625, -22.0859375, -20.9130859375, -19.740234375, -18.5673828125, -17.39453125, -16.2216796875, -15.048828125, -13.8759765625, -12.703125, -11.5302734375, -10.357421875, -9.1845703125, -8.01171875, -6.8388671875, -5.666015625, -4.4931640625, -3.3203125, -2.1474609375, -0.974609375, 0.1982421875, 1.37109375, 2.5439453125, 3.716796875, 4.8896484375, 6.0625, 7.2353515625, 8.408203125, 9.5810546875, 10.75390625, 11.9267578125, 13.099609375, 14.2724609375, 15.4453125, 16.6181640625, 17.791015625, 18.9638671875, 20.13671875, 21.3095703125, 22.482421875, 23.6552734375, 24.828125, 26.0009765625, 27.173828125, 28.3466796875, 29.51953125, 30.6923828125, 31.865234375, 33.0380859375, 34.2109375, 35.3837890625, 36.556640625, 37.7294921875, 38.90234375, 40.0751953125, 41.248046875, 42.4208984375, 43.59375]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 4.0, 8.0, 15.0, 21.0, 23.0, 42.0, 42.0, 47.0, 77.0, 58.0, 86.0, 89.0, 84.0, 78.0, 69.0, 65.0, 41.0, 35.0, 36.0, 30.0, 14.0, 7.0, 12.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.79296875, -2.68121337890625, -2.5694580078125, -2.45770263671875, -2.345947265625, -2.23419189453125, -2.1224365234375, -2.01068115234375, -1.89892578125, -1.78717041015625, -1.6754150390625, -1.56365966796875, -1.451904296875, -1.34014892578125, -1.2283935546875, -1.11663818359375, -1.0048828125, -0.89312744140625, -0.7813720703125, -0.66961669921875, -0.557861328125, -0.44610595703125, -0.3343505859375, -0.22259521484375, -0.11083984375, 0.00091552734375, 0.1126708984375, 0.22442626953125, 0.336181640625, 0.44793701171875, 0.5596923828125, 0.67144775390625, 0.783203125, 0.89495849609375, 1.0067138671875, 1.11846923828125, 1.230224609375, 1.34197998046875, 1.4537353515625, 1.56549072265625, 1.67724609375, 1.78900146484375, 1.9007568359375, 2.01251220703125, 2.124267578125, 2.23602294921875, 2.3477783203125, 2.45953369140625, 2.5712890625, 2.68304443359375, 2.7947998046875, 2.90655517578125, 3.018310546875, 3.13006591796875, 3.2418212890625, 3.35357666015625, 3.46533203125, 3.57708740234375, 3.6888427734375, 3.80059814453125, 3.912353515625, 4.02410888671875, 4.1358642578125, 4.24761962890625, 4.359375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 3.0, 1.0, 4.0, 4.0, 7.0, 7.0, 10.0, 15.0, 42.0, 60.0, 143.0, 350.0, 786.0, 2152.0, 6020.0, 21718.0, 280211.0, 3812606.0, 54292.0, 10368.0, 3314.0, 1270.0, 482.0, 214.0, 96.0, 39.0, 24.0, 12.0, 3.0, 6.0, 5.0, 3.0, 8.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.0, -31.037353515625, -30.07470703125, -29.112060546875, -28.1494140625, -27.186767578125, -26.22412109375, -25.261474609375, -24.298828125, -23.336181640625, -22.37353515625, -21.410888671875, -20.4482421875, -19.485595703125, -18.52294921875, -17.560302734375, -16.59765625, -15.635009765625, -14.67236328125, -13.709716796875, -12.7470703125, -11.784423828125, -10.82177734375, -9.859130859375, -8.896484375, -7.933837890625, -6.97119140625, -6.008544921875, -5.0458984375, -4.083251953125, -3.12060546875, -2.157958984375, -1.1953125, -0.232666015625, 0.72998046875, 1.692626953125, 2.6552734375, 3.617919921875, 4.58056640625, 5.543212890625, 6.505859375, 7.468505859375, 8.43115234375, 9.393798828125, 10.3564453125, 11.319091796875, 12.28173828125, 13.244384765625, 14.20703125, 15.169677734375, 16.13232421875, 17.094970703125, 18.0576171875, 19.020263671875, 19.98291015625, 20.945556640625, 21.908203125, 22.870849609375, 23.83349609375, 24.796142578125, 25.7587890625, 26.721435546875, 27.68408203125, 28.646728515625, 29.609375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 3.0, 0.0, 3.0, 3.0, 7.0, 7.0, 5.0, 4.0, 7.0, 7.0, 16.0, 21.0, 24.0, 35.0, 65.0, 116.0, 251.0, 848.0, 1898.0, 361.0, 143.0, 84.0, 49.0, 24.0, 17.0, 19.0, 10.0, 6.0, 4.0, 7.0, 6.0, 7.0, 6.0, 1.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.1875, -6.98883056640625, -6.7901611328125, -6.59149169921875, -6.392822265625, -6.19415283203125, -5.9954833984375, -5.79681396484375, -5.59814453125, -5.39947509765625, -5.2008056640625, -5.00213623046875, -4.803466796875, -4.60479736328125, -4.4061279296875, -4.20745849609375, -4.0087890625, -3.81011962890625, -3.6114501953125, -3.41278076171875, -3.214111328125, -3.01544189453125, -2.8167724609375, -2.61810302734375, -2.41943359375, -2.22076416015625, -2.0220947265625, -1.82342529296875, -1.624755859375, -1.42608642578125, -1.2274169921875, -1.02874755859375, -0.830078125, -0.63140869140625, -0.4327392578125, -0.23406982421875, -0.035400390625, 0.16326904296875, 0.3619384765625, 0.56060791015625, 0.75927734375, 0.95794677734375, 1.1566162109375, 1.35528564453125, 1.553955078125, 1.75262451171875, 1.9512939453125, 2.14996337890625, 2.3486328125, 2.54730224609375, 2.7459716796875, 2.94464111328125, 3.143310546875, 3.34197998046875, 3.5406494140625, 3.73931884765625, 3.93798828125, 4.13665771484375, 4.3353271484375, 4.53399658203125, 4.732666015625, 4.93133544921875, 5.1300048828125, 5.32867431640625, 5.52734375]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 7.0, 12.0, 23.0, 46.0, 99.0, 181.0, 244.0, 191.0, 114.0, 51.0, 17.0, 6.0, 8.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.51774597167969, -68.58991241455078, -66.66207885742188, -64.73424530029297, -62.80641555786133, -60.87858200073242, -58.95075225830078, -57.022918701171875, -55.09508514404297, -53.16725158691406, -51.239418029785156, -49.311588287353516, -47.38375473022461, -45.4559211730957, -43.52809143066406, -41.600257873535156, -39.67242431640625, -37.744590759277344, -35.81675720214844, -33.8889274597168, -31.96109390258789, -30.033260345458984, -28.10542869567871, -26.177597045898438, -24.24976348876953, -22.321929931640625, -20.39409828186035, -18.466266632080078, -16.538433074951172, -14.610600471496582, -12.682767868041992, -10.754935264587402, -8.827102661132812, -6.899270057678223, -4.971437454223633, -3.043604850769043, -1.1157722473144531, 0.8120603561401367, 2.7398929595947266, 4.667725563049316, 6.595558166503906, 8.523390769958496, 10.451223373413086, 12.379055976867676, 14.306888580322266, 16.234722137451172, 18.162553787231445, 20.09038543701172, 22.018218994140625, 23.94605255126953, 25.873884201049805, 27.801715850830078, 29.729549407958984, 31.65738296508789, 33.58521270751953, 35.51304626464844, 37.440879821777344, 39.36871337890625, 41.296546936035156, 43.2243766784668, 45.1522102355957, 47.08004379272461, 49.00787353515625, 50.935707092285156, 52.86354064941406]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 10.0, 5.0, 8.0, 12.0, 12.0, 18.0, 18.0, 22.0, 20.0, 27.0, 41.0, 40.0, 42.0, 51.0, 67.0, 54.0, 53.0, 64.0, 55.0, 53.0, 46.0, 40.0, 35.0, 38.0, 33.0, 36.0, 16.0, 21.0, 16.0, 10.0, 12.0, 7.0, 11.0, 6.0, 7.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-27.39090347290039, -26.648557662963867, -25.906211853027344, -25.16386604309082, -24.421520233154297, -23.67917251586914, -22.936826705932617, -22.194480895996094, -21.45213508605957, -20.709789276123047, -19.967443466186523, -19.22509765625, -18.482749938964844, -17.74040412902832, -16.998058319091797, -16.255712509155273, -15.51336669921875, -14.771020889282227, -14.028675079345703, -13.286328315734863, -12.54398250579834, -11.801636695861816, -11.059289932250977, -10.316944122314453, -9.57459831237793, -8.832252502441406, -8.089906692504883, -7.347559928894043, -6.6052141189575195, -5.862868309020996, -5.1205220222473145, -4.378175735473633, -3.635831832885742, -2.8934857845306396, -2.151139736175537, -1.4087936878204346, -0.666447639465332, 0.07589840888977051, 0.818244457244873, 1.5605907440185547, 2.302936553955078, 3.0452826023101807, 3.787628650665283, 4.529974937438965, 5.272320747375488, 6.014666557312012, 6.757012844085693, 7.499359130859375, 8.241704940795898, 8.984050750732422, 9.726396560668945, 10.468743324279785, 11.211089134216309, 11.953434944152832, 12.695781707763672, 13.438127517700195, 14.180473327636719, 14.922819137573242, 15.665164947509766, 16.40751075744629, 17.149856567382812, 17.89220428466797, 18.634550094604492, 19.376895904541016, 20.11924171447754]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 1.0, 5.0, 9.0, 13.0, 21.0, 31.0, 33.0, 65.0, 81.0, 107.0, 188.0, 324.0, 516.0, 994.0, 2183.0, 6082.0, 23480.0, 156394.0, 713914.0, 115516.0, 19151.0, 5356.0, 1984.0, 897.0, 432.0, 290.0, 163.0, 103.0, 75.0, 50.0, 23.0, 25.0, 7.0, 9.0, 10.0, 10.0, 7.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-25.109375, -24.194091796875, -23.27880859375, -22.363525390625, -21.4482421875, -20.532958984375, -19.61767578125, -18.702392578125, -17.787109375, -16.871826171875, -15.95654296875, -15.041259765625, -14.1259765625, -13.210693359375, -12.29541015625, -11.380126953125, -10.46484375, -9.549560546875, -8.63427734375, -7.718994140625, -6.8037109375, -5.888427734375, -4.97314453125, -4.057861328125, -3.142578125, -2.227294921875, -1.31201171875, -0.396728515625, 0.5185546875, 1.433837890625, 2.34912109375, 3.264404296875, 4.1796875, 5.094970703125, 6.01025390625, 6.925537109375, 7.8408203125, 8.756103515625, 9.67138671875, 10.586669921875, 11.501953125, 12.417236328125, 13.33251953125, 14.247802734375, 15.1630859375, 16.078369140625, 16.99365234375, 17.908935546875, 18.82421875, 19.739501953125, 20.65478515625, 21.570068359375, 22.4853515625, 23.400634765625, 24.31591796875, 25.231201171875, 26.146484375, 27.061767578125, 27.97705078125, 28.892333984375, 29.8076171875, 30.722900390625, 31.63818359375, 32.553466796875, 33.46875]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 8.0, 7.0, 14.0, 16.0, 28.0, 36.0, 34.0, 61.0, 69.0, 73.0, 82.0, 99.0, 81.0, 75.0, 63.0, 53.0, 55.0, 35.0, 34.0, 18.0, 25.0, 13.0, 6.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.01953125, -2.9029541015625, -2.786376953125, -2.6697998046875, -2.55322265625, -2.4366455078125, -2.320068359375, -2.2034912109375, -2.0869140625, -1.9703369140625, -1.853759765625, -1.7371826171875, -1.62060546875, -1.5040283203125, -1.387451171875, -1.2708740234375, -1.154296875, -1.0377197265625, -0.921142578125, -0.8045654296875, -0.68798828125, -0.5714111328125, -0.454833984375, -0.3382568359375, -0.2216796875, -0.1051025390625, 0.011474609375, 0.1280517578125, 0.24462890625, 0.3612060546875, 0.477783203125, 0.5943603515625, 0.7109375, 0.8275146484375, 0.944091796875, 1.0606689453125, 1.17724609375, 1.2938232421875, 1.410400390625, 1.5269775390625, 1.6435546875, 1.7601318359375, 1.876708984375, 1.9932861328125, 2.10986328125, 2.2264404296875, 2.343017578125, 2.4595947265625, 2.576171875, 2.6927490234375, 2.809326171875, 2.9259033203125, 3.04248046875, 3.1590576171875, 3.275634765625, 3.3922119140625, 3.5087890625, 3.6253662109375, 3.741943359375, 3.8585205078125, 3.97509765625, 4.0916748046875, 4.208251953125, 4.3248291015625, 4.44140625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 6.0, 5.0, 4.0, 8.0, 10.0, 14.0, 30.0, 37.0, 47.0, 74.0, 101.0, 158.0, 220.0, 324.0, 478.0, 843.0, 1840.0, 4959.0, 17975.0, 87121.0, 499862.0, 353992.0, 59759.0, 13115.0, 3965.0, 1505.0, 716.0, 443.0, 283.0, 197.0, 149.0, 88.0, 61.0, 53.0, 32.0, 31.0, 16.0, 8.0, 16.0, 7.0, 5.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.03125, -16.513427734375, -15.99560546875, -15.477783203125, -14.9599609375, -14.442138671875, -13.92431640625, -13.406494140625, -12.888671875, -12.370849609375, -11.85302734375, -11.335205078125, -10.8173828125, -10.299560546875, -9.78173828125, -9.263916015625, -8.74609375, -8.228271484375, -7.71044921875, -7.192626953125, -6.6748046875, -6.156982421875, -5.63916015625, -5.121337890625, -4.603515625, -4.085693359375, -3.56787109375, -3.050048828125, -2.5322265625, -2.014404296875, -1.49658203125, -0.978759765625, -0.4609375, 0.056884765625, 0.57470703125, 1.092529296875, 1.6103515625, 2.128173828125, 2.64599609375, 3.163818359375, 3.681640625, 4.199462890625, 4.71728515625, 5.235107421875, 5.7529296875, 6.270751953125, 6.78857421875, 7.306396484375, 7.82421875, 8.342041015625, 8.85986328125, 9.377685546875, 9.8955078125, 10.413330078125, 10.93115234375, 11.448974609375, 11.966796875, 12.484619140625, 13.00244140625, 13.520263671875, 14.0380859375, 14.555908203125, 15.07373046875, 15.591552734375, 16.109375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 3.0, 5.0, 9.0, 2.0, 8.0, 17.0, 11.0, 18.0, 29.0, 27.0, 22.0, 34.0, 27.0, 35.0, 43.0, 54.0, 53.0, 37.0, 56.0, 46.0, 50.0, 35.0, 36.0, 45.0, 28.0, 46.0, 34.0, 27.0, 29.0, 22.0, 16.0, 14.0, 22.0, 15.0, 7.0, 9.0, 8.0, 4.0, 7.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-10.25, -9.9493408203125, -9.648681640625, -9.3480224609375, -9.04736328125, -8.7467041015625, -8.446044921875, -8.1453857421875, -7.8447265625, -7.5440673828125, -7.243408203125, -6.9427490234375, -6.64208984375, -6.3414306640625, -6.040771484375, -5.7401123046875, -5.439453125, -5.1387939453125, -4.838134765625, -4.5374755859375, -4.23681640625, -3.9361572265625, -3.635498046875, -3.3348388671875, -3.0341796875, -2.7335205078125, -2.432861328125, -2.1322021484375, -1.83154296875, -1.5308837890625, -1.230224609375, -0.9295654296875, -0.62890625, -0.3282470703125, -0.027587890625, 0.2730712890625, 0.57373046875, 0.8743896484375, 1.175048828125, 1.4757080078125, 1.7763671875, 2.0770263671875, 2.377685546875, 2.6783447265625, 2.97900390625, 3.2796630859375, 3.580322265625, 3.8809814453125, 4.181640625, 4.4822998046875, 4.782958984375, 5.0836181640625, 5.38427734375, 5.6849365234375, 5.985595703125, 6.2862548828125, 6.5869140625, 6.8875732421875, 7.188232421875, 7.4888916015625, 7.78955078125, 8.0902099609375, 8.390869140625, 8.6915283203125, 8.9921875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 2.0, 3.0, 6.0, 4.0, 3.0, 9.0, 9.0, 7.0, 14.0, 23.0, 22.0, 58.0, 88.0, 164.0, 382.0, 982.0, 2911.0, 11505.0, 78973.0, 759440.0, 169076.0, 18386.0, 4250.0, 1233.0, 498.0, 222.0, 97.0, 60.0, 30.0, 26.0, 21.0, 10.0, 11.0, 8.0, 5.0, 3.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-13.7578125, -13.348876953125, -12.93994140625, -12.531005859375, -12.1220703125, -11.713134765625, -11.30419921875, -10.895263671875, -10.486328125, -10.077392578125, -9.66845703125, -9.259521484375, -8.8505859375, -8.441650390625, -8.03271484375, -7.623779296875, -7.21484375, -6.805908203125, -6.39697265625, -5.988037109375, -5.5791015625, -5.170166015625, -4.76123046875, -4.352294921875, -3.943359375, -3.534423828125, -3.12548828125, -2.716552734375, -2.3076171875, -1.898681640625, -1.48974609375, -1.080810546875, -0.671875, -0.262939453125, 0.14599609375, 0.554931640625, 0.9638671875, 1.372802734375, 1.78173828125, 2.190673828125, 2.599609375, 3.008544921875, 3.41748046875, 3.826416015625, 4.2353515625, 4.644287109375, 5.05322265625, 5.462158203125, 5.87109375, 6.280029296875, 6.68896484375, 7.097900390625, 7.5068359375, 7.915771484375, 8.32470703125, 8.733642578125, 9.142578125, 9.551513671875, 9.96044921875, 10.369384765625, 10.7783203125, 11.187255859375, 11.59619140625, 12.005126953125, 12.4140625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 4.0, 5.0, 11.0, 10.0, 22.0, 22.0, 37.0, 31.0, 52.0, 59.0, 118.0, 199.0, 138.0, 82.0, 49.0, 46.0, 25.0, 20.0, 19.0, 15.0, 7.0, 6.0, 6.0, 4.0, 4.0, 2.0, 4.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0020618438720703125, -0.0019966959953308105, -0.0019315481185913086, -0.0018664002418518066, -0.0018012523651123047, -0.0017361044883728027, -0.0016709566116333008, -0.0016058087348937988, -0.0015406608581542969, -0.001475512981414795, -0.001410365104675293, -0.001345217227935791, -0.001280069351196289, -0.0012149214744567871, -0.0011497735977172852, -0.0010846257209777832, -0.0010194778442382812, -0.0009543299674987793, -0.0008891820907592773, -0.0008240342140197754, -0.0007588863372802734, -0.0006937384605407715, -0.0006285905838012695, -0.0005634427070617676, -0.0004982948303222656, -0.00043314695358276367, -0.0003679990768432617, -0.00030285120010375977, -0.0002377033233642578, -0.00017255544662475586, -0.0001074075698852539, -4.225969314575195e-05, 2.288818359375e-05, 8.803606033325195e-05, 0.0001531839370727539, 0.00021833181381225586, 0.0002834796905517578, 0.00034862756729125977, 0.0004137754440307617, 0.00047892332077026367, 0.0005440711975097656, 0.0006092190742492676, 0.0006743669509887695, 0.0007395148277282715, 0.0008046627044677734, 0.0008698105812072754, 0.0009349584579467773, 0.0010001063346862793, 0.0010652542114257812, 0.0011304020881652832, 0.0011955499649047852, 0.0012606978416442871, 0.001325845718383789, 0.001390993595123291, 0.001456141471862793, 0.001521289348602295, 0.0015864372253417969, 0.0016515851020812988, 0.0017167329788208008, 0.0017818808555603027, 0.0018470287322998047, 0.0019121766090393066, 0.0019773244857788086, 0.0020424723625183105, 0.0021076202392578125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 7.0, 6.0, 7.0, 10.0, 13.0, 29.0, 31.0, 91.0, 169.0, 487.0, 1839.0, 16156.0, 954004.0, 70830.0, 3654.0, 699.0, 256.0, 120.0, 56.0, 26.0, 23.0, 13.0, 8.0, 6.0, 7.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-30.140625, -29.189453125, -28.23828125, -27.287109375, -26.3359375, -25.384765625, -24.43359375, -23.482421875, -22.53125, -21.580078125, -20.62890625, -19.677734375, -18.7265625, -17.775390625, -16.82421875, -15.873046875, -14.921875, -13.970703125, -13.01953125, -12.068359375, -11.1171875, -10.166015625, -9.21484375, -8.263671875, -7.3125, -6.361328125, -5.41015625, -4.458984375, -3.5078125, -2.556640625, -1.60546875, -0.654296875, 0.296875, 1.248046875, 2.19921875, 3.150390625, 4.1015625, 5.052734375, 6.00390625, 6.955078125, 7.90625, 8.857421875, 9.80859375, 10.759765625, 11.7109375, 12.662109375, 13.61328125, 14.564453125, 15.515625, 16.466796875, 17.41796875, 18.369140625, 19.3203125, 20.271484375, 21.22265625, 22.173828125, 23.125, 24.076171875, 25.02734375, 25.978515625, 26.9296875, 27.880859375, 28.83203125, 29.783203125, 30.734375]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 4.0, 5.0, 0.0, 7.0, 4.0, 3.0, 12.0, 11.0, 26.0, 33.0, 76.0, 117.0, 161.0, 176.0, 137.0, 81.0, 64.0, 37.0, 16.0, 12.0, 5.0, 5.0, 3.0, 4.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-12.703125, -12.40960693359375, -12.1160888671875, -11.82257080078125, -11.529052734375, -11.23553466796875, -10.9420166015625, -10.64849853515625, -10.35498046875, -10.06146240234375, -9.7679443359375, -9.47442626953125, -9.180908203125, -8.88739013671875, -8.5938720703125, -8.30035400390625, -8.0068359375, -7.71331787109375, -7.4197998046875, -7.12628173828125, -6.832763671875, -6.53924560546875, -6.2457275390625, -5.95220947265625, -5.65869140625, -5.36517333984375, -5.0716552734375, -4.77813720703125, -4.484619140625, -4.19110107421875, -3.8975830078125, -3.60406494140625, -3.310546875, -3.01702880859375, -2.7235107421875, -2.42999267578125, -2.136474609375, -1.84295654296875, -1.5494384765625, -1.25592041015625, -0.96240234375, -0.66888427734375, -0.3753662109375, -0.08184814453125, 0.211669921875, 0.50518798828125, 0.7987060546875, 1.09222412109375, 1.3857421875, 1.67926025390625, 1.9727783203125, 2.26629638671875, 2.559814453125, 2.85333251953125, 3.1468505859375, 3.44036865234375, 3.73388671875, 4.02740478515625, 4.3209228515625, 4.61444091796875, 4.907958984375, 5.20147705078125, 5.4949951171875, 5.78851318359375, 6.08203125]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 6.0, 23.0, 63.0, 112.0, 203.0, 270.0, 201.0, 80.0, 24.0, 15.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-251.78115844726562, -246.55262756347656, -241.3240966796875, -236.09556579589844, -230.86703491210938, -225.6385040283203, -220.40997314453125, -215.18145751953125, -209.95291137695312, -204.72438049316406, -199.495849609375, -194.26731872558594, -189.03878784179688, -183.8102569580078, -178.58172607421875, -173.35321044921875, -168.1246795654297, -162.89614868164062, -157.66761779785156, -152.4390869140625, -147.21055603027344, -141.98202514648438, -136.7534942626953, -131.52496337890625, -126.29644012451172, -121.06790924072266, -115.8393783569336, -110.61084747314453, -105.38232421875, -100.15379333496094, -94.92526245117188, -89.69673156738281, -84.46820068359375, -79.23966979980469, -74.01113891601562, -68.78260803222656, -63.554080963134766, -58.3255500793457, -53.097023010253906, -47.868492126464844, -42.63996124267578, -37.41143035888672, -32.182899475097656, -26.95437240600586, -21.725841522216797, -16.497310638427734, -11.268781661987305, -6.040252685546875, -0.8117218017578125, 4.416808128356934, 9.64533805847168, 14.873867988586426, 20.102397918701172, 25.330928802490234, 30.559457778930664, 35.787986755371094, 41.016517639160156, 46.24504852294922, 51.47357940673828, 56.70210647583008, 61.93063735961914, 67.15916442871094, 72.3876953125, 77.61622619628906, 82.84475708007812]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 9.0, 5.0, 6.0, 6.0, 10.0, 13.0, 16.0, 17.0, 21.0, 26.0, 24.0, 25.0, 41.0, 20.0, 40.0, 24.0, 43.0, 39.0, 43.0, 44.0, 40.0, 36.0, 53.0, 34.0, 34.0, 47.0, 50.0, 29.0, 32.0, 33.0, 29.0, 24.0, 15.0, 13.0, 11.0, 16.0, 10.0, 5.0, 4.0, 4.0, 7.0, 1.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.58219528198242, -52.996856689453125, -51.411521911621094, -49.8261833190918, -48.2408447265625, -46.6555061340332, -45.070167541503906, -43.484832763671875, -41.89949417114258, -40.31415557861328, -38.72882080078125, -37.14348220825195, -35.558143615722656, -33.97280502319336, -32.38746643066406, -30.80213165283203, -29.216793060302734, -27.631454467773438, -26.046117782592773, -24.46078109741211, -22.875442504882812, -21.290103912353516, -19.70476722717285, -18.119430541992188, -16.53409194946289, -14.94875431060791, -13.36341667175293, -11.77807903289795, -10.192741394042969, -8.607403755187988, -7.022066116333008, -5.436728477478027, -3.8513870239257812, -2.266049385070801, -0.6807117462158203, 0.9046258926391602, 2.4899635314941406, 4.075301170349121, 5.660638809204102, 7.245976448059082, 8.831314086914062, 10.416651725769043, 12.001989364624023, 13.587327003479004, 15.172664642333984, 16.75800323486328, 18.343339920043945, 19.92867660522461, 21.514015197753906, 23.099353790283203, 24.684690475463867, 26.27002716064453, 27.855365753173828, 29.440704345703125, 31.02604103088379, 32.61137771606445, 34.19671630859375, 35.78205490112305, 37.367393493652344, 38.952728271484375, 40.53806686401367, 42.12340545654297, 43.708740234375, 45.2940788269043, 46.879417419433594]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 7.0, 5.0, 10.0, 15.0, 21.0, 25.0, 39.0, 71.0, 91.0, 185.0, 377.0, 892.0, 2318.0, 8192.0, 63243.0, 4021851.0, 82838.0, 9310.0, 2528.0, 936.0, 464.0, 266.0, 163.0, 89.0, 71.0, 51.0, 61.0, 34.0, 20.0, 21.0, 18.0, 15.0, 8.0, 12.0, 11.0, 5.0, 8.0, 4.0, 2.0, 1.0, 1.0, 4.0, 0.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.78125, -20.60693359375, -19.4326171875, -18.25830078125, -17.083984375, -15.90966796875, -14.7353515625, -13.56103515625, -12.38671875, -11.21240234375, -10.0380859375, -8.86376953125, -7.689453125, -6.51513671875, -5.3408203125, -4.16650390625, -2.9921875, -1.81787109375, -0.6435546875, 0.53076171875, 1.705078125, 2.87939453125, 4.0537109375, 5.22802734375, 6.40234375, 7.57666015625, 8.7509765625, 9.92529296875, 11.099609375, 12.27392578125, 13.4482421875, 14.62255859375, 15.796875, 16.97119140625, 18.1455078125, 19.31982421875, 20.494140625, 21.66845703125, 22.8427734375, 24.01708984375, 25.19140625, 26.36572265625, 27.5400390625, 28.71435546875, 29.888671875, 31.06298828125, 32.2373046875, 33.41162109375, 34.5859375, 35.76025390625, 36.9345703125, 38.10888671875, 39.283203125, 40.45751953125, 41.6318359375, 42.80615234375, 43.98046875, 45.15478515625, 46.3291015625, 47.50341796875, 48.677734375, 49.85205078125, 51.0263671875, 52.20068359375, 53.375]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 6.0, 3.0, 12.0, 16.0, 20.0, 40.0, 36.0, 51.0, 84.0, 94.0, 95.0, 113.0, 105.0, 73.0, 72.0, 50.0, 39.0, 37.0, 18.0, 19.0, 10.0, 4.0, 5.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.775390625, -2.633148193359375, -2.49090576171875, -2.348663330078125, -2.2064208984375, -2.064178466796875, -1.92193603515625, -1.779693603515625, -1.637451171875, -1.495208740234375, -1.35296630859375, -1.210723876953125, -1.0684814453125, -0.926239013671875, -0.78399658203125, -0.641754150390625, -0.49951171875, -0.357269287109375, -0.21502685546875, -0.072784423828125, 0.0694580078125, 0.211700439453125, 0.35394287109375, 0.496185302734375, 0.638427734375, 0.780670166015625, 0.92291259765625, 1.065155029296875, 1.2073974609375, 1.349639892578125, 1.49188232421875, 1.634124755859375, 1.7763671875, 1.918609619140625, 2.06085205078125, 2.203094482421875, 2.3453369140625, 2.487579345703125, 2.62982177734375, 2.772064208984375, 2.914306640625, 3.056549072265625, 3.19879150390625, 3.341033935546875, 3.4832763671875, 3.625518798828125, 3.76776123046875, 3.910003662109375, 4.05224609375, 4.194488525390625, 4.33673095703125, 4.478973388671875, 4.6212158203125, 4.763458251953125, 4.90570068359375, 5.047943115234375, 5.190185546875, 5.332427978515625, 5.47467041015625, 5.616912841796875, 5.7591552734375, 5.901397705078125, 6.04364013671875, 6.185882568359375, 6.328125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 4.0, 3.0, 2.0, 5.0, 1.0, 4.0, 6.0, 13.0, 17.0, 22.0, 44.0, 85.0, 199.0, 510.0, 1398.0, 4301.0, 17936.0, 215234.0, 3866126.0, 73571.0, 10380.0, 2785.0, 956.0, 360.0, 145.0, 75.0, 40.0, 18.0, 14.0, 13.0, 8.0, 5.0, 4.0, 1.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.3125, -39.28759765625, -38.2626953125, -37.23779296875, -36.212890625, -35.18798828125, -34.1630859375, -33.13818359375, -32.11328125, -31.08837890625, -30.0634765625, -29.03857421875, -28.013671875, -26.98876953125, -25.9638671875, -24.93896484375, -23.9140625, -22.88916015625, -21.8642578125, -20.83935546875, -19.814453125, -18.78955078125, -17.7646484375, -16.73974609375, -15.71484375, -14.68994140625, -13.6650390625, -12.64013671875, -11.615234375, -10.59033203125, -9.5654296875, -8.54052734375, -7.515625, -6.49072265625, -5.4658203125, -4.44091796875, -3.416015625, -2.39111328125, -1.3662109375, -0.34130859375, 0.68359375, 1.70849609375, 2.7333984375, 3.75830078125, 4.783203125, 5.80810546875, 6.8330078125, 7.85791015625, 8.8828125, 9.90771484375, 10.9326171875, 11.95751953125, 12.982421875, 14.00732421875, 15.0322265625, 16.05712890625, 17.08203125, 18.10693359375, 19.1318359375, 20.15673828125, 21.181640625, 22.20654296875, 23.2314453125, 24.25634765625, 25.28125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 7.0, 3.0, 4.0, 6.0, 7.0, 10.0, 13.0, 26.0, 20.0, 42.0, 69.0, 143.0, 326.0, 1538.0, 1247.0, 278.0, 135.0, 67.0, 36.0, 31.0, 20.0, 8.0, 9.0, 10.0, 7.0, 6.0, 1.0, 4.0, 1.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.1328125, -10.8314208984375, -10.530029296875, -10.2286376953125, -9.92724609375, -9.6258544921875, -9.324462890625, -9.0230712890625, -8.7216796875, -8.4202880859375, -8.118896484375, -7.8175048828125, -7.51611328125, -7.2147216796875, -6.913330078125, -6.6119384765625, -6.310546875, -6.0091552734375, -5.707763671875, -5.4063720703125, -5.10498046875, -4.8035888671875, -4.502197265625, -4.2008056640625, -3.8994140625, -3.5980224609375, -3.296630859375, -2.9952392578125, -2.69384765625, -2.3924560546875, -2.091064453125, -1.7896728515625, -1.48828125, -1.1868896484375, -0.885498046875, -0.5841064453125, -0.28271484375, 0.0186767578125, 0.320068359375, 0.6214599609375, 0.9228515625, 1.2242431640625, 1.525634765625, 1.8270263671875, 2.12841796875, 2.4298095703125, 2.731201171875, 3.0325927734375, 3.333984375, 3.6353759765625, 3.936767578125, 4.2381591796875, 4.53955078125, 4.8409423828125, 5.142333984375, 5.4437255859375, 5.7451171875, 6.0465087890625, 6.347900390625, 6.6492919921875, 6.95068359375, 7.2520751953125, 7.553466796875, 7.8548583984375, 8.15625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 7.0, 11.0, 44.0, 86.0, 203.0, 337.0, 206.0, 69.0, 30.0, 15.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-144.18704223632812, -140.9467010498047, -137.70635986328125, -134.46603393554688, -131.22569274902344, -127.9853515625, -124.7450180053711, -121.50467681884766, -118.26434326171875, -115.02400207519531, -111.7836685180664, -108.54332733154297, -105.30299377441406, -102.06265258789062, -98.82231903076172, -95.58197784423828, -92.34164428710938, -89.10130310058594, -85.86096954345703, -82.6206283569336, -79.38029479980469, -76.13995361328125, -72.89962005615234, -69.6592788696289, -66.41893768310547, -63.1786003112793, -59.938262939453125, -56.69792556762695, -53.45758819580078, -50.217247009277344, -46.97691345214844, -43.736572265625, -40.496238708496094, -37.25590133666992, -34.01556396484375, -30.775226593017578, -27.534889221191406, -24.2945499420166, -21.05421257019043, -17.813875198364258, -14.573537826538086, -11.333200454711914, -8.092863082885742, -4.852524757385254, -1.612187385559082, 1.6281509399414062, 4.868488311767578, 8.10882568359375, 11.349163055419922, 14.589500427246094, 17.829837799072266, 21.070175170898438, 24.31051254272461, 27.550851821899414, 30.791189193725586, 34.031524658203125, 37.27186584472656, 40.512203216552734, 43.752540588378906, 46.99287796020508, 50.23321533203125, 53.47355651855469, 56.713890075683594, 59.95423126220703, 63.19456481933594]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 3.0, 5.0, 5.0, 3.0, 10.0, 10.0, 13.0, 10.0, 21.0, 22.0, 21.0, 29.0, 39.0, 26.0, 42.0, 43.0, 47.0, 43.0, 46.0, 39.0, 54.0, 41.0, 44.0, 40.0, 40.0, 30.0, 37.0, 37.0, 33.0, 31.0, 29.0, 20.0, 17.0, 21.0, 12.0, 13.0, 6.0, 7.0, 2.0, 5.0, 4.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-28.6551513671875, -27.839405059814453, -27.02366065979004, -26.207914352416992, -25.392169952392578, -24.57642364501953, -23.760677337646484, -22.944931030273438, -22.129186630249023, -21.313440322875977, -20.497695922851562, -19.681949615478516, -18.86620330810547, -18.050458908081055, -17.234712600708008, -16.418968200683594, -15.603221893310547, -14.787476539611816, -13.971731185913086, -13.155984878540039, -12.340239524841309, -11.524494171142578, -10.708747863769531, -9.8930025100708, -9.07725715637207, -8.26151180267334, -7.445765972137451, -6.6300201416015625, -5.814274787902832, -4.998529434204102, -4.182783603668213, -3.367037773132324, -2.5512924194335938, -1.7355468273162842, -0.9198012351989746, -0.10405564308166504, 0.7116899490356445, 1.527435302734375, 2.3431811332702637, 3.1589269638061523, 3.974672317504883, 4.790417671203613, 5.606163501739502, 6.421909332275391, 7.237654685974121, 8.053400039672852, 8.869146347045898, 9.684891700744629, 10.50063705444336, 11.31638240814209, 12.13212776184082, 12.947874069213867, 13.763619422912598, 14.579364776611328, 15.395111083984375, 16.210857391357422, 17.026601791381836, 17.842348098754883, 18.658092498779297, 19.473838806152344, 20.28958511352539, 21.105329513549805, 21.92107582092285, 22.736820220947266, 23.552566528320312]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 3.0, 3.0, 8.0, 7.0, 5.0, 13.0, 17.0, 18.0, 36.0, 49.0, 102.0, 142.0, 367.0, 991.0, 4146.0, 30652.0, 817591.0, 178748.0, 12353.0, 2118.0, 618.0, 264.0, 131.0, 64.0, 41.0, 16.0, 22.0, 17.0, 5.0, 3.0, 2.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.65625, -54.1435546875, -52.630859375, -51.1181640625, -49.60546875, -48.0927734375, -46.580078125, -45.0673828125, -43.5546875, -42.0419921875, -40.529296875, -39.0166015625, -37.50390625, -35.9912109375, -34.478515625, -32.9658203125, -31.453125, -29.9404296875, -28.427734375, -26.9150390625, -25.40234375, -23.8896484375, -22.376953125, -20.8642578125, -19.3515625, -17.8388671875, -16.326171875, -14.8134765625, -13.30078125, -11.7880859375, -10.275390625, -8.7626953125, -7.25, -5.7373046875, -4.224609375, -2.7119140625, -1.19921875, 0.3134765625, 1.826171875, 3.3388671875, 4.8515625, 6.3642578125, 7.876953125, 9.3896484375, 10.90234375, 12.4150390625, 13.927734375, 15.4404296875, 16.953125, 18.4658203125, 19.978515625, 21.4912109375, 23.00390625, 24.5166015625, 26.029296875, 27.5419921875, 29.0546875, 30.5673828125, 32.080078125, 33.5927734375, 35.10546875, 36.6181640625, 38.130859375, 39.6435546875, 41.15625]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 3.0, 10.0, 13.0, 28.0, 48.0, 68.0, 81.0, 79.0, 110.0, 109.0, 110.0, 85.0, 62.0, 67.0, 35.0, 26.0, 30.0, 10.0, 13.0, 9.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.08984375, -2.932373046875, -2.77490234375, -2.617431640625, -2.4599609375, -2.302490234375, -2.14501953125, -1.987548828125, -1.830078125, -1.672607421875, -1.51513671875, -1.357666015625, -1.2001953125, -1.042724609375, -0.88525390625, -0.727783203125, -0.5703125, -0.412841796875, -0.25537109375, -0.097900390625, 0.0595703125, 0.217041015625, 0.37451171875, 0.531982421875, 0.689453125, 0.846923828125, 1.00439453125, 1.161865234375, 1.3193359375, 1.476806640625, 1.63427734375, 1.791748046875, 1.94921875, 2.106689453125, 2.26416015625, 2.421630859375, 2.5791015625, 2.736572265625, 2.89404296875, 3.051513671875, 3.208984375, 3.366455078125, 3.52392578125, 3.681396484375, 3.8388671875, 3.996337890625, 4.15380859375, 4.311279296875, 4.46875, 4.626220703125, 4.78369140625, 4.941162109375, 5.0986328125, 5.256103515625, 5.41357421875, 5.571044921875, 5.728515625, 5.885986328125, 6.04345703125, 6.200927734375, 6.3583984375, 6.515869140625, 6.67333984375, 6.830810546875, 6.98828125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 4.0, 6.0, 10.0, 8.0, 19.0, 31.0, 26.0, 57.0, 99.0, 178.0, 253.0, 462.0, 1060.0, 3471.0, 26705.0, 608290.0, 382462.0, 20381.0, 3066.0, 877.0, 426.0, 272.0, 139.0, 105.0, 63.0, 44.0, 20.0, 11.0, 6.0, 6.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-38.15625, -37.150634765625, -36.14501953125, -35.139404296875, -34.1337890625, -33.128173828125, -32.12255859375, -31.116943359375, -30.111328125, -29.105712890625, -28.10009765625, -27.094482421875, -26.0888671875, -25.083251953125, -24.07763671875, -23.072021484375, -22.06640625, -21.060791015625, -20.05517578125, -19.049560546875, -18.0439453125, -17.038330078125, -16.03271484375, -15.027099609375, -14.021484375, -13.015869140625, -12.01025390625, -11.004638671875, -9.9990234375, -8.993408203125, -7.98779296875, -6.982177734375, -5.9765625, -4.970947265625, -3.96533203125, -2.959716796875, -1.9541015625, -0.948486328125, 0.05712890625, 1.062744140625, 2.068359375, 3.073974609375, 4.07958984375, 5.085205078125, 6.0908203125, 7.096435546875, 8.10205078125, 9.107666015625, 10.11328125, 11.118896484375, 12.12451171875, 13.130126953125, 14.1357421875, 15.141357421875, 16.14697265625, 17.152587890625, 18.158203125, 19.163818359375, 20.16943359375, 21.175048828125, 22.1806640625, 23.186279296875, 24.19189453125, 25.197509765625, 26.203125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 2.0, 10.0, 5.0, 10.0, 14.0, 14.0, 25.0, 35.0, 20.0, 37.0, 39.0, 37.0, 49.0, 60.0, 51.0, 64.0, 58.0, 44.0, 48.0, 58.0, 57.0, 44.0, 37.0, 26.0, 29.0, 36.0, 25.0, 15.0, 17.0, 13.0, 9.0, 8.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.1875, -15.7471923828125, -15.306884765625, -14.8665771484375, -14.42626953125, -13.9859619140625, -13.545654296875, -13.1053466796875, -12.6650390625, -12.2247314453125, -11.784423828125, -11.3441162109375, -10.90380859375, -10.4635009765625, -10.023193359375, -9.5828857421875, -9.142578125, -8.7022705078125, -8.261962890625, -7.8216552734375, -7.38134765625, -6.9410400390625, -6.500732421875, -6.0604248046875, -5.6201171875, -5.1798095703125, -4.739501953125, -4.2991943359375, -3.85888671875, -3.4185791015625, -2.978271484375, -2.5379638671875, -2.09765625, -1.6573486328125, -1.217041015625, -0.7767333984375, -0.33642578125, 0.1038818359375, 0.544189453125, 0.9844970703125, 1.4248046875, 1.8651123046875, 2.305419921875, 2.7457275390625, 3.18603515625, 3.6263427734375, 4.066650390625, 4.5069580078125, 4.947265625, 5.3875732421875, 5.827880859375, 6.2681884765625, 6.70849609375, 7.1488037109375, 7.589111328125, 8.0294189453125, 8.4697265625, 8.9100341796875, 9.350341796875, 9.7906494140625, 10.23095703125, 10.6712646484375, 11.111572265625, 11.5518798828125, 11.9921875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 9.0, 7.0, 13.0, 21.0, 27.0, 44.0, 63.0, 100.0, 208.0, 304.0, 564.0, 1024.0, 2244.0, 6033.0, 22514.0, 184749.0, 758379.0, 54519.0, 10998.0, 3471.0, 1495.0, 740.0, 397.0, 258.0, 136.0, 86.0, 55.0, 32.0, 22.0, 17.0, 17.0, 5.0, 4.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.5390625, -13.1318359375, -12.724609375, -12.3173828125, -11.91015625, -11.5029296875, -11.095703125, -10.6884765625, -10.28125, -9.8740234375, -9.466796875, -9.0595703125, -8.65234375, -8.2451171875, -7.837890625, -7.4306640625, -7.0234375, -6.6162109375, -6.208984375, -5.8017578125, -5.39453125, -4.9873046875, -4.580078125, -4.1728515625, -3.765625, -3.3583984375, -2.951171875, -2.5439453125, -2.13671875, -1.7294921875, -1.322265625, -0.9150390625, -0.5078125, -0.1005859375, 0.306640625, 0.7138671875, 1.12109375, 1.5283203125, 1.935546875, 2.3427734375, 2.75, 3.1572265625, 3.564453125, 3.9716796875, 4.37890625, 4.7861328125, 5.193359375, 5.6005859375, 6.0078125, 6.4150390625, 6.822265625, 7.2294921875, 7.63671875, 8.0439453125, 8.451171875, 8.8583984375, 9.265625, 9.6728515625, 10.080078125, 10.4873046875, 10.89453125, 11.3017578125, 11.708984375, 12.1162109375, 12.5234375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 5.0, 9.0, 4.0, 7.0, 11.0, 21.0, 33.0, 41.0, 57.0, 157.0, 289.0, 144.0, 58.0, 43.0, 29.0, 19.0, 21.0, 12.0, 10.0, 8.0, 4.0, 2.0, 5.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0032329559326171875, -0.0031489431858062744, -0.0030649304389953613, -0.0029809176921844482, -0.002896904945373535, -0.002812892198562622, -0.002728879451751709, -0.002644866704940796, -0.002560853958129883, -0.0024768412113189697, -0.0023928284645080566, -0.0023088157176971436, -0.0022248029708862305, -0.0021407902240753174, -0.0020567774772644043, -0.001972764730453491, -0.0018887519836425781, -0.001804739236831665, -0.001720726490020752, -0.0016367137432098389, -0.0015527009963989258, -0.0014686882495880127, -0.0013846755027770996, -0.0013006627559661865, -0.0012166500091552734, -0.0011326372623443604, -0.0010486245155334473, -0.0009646117687225342, -0.0008805990219116211, -0.000796586275100708, -0.0007125735282897949, -0.0006285607814788818, -0.0005445480346679688, -0.00046053528785705566, -0.0003765225410461426, -0.0002925097942352295, -0.0002084970474243164, -0.00012448430061340332, -4.0471553802490234e-05, 4.354119300842285e-05, 0.00012755393981933594, 0.00021156668663024902, 0.0002955794334411621, 0.0003795921802520752, 0.0004636049270629883, 0.0005476176738739014, 0.0006316304206848145, 0.0007156431674957275, 0.0007996559143066406, 0.0008836686611175537, 0.0009676814079284668, 0.0010516941547393799, 0.001135706901550293, 0.001219719648361206, 0.0013037323951721191, 0.0013877451419830322, 0.0014717578887939453, 0.0015557706356048584, 0.0016397833824157715, 0.0017237961292266846, 0.0018078088760375977, 0.0018918216228485107, 0.001975834369659424, 0.002059847116470337, 0.00214385986328125]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 7.0, 3.0, 2.0, 4.0, 3.0, 2.0, 7.0, 11.0, 11.0, 12.0, 24.0, 29.0, 56.0, 77.0, 107.0, 232.0, 427.0, 1001.0, 2725.0, 10817.0, 95438.0, 866257.0, 59174.0, 8105.0, 2251.0, 831.0, 389.0, 210.0, 123.0, 65.0, 47.0, 28.0, 16.0, 17.0, 11.0, 15.0, 6.0, 7.0, 6.0, 2.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.2109375, -13.6925048828125, -13.174072265625, -12.6556396484375, -12.13720703125, -11.6187744140625, -11.100341796875, -10.5819091796875, -10.0634765625, -9.5450439453125, -9.026611328125, -8.5081787109375, -7.98974609375, -7.4713134765625, -6.952880859375, -6.4344482421875, -5.916015625, -5.3975830078125, -4.879150390625, -4.3607177734375, -3.84228515625, -3.3238525390625, -2.805419921875, -2.2869873046875, -1.7685546875, -1.2501220703125, -0.731689453125, -0.2132568359375, 0.30517578125, 0.8236083984375, 1.342041015625, 1.8604736328125, 2.37890625, 2.8973388671875, 3.415771484375, 3.9342041015625, 4.45263671875, 4.9710693359375, 5.489501953125, 6.0079345703125, 6.5263671875, 7.0447998046875, 7.563232421875, 8.0816650390625, 8.60009765625, 9.1185302734375, 9.636962890625, 10.1553955078125, 10.673828125, 11.1922607421875, 11.710693359375, 12.2291259765625, 12.74755859375, 13.2659912109375, 13.784423828125, 14.3028564453125, 14.8212890625, 15.3397216796875, 15.858154296875, 16.3765869140625, 16.89501953125, 17.4134521484375, 17.931884765625, 18.4503173828125, 18.96875]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 1.0, 1.0, 3.0, 7.0, 7.0, 5.0, 16.0, 16.0, 12.0, 29.0, 35.0, 57.0, 70.0, 133.0, 167.0, 147.0, 81.0, 51.0, 49.0, 33.0, 18.0, 16.0, 10.0, 12.0, 5.0, 3.0, 4.0, 6.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.7578125, -7.512451171875, -7.26708984375, -7.021728515625, -6.7763671875, -6.531005859375, -6.28564453125, -6.040283203125, -5.794921875, -5.549560546875, -5.30419921875, -5.058837890625, -4.8134765625, -4.568115234375, -4.32275390625, -4.077392578125, -3.83203125, -3.586669921875, -3.34130859375, -3.095947265625, -2.8505859375, -2.605224609375, -2.35986328125, -2.114501953125, -1.869140625, -1.623779296875, -1.37841796875, -1.133056640625, -0.8876953125, -0.642333984375, -0.39697265625, -0.151611328125, 0.09375, 0.339111328125, 0.58447265625, 0.829833984375, 1.0751953125, 1.320556640625, 1.56591796875, 1.811279296875, 2.056640625, 2.302001953125, 2.54736328125, 2.792724609375, 3.0380859375, 3.283447265625, 3.52880859375, 3.774169921875, 4.01953125, 4.264892578125, 4.51025390625, 4.755615234375, 5.0009765625, 5.246337890625, 5.49169921875, 5.737060546875, 5.982421875, 6.227783203125, 6.47314453125, 6.718505859375, 6.9638671875, 7.209228515625, 7.45458984375, 7.699951171875, 7.9453125]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 6.0, 36.0, 132.0, 447.0, 297.0, 72.0, 15.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-265.8282775878906, -254.632568359375, -243.43685913085938, -232.24114990234375, -221.04544067382812, -209.8497314453125, -198.65402221679688, -187.45831298828125, -176.26260375976562, -165.06689453125, -153.87118530273438, -142.67547607421875, -131.47976684570312, -120.2840576171875, -109.08834838867188, -97.89263916015625, -86.69692993164062, -75.501220703125, -64.30551147460938, -53.10980224609375, -41.914093017578125, -30.7183837890625, -19.522674560546875, -8.32696533203125, 2.868743896484375, 14.064453125, 25.260162353515625, 36.45587158203125, 47.651580810546875, 58.8472900390625, 70.04299926757812, 81.23870849609375, 92.4344482421875, 103.63015747070312, 114.82586669921875, 126.02157592773438, 137.21728515625, 148.41299438476562, 159.60870361328125, 170.80441284179688, 182.0001220703125, 193.19583129882812, 204.39154052734375, 215.58724975585938, 226.782958984375, 237.97866821289062, 249.17437744140625, 260.3700866699219, 271.5657958984375, 282.7615051269531, 293.95721435546875, 305.1529235839844, 316.3486328125, 327.5443420410156, 338.74005126953125, 349.9357604980469, 361.1314697265625, 372.3271789550781, 383.52288818359375, 394.7185974121094, 405.914306640625, 417.1100158691406, 428.30572509765625, 439.5014343261719, 450.6971435546875]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 8.0, 7.0, 8.0, 8.0, 14.0, 14.0, 11.0, 20.0, 19.0, 30.0, 33.0, 34.0, 30.0, 36.0, 51.0, 44.0, 40.0, 51.0, 41.0, 44.0, 47.0, 25.0, 55.0, 30.0, 38.0, 43.0, 42.0, 26.0, 27.0, 23.0, 20.0, 14.0, 17.0, 9.0, 9.0, 8.0, 4.0, 7.0, 3.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-66.44593048095703, -64.49459838867188, -62.54326248168945, -60.59192657470703, -58.640594482421875, -56.68925857543945, -54.73792266845703, -52.786590576171875, -50.83525466918945, -48.88391876220703, -46.932586669921875, -44.98125076293945, -43.0299186706543, -41.078582763671875, -39.12725067138672, -37.1759147644043, -35.224578857421875, -33.27324295043945, -31.321910858154297, -29.370574951171875, -27.419240951538086, -25.467906951904297, -23.516572952270508, -21.56523895263672, -19.613906860351562, -17.662572860717773, -15.711237907409668, -13.759903907775879, -11.808568954467773, -9.857234954833984, -7.905900955200195, -5.95456600189209, -4.003231048583984, -2.051896572113037, -0.10056233406066895, 1.8507719039916992, 3.8021063804626465, 5.753440856933594, 7.704774856567383, 9.656109809875488, 11.607443809509277, 13.558777809143066, 15.510112762451172, 17.46144676208496, 19.41278076171875, 21.364116668701172, 23.315448760986328, 25.26678466796875, 27.21811866760254, 29.169452667236328, 31.120786666870117, 33.072120666503906, 35.02345657348633, 36.97479248046875, 38.926124572753906, 40.87746047973633, 42.828792572021484, 44.780128479003906, 46.73146057128906, 48.682796478271484, 50.63412857055664, 52.58546447753906, 54.53679656982422, 56.48813247680664, 58.43946838378906]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 5.0, 6.0, 7.0, 7.0, 10.0, 8.0, 9.0, 20.0, 24.0, 45.0, 71.0, 137.0, 225.0, 451.0, 990.0, 2521.0, 7921.0, 49232.0, 3982963.0, 131268.0, 12358.0, 3305.0, 1222.0, 567.0, 267.0, 161.0, 119.0, 76.0, 69.0, 44.0, 33.0, 20.0, 21.0, 15.0, 17.0, 16.0, 16.0, 4.0, 4.0, 9.0, 8.0, 10.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-21.90625, -20.7919921875, -19.677734375, -18.5634765625, -17.44921875, -16.3349609375, -15.220703125, -14.1064453125, -12.9921875, -11.8779296875, -10.763671875, -9.6494140625, -8.53515625, -7.4208984375, -6.306640625, -5.1923828125, -4.078125, -2.9638671875, -1.849609375, -0.7353515625, 0.37890625, 1.4931640625, 2.607421875, 3.7216796875, 4.8359375, 5.9501953125, 7.064453125, 8.1787109375, 9.29296875, 10.4072265625, 11.521484375, 12.6357421875, 13.75, 14.8642578125, 15.978515625, 17.0927734375, 18.20703125, 19.3212890625, 20.435546875, 21.5498046875, 22.6640625, 23.7783203125, 24.892578125, 26.0068359375, 27.12109375, 28.2353515625, 29.349609375, 30.4638671875, 31.578125, 32.6923828125, 33.806640625, 34.9208984375, 36.03515625, 37.1494140625, 38.263671875, 39.3779296875, 40.4921875, 41.6064453125, 42.720703125, 43.8349609375, 44.94921875, 46.0634765625, 47.177734375, 48.2919921875, 49.40625]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 7.0, 6.0, 9.0, 22.0, 34.0, 47.0, 49.0, 70.0, 83.0, 75.0, 96.0, 86.0, 86.0, 80.0, 66.0, 62.0, 33.0, 31.0, 18.0, 17.0, 10.0, 5.0, 6.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6171875, -3.46722412109375, -3.3172607421875, -3.16729736328125, -3.017333984375, -2.86737060546875, -2.7174072265625, -2.56744384765625, -2.41748046875, -2.26751708984375, -2.1175537109375, -1.96759033203125, -1.817626953125, -1.66766357421875, -1.5177001953125, -1.36773681640625, -1.2177734375, -1.06781005859375, -0.9178466796875, -0.76788330078125, -0.617919921875, -0.46795654296875, -0.3179931640625, -0.16802978515625, -0.01806640625, 0.13189697265625, 0.2818603515625, 0.43182373046875, 0.581787109375, 0.73175048828125, 0.8817138671875, 1.03167724609375, 1.181640625, 1.33160400390625, 1.4815673828125, 1.63153076171875, 1.781494140625, 1.93145751953125, 2.0814208984375, 2.23138427734375, 2.38134765625, 2.53131103515625, 2.6812744140625, 2.83123779296875, 2.981201171875, 3.13116455078125, 3.2811279296875, 3.43109130859375, 3.5810546875, 3.73101806640625, 3.8809814453125, 4.03094482421875, 4.180908203125, 4.33087158203125, 4.4808349609375, 4.63079833984375, 4.78076171875, 4.93072509765625, 5.0806884765625, 5.23065185546875, 5.380615234375, 5.53057861328125, 5.6805419921875, 5.83050537109375, 5.98046875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 3.0, 13.0, 10.0, 20.0, 25.0, 49.0, 99.0, 176.0, 453.0, 1075.0, 3153.0, 12136.0, 105333.0, 3967658.0, 88309.0, 10982.0, 2925.0, 1031.0, 406.0, 202.0, 93.0, 44.0, 32.0, 20.0, 8.0, 13.0, 4.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.078125, -27.889892578125, -26.70166015625, -25.513427734375, -24.3251953125, -23.136962890625, -21.94873046875, -20.760498046875, -19.572265625, -18.384033203125, -17.19580078125, -16.007568359375, -14.8193359375, -13.631103515625, -12.44287109375, -11.254638671875, -10.06640625, -8.878173828125, -7.68994140625, -6.501708984375, -5.3134765625, -4.125244140625, -2.93701171875, -1.748779296875, -0.560546875, 0.627685546875, 1.81591796875, 3.004150390625, 4.1923828125, 5.380615234375, 6.56884765625, 7.757080078125, 8.9453125, 10.133544921875, 11.32177734375, 12.510009765625, 13.6982421875, 14.886474609375, 16.07470703125, 17.262939453125, 18.451171875, 19.639404296875, 20.82763671875, 22.015869140625, 23.2041015625, 24.392333984375, 25.58056640625, 26.768798828125, 27.95703125, 29.145263671875, 30.33349609375, 31.521728515625, 32.7099609375, 33.898193359375, 35.08642578125, 36.274658203125, 37.462890625, 38.651123046875, 39.83935546875, 41.027587890625, 42.2158203125, 43.404052734375, 44.59228515625, 45.780517578125, 46.96875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 5.0, 8.0, 2.0, 7.0, 4.0, 10.0, 13.0, 8.0, 14.0, 28.0, 36.0, 70.0, 105.0, 301.0, 1647.0, 1214.0, 298.0, 131.0, 59.0, 34.0, 21.0, 17.0, 16.0, 8.0, 3.0, 5.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.96875, -6.677734375, -6.38671875, -6.095703125, -5.8046875, -5.513671875, -5.22265625, -4.931640625, -4.640625, -4.349609375, -4.05859375, -3.767578125, -3.4765625, -3.185546875, -2.89453125, -2.603515625, -2.3125, -2.021484375, -1.73046875, -1.439453125, -1.1484375, -0.857421875, -0.56640625, -0.275390625, 0.015625, 0.306640625, 0.59765625, 0.888671875, 1.1796875, 1.470703125, 1.76171875, 2.052734375, 2.34375, 2.634765625, 2.92578125, 3.216796875, 3.5078125, 3.798828125, 4.08984375, 4.380859375, 4.671875, 4.962890625, 5.25390625, 5.544921875, 5.8359375, 6.126953125, 6.41796875, 6.708984375, 7.0, 7.291015625, 7.58203125, 7.873046875, 8.1640625, 8.455078125, 8.74609375, 9.037109375, 9.328125, 9.619140625, 9.91015625, 10.201171875, 10.4921875, 10.783203125, 11.07421875, 11.365234375, 11.65625]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 0.0, 1.0, 6.0, 9.0, 15.0, 41.0, 65.0, 130.0, 243.0, 229.0, 139.0, 74.0, 27.0, 16.0, 5.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-83.51289367675781, -81.0558853149414, -78.59886932373047, -76.14186096191406, -73.68485260009766, -71.22784423828125, -68.77082824707031, -66.3138198852539, -63.856807708740234, -61.39979553222656, -58.942787170410156, -56.485774993896484, -54.02876281738281, -51.571754455566406, -49.114742279052734, -46.65773010253906, -44.200721740722656, -41.743709564208984, -39.28670120239258, -36.829689025878906, -34.3726806640625, -31.915668487548828, -29.458656311035156, -27.001646041870117, -24.544635772705078, -22.08762550354004, -19.630615234375, -17.173603057861328, -14.716592788696289, -12.25958251953125, -9.802571296691895, -7.345560073852539, -4.888542175292969, -2.4315314292907715, 0.02547931671142578, 2.482490062713623, 4.93950080871582, 7.396511077880859, 9.853522300720215, 12.31053352355957, 14.76754379272461, 17.22455406188965, 19.681564331054688, 22.13857650756836, 24.5955867767334, 27.052597045898438, 29.50960922241211, 31.96661949157715, 34.42362976074219, 36.88064193725586, 39.337650299072266, 41.79466247558594, 44.251670837402344, 46.708683013916016, 49.16569519042969, 51.622703552246094, 54.079715728759766, 56.53672790527344, 58.993736267089844, 61.450748443603516, 63.90776062011719, 66.3647689819336, 68.82177734375, 71.27879333496094, 73.73580169677734]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 5.0, 5.0, 8.0, 4.0, 12.0, 14.0, 9.0, 18.0, 13.0, 29.0, 27.0, 25.0, 44.0, 34.0, 44.0, 47.0, 50.0, 55.0, 55.0, 42.0, 58.0, 47.0, 43.0, 60.0, 26.0, 36.0, 45.0, 25.0, 18.0, 30.0, 23.0, 9.0, 5.0, 11.0, 10.0, 6.0, 4.0, 5.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.808746337890625, -23.984798431396484, -23.160850524902344, -22.336904525756836, -21.512956619262695, -20.689008712768555, -19.865062713623047, -19.041114807128906, -18.217166900634766, -17.393218994140625, -16.569271087646484, -15.745325088500977, -14.921377182006836, -14.097429275512695, -13.273482322692871, -12.449535369873047, -11.625587463378906, -10.801639556884766, -9.977692604064941, -9.153745651245117, -8.329797744750977, -7.505850315093994, -6.681902885437012, -5.857955455780029, -5.034008026123047, -4.2100605964660645, -3.386113166809082, -2.5621657371520996, -1.7382183074951172, -0.9142708778381348, -0.09032344818115234, 0.7336239814758301, 1.5575714111328125, 2.381518840789795, 3.2054662704467773, 4.02941370010376, 4.853361129760742, 5.677308559417725, 6.501255989074707, 7.3252034187316895, 8.149150848388672, 8.973098754882812, 9.797045707702637, 10.620992660522461, 11.444940567016602, 12.268888473510742, 13.092835426330566, 13.91678237915039, 14.740730285644531, 15.564678192138672, 16.388626098632812, 17.21257209777832, 18.03652000427246, 18.8604679107666, 19.68441390991211, 20.50836181640625, 21.33230972290039, 22.15625762939453, 22.980205535888672, 23.80415153503418, 24.62809944152832, 25.45204734802246, 26.27599334716797, 27.09994125366211, 27.92388916015625]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 3.0, 3.0, 9.0, 7.0, 17.0, 12.0, 30.0, 49.0, 68.0, 168.0, 359.0, 1058.0, 4058.0, 38472.0, 922654.0, 73746.0, 5586.0, 1332.0, 455.0, 199.0, 112.0, 47.0, 29.0, 20.0, 19.0, 10.0, 11.0, 7.0, 4.0, 6.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.84375, -45.48974609375, -44.1357421875, -42.78173828125, -41.427734375, -40.07373046875, -38.7197265625, -37.36572265625, -36.01171875, -34.65771484375, -33.3037109375, -31.94970703125, -30.595703125, -29.24169921875, -27.8876953125, -26.53369140625, -25.1796875, -23.82568359375, -22.4716796875, -21.11767578125, -19.763671875, -18.40966796875, -17.0556640625, -15.70166015625, -14.34765625, -12.99365234375, -11.6396484375, -10.28564453125, -8.931640625, -7.57763671875, -6.2236328125, -4.86962890625, -3.515625, -2.16162109375, -0.8076171875, 0.54638671875, 1.900390625, 3.25439453125, 4.6083984375, 5.96240234375, 7.31640625, 8.67041015625, 10.0244140625, 11.37841796875, 12.732421875, 14.08642578125, 15.4404296875, 16.79443359375, 18.1484375, 19.50244140625, 20.8564453125, 22.21044921875, 23.564453125, 24.91845703125, 26.2724609375, 27.62646484375, 28.98046875, 30.33447265625, 31.6884765625, 33.04248046875, 34.396484375, 35.75048828125, 37.1044921875, 38.45849609375, 39.8125]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 4.0, 9.0, 6.0, 2.0, 20.0, 11.0, 19.0, 28.0, 44.0, 68.0, 66.0, 61.0, 55.0, 77.0, 71.0, 71.0, 66.0, 68.0, 63.0, 41.0, 38.0, 23.0, 23.0, 25.0, 17.0, 9.0, 12.0, 6.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.42578125, -2.29595947265625, -2.1661376953125, -2.03631591796875, -1.906494140625, -1.77667236328125, -1.6468505859375, -1.51702880859375, -1.38720703125, -1.25738525390625, -1.1275634765625, -0.99774169921875, -0.867919921875, -0.73809814453125, -0.6082763671875, -0.47845458984375, -0.3486328125, -0.21881103515625, -0.0889892578125, 0.04083251953125, 0.170654296875, 0.30047607421875, 0.4302978515625, 0.56011962890625, 0.68994140625, 0.81976318359375, 0.9495849609375, 1.07940673828125, 1.209228515625, 1.33905029296875, 1.4688720703125, 1.59869384765625, 1.728515625, 1.85833740234375, 1.9881591796875, 2.11798095703125, 2.247802734375, 2.37762451171875, 2.5074462890625, 2.63726806640625, 2.76708984375, 2.89691162109375, 3.0267333984375, 3.15655517578125, 3.286376953125, 3.41619873046875, 3.5460205078125, 3.67584228515625, 3.8056640625, 3.93548583984375, 4.0653076171875, 4.19512939453125, 4.324951171875, 4.45477294921875, 4.5845947265625, 4.71441650390625, 4.84423828125, 4.97406005859375, 5.1038818359375, 5.23370361328125, 5.363525390625, 5.49334716796875, 5.6231689453125, 5.75299072265625, 5.8828125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 3.0, 3.0, 6.0, 7.0, 12.0, 11.0, 14.0, 23.0, 24.0, 38.0, 54.0, 94.0, 124.0, 247.0, 454.0, 1019.0, 2474.0, 7333.0, 26746.0, 147846.0, 746605.0, 87532.0, 18678.0, 5435.0, 1968.0, 831.0, 382.0, 228.0, 125.0, 67.0, 46.0, 32.0, 34.0, 23.0, 12.0, 7.0, 3.0, 3.0, 1.0, 2.0, 6.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-18.984375, -18.39794921875, -17.8115234375, -17.22509765625, -16.638671875, -16.05224609375, -15.4658203125, -14.87939453125, -14.29296875, -13.70654296875, -13.1201171875, -12.53369140625, -11.947265625, -11.36083984375, -10.7744140625, -10.18798828125, -9.6015625, -9.01513671875, -8.4287109375, -7.84228515625, -7.255859375, -6.66943359375, -6.0830078125, -5.49658203125, -4.91015625, -4.32373046875, -3.7373046875, -3.15087890625, -2.564453125, -1.97802734375, -1.3916015625, -0.80517578125, -0.21875, 0.36767578125, 0.9541015625, 1.54052734375, 2.126953125, 2.71337890625, 3.2998046875, 3.88623046875, 4.47265625, 5.05908203125, 5.6455078125, 6.23193359375, 6.818359375, 7.40478515625, 7.9912109375, 8.57763671875, 9.1640625, 9.75048828125, 10.3369140625, 10.92333984375, 11.509765625, 12.09619140625, 12.6826171875, 13.26904296875, 13.85546875, 14.44189453125, 15.0283203125, 15.61474609375, 16.201171875, 16.78759765625, 17.3740234375, 17.96044921875, 18.546875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 5.0, 8.0, 9.0, 7.0, 11.0, 9.0, 18.0, 19.0, 16.0, 25.0, 29.0, 30.0, 46.0, 43.0, 41.0, 48.0, 50.0, 41.0, 30.0, 54.0, 63.0, 30.0, 38.0, 27.0, 38.0, 38.0, 41.0, 28.0, 25.0, 28.0, 14.0, 15.0, 14.0, 10.0, 12.0, 7.0, 8.0, 4.0, 10.0, 3.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-12.7734375, -12.4017333984375, -12.030029296875, -11.6583251953125, -11.28662109375, -10.9149169921875, -10.543212890625, -10.1715087890625, -9.7998046875, -9.4281005859375, -9.056396484375, -8.6846923828125, -8.31298828125, -7.9412841796875, -7.569580078125, -7.1978759765625, -6.826171875, -6.4544677734375, -6.082763671875, -5.7110595703125, -5.33935546875, -4.9676513671875, -4.595947265625, -4.2242431640625, -3.8525390625, -3.4808349609375, -3.109130859375, -2.7374267578125, -2.36572265625, -1.9940185546875, -1.622314453125, -1.2506103515625, -0.87890625, -0.5072021484375, -0.135498046875, 0.2362060546875, 0.60791015625, 0.9796142578125, 1.351318359375, 1.7230224609375, 2.0947265625, 2.4664306640625, 2.838134765625, 3.2098388671875, 3.58154296875, 3.9532470703125, 4.324951171875, 4.6966552734375, 5.068359375, 5.4400634765625, 5.811767578125, 6.1834716796875, 6.55517578125, 6.9268798828125, 7.298583984375, 7.6702880859375, 8.0419921875, 8.4136962890625, 8.785400390625, 9.1571044921875, 9.52880859375, 9.9005126953125, 10.272216796875, 10.6439208984375, 11.015625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 3.0, 5.0, 7.0, 12.0, 16.0, 26.0, 55.0, 153.0, 369.0, 981.0, 2840.0, 10825.0, 77642.0, 860227.0, 79730.0, 11142.0, 2863.0, 990.0, 383.0, 160.0, 48.0, 33.0, 18.0, 12.0, 9.0, 8.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.203125, -15.7711181640625, -15.339111328125, -14.9071044921875, -14.47509765625, -14.0430908203125, -13.611083984375, -13.1790771484375, -12.7470703125, -12.3150634765625, -11.883056640625, -11.4510498046875, -11.01904296875, -10.5870361328125, -10.155029296875, -9.7230224609375, -9.291015625, -8.8590087890625, -8.427001953125, -7.9949951171875, -7.56298828125, -7.1309814453125, -6.698974609375, -6.2669677734375, -5.8349609375, -5.4029541015625, -4.970947265625, -4.5389404296875, -4.10693359375, -3.6749267578125, -3.242919921875, -2.8109130859375, -2.37890625, -1.9468994140625, -1.514892578125, -1.0828857421875, -0.65087890625, -0.2188720703125, 0.213134765625, 0.6451416015625, 1.0771484375, 1.5091552734375, 1.941162109375, 2.3731689453125, 2.80517578125, 3.2371826171875, 3.669189453125, 4.1011962890625, 4.533203125, 4.9652099609375, 5.397216796875, 5.8292236328125, 6.26123046875, 6.6932373046875, 7.125244140625, 7.5572509765625, 7.9892578125, 8.4212646484375, 8.853271484375, 9.2852783203125, 9.71728515625, 10.1492919921875, 10.581298828125, 11.0133056640625, 11.4453125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 2.0, 5.0, 5.0, 8.0, 7.0, 14.0, 10.0, 18.0, 28.0, 50.0, 135.0, 303.0, 199.0, 75.0, 51.0, 29.0, 23.0, 11.0, 12.0, 8.0, 5.0, 3.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0018768310546875, -0.001790463924407959, -0.001704096794128418, -0.001617729663848877, -0.001531362533569336, -0.001444995403289795, -0.001358628273010254, -0.0012722611427307129, -0.0011858940124511719, -0.0010995268821716309, -0.0010131597518920898, -0.0009267926216125488, -0.0008404254913330078, -0.0007540583610534668, -0.0006676912307739258, -0.0005813241004943848, -0.0004949569702148438, -0.00040858983993530273, -0.0003222227096557617, -0.0002358555793762207, -0.0001494884490966797, -6.312131881713867e-05, 2.3245811462402344e-05, 0.00010961294174194336, 0.00019598007202148438, 0.0002823472023010254, 0.0003687143325805664, 0.0004550814628601074, 0.0005414485931396484, 0.0006278157234191895, 0.0007141828536987305, 0.0008005499839782715, 0.0008869171142578125, 0.0009732842445373535, 0.0010596513748168945, 0.0011460185050964355, 0.0012323856353759766, 0.0013187527656555176, 0.0014051198959350586, 0.0014914870262145996, 0.0015778541564941406, 0.0016642212867736816, 0.0017505884170532227, 0.0018369555473327637, 0.0019233226776123047, 0.0020096898078918457, 0.0020960569381713867, 0.0021824240684509277, 0.0022687911987304688, 0.0023551583290100098, 0.0024415254592895508, 0.002527892589569092, 0.002614259719848633, 0.002700626850128174, 0.002786993980407715, 0.002873361110687256, 0.002959728240966797, 0.003046095371246338, 0.003132462501525879, 0.00321882963180542, 0.003305196762084961, 0.003391563892364502, 0.003477931022644043, 0.003564298152923584, 0.003650665283203125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 9.0, 11.0, 16.0, 32.0, 54.0, 105.0, 205.0, 463.0, 1284.0, 4035.0, 27586.0, 808134.0, 191280.0, 11402.0, 2463.0, 830.0, 312.0, 153.0, 71.0, 40.0, 22.0, 20.0, 7.0, 2.0, 4.0, 1.0, 1.0, 8.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.546875, -15.972412109375, -15.39794921875, -14.823486328125, -14.2490234375, -13.674560546875, -13.10009765625, -12.525634765625, -11.951171875, -11.376708984375, -10.80224609375, -10.227783203125, -9.6533203125, -9.078857421875, -8.50439453125, -7.929931640625, -7.35546875, -6.781005859375, -6.20654296875, -5.632080078125, -5.0576171875, -4.483154296875, -3.90869140625, -3.334228515625, -2.759765625, -2.185302734375, -1.61083984375, -1.036376953125, -0.4619140625, 0.112548828125, 0.68701171875, 1.261474609375, 1.8359375, 2.410400390625, 2.98486328125, 3.559326171875, 4.1337890625, 4.708251953125, 5.28271484375, 5.857177734375, 6.431640625, 7.006103515625, 7.58056640625, 8.155029296875, 8.7294921875, 9.303955078125, 9.87841796875, 10.452880859375, 11.02734375, 11.601806640625, 12.17626953125, 12.750732421875, 13.3251953125, 13.899658203125, 14.47412109375, 15.048583984375, 15.623046875, 16.197509765625, 16.77197265625, 17.346435546875, 17.9208984375, 18.495361328125, 19.06982421875, 19.644287109375, 20.21875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 9.0, 13.0, 14.0, 19.0, 28.0, 32.0, 47.0, 70.0, 100.0, 158.0, 177.0, 109.0, 74.0, 48.0, 23.0, 30.0, 13.0, 8.0, 9.0, 2.0, 5.0, 1.0, 4.0, 1.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.84375, -7.54296875, -7.2421875, -6.94140625, -6.640625, -6.33984375, -6.0390625, -5.73828125, -5.4375, -5.13671875, -4.8359375, -4.53515625, -4.234375, -3.93359375, -3.6328125, -3.33203125, -3.03125, -2.73046875, -2.4296875, -2.12890625, -1.828125, -1.52734375, -1.2265625, -0.92578125, -0.625, -0.32421875, -0.0234375, 0.27734375, 0.578125, 0.87890625, 1.1796875, 1.48046875, 1.78125, 2.08203125, 2.3828125, 2.68359375, 2.984375, 3.28515625, 3.5859375, 3.88671875, 4.1875, 4.48828125, 4.7890625, 5.08984375, 5.390625, 5.69140625, 5.9921875, 6.29296875, 6.59375, 6.89453125, 7.1953125, 7.49609375, 7.796875, 8.09765625, 8.3984375, 8.69921875, 9.0, 9.30078125, 9.6015625, 9.90234375, 10.203125, 10.50390625, 10.8046875, 11.10546875, 11.40625]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 7.0, 5.0, 17.0, 95.0, 318.0, 365.0, 156.0, 38.0, 9.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-155.36572265625, -146.32508850097656, -137.28445434570312, -128.24380493164062, -119.20317077636719, -110.16253662109375, -101.12189483642578, -92.08125305175781, -83.04061889648438, -73.99998474121094, -64.95934295654297, -55.918704986572266, -46.87806701660156, -37.83742904663086, -28.796791076660156, -19.756153106689453, -10.71551513671875, -1.6748771667480469, 7.365760803222656, 16.40639877319336, 25.447036743164062, 34.487674713134766, 43.52831268310547, 52.56895065307617, 61.609588623046875, 70.65022277832031, 79.69086456298828, 88.73150634765625, 97.77214050292969, 106.81277465820312, 115.8534164428711, 124.89405822753906, 133.93466186523438, 142.9752960205078, 152.01593017578125, 161.05657958984375, 170.0972137451172, 179.13784790039062, 188.17849731445312, 197.21913146972656, 206.259765625, 215.30039978027344, 224.34103393554688, 233.38168334960938, 242.4223175048828, 251.46295166015625, 260.50360107421875, 269.5442199707031, 278.5848693847656, 287.6255187988281, 296.6661376953125, 305.706787109375, 314.7474365234375, 323.7880554199219, 332.8287048339844, 341.86932373046875, 350.90997314453125, 359.95062255859375, 368.9912414550781, 378.0318908691406, 387.072509765625, 396.1131591796875, 405.15380859375, 414.1944274902344, 423.2350769042969]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 3.0, 2.0, 1.0, 3.0, 6.0, 3.0, 7.0, 5.0, 13.0, 15.0, 8.0, 11.0, 19.0, 17.0, 24.0, 18.0, 21.0, 32.0, 28.0, 28.0, 40.0, 31.0, 33.0, 39.0, 40.0, 32.0, 38.0, 44.0, 47.0, 41.0, 43.0, 40.0, 28.0, 31.0, 38.0, 26.0, 24.0, 20.0, 12.0, 17.0, 12.0, 18.0, 16.0, 8.0, 8.0, 10.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-65.97947692871094, -64.21476745605469, -62.45005416870117, -60.68534469604492, -58.92063522338867, -57.155921936035156, -55.391212463378906, -53.626502990722656, -51.861793518066406, -50.097084045410156, -48.33237075805664, -46.56766128540039, -44.80295181274414, -43.038238525390625, -41.273529052734375, -39.508819580078125, -37.74410629272461, -35.97939682006836, -34.214683532714844, -32.449974060058594, -30.685264587402344, -28.92055320739746, -27.155841827392578, -25.391132354736328, -23.626420974731445, -21.861709594726562, -20.097000122070312, -18.33228874206543, -16.567577362060547, -14.802867889404297, -13.038156509399414, -11.273446083068848, -9.508735656738281, -7.744025230407715, -5.97931432723999, -4.214603424072266, -2.449892997741699, -0.6851825714111328, 1.07952880859375, 2.8442392349243164, 4.608949661254883, 6.373660087585449, 8.138370513916016, 9.903081893920898, 11.667792320251465, 13.432502746582031, 15.197214126586914, 16.961925506591797, 18.726634979248047, 20.49134635925293, 22.25605583190918, 24.020767211914062, 25.785476684570312, 27.550188064575195, 29.314899444580078, 31.079608917236328, 32.844322204589844, 34.609031677246094, 36.37374496459961, 38.13845443725586, 39.90316390991211, 41.667877197265625, 43.432586669921875, 45.197296142578125, 46.962005615234375]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 6.0, 3.0, 3.0, 11.0, 12.0, 7.0, 14.0, 20.0, 28.0, 38.0, 64.0, 110.0, 130.0, 226.0, 359.0, 706.0, 1251.0, 2798.0, 7124.0, 22681.0, 136239.0, 3856406.0, 132127.0, 21665.0, 6530.0, 2688.0, 1185.0, 699.0, 391.0, 221.0, 144.0, 93.0, 60.0, 56.0, 41.0, 37.0, 25.0, 15.0, 13.0, 11.0, 11.0, 11.0, 4.0, 4.0, 9.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-22.078125, -21.212158203125, -20.34619140625, -19.480224609375, -18.6142578125, -17.748291015625, -16.88232421875, -16.016357421875, -15.150390625, -14.284423828125, -13.41845703125, -12.552490234375, -11.6865234375, -10.820556640625, -9.95458984375, -9.088623046875, -8.22265625, -7.356689453125, -6.49072265625, -5.624755859375, -4.7587890625, -3.892822265625, -3.02685546875, -2.160888671875, -1.294921875, -0.428955078125, 0.43701171875, 1.302978515625, 2.1689453125, 3.034912109375, 3.90087890625, 4.766845703125, 5.6328125, 6.498779296875, 7.36474609375, 8.230712890625, 9.0966796875, 9.962646484375, 10.82861328125, 11.694580078125, 12.560546875, 13.426513671875, 14.29248046875, 15.158447265625, 16.0244140625, 16.890380859375, 17.75634765625, 18.622314453125, 19.48828125, 20.354248046875, 21.22021484375, 22.086181640625, 22.9521484375, 23.818115234375, 24.68408203125, 25.550048828125, 26.416015625, 27.281982421875, 28.14794921875, 29.013916015625, 29.8798828125, 30.745849609375, 31.61181640625, 32.477783203125, 33.34375]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 5.0, 4.0, 12.0, 12.0, 21.0, 34.0, 28.0, 40.0, 54.0, 64.0, 73.0, 80.0, 79.0, 74.0, 70.0, 73.0, 62.0, 59.0, 41.0, 29.0, 22.0, 24.0, 11.0, 11.0, 10.0, 6.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.41015625, -4.263671875, -4.1171875, -3.970703125, -3.82421875, -3.677734375, -3.53125, -3.384765625, -3.23828125, -3.091796875, -2.9453125, -2.798828125, -2.65234375, -2.505859375, -2.359375, -2.212890625, -2.06640625, -1.919921875, -1.7734375, -1.626953125, -1.48046875, -1.333984375, -1.1875, -1.041015625, -0.89453125, -0.748046875, -0.6015625, -0.455078125, -0.30859375, -0.162109375, -0.015625, 0.130859375, 0.27734375, 0.423828125, 0.5703125, 0.716796875, 0.86328125, 1.009765625, 1.15625, 1.302734375, 1.44921875, 1.595703125, 1.7421875, 1.888671875, 2.03515625, 2.181640625, 2.328125, 2.474609375, 2.62109375, 2.767578125, 2.9140625, 3.060546875, 3.20703125, 3.353515625, 3.5, 3.646484375, 3.79296875, 3.939453125, 4.0859375, 4.232421875, 4.37890625, 4.525390625, 4.671875, 4.818359375, 4.96484375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 3.0, 4.0, 13.0, 26.0, 41.0, 62.0, 109.0, 239.0, 339.0, 656.0, 1382.0, 2664.0, 6675.0, 20212.0, 97261.0, 3536046.0, 460522.0, 46759.0, 12554.0, 4664.0, 2012.0, 994.0, 453.0, 234.0, 135.0, 77.0, 39.0, 21.0, 26.0, 17.0, 8.0, 9.0, 3.0, 4.0, 3.0, 1.0, 5.0, 2.0, 2.0, 1.0], "bins": [-36.0625, -35.15625, -34.25, -33.34375, -32.4375, -31.53125, -30.625, -29.71875, -28.8125, -27.90625, -27.0, -26.09375, -25.1875, -24.28125, -23.375, -22.46875, -21.5625, -20.65625, -19.75, -18.84375, -17.9375, -17.03125, -16.125, -15.21875, -14.3125, -13.40625, -12.5, -11.59375, -10.6875, -9.78125, -8.875, -7.96875, -7.0625, -6.15625, -5.25, -4.34375, -3.4375, -2.53125, -1.625, -0.71875, 0.1875, 1.09375, 2.0, 2.90625, 3.8125, 4.71875, 5.625, 6.53125, 7.4375, 8.34375, 9.25, 10.15625, 11.0625, 11.96875, 12.875, 13.78125, 14.6875, 15.59375, 16.5, 17.40625, 18.3125, 19.21875, 20.125, 21.03125, 21.9375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 6.0, 2.0, 1.0, 2.0, 8.0, 6.0, 12.0, 6.0, 17.0, 16.0, 21.0, 38.0, 44.0, 82.0, 95.0, 169.0, 435.0, 1893.0, 623.0, 222.0, 101.0, 66.0, 47.0, 24.0, 22.0, 24.0, 19.0, 18.0, 12.0, 6.0, 6.0, 6.0, 5.0, 4.0, 3.0, 1.0, 0.0, 4.0, 3.0, 1.0, 1.0, 2.0], "bins": [-9.65625, -9.412841796875, -9.16943359375, -8.926025390625, -8.6826171875, -8.439208984375, -8.19580078125, -7.952392578125, -7.708984375, -7.465576171875, -7.22216796875, -6.978759765625, -6.7353515625, -6.491943359375, -6.24853515625, -6.005126953125, -5.76171875, -5.518310546875, -5.27490234375, -5.031494140625, -4.7880859375, -4.544677734375, -4.30126953125, -4.057861328125, -3.814453125, -3.571044921875, -3.32763671875, -3.084228515625, -2.8408203125, -2.597412109375, -2.35400390625, -2.110595703125, -1.8671875, -1.623779296875, -1.38037109375, -1.136962890625, -0.8935546875, -0.650146484375, -0.40673828125, -0.163330078125, 0.080078125, 0.323486328125, 0.56689453125, 0.810302734375, 1.0537109375, 1.297119140625, 1.54052734375, 1.783935546875, 2.02734375, 2.270751953125, 2.51416015625, 2.757568359375, 3.0009765625, 3.244384765625, 3.48779296875, 3.731201171875, 3.974609375, 4.218017578125, 4.46142578125, 4.704833984375, 4.9482421875, 5.191650390625, 5.43505859375, 5.678466796875, 5.921875]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 4.0, 5.0, 1.0, 9.0, 16.0, 40.0, 113.0, 204.0, 284.0, 200.0, 80.0, 25.0, 15.0, 7.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-158.50746154785156, -155.24777221679688, -151.98806762695312, -148.72837829589844, -145.46868896484375, -142.208984375, -138.9492950439453, -135.68959045410156, -132.42990112304688, -129.1702117919922, -125.91050720214844, -122.65081787109375, -119.39112091064453, -116.13142395019531, -112.87173461914062, -109.6120376586914, -106.35234069824219, -103.09264373779297, -99.83294677734375, -96.57325744628906, -93.31356048583984, -90.05386352539062, -86.79417419433594, -83.53447723388672, -80.2747802734375, -77.01508331298828, -73.75538635253906, -70.49569702148438, -67.23600006103516, -63.97630310058594, -60.716609954833984, -57.45691680908203, -54.197227478027344, -50.937530517578125, -47.67783737182617, -44.41814422607422, -41.158447265625, -37.89875030517578, -34.63905715942383, -31.379362106323242, -28.119667053222656, -24.85997200012207, -21.600276947021484, -18.3405818939209, -15.080886840820312, -11.821191787719727, -8.56149673461914, -5.301801681518555, -2.0421066284179688, 1.2175884246826172, 4.477283477783203, 7.736978530883789, 10.996673583984375, 14.256368637084961, 17.516063690185547, 20.775758743286133, 24.03545379638672, 27.295148849487305, 30.55484390258789, 33.814537048339844, 37.07423400878906, 40.33393096923828, 43.593624114990234, 46.85331726074219, 50.113014221191406]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 5.0, 3.0, 9.0, 5.0, 8.0, 9.0, 14.0, 10.0, 19.0, 18.0, 13.0, 17.0, 24.0, 34.0, 25.0, 23.0, 29.0, 37.0, 35.0, 42.0, 39.0, 44.0, 39.0, 36.0, 47.0, 32.0, 30.0, 45.0, 33.0, 47.0, 27.0, 28.0, 24.0, 21.0, 18.0, 15.0, 17.0, 17.0, 9.0, 14.0, 6.0, 9.0, 9.0, 8.0, 4.0, 5.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-26.313270568847656, -25.519046783447266, -24.724822998046875, -23.930599212646484, -23.136377334594727, -22.342153549194336, -21.547929763793945, -20.753705978393555, -19.959482192993164, -19.165258407592773, -18.371034622192383, -17.576812744140625, -16.782588958740234, -15.988365173339844, -15.194141387939453, -14.399917602539062, -13.605694770812988, -12.811470985412598, -12.017248153686523, -11.223024368286133, -10.428800582885742, -9.634576797485352, -8.840353965759277, -8.046130180358887, -7.251906871795654, -6.457683563232422, -5.663459777832031, -4.869236469268799, -4.075013160705566, -3.280789375305176, -2.4865660667419434, -1.6923422813415527, -0.8981189727783203, -0.10389548540115356, 0.6903280019760132, 1.4845514297485352, 2.2787749767303467, 3.072998523712158, 3.8672218322753906, 4.661445617675781, 5.455668926239014, 6.249892234802246, 7.044116020202637, 7.838339328765869, 8.632562637329102, 9.426786422729492, 10.221010208129883, 11.015233993530273, 11.809456825256348, 12.603680610656738, 13.397903442382812, 14.192127227783203, 14.986351013183594, 15.780574798583984, 16.574798583984375, 17.369022369384766, 18.163244247436523, 18.957468032836914, 19.751691818237305, 20.545913696289062, 21.340137481689453, 22.134361267089844, 22.928585052490234, 23.722808837890625, 24.517032623291016]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 6.0, 5.0, 10.0, 15.0, 19.0, 29.0, 56.0, 81.0, 141.0, 322.0, 723.0, 1706.0, 5160.0, 22439.0, 166157.0, 720343.0, 108458.0, 16080.0, 4078.0, 1487.0, 561.0, 302.0, 142.0, 80.0, 52.0, 32.0, 15.0, 18.0, 10.0, 6.0, 5.0, 4.0, 5.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.625, -26.685546875, -25.74609375, -24.806640625, -23.8671875, -22.927734375, -21.98828125, -21.048828125, -20.109375, -19.169921875, -18.23046875, -17.291015625, -16.3515625, -15.412109375, -14.47265625, -13.533203125, -12.59375, -11.654296875, -10.71484375, -9.775390625, -8.8359375, -7.896484375, -6.95703125, -6.017578125, -5.078125, -4.138671875, -3.19921875, -2.259765625, -1.3203125, -0.380859375, 0.55859375, 1.498046875, 2.4375, 3.376953125, 4.31640625, 5.255859375, 6.1953125, 7.134765625, 8.07421875, 9.013671875, 9.953125, 10.892578125, 11.83203125, 12.771484375, 13.7109375, 14.650390625, 15.58984375, 16.529296875, 17.46875, 18.408203125, 19.34765625, 20.287109375, 21.2265625, 22.166015625, 23.10546875, 24.044921875, 24.984375, 25.923828125, 26.86328125, 27.802734375, 28.7421875, 29.681640625, 30.62109375, 31.560546875, 32.5]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 5.0, 6.0, 8.0, 10.0, 8.0, 25.0, 14.0, 26.0, 26.0, 31.0, 51.0, 37.0, 52.0, 55.0, 53.0, 55.0, 65.0, 54.0, 58.0, 53.0, 49.0, 45.0, 45.0, 33.0, 29.0, 27.0, 21.0, 21.0, 7.0, 12.0, 8.0, 3.0, 6.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.4765625, -3.35186767578125, -3.2271728515625, -3.10247802734375, -2.977783203125, -2.85308837890625, -2.7283935546875, -2.60369873046875, -2.47900390625, -2.35430908203125, -2.2296142578125, -2.10491943359375, -1.980224609375, -1.85552978515625, -1.7308349609375, -1.60614013671875, -1.4814453125, -1.35675048828125, -1.2320556640625, -1.10736083984375, -0.982666015625, -0.85797119140625, -0.7332763671875, -0.60858154296875, -0.48388671875, -0.35919189453125, -0.2344970703125, -0.10980224609375, 0.014892578125, 0.13958740234375, 0.2642822265625, 0.38897705078125, 0.513671875, 0.63836669921875, 0.7630615234375, 0.88775634765625, 1.012451171875, 1.13714599609375, 1.2618408203125, 1.38653564453125, 1.51123046875, 1.63592529296875, 1.7606201171875, 1.88531494140625, 2.010009765625, 2.13470458984375, 2.2593994140625, 2.38409423828125, 2.5087890625, 2.63348388671875, 2.7581787109375, 2.88287353515625, 3.007568359375, 3.13226318359375, 3.2569580078125, 3.38165283203125, 3.50634765625, 3.63104248046875, 3.7557373046875, 3.88043212890625, 4.005126953125, 4.12982177734375, 4.2545166015625, 4.37921142578125, 4.50390625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 3.0, 8.0, 12.0, 9.0, 11.0, 12.0, 35.0, 29.0, 47.0, 73.0, 81.0, 113.0, 140.0, 220.0, 259.0, 422.0, 627.0, 1228.0, 2863.0, 8607.0, 38012.0, 274808.0, 622198.0, 76188.0, 14407.0, 4042.0, 1622.0, 870.0, 493.0, 282.0, 199.0, 170.0, 107.0, 89.0, 78.0, 50.0, 33.0, 24.0, 17.0, 15.0, 14.0, 12.0, 11.0, 6.0, 1.0, 3.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-22.0, -21.294677734375, -20.58935546875, -19.884033203125, -19.1787109375, -18.473388671875, -17.76806640625, -17.062744140625, -16.357421875, -15.652099609375, -14.94677734375, -14.241455078125, -13.5361328125, -12.830810546875, -12.12548828125, -11.420166015625, -10.71484375, -10.009521484375, -9.30419921875, -8.598876953125, -7.8935546875, -7.188232421875, -6.48291015625, -5.777587890625, -5.072265625, -4.366943359375, -3.66162109375, -2.956298828125, -2.2509765625, -1.545654296875, -0.84033203125, -0.135009765625, 0.5703125, 1.275634765625, 1.98095703125, 2.686279296875, 3.3916015625, 4.096923828125, 4.80224609375, 5.507568359375, 6.212890625, 6.918212890625, 7.62353515625, 8.328857421875, 9.0341796875, 9.739501953125, 10.44482421875, 11.150146484375, 11.85546875, 12.560791015625, 13.26611328125, 13.971435546875, 14.6767578125, 15.382080078125, 16.08740234375, 16.792724609375, 17.498046875, 18.203369140625, 18.90869140625, 19.614013671875, 20.3193359375, 21.024658203125, 21.72998046875, 22.435302734375, 23.140625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 4.0, 5.0, 5.0, 4.0, 6.0, 8.0, 11.0, 5.0, 11.0, 21.0, 16.0, 33.0, 22.0, 37.0, 25.0, 34.0, 32.0, 38.0, 45.0, 34.0, 47.0, 35.0, 51.0, 46.0, 48.0, 52.0, 36.0, 37.0, 34.0, 47.0, 24.0, 22.0, 20.0, 16.0, 23.0, 15.0, 12.0, 7.0, 11.0, 2.0, 6.0, 6.0, 6.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.9609375, -14.486328125, -14.01171875, -13.537109375, -13.0625, -12.587890625, -12.11328125, -11.638671875, -11.1640625, -10.689453125, -10.21484375, -9.740234375, -9.265625, -8.791015625, -8.31640625, -7.841796875, -7.3671875, -6.892578125, -6.41796875, -5.943359375, -5.46875, -4.994140625, -4.51953125, -4.044921875, -3.5703125, -3.095703125, -2.62109375, -2.146484375, -1.671875, -1.197265625, -0.72265625, -0.248046875, 0.2265625, 0.701171875, 1.17578125, 1.650390625, 2.125, 2.599609375, 3.07421875, 3.548828125, 4.0234375, 4.498046875, 4.97265625, 5.447265625, 5.921875, 6.396484375, 6.87109375, 7.345703125, 7.8203125, 8.294921875, 8.76953125, 9.244140625, 9.71875, 10.193359375, 10.66796875, 11.142578125, 11.6171875, 12.091796875, 12.56640625, 13.041015625, 13.515625, 13.990234375, 14.46484375, 14.939453125, 15.4140625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 7.0, 7.0, 12.0, 22.0, 32.0, 46.0, 86.0, 160.0, 267.0, 479.0, 1015.0, 2291.0, 7078.0, 55611.0, 884917.0, 83279.0, 8401.0, 2531.0, 1093.0, 551.0, 271.0, 167.0, 86.0, 51.0, 38.0, 24.0, 15.0, 6.0, 7.0, 3.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.796875, -20.137939453125, -19.47900390625, -18.820068359375, -18.1611328125, -17.502197265625, -16.84326171875, -16.184326171875, -15.525390625, -14.866455078125, -14.20751953125, -13.548583984375, -12.8896484375, -12.230712890625, -11.57177734375, -10.912841796875, -10.25390625, -9.594970703125, -8.93603515625, -8.277099609375, -7.6181640625, -6.959228515625, -6.30029296875, -5.641357421875, -4.982421875, -4.323486328125, -3.66455078125, -3.005615234375, -2.3466796875, -1.687744140625, -1.02880859375, -0.369873046875, 0.2890625, 0.947998046875, 1.60693359375, 2.265869140625, 2.9248046875, 3.583740234375, 4.24267578125, 4.901611328125, 5.560546875, 6.219482421875, 6.87841796875, 7.537353515625, 8.1962890625, 8.855224609375, 9.51416015625, 10.173095703125, 10.83203125, 11.490966796875, 12.14990234375, 12.808837890625, 13.4677734375, 14.126708984375, 14.78564453125, 15.444580078125, 16.103515625, 16.762451171875, 17.42138671875, 18.080322265625, 18.7392578125, 19.398193359375, 20.05712890625, 20.716064453125, 21.375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 2.0, 0.0, 6.0, 9.0, 9.0, 22.0, 21.0, 27.0, 46.0, 68.0, 106.0, 266.0, 159.0, 74.0, 62.0, 36.0, 28.0, 16.0, 11.0, 8.0, 11.0, 4.0, 4.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.004116058349609375, -0.00401228666305542, -0.003908514976501465, -0.0038047432899475098, -0.0037009716033935547, -0.0035971999168395996, -0.0034934282302856445, -0.0033896565437316895, -0.0032858848571777344, -0.0031821131706237793, -0.0030783414840698242, -0.002974569797515869, -0.002870798110961914, -0.002767026424407959, -0.002663254737854004, -0.002559483051300049, -0.0024557113647460938, -0.0023519396781921387, -0.0022481679916381836, -0.0021443963050842285, -0.0020406246185302734, -0.0019368529319763184, -0.0018330812454223633, -0.0017293095588684082, -0.0016255378723144531, -0.001521766185760498, -0.001417994499206543, -0.0013142228126525879, -0.0012104511260986328, -0.0011066794395446777, -0.0010029077529907227, -0.0008991360664367676, -0.0007953643798828125, -0.0006915926933288574, -0.0005878210067749023, -0.00048404932022094727, -0.0003802776336669922, -0.0002765059471130371, -0.00017273426055908203, -6.896257400512695e-05, 3.4809112548828125e-05, 0.0001385807991027832, 0.00024235248565673828, 0.00034612417221069336, 0.00044989585876464844, 0.0005536675453186035, 0.0006574392318725586, 0.0007612109184265137, 0.0008649826049804688, 0.0009687542915344238, 0.001072525978088379, 0.001176297664642334, 0.001280069351196289, 0.0013838410377502441, 0.0014876127243041992, 0.0015913844108581543, 0.0016951560974121094, 0.0017989277839660645, 0.0019026994705200195, 0.0020064711570739746, 0.0021102428436279297, 0.0022140145301818848, 0.00231778621673584, 0.002421557903289795, 0.00252532958984375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 6.0, 1.0, 4.0, 5.0, 4.0, 3.0, 4.0, 6.0, 13.0, 10.0, 12.0, 32.0, 44.0, 50.0, 73.0, 149.0, 223.0, 385.0, 936.0, 2092.0, 7596.0, 65829.0, 904816.0, 55399.0, 7018.0, 2041.0, 794.0, 417.0, 197.0, 117.0, 92.0, 55.0, 26.0, 24.0, 17.0, 17.0, 8.0, 10.0, 9.0, 5.0, 4.0, 5.0, 4.0, 4.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-24.0625, -23.321533203125, -22.58056640625, -21.839599609375, -21.0986328125, -20.357666015625, -19.61669921875, -18.875732421875, -18.134765625, -17.393798828125, -16.65283203125, -15.911865234375, -15.1708984375, -14.429931640625, -13.68896484375, -12.947998046875, -12.20703125, -11.466064453125, -10.72509765625, -9.984130859375, -9.2431640625, -8.502197265625, -7.76123046875, -7.020263671875, -6.279296875, -5.538330078125, -4.79736328125, -4.056396484375, -3.3154296875, -2.574462890625, -1.83349609375, -1.092529296875, -0.3515625, 0.389404296875, 1.13037109375, 1.871337890625, 2.6123046875, 3.353271484375, 4.09423828125, 4.835205078125, 5.576171875, 6.317138671875, 7.05810546875, 7.799072265625, 8.5400390625, 9.281005859375, 10.02197265625, 10.762939453125, 11.50390625, 12.244873046875, 12.98583984375, 13.726806640625, 14.4677734375, 15.208740234375, 15.94970703125, 16.690673828125, 17.431640625, 18.172607421875, 18.91357421875, 19.654541015625, 20.3955078125, 21.136474609375, 21.87744140625, 22.618408203125, 23.359375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 5.0, 6.0, 4.0, 5.0, 10.0, 15.0, 31.0, 44.0, 54.0, 75.0, 137.0, 150.0, 150.0, 124.0, 78.0, 43.0, 22.0, 20.0, 11.0, 5.0, 2.0, 5.0, 3.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.3984375, -14.9130859375, -14.427734375, -13.9423828125, -13.45703125, -12.9716796875, -12.486328125, -12.0009765625, -11.515625, -11.0302734375, -10.544921875, -10.0595703125, -9.57421875, -9.0888671875, -8.603515625, -8.1181640625, -7.6328125, -7.1474609375, -6.662109375, -6.1767578125, -5.69140625, -5.2060546875, -4.720703125, -4.2353515625, -3.75, -3.2646484375, -2.779296875, -2.2939453125, -1.80859375, -1.3232421875, -0.837890625, -0.3525390625, 0.1328125, 0.6181640625, 1.103515625, 1.5888671875, 2.07421875, 2.5595703125, 3.044921875, 3.5302734375, 4.015625, 4.5009765625, 4.986328125, 5.4716796875, 5.95703125, 6.4423828125, 6.927734375, 7.4130859375, 7.8984375, 8.3837890625, 8.869140625, 9.3544921875, 9.83984375, 10.3251953125, 10.810546875, 11.2958984375, 11.78125, 12.2666015625, 12.751953125, 13.2373046875, 13.72265625, 14.2080078125, 14.693359375, 15.1787109375, 15.6640625]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 10.0, 45.0, 123.0, 283.0, 339.0, 149.0, 38.0, 11.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-393.5204772949219, -382.62493896484375, -371.7294006347656, -360.8338623046875, -349.9383544921875, -339.0428161621094, -328.14727783203125, -317.2517395019531, -306.356201171875, -295.4606628417969, -284.56512451171875, -273.66961669921875, -262.7740783691406, -251.8785400390625, -240.98300170898438, -230.08746337890625, -219.19195556640625, -208.29641723632812, -197.40089416503906, -186.50535583496094, -175.60983276367188, -164.71429443359375, -153.81875610351562, -142.9232177734375, -132.02769470214844, -121.13216400146484, -110.23663330078125, -99.34109497070312, -88.44556427001953, -77.55003356933594, -66.65449523925781, -55.75896453857422, -44.863433837890625, -33.96790313720703, -23.072368621826172, -12.176834106445312, -1.2813034057617188, 9.614227294921875, 20.509765625, 31.405296325683594, 42.30082702636719, 53.19635772705078, 64.09188842773438, 74.9874267578125, 85.8829574584961, 96.77848815917969, 107.67402648925781, 118.5695571899414, 129.465087890625, 140.36062622070312, 151.2561492919922, 162.1516876220703, 173.04721069335938, 183.9427490234375, 194.83828735351562, 205.73382568359375, 216.6293487548828, 227.52488708496094, 238.42041015625, 249.31594848632812, 260.21148681640625, 271.10699462890625, 282.0025634765625, 292.8980712890625, 303.7936096191406]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 3.0, 6.0, 4.0, 9.0, 12.0, 7.0, 15.0, 14.0, 17.0, 17.0, 30.0, 25.0, 28.0, 38.0, 40.0, 31.0, 37.0, 43.0, 44.0, 34.0, 44.0, 48.0, 35.0, 38.0, 40.0, 34.0, 45.0, 32.0, 36.0, 34.0, 23.0, 24.0, 23.0, 22.0, 15.0, 11.0, 11.0, 4.0, 9.0, 3.0, 7.0, 5.0, 3.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-86.71678924560547, -84.1964340209961, -81.67607116699219, -79.15571594238281, -76.6353530883789, -74.11499786376953, -71.59463500976562, -69.07427978515625, -66.55392456054688, -64.0335693359375, -61.513206481933594, -58.99284744262695, -56.47248840332031, -53.95213317871094, -51.4317741394043, -48.911415100097656, -46.39105224609375, -43.87069320678711, -41.35033416748047, -38.82997512817383, -36.30961608886719, -33.78926086425781, -31.268901824951172, -28.74854278564453, -26.22818374633789, -23.70782470703125, -21.18746566772461, -18.6671085357666, -16.14674949645996, -13.62639045715332, -11.106032371520996, -8.585674285888672, -6.0653076171875, -3.5449490547180176, -1.0245904922485352, 1.4957680702209473, 4.01612663269043, 6.53648567199707, 9.056843757629395, 11.577201843261719, 14.09756088256836, 16.617919921875, 19.13827896118164, 21.65863609313965, 24.17899513244629, 26.69935417175293, 29.219711303710938, 31.740070343017578, 34.26042938232422, 36.78078842163086, 39.3011474609375, 41.82150650024414, 44.34186553955078, 46.862220764160156, 49.3825798034668, 51.90293884277344, 54.42329788208008, 56.94365692138672, 59.46401596069336, 61.984375, 64.50473022460938, 67.02509307861328, 69.54544830322266, 72.06581115722656, 74.58616638183594]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 3.0, 0.0, 1.0, 2.0, 6.0, 12.0, 23.0, 20.0, 28.0, 38.0, 63.0, 77.0, 128.0, 182.0, 330.0, 519.0, 918.0, 1789.0, 3560.0, 8122.0, 25933.0, 234676.0, 3811051.0, 80110.0, 15824.0, 5536.0, 2421.0, 1155.0, 654.0, 357.0, 206.0, 143.0, 121.0, 68.0, 45.0, 43.0, 27.0, 14.0, 22.0, 14.0, 10.0, 8.0, 9.0, 8.0, 6.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.703125, -21.806396484375, -20.90966796875, -20.012939453125, -19.1162109375, -18.219482421875, -17.32275390625, -16.426025390625, -15.529296875, -14.632568359375, -13.73583984375, -12.839111328125, -11.9423828125, -11.045654296875, -10.14892578125, -9.252197265625, -8.35546875, -7.458740234375, -6.56201171875, -5.665283203125, -4.7685546875, -3.871826171875, -2.97509765625, -2.078369140625, -1.181640625, -0.284912109375, 0.61181640625, 1.508544921875, 2.4052734375, 3.302001953125, 4.19873046875, 5.095458984375, 5.9921875, 6.888916015625, 7.78564453125, 8.682373046875, 9.5791015625, 10.475830078125, 11.37255859375, 12.269287109375, 13.166015625, 14.062744140625, 14.95947265625, 15.856201171875, 16.7529296875, 17.649658203125, 18.54638671875, 19.443115234375, 20.33984375, 21.236572265625, 22.13330078125, 23.030029296875, 23.9267578125, 24.823486328125, 25.72021484375, 26.616943359375, 27.513671875, 28.410400390625, 29.30712890625, 30.203857421875, 31.1005859375, 31.997314453125, 32.89404296875, 33.790771484375, 34.6875]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 5.0, 7.0, 11.0, 4.0, 15.0, 12.0, 22.0, 26.0, 33.0, 46.0, 35.0, 44.0, 46.0, 54.0, 56.0, 61.0, 67.0, 61.0, 62.0, 52.0, 57.0, 43.0, 39.0, 30.0, 25.0, 23.0, 14.0, 14.0, 11.0, 14.0, 5.0, 3.0, 5.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.11328125, -3.97821044921875, -3.8431396484375, -3.70806884765625, -3.572998046875, -3.43792724609375, -3.3028564453125, -3.16778564453125, -3.03271484375, -2.89764404296875, -2.7625732421875, -2.62750244140625, -2.492431640625, -2.35736083984375, -2.2222900390625, -2.08721923828125, -1.9521484375, -1.81707763671875, -1.6820068359375, -1.54693603515625, -1.411865234375, -1.27679443359375, -1.1417236328125, -1.00665283203125, -0.87158203125, -0.73651123046875, -0.6014404296875, -0.46636962890625, -0.331298828125, -0.19622802734375, -0.0611572265625, 0.07391357421875, 0.208984375, 0.34405517578125, 0.4791259765625, 0.61419677734375, 0.749267578125, 0.88433837890625, 1.0194091796875, 1.15447998046875, 1.28955078125, 1.42462158203125, 1.5596923828125, 1.69476318359375, 1.829833984375, 1.96490478515625, 2.0999755859375, 2.23504638671875, 2.3701171875, 2.50518798828125, 2.6402587890625, 2.77532958984375, 2.910400390625, 3.04547119140625, 3.1805419921875, 3.31561279296875, 3.45068359375, 3.58575439453125, 3.7208251953125, 3.85589599609375, 3.990966796875, 4.12603759765625, 4.2611083984375, 4.39617919921875, 4.53125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 0.0, 7.0, 8.0, 5.0, 23.0, 23.0, 39.0, 73.0, 114.0, 249.0, 558.0, 1311.0, 3246.0, 9387.0, 34881.0, 241103.0, 3665056.0, 193627.0, 30757.0, 8504.0, 3008.0, 1234.0, 533.0, 236.0, 123.0, 86.0, 37.0, 21.0, 12.0, 10.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.6875, -27.830078125, -26.97265625, -26.115234375, -25.2578125, -24.400390625, -23.54296875, -22.685546875, -21.828125, -20.970703125, -20.11328125, -19.255859375, -18.3984375, -17.541015625, -16.68359375, -15.826171875, -14.96875, -14.111328125, -13.25390625, -12.396484375, -11.5390625, -10.681640625, -9.82421875, -8.966796875, -8.109375, -7.251953125, -6.39453125, -5.537109375, -4.6796875, -3.822265625, -2.96484375, -2.107421875, -1.25, -0.392578125, 0.46484375, 1.322265625, 2.1796875, 3.037109375, 3.89453125, 4.751953125, 5.609375, 6.466796875, 7.32421875, 8.181640625, 9.0390625, 9.896484375, 10.75390625, 11.611328125, 12.46875, 13.326171875, 14.18359375, 15.041015625, 15.8984375, 16.755859375, 17.61328125, 18.470703125, 19.328125, 20.185546875, 21.04296875, 21.900390625, 22.7578125, 23.615234375, 24.47265625, 25.330078125, 26.1875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 6.0, 7.0, 3.0, 9.0, 6.0, 6.0, 14.0, 12.0, 14.0, 23.0, 25.0, 45.0, 59.0, 95.0, 157.0, 282.0, 752.0, 1547.0, 442.0, 207.0, 104.0, 68.0, 44.0, 42.0, 20.0, 17.0, 20.0, 10.0, 5.0, 9.0, 6.0, 4.0, 5.0, 1.0, 2.0, 5.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-9.109375, -8.8179931640625, -8.526611328125, -8.2352294921875, -7.94384765625, -7.6524658203125, -7.361083984375, -7.0697021484375, -6.7783203125, -6.4869384765625, -6.195556640625, -5.9041748046875, -5.61279296875, -5.3214111328125, -5.030029296875, -4.7386474609375, -4.447265625, -4.1558837890625, -3.864501953125, -3.5731201171875, -3.28173828125, -2.9903564453125, -2.698974609375, -2.4075927734375, -2.1162109375, -1.8248291015625, -1.533447265625, -1.2420654296875, -0.95068359375, -0.6593017578125, -0.367919921875, -0.0765380859375, 0.21484375, 0.5062255859375, 0.797607421875, 1.0889892578125, 1.38037109375, 1.6717529296875, 1.963134765625, 2.2545166015625, 2.5458984375, 2.8372802734375, 3.128662109375, 3.4200439453125, 3.71142578125, 4.0028076171875, 4.294189453125, 4.5855712890625, 4.876953125, 5.1683349609375, 5.459716796875, 5.7510986328125, 6.04248046875, 6.3338623046875, 6.625244140625, 6.9166259765625, 7.2080078125, 7.4993896484375, 7.790771484375, 8.0821533203125, 8.37353515625, 8.6649169921875, 8.956298828125, 9.2476806640625, 9.5390625]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 8.0, 18.0, 55.0, 117.0, 226.0, 295.0, 167.0, 73.0, 28.0, 11.0, 7.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-164.75221252441406, -160.42298889160156, -156.09376525878906, -151.76454162597656, -147.43533325195312, -143.10610961914062, -138.77688598632812, -134.44766235351562, -130.11843872070312, -125.78921508789062, -121.45999145507812, -117.13077545166016, -112.80155181884766, -108.47232818603516, -104.14311218261719, -99.81388854980469, -95.48466491699219, -91.15544128417969, -86.82621765136719, -82.49700164794922, -78.16777801513672, -73.83855438232422, -69.50933837890625, -65.18011474609375, -60.85089111328125, -56.52166748046875, -52.192447662353516, -47.86322784423828, -43.53400421142578, -39.20478057861328, -34.87556076049805, -30.54633903503418, -26.21710205078125, -21.887880325317383, -17.558658599853516, -13.229436874389648, -8.900215148925781, -4.570993423461914, -0.24177169799804688, 4.08745002746582, 8.416671752929688, 12.745893478393555, 17.075115203857422, 21.40433692932129, 25.733558654785156, 30.062780380249023, 34.39200210571289, 38.721221923828125, 43.050445556640625, 47.379669189453125, 51.70888900756836, 56.038108825683594, 60.367332458496094, 64.6965560913086, 69.02577209472656, 73.35499572753906, 77.68421936035156, 82.01344299316406, 86.34266662597656, 90.67188262939453, 95.00110626220703, 99.33032989501953, 103.6595458984375, 107.98876953125, 112.3179931640625]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 11.0, 7.0, 6.0, 22.0, 11.0, 8.0, 11.0, 24.0, 21.0, 38.0, 22.0, 35.0, 28.0, 45.0, 40.0, 34.0, 67.0, 48.0, 55.0, 49.0, 49.0, 46.0, 45.0, 33.0, 41.0, 24.0, 26.0, 30.0, 25.0, 17.0, 16.0, 15.0, 12.0, 7.0, 5.0, 4.0, 3.0, 5.0, 5.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-34.372947692871094, -33.1755256652832, -31.978105545043945, -30.780683517456055, -29.583261489868164, -28.385841369628906, -27.188419342041016, -25.990997314453125, -24.793575286865234, -23.596153259277344, -22.398733139038086, -21.201311111450195, -20.003889083862305, -18.806468963623047, -17.609046936035156, -16.411624908447266, -15.214204788208008, -14.016783714294434, -12.819361686706543, -11.621940612792969, -10.424518585205078, -9.227097511291504, -8.02967643737793, -6.832254409790039, -5.634833335876465, -4.437411785125732, -3.239990472793579, -2.042569160461426, -0.8451476097106934, 0.35227394104003906, 1.5496950149536133, 2.747117042541504, 3.944538116455078, 5.1419596672058105, 6.339381217956543, 7.536802291870117, 8.734224319458008, 9.931645393371582, 11.129066467285156, 12.326488494873047, 13.523909568786621, 14.721330642700195, 15.918752670288086, 17.116172790527344, 18.313594818115234, 19.511016845703125, 20.708438873291016, 21.905860900878906, 23.103281021118164, 24.300703048706055, 25.498123168945312, 26.695545196533203, 27.892967224121094, 29.090389251708984, 30.287809371948242, 31.485231399536133, 32.68265151977539, 33.88007354736328, 35.07749557495117, 36.27491760253906, 37.47233581542969, 38.66975784301758, 39.86717987060547, 41.06460189819336, 42.26202392578125]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 4.0, 4.0, 4.0, 7.0, 11.0, 14.0, 19.0, 43.0, 101.0, 159.0, 293.0, 663.0, 1550.0, 3993.0, 13255.0, 56859.0, 317737.0, 518581.0, 103848.0, 21572.0, 5960.0, 2096.0, 898.0, 407.0, 201.0, 120.0, 57.0, 36.0, 22.0, 20.0, 9.0, 7.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.859375, -16.132080078125, -15.40478515625, -14.677490234375, -13.9501953125, -13.222900390625, -12.49560546875, -11.768310546875, -11.041015625, -10.313720703125, -9.58642578125, -8.859130859375, -8.1318359375, -7.404541015625, -6.67724609375, -5.949951171875, -5.22265625, -4.495361328125, -3.76806640625, -3.040771484375, -2.3134765625, -1.586181640625, -0.85888671875, -0.131591796875, 0.595703125, 1.322998046875, 2.05029296875, 2.777587890625, 3.5048828125, 4.232177734375, 4.95947265625, 5.686767578125, 6.4140625, 7.141357421875, 7.86865234375, 8.595947265625, 9.3232421875, 10.050537109375, 10.77783203125, 11.505126953125, 12.232421875, 12.959716796875, 13.68701171875, 14.414306640625, 15.1416015625, 15.868896484375, 16.59619140625, 17.323486328125, 18.05078125, 18.778076171875, 19.50537109375, 20.232666015625, 20.9599609375, 21.687255859375, 22.41455078125, 23.141845703125, 23.869140625, 24.596435546875, 25.32373046875, 26.051025390625, 26.7783203125, 27.505615234375, 28.23291015625, 28.960205078125, 29.6875]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 11.0, 1.0, 9.0, 9.0, 9.0, 15.0, 16.0, 13.0, 17.0, 17.0, 21.0, 24.0, 24.0, 40.0, 38.0, 35.0, 31.0, 35.0, 39.0, 50.0, 44.0, 44.0, 50.0, 46.0, 42.0, 49.0, 37.0, 42.0, 21.0, 31.0, 36.0, 20.0, 14.0, 7.0, 13.0, 8.0, 11.0, 10.0, 4.0, 4.0, 5.0, 4.0, 3.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-3.5, -3.38262939453125, -3.2652587890625, -3.14788818359375, -3.030517578125, -2.91314697265625, -2.7957763671875, -2.67840576171875, -2.56103515625, -2.44366455078125, -2.3262939453125, -2.20892333984375, -2.091552734375, -1.97418212890625, -1.8568115234375, -1.73944091796875, -1.6220703125, -1.50469970703125, -1.3873291015625, -1.26995849609375, -1.152587890625, -1.03521728515625, -0.9178466796875, -0.80047607421875, -0.68310546875, -0.56573486328125, -0.4483642578125, -0.33099365234375, -0.213623046875, -0.09625244140625, 0.0211181640625, 0.13848876953125, 0.255859375, 0.37322998046875, 0.4906005859375, 0.60797119140625, 0.725341796875, 0.84271240234375, 0.9600830078125, 1.07745361328125, 1.19482421875, 1.31219482421875, 1.4295654296875, 1.54693603515625, 1.664306640625, 1.78167724609375, 1.8990478515625, 2.01641845703125, 2.1337890625, 2.25115966796875, 2.3685302734375, 2.48590087890625, 2.603271484375, 2.72064208984375, 2.8380126953125, 2.95538330078125, 3.07275390625, 3.19012451171875, 3.3074951171875, 3.42486572265625, 3.542236328125, 3.65960693359375, 3.7769775390625, 3.89434814453125, 4.01171875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 2.0, 4.0, 2.0, 15.0, 9.0, 18.0, 24.0, 34.0, 48.0, 74.0, 76.0, 138.0, 168.0, 232.0, 333.0, 506.0, 804.0, 1676.0, 4023.0, 14459.0, 78215.0, 544590.0, 340310.0, 46670.0, 9714.0, 2941.0, 1285.0, 706.0, 434.0, 301.0, 199.0, 161.0, 105.0, 86.0, 65.0, 26.0, 33.0, 23.0, 20.0, 8.0, 11.0, 7.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.875, -23.1484375, -22.421875, -21.6953125, -20.96875, -20.2421875, -19.515625, -18.7890625, -18.0625, -17.3359375, -16.609375, -15.8828125, -15.15625, -14.4296875, -13.703125, -12.9765625, -12.25, -11.5234375, -10.796875, -10.0703125, -9.34375, -8.6171875, -7.890625, -7.1640625, -6.4375, -5.7109375, -4.984375, -4.2578125, -3.53125, -2.8046875, -2.078125, -1.3515625, -0.625, 0.1015625, 0.828125, 1.5546875, 2.28125, 3.0078125, 3.734375, 4.4609375, 5.1875, 5.9140625, 6.640625, 7.3671875, 8.09375, 8.8203125, 9.546875, 10.2734375, 11.0, 11.7265625, 12.453125, 13.1796875, 13.90625, 14.6328125, 15.359375, 16.0859375, 16.8125, 17.5390625, 18.265625, 18.9921875, 19.71875, 20.4453125, 21.171875, 21.8984375, 22.625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 10.0, 6.0, 3.0, 9.0, 8.0, 9.0, 20.0, 25.0, 29.0, 31.0, 34.0, 39.0, 43.0, 42.0, 37.0, 45.0, 55.0, 54.0, 44.0, 58.0, 41.0, 50.0, 44.0, 45.0, 31.0, 34.0, 31.0, 22.0, 18.0, 24.0, 16.0, 12.0, 5.0, 7.0, 8.0, 3.0, 6.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.28125, -19.618408203125, -18.95556640625, -18.292724609375, -17.6298828125, -16.967041015625, -16.30419921875, -15.641357421875, -14.978515625, -14.315673828125, -13.65283203125, -12.989990234375, -12.3271484375, -11.664306640625, -11.00146484375, -10.338623046875, -9.67578125, -9.012939453125, -8.35009765625, -7.687255859375, -7.0244140625, -6.361572265625, -5.69873046875, -5.035888671875, -4.373046875, -3.710205078125, -3.04736328125, -2.384521484375, -1.7216796875, -1.058837890625, -0.39599609375, 0.266845703125, 0.9296875, 1.592529296875, 2.25537109375, 2.918212890625, 3.5810546875, 4.243896484375, 4.90673828125, 5.569580078125, 6.232421875, 6.895263671875, 7.55810546875, 8.220947265625, 8.8837890625, 9.546630859375, 10.20947265625, 10.872314453125, 11.53515625, 12.197998046875, 12.86083984375, 13.523681640625, 14.1865234375, 14.849365234375, 15.51220703125, 16.175048828125, 16.837890625, 17.500732421875, 18.16357421875, 18.826416015625, 19.4892578125, 20.152099609375, 20.81494140625, 21.477783203125, 22.140625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 6.0, 7.0, 1.0, 12.0, 12.0, 13.0, 18.0, 33.0, 43.0, 62.0, 93.0, 170.0, 277.0, 505.0, 1107.0, 2300.0, 6077.0, 23196.0, 194566.0, 722909.0, 75817.0, 13496.0, 4318.0, 1665.0, 818.0, 422.0, 221.0, 135.0, 80.0, 57.0, 41.0, 16.0, 22.0, 8.0, 8.0, 6.0, 8.0, 6.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-17.609375, -17.064453125, -16.51953125, -15.974609375, -15.4296875, -14.884765625, -14.33984375, -13.794921875, -13.25, -12.705078125, -12.16015625, -11.615234375, -11.0703125, -10.525390625, -9.98046875, -9.435546875, -8.890625, -8.345703125, -7.80078125, -7.255859375, -6.7109375, -6.166015625, -5.62109375, -5.076171875, -4.53125, -3.986328125, -3.44140625, -2.896484375, -2.3515625, -1.806640625, -1.26171875, -0.716796875, -0.171875, 0.373046875, 0.91796875, 1.462890625, 2.0078125, 2.552734375, 3.09765625, 3.642578125, 4.1875, 4.732421875, 5.27734375, 5.822265625, 6.3671875, 6.912109375, 7.45703125, 8.001953125, 8.546875, 9.091796875, 9.63671875, 10.181640625, 10.7265625, 11.271484375, 11.81640625, 12.361328125, 12.90625, 13.451171875, 13.99609375, 14.541015625, 15.0859375, 15.630859375, 16.17578125, 16.720703125, 17.265625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 4.0, 6.0, 13.0, 10.0, 18.0, 39.0, 66.0, 92.0, 140.0, 188.0, 155.0, 99.0, 53.0, 45.0, 27.0, 15.0, 9.0, 10.0, 2.0, 8.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00209808349609375, -0.001984834671020508, -0.0018715858459472656, -0.0017583370208740234, -0.0016450881958007812, -0.001531839370727539, -0.0014185905456542969, -0.0013053417205810547, -0.0011920928955078125, -0.0010788440704345703, -0.0009655952453613281, -0.0008523464202880859, -0.0007390975952148438, -0.0006258487701416016, -0.0005125999450683594, -0.0003993511199951172, -0.000286102294921875, -0.0001728534698486328, -5.9604644775390625e-05, 5.364418029785156e-05, 0.00016689300537109375, 0.00028014183044433594, 0.0003933906555175781, 0.0005066394805908203, 0.0006198883056640625, 0.0007331371307373047, 0.0008463859558105469, 0.0009596347808837891, 0.0010728836059570312, 0.0011861324310302734, 0.0012993812561035156, 0.0014126300811767578, 0.00152587890625, 0.0016391277313232422, 0.0017523765563964844, 0.0018656253814697266, 0.0019788742065429688, 0.002092123031616211, 0.002205371856689453, 0.0023186206817626953, 0.0024318695068359375, 0.0025451183319091797, 0.002658367156982422, 0.002771615982055664, 0.0028848648071289062, 0.0029981136322021484, 0.0031113624572753906, 0.003224611282348633, 0.003337860107421875, 0.003451108932495117, 0.0035643577575683594, 0.0036776065826416016, 0.0037908554077148438, 0.003904104232788086, 0.004017353057861328, 0.00413060188293457, 0.0042438507080078125, 0.004357099533081055, 0.004470348358154297, 0.004583597183227539, 0.004696846008300781, 0.0048100948333740234, 0.004923343658447266, 0.005036592483520508, 0.00514984130859375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 7.0, 5.0, 5.0, 11.0, 11.0, 8.0, 22.0, 32.0, 32.0, 40.0, 105.0, 128.0, 193.0, 400.0, 959.0, 2597.0, 10687.0, 106468.0, 863205.0, 52390.0, 7526.0, 2094.0, 739.0, 332.0, 200.0, 121.0, 63.0, 52.0, 38.0, 26.0, 24.0, 8.0, 10.0, 5.0, 9.0, 1.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.5, -23.666259765625, -22.83251953125, -21.998779296875, -21.1650390625, -20.331298828125, -19.49755859375, -18.663818359375, -17.830078125, -16.996337890625, -16.16259765625, -15.328857421875, -14.4951171875, -13.661376953125, -12.82763671875, -11.993896484375, -11.16015625, -10.326416015625, -9.49267578125, -8.658935546875, -7.8251953125, -6.991455078125, -6.15771484375, -5.323974609375, -4.490234375, -3.656494140625, -2.82275390625, -1.989013671875, -1.1552734375, -0.321533203125, 0.51220703125, 1.345947265625, 2.1796875, 3.013427734375, 3.84716796875, 4.680908203125, 5.5146484375, 6.348388671875, 7.18212890625, 8.015869140625, 8.849609375, 9.683349609375, 10.51708984375, 11.350830078125, 12.1845703125, 13.018310546875, 13.85205078125, 14.685791015625, 15.51953125, 16.353271484375, 17.18701171875, 18.020751953125, 18.8544921875, 19.688232421875, 20.52197265625, 21.355712890625, 22.189453125, 23.023193359375, 23.85693359375, 24.690673828125, 25.5244140625, 26.358154296875, 27.19189453125, 28.025634765625, 28.859375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 5.0, 5.0, 5.0, 10.0, 10.0, 12.0, 17.0, 26.0, 48.0, 59.0, 99.0, 126.0, 184.0, 137.0, 99.0, 47.0, 39.0, 19.0, 13.0, 20.0, 8.0, 4.0, 4.0, 2.0, 6.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.796875, -20.2269287109375, -19.656982421875, -19.0870361328125, -18.51708984375, -17.9471435546875, -17.377197265625, -16.8072509765625, -16.2373046875, -15.6673583984375, -15.097412109375, -14.5274658203125, -13.95751953125, -13.3875732421875, -12.817626953125, -12.2476806640625, -11.677734375, -11.1077880859375, -10.537841796875, -9.9678955078125, -9.39794921875, -8.8280029296875, -8.258056640625, -7.6881103515625, -7.1181640625, -6.5482177734375, -5.978271484375, -5.4083251953125, -4.83837890625, -4.2684326171875, -3.698486328125, -3.1285400390625, -2.55859375, -1.9886474609375, -1.418701171875, -0.8487548828125, -0.27880859375, 0.2911376953125, 0.861083984375, 1.4310302734375, 2.0009765625, 2.5709228515625, 3.140869140625, 3.7108154296875, 4.28076171875, 4.8507080078125, 5.420654296875, 5.9906005859375, 6.560546875, 7.1304931640625, 7.700439453125, 8.2703857421875, 8.84033203125, 9.4102783203125, 9.980224609375, 10.5501708984375, 11.1201171875, 11.6900634765625, 12.260009765625, 12.8299560546875, 13.39990234375, 13.9698486328125, 14.539794921875, 15.1097412109375, 15.6796875]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 5.0, 22.0, 104.0, 273.0, 354.0, 173.0, 50.0, 12.0, 6.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-504.19976806640625, -490.9960632324219, -477.7923278808594, -464.588623046875, -451.3849182128906, -438.1811828613281, -424.97747802734375, -411.77374267578125, -398.5700378417969, -385.3663330078125, -372.16259765625, -358.9588928222656, -345.75518798828125, -332.55145263671875, -319.3477478027344, -306.14404296875, -292.9403076171875, -279.7366027832031, -266.5328674316406, -253.32916259765625, -240.1254425048828, -226.92172241210938, -213.718017578125, -200.51429748535156, -187.31060791015625, -174.1068878173828, -160.90318298339844, -147.699462890625, -134.49574279785156, -121.29203033447266, -108.08831787109375, -94.88459777832031, -81.68087768554688, -68.47716522216797, -55.27344512939453, -42.069732666015625, -28.866016387939453, -15.662300109863281, -2.458587646484375, 10.745132446289062, 23.94884490966797, 37.15256118774414, 50.35627746582031, 63.55998992919922, 76.76370239257812, 89.96742248535156, 103.17113494873047, 116.3748550415039, 129.5785675048828, 142.78228759765625, 155.98599243164062, 169.18971252441406, 182.3934326171875, 195.59713745117188, 208.8008575439453, 222.00457763671875, 235.20828247070312, 248.41200256347656, 261.61572265625, 274.8194274902344, 288.02313232421875, 301.22686767578125, 314.4305725097656, 327.63427734375, 340.8380126953125]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 3.0, 8.0, 9.0, 14.0, 12.0, 17.0, 10.0, 20.0, 32.0, 28.0, 30.0, 35.0, 36.0, 36.0, 44.0, 43.0, 48.0, 46.0, 45.0, 47.0, 50.0, 47.0, 49.0, 33.0, 34.0, 42.0, 36.0, 26.0, 25.0, 22.0, 15.0, 13.0, 6.0, 11.0, 12.0, 11.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-117.52378845214844, -114.04743957519531, -110.57109832763672, -107.09475708007812, -103.618408203125, -100.14205932617188, -96.66571807861328, -93.18937683105469, -89.71302795410156, -86.23667907714844, -82.76033782958984, -79.28399658203125, -75.80764770507812, -72.331298828125, -68.8549575805664, -65.37861633300781, -61.90226745605469, -58.42592239379883, -54.94957733154297, -51.47323226928711, -47.99688720703125, -44.52054214477539, -41.04419708251953, -37.56785202026367, -34.09150695800781, -30.615161895751953, -27.138816833496094, -23.662471771240234, -20.186126708984375, -16.709781646728516, -13.233436584472656, -9.757091522216797, -6.2807464599609375, -2.804401397705078, 0.6719436645507812, 4.148288726806641, 7.6246337890625, 11.10097885131836, 14.577323913574219, 18.053668975830078, 21.530014038085938, 25.006359100341797, 28.482704162597656, 31.959049224853516, 35.435394287109375, 38.911739349365234, 42.388084411621094, 45.86442947387695, 49.34077453613281, 52.81711959838867, 56.29346466064453, 59.76980972290039, 63.24615478515625, 66.72250366210938, 70.19884490966797, 73.67518615722656, 77.15153503417969, 80.62788391113281, 84.1042251586914, 87.58056640625, 91.05691528320312, 94.53326416015625, 98.00960540771484, 101.48594665527344, 104.96229553222656]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 6.0, 5.0, 9.0, 14.0, 15.0, 39.0, 27.0, 54.0, 79.0, 117.0, 187.0, 362.0, 616.0, 1186.0, 2414.0, 6418.0, 72820.0, 4087851.0, 14794.0, 3741.0, 1602.0, 827.0, 414.0, 222.0, 152.0, 82.0, 57.0, 46.0, 30.0, 19.0, 15.0, 14.0, 15.0, 10.0, 2.0, 5.0, 9.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.25, -33.85400390625, -32.4580078125, -31.06201171875, -29.666015625, -28.27001953125, -26.8740234375, -25.47802734375, -24.08203125, -22.68603515625, -21.2900390625, -19.89404296875, -18.498046875, -17.10205078125, -15.7060546875, -14.31005859375, -12.9140625, -11.51806640625, -10.1220703125, -8.72607421875, -7.330078125, -5.93408203125, -4.5380859375, -3.14208984375, -1.74609375, -0.35009765625, 1.0458984375, 2.44189453125, 3.837890625, 5.23388671875, 6.6298828125, 8.02587890625, 9.421875, 10.81787109375, 12.2138671875, 13.60986328125, 15.005859375, 16.40185546875, 17.7978515625, 19.19384765625, 20.58984375, 21.98583984375, 23.3818359375, 24.77783203125, 26.173828125, 27.56982421875, 28.9658203125, 30.36181640625, 31.7578125, 33.15380859375, 34.5498046875, 35.94580078125, 37.341796875, 38.73779296875, 40.1337890625, 41.52978515625, 42.92578125, 44.32177734375, 45.7177734375, 47.11376953125, 48.509765625, 49.90576171875, 51.3017578125, 52.69775390625, 54.09375]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 3.0, 4.0, 5.0, 6.0, 10.0, 11.0, 14.0, 15.0, 14.0, 18.0, 34.0, 29.0, 32.0, 31.0, 45.0, 34.0, 47.0, 49.0, 47.0, 48.0, 42.0, 44.0, 47.0, 51.0, 41.0, 45.0, 33.0, 40.0, 31.0, 31.0, 25.0, 18.0, 11.0, 4.0, 7.0, 10.0, 9.0, 6.0, 2.0, 4.0, 4.0, 3.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.546875, -4.401123046875, -4.25537109375, -4.109619140625, -3.9638671875, -3.818115234375, -3.67236328125, -3.526611328125, -3.380859375, -3.235107421875, -3.08935546875, -2.943603515625, -2.7978515625, -2.652099609375, -2.50634765625, -2.360595703125, -2.21484375, -2.069091796875, -1.92333984375, -1.777587890625, -1.6318359375, -1.486083984375, -1.34033203125, -1.194580078125, -1.048828125, -0.903076171875, -0.75732421875, -0.611572265625, -0.4658203125, -0.320068359375, -0.17431640625, -0.028564453125, 0.1171875, 0.262939453125, 0.40869140625, 0.554443359375, 0.7001953125, 0.845947265625, 0.99169921875, 1.137451171875, 1.283203125, 1.428955078125, 1.57470703125, 1.720458984375, 1.8662109375, 2.011962890625, 2.15771484375, 2.303466796875, 2.44921875, 2.594970703125, 2.74072265625, 2.886474609375, 3.0322265625, 3.177978515625, 3.32373046875, 3.469482421875, 3.615234375, 3.760986328125, 3.90673828125, 4.052490234375, 4.1982421875, 4.343994140625, 4.48974609375, 4.635498046875, 4.78125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 7.0, 9.0, 15.0, 15.0, 31.0, 33.0, 66.0, 185.0, 408.0, 1262.0, 4735.0, 44119.0, 4119980.0, 18872.0, 3049.0, 884.0, 286.0, 110.0, 70.0, 52.0, 36.0, 22.0, 14.0, 13.0, 9.0, 3.0, 1.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.71875, -45.58447265625, -43.4501953125, -41.31591796875, -39.181640625, -37.04736328125, -34.9130859375, -32.77880859375, -30.64453125, -28.51025390625, -26.3759765625, -24.24169921875, -22.107421875, -19.97314453125, -17.8388671875, -15.70458984375, -13.5703125, -11.43603515625, -9.3017578125, -7.16748046875, -5.033203125, -2.89892578125, -0.7646484375, 1.36962890625, 3.50390625, 5.63818359375, 7.7724609375, 9.90673828125, 12.041015625, 14.17529296875, 16.3095703125, 18.44384765625, 20.578125, 22.71240234375, 24.8466796875, 26.98095703125, 29.115234375, 31.24951171875, 33.3837890625, 35.51806640625, 37.65234375, 39.78662109375, 41.9208984375, 44.05517578125, 46.189453125, 48.32373046875, 50.4580078125, 52.59228515625, 54.7265625, 56.86083984375, 58.9951171875, 61.12939453125, 63.263671875, 65.39794921875, 67.5322265625, 69.66650390625, 71.80078125, 73.93505859375, 76.0693359375, 78.20361328125, 80.337890625, 82.47216796875, 84.6064453125, 86.74072265625, 88.875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 0.0, 3.0, 0.0, 5.0, 12.0, 11.0, 14.0, 46.0, 116.0, 3581.0, 207.0, 41.0, 16.0, 14.0, 6.0, 3.0, 6.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.58984375, -5.25384521484375, -4.9178466796875, -4.58184814453125, -4.245849609375, -3.90985107421875, -3.5738525390625, -3.23785400390625, -2.90185546875, -2.56585693359375, -2.2298583984375, -1.89385986328125, -1.557861328125, -1.22186279296875, -0.8858642578125, -0.54986572265625, -0.2138671875, 0.12213134765625, 0.4581298828125, 0.79412841796875, 1.130126953125, 1.46612548828125, 1.8021240234375, 2.13812255859375, 2.47412109375, 2.81011962890625, 3.1461181640625, 3.48211669921875, 3.818115234375, 4.15411376953125, 4.4901123046875, 4.82611083984375, 5.162109375, 5.49810791015625, 5.8341064453125, 6.17010498046875, 6.506103515625, 6.84210205078125, 7.1781005859375, 7.51409912109375, 7.85009765625, 8.18609619140625, 8.5220947265625, 8.85809326171875, 9.194091796875, 9.53009033203125, 9.8660888671875, 10.20208740234375, 10.5380859375, 10.87408447265625, 11.2100830078125, 11.54608154296875, 11.882080078125, 12.21807861328125, 12.5540771484375, 12.89007568359375, 13.22607421875, 13.56207275390625, 13.8980712890625, 14.23406982421875, 14.570068359375, 14.90606689453125, 15.2420654296875, 15.57806396484375, 15.9140625]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 13.0, 11.0, 37.0, 61.0, 162.0, 201.0, 214.0, 176.0, 80.0, 29.0, 11.0, 8.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.744178771972656, -59.430084228515625, -58.115989685058594, -56.80189514160156, -55.48780059814453, -54.1737060546875, -52.85961151123047, -51.54551696777344, -50.231422424316406, -48.917327880859375, -47.603233337402344, -46.28913879394531, -44.97504425048828, -43.66094970703125, -42.34685516357422, -41.03276062011719, -39.718666076660156, -38.404571533203125, -37.090476989746094, -35.77638244628906, -34.46228790283203, -33.148193359375, -31.83409881591797, -30.520004272460938, -29.205913543701172, -27.89181900024414, -26.57772445678711, -25.263629913330078, -23.949535369873047, -22.635440826416016, -21.321346282958984, -20.007251739501953, -18.693157196044922, -17.37906265258789, -16.06496810913086, -14.750873565673828, -13.436779022216797, -12.122684478759766, -10.80859088897705, -9.49449634552002, -8.180401802062988, -6.866307258605957, -5.552212715148926, -4.238118648529053, -2.9240241050720215, -1.6099295616149902, -0.2958354949951172, 1.018259048461914, 2.3323535919189453, 3.6464481353759766, 4.960542678833008, 6.274636745452881, 7.588731288909912, 8.902826309204102, 10.216919898986816, 11.531014442443848, 12.845108985900879, 14.15920352935791, 15.473298072814941, 16.787391662597656, 18.101486206054688, 19.41558074951172, 20.72967529296875, 22.04376983642578, 23.357864379882812]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 4.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 0.0, 10.0, 6.0, 7.0, 12.0, 6.0, 14.0, 17.0, 17.0, 16.0, 21.0, 19.0, 30.0, 32.0, 26.0, 40.0, 35.0, 35.0, 40.0, 24.0, 37.0, 41.0, 30.0, 42.0, 42.0, 42.0, 35.0, 28.0, 33.0, 31.0, 33.0, 19.0, 24.0, 23.0, 27.0, 21.0, 9.0, 20.0, 4.0, 8.0, 4.0, 14.0, 6.0, 4.0, 3.0, 2.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.126870155334473, -10.776680946350098, -10.426491737365723, -10.076302528381348, -9.726114273071289, -9.375925064086914, -9.025735855102539, -8.675546646118164, -8.325357437133789, -7.975168228149414, -7.624979019165039, -7.274790287017822, -6.924601078033447, -6.574411869049072, -6.2242231369018555, -5.8740339279174805, -5.5238447189331055, -5.1736555099487305, -4.8234663009643555, -4.473277568817139, -4.123088359832764, -3.7728991508483887, -3.4227101802825928, -3.072521209716797, -2.722332000732422, -2.372142791748047, -2.021953821182251, -1.6717647314071655, -1.32157564163208, -0.9713865518569946, -0.6211974620819092, -0.2710084915161133, 0.07917976379394531, 0.42936885356903076, 0.7795579433441162, 1.1297470331192017, 1.479936122894287, 1.8301252126693726, 2.180314302444458, 2.530503273010254, 2.880692481994629, 3.230881690979004, 3.5810706615448, 3.9312596321105957, 4.281448841094971, 4.631638050079346, 4.9818267822265625, 5.3320159912109375, 5.6822052001953125, 6.0323944091796875, 6.3825836181640625, 6.732772350311279, 7.082961559295654, 7.433150768280029, 7.783339500427246, 8.133528709411621, 8.483717918395996, 8.833907127380371, 9.184096336364746, 9.534285545349121, 9.88447380065918, 10.234663009643555, 10.58485221862793, 10.935041427612305, 11.28523063659668]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 7.0, 5.0, 2.0, 11.0, 10.0, 18.0, 20.0, 24.0, 42.0, 32.0, 76.0, 75.0, 154.0, 170.0, 312.0, 568.0, 997.0, 1843.0, 4154.0, 8932.0, 21053.0, 52341.0, 136463.0, 300434.0, 297971.0, 133417.0, 51384.0, 20835.0, 8764.0, 3973.0, 1912.0, 992.0, 590.0, 352.0, 198.0, 104.0, 91.0, 58.0, 52.0, 31.0, 24.0, 19.0, 13.0, 11.0, 11.0, 5.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-11.7265625, -11.37109375, -11.015625, -10.66015625, -10.3046875, -9.94921875, -9.59375, -9.23828125, -8.8828125, -8.52734375, -8.171875, -7.81640625, -7.4609375, -7.10546875, -6.75, -6.39453125, -6.0390625, -5.68359375, -5.328125, -4.97265625, -4.6171875, -4.26171875, -3.90625, -3.55078125, -3.1953125, -2.83984375, -2.484375, -2.12890625, -1.7734375, -1.41796875, -1.0625, -0.70703125, -0.3515625, 0.00390625, 0.359375, 0.71484375, 1.0703125, 1.42578125, 1.78125, 2.13671875, 2.4921875, 2.84765625, 3.203125, 3.55859375, 3.9140625, 4.26953125, 4.625, 4.98046875, 5.3359375, 5.69140625, 6.046875, 6.40234375, 6.7578125, 7.11328125, 7.46875, 7.82421875, 8.1796875, 8.53515625, 8.890625, 9.24609375, 9.6015625, 9.95703125, 10.3125, 10.66796875, 11.0234375]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 4.0, 5.0, 5.0, 9.0, 9.0, 9.0, 10.0, 14.0, 16.0, 18.0, 21.0, 21.0, 25.0, 32.0, 29.0, 41.0, 36.0, 32.0, 30.0, 43.0, 43.0, 45.0, 36.0, 47.0, 41.0, 34.0, 42.0, 31.0, 28.0, 29.0, 38.0, 34.0, 24.0, 14.0, 19.0, 18.0, 8.0, 11.0, 12.0, 13.0, 4.0, 6.0, 4.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.453125, -4.314208984375, -4.17529296875, -4.036376953125, -3.8974609375, -3.758544921875, -3.61962890625, -3.480712890625, -3.341796875, -3.202880859375, -3.06396484375, -2.925048828125, -2.7861328125, -2.647216796875, -2.50830078125, -2.369384765625, -2.23046875, -2.091552734375, -1.95263671875, -1.813720703125, -1.6748046875, -1.535888671875, -1.39697265625, -1.258056640625, -1.119140625, -0.980224609375, -0.84130859375, -0.702392578125, -0.5634765625, -0.424560546875, -0.28564453125, -0.146728515625, -0.0078125, 0.131103515625, 0.27001953125, 0.408935546875, 0.5478515625, 0.686767578125, 0.82568359375, 0.964599609375, 1.103515625, 1.242431640625, 1.38134765625, 1.520263671875, 1.6591796875, 1.798095703125, 1.93701171875, 2.075927734375, 2.21484375, 2.353759765625, 2.49267578125, 2.631591796875, 2.7705078125, 2.909423828125, 3.04833984375, 3.187255859375, 3.326171875, 3.465087890625, 3.60400390625, 3.742919921875, 3.8818359375, 4.020751953125, 4.15966796875, 4.298583984375, 4.4375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 2.0, 10.0, 10.0, 14.0, 13.0, 29.0, 48.0, 54.0, 74.0, 92.0, 198.0, 285.0, 425.0, 821.0, 1574.0, 5122.0, 37537.0, 568998.0, 399501.0, 26445.0, 4038.0, 1367.0, 752.0, 399.0, 248.0, 160.0, 100.0, 74.0, 59.0, 25.0, 22.0, 22.0, 6.0, 8.0, 10.0, 6.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-33.5625, -32.6015625, -31.640625, -30.6796875, -29.71875, -28.7578125, -27.796875, -26.8359375, -25.875, -24.9140625, -23.953125, -22.9921875, -22.03125, -21.0703125, -20.109375, -19.1484375, -18.1875, -17.2265625, -16.265625, -15.3046875, -14.34375, -13.3828125, -12.421875, -11.4609375, -10.5, -9.5390625, -8.578125, -7.6171875, -6.65625, -5.6953125, -4.734375, -3.7734375, -2.8125, -1.8515625, -0.890625, 0.0703125, 1.03125, 1.9921875, 2.953125, 3.9140625, 4.875, 5.8359375, 6.796875, 7.7578125, 8.71875, 9.6796875, 10.640625, 11.6015625, 12.5625, 13.5234375, 14.484375, 15.4453125, 16.40625, 17.3671875, 18.328125, 19.2890625, 20.25, 21.2109375, 22.171875, 23.1328125, 24.09375, 25.0546875, 26.015625, 26.9765625, 27.9375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 1.0, 5.0, 6.0, 1.0, 4.0, 4.0, 9.0, 10.0, 14.0, 15.0, 11.0, 10.0, 23.0, 23.0, 28.0, 27.0, 34.0, 37.0, 45.0, 42.0, 48.0, 31.0, 38.0, 56.0, 50.0, 40.0, 33.0, 37.0, 41.0, 24.0, 36.0, 40.0, 31.0, 25.0, 21.0, 17.0, 17.0, 12.0, 8.0, 8.0, 10.0, 5.0, 15.0, 2.0, 5.0, 1.0, 1.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-21.359375, -20.656005859375, -19.95263671875, -19.249267578125, -18.5458984375, -17.842529296875, -17.13916015625, -16.435791015625, -15.732421875, -15.029052734375, -14.32568359375, -13.622314453125, -12.9189453125, -12.215576171875, -11.51220703125, -10.808837890625, -10.10546875, -9.402099609375, -8.69873046875, -7.995361328125, -7.2919921875, -6.588623046875, -5.88525390625, -5.181884765625, -4.478515625, -3.775146484375, -3.07177734375, -2.368408203125, -1.6650390625, -0.961669921875, -0.25830078125, 0.445068359375, 1.1484375, 1.851806640625, 2.55517578125, 3.258544921875, 3.9619140625, 4.665283203125, 5.36865234375, 6.072021484375, 6.775390625, 7.478759765625, 8.18212890625, 8.885498046875, 9.5888671875, 10.292236328125, 10.99560546875, 11.698974609375, 12.40234375, 13.105712890625, 13.80908203125, 14.512451171875, 15.2158203125, 15.919189453125, 16.62255859375, 17.325927734375, 18.029296875, 18.732666015625, 19.43603515625, 20.139404296875, 20.8427734375, 21.546142578125, 22.24951171875, 22.952880859375, 23.65625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 4.0, 4.0, 5.0, 7.0, 5.0, 20.0, 9.0, 21.0, 20.0, 38.0, 53.0, 87.0, 147.0, 223.0, 375.0, 751.0, 1800.0, 4226.0, 13813.0, 66549.0, 506947.0, 384446.0, 50591.0, 11492.0, 3724.0, 1563.0, 718.0, 385.0, 189.0, 118.0, 89.0, 44.0, 30.0, 21.0, 10.0, 8.0, 9.0, 8.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.4765625, -8.136474609375, -7.79638671875, -7.456298828125, -7.1162109375, -6.776123046875, -6.43603515625, -6.095947265625, -5.755859375, -5.415771484375, -5.07568359375, -4.735595703125, -4.3955078125, -4.055419921875, -3.71533203125, -3.375244140625, -3.03515625, -2.695068359375, -2.35498046875, -2.014892578125, -1.6748046875, -1.334716796875, -0.99462890625, -0.654541015625, -0.314453125, 0.025634765625, 0.36572265625, 0.705810546875, 1.0458984375, 1.385986328125, 1.72607421875, 2.066162109375, 2.40625, 2.746337890625, 3.08642578125, 3.426513671875, 3.7666015625, 4.106689453125, 4.44677734375, 4.786865234375, 5.126953125, 5.467041015625, 5.80712890625, 6.147216796875, 6.4873046875, 6.827392578125, 7.16748046875, 7.507568359375, 7.84765625, 8.187744140625, 8.52783203125, 8.867919921875, 9.2080078125, 9.548095703125, 9.88818359375, 10.228271484375, 10.568359375, 10.908447265625, 11.24853515625, 11.588623046875, 11.9287109375, 12.268798828125, 12.60888671875, 12.948974609375, 13.2890625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 1.0, 7.0, 4.0, 7.0, 12.0, 15.0, 17.0, 29.0, 42.0, 58.0, 87.0, 134.0, 134.0, 129.0, 94.0, 73.0, 45.0, 37.0, 14.0, 20.0, 9.0, 6.0, 5.0, 3.0, 5.0, 3.0, 6.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0027446746826171875, -0.0026677846908569336, -0.0025908946990966797, -0.0025140047073364258, -0.002437114715576172, -0.002360224723815918, -0.002283334732055664, -0.00220644474029541, -0.0021295547485351562, -0.0020526647567749023, -0.0019757747650146484, -0.0018988847732543945, -0.0018219947814941406, -0.0017451047897338867, -0.0016682147979736328, -0.001591324806213379, -0.001514434814453125, -0.001437544822692871, -0.0013606548309326172, -0.0012837648391723633, -0.0012068748474121094, -0.0011299848556518555, -0.0010530948638916016, -0.0009762048721313477, -0.0008993148803710938, -0.0008224248886108398, -0.0007455348968505859, -0.000668644905090332, -0.0005917549133300781, -0.0005148649215698242, -0.0004379749298095703, -0.0003610849380493164, -0.0002841949462890625, -0.0002073049545288086, -0.0001304149627685547, -5.352497100830078e-05, 2.3365020751953125e-05, 0.00010025501251220703, 0.00017714500427246094, 0.00025403499603271484, 0.00033092498779296875, 0.00040781497955322266, 0.00048470497131347656, 0.0005615949630737305, 0.0006384849548339844, 0.0007153749465942383, 0.0007922649383544922, 0.0008691549301147461, 0.000946044921875, 0.001022934913635254, 0.0010998249053955078, 0.0011767148971557617, 0.0012536048889160156, 0.0013304948806762695, 0.0014073848724365234, 0.0014842748641967773, 0.0015611648559570312, 0.0016380548477172852, 0.001714944839477539, 0.001791834831237793, 0.0018687248229980469, 0.0019456148147583008, 0.0020225048065185547, 0.0020993947982788086, 0.0021762847900390625]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 5.0, 3.0, 3.0, 8.0, 9.0, 10.0, 18.0, 25.0, 17.0, 38.0, 67.0, 74.0, 150.0, 267.0, 517.0, 1158.0, 2782.0, 10275.0, 70520.0, 697499.0, 234529.0, 22523.0, 4760.0, 1626.0, 724.0, 354.0, 218.0, 107.0, 81.0, 46.0, 35.0, 28.0, 22.0, 16.0, 18.0, 10.0, 3.0, 4.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-14.25, -13.8009033203125, -13.351806640625, -12.9027099609375, -12.45361328125, -12.0045166015625, -11.555419921875, -11.1063232421875, -10.6572265625, -10.2081298828125, -9.759033203125, -9.3099365234375, -8.86083984375, -8.4117431640625, -7.962646484375, -7.5135498046875, -7.064453125, -6.6153564453125, -6.166259765625, -5.7171630859375, -5.26806640625, -4.8189697265625, -4.369873046875, -3.9207763671875, -3.4716796875, -3.0225830078125, -2.573486328125, -2.1243896484375, -1.67529296875, -1.2261962890625, -0.777099609375, -0.3280029296875, 0.12109375, 0.5701904296875, 1.019287109375, 1.4683837890625, 1.91748046875, 2.3665771484375, 2.815673828125, 3.2647705078125, 3.7138671875, 4.1629638671875, 4.612060546875, 5.0611572265625, 5.51025390625, 5.9593505859375, 6.408447265625, 6.8575439453125, 7.306640625, 7.7557373046875, 8.204833984375, 8.6539306640625, 9.10302734375, 9.5521240234375, 10.001220703125, 10.4503173828125, 10.8994140625, 11.3485107421875, 11.797607421875, 12.2467041015625, 12.69580078125, 13.1448974609375, 13.593994140625, 14.0430908203125, 14.4921875]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 4.0, 9.0, 6.0, 8.0, 14.0, 11.0, 7.0, 15.0, 27.0, 24.0, 38.0, 53.0, 61.0, 83.0, 102.0, 104.0, 99.0, 76.0, 67.0, 63.0, 26.0, 31.0, 17.0, 18.0, 7.0, 8.0, 8.0, 5.0, 5.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.2890625, -10.969482421875, -10.64990234375, -10.330322265625, -10.0107421875, -9.691162109375, -9.37158203125, -9.052001953125, -8.732421875, -8.412841796875, -8.09326171875, -7.773681640625, -7.4541015625, -7.134521484375, -6.81494140625, -6.495361328125, -6.17578125, -5.856201171875, -5.53662109375, -5.217041015625, -4.8974609375, -4.577880859375, -4.25830078125, -3.938720703125, -3.619140625, -3.299560546875, -2.97998046875, -2.660400390625, -2.3408203125, -2.021240234375, -1.70166015625, -1.382080078125, -1.0625, -0.742919921875, -0.42333984375, -0.103759765625, 0.2158203125, 0.535400390625, 0.85498046875, 1.174560546875, 1.494140625, 1.813720703125, 2.13330078125, 2.452880859375, 2.7724609375, 3.092041015625, 3.41162109375, 3.731201171875, 4.05078125, 4.370361328125, 4.68994140625, 5.009521484375, 5.3291015625, 5.648681640625, 5.96826171875, 6.287841796875, 6.607421875, 6.927001953125, 7.24658203125, 7.566162109375, 7.8857421875, 8.205322265625, 8.52490234375, 8.844482421875, 9.1640625]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 9.0, 24.0, 86.0, 179.0, 271.0, 204.0, 139.0, 58.0, 18.0, 9.0, 5.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-461.7149658203125, -452.2321472167969, -442.7492980957031, -433.2664794921875, -423.78363037109375, -414.3008117675781, -404.8179626464844, -395.33514404296875, -385.852294921875, -376.3694763183594, -366.8866271972656, -357.40380859375, -347.92095947265625, -338.4381408691406, -328.9552917480469, -319.47247314453125, -309.9896545410156, -300.5068359375, -291.02398681640625, -281.5411682128906, -272.0583190917969, -262.57550048828125, -253.09266662597656, -243.60983276367188, -234.1269989013672, -224.6441650390625, -215.1613311767578, -205.67849731445312, -196.1956787109375, -186.71282958984375, -177.23001098632812, -167.74717712402344, -158.26431274414062, -148.78147888183594, -139.29864501953125, -129.81581115722656, -120.3329849243164, -110.85015106201172, -101.36732482910156, -91.88449096679688, -82.40165710449219, -72.9188232421875, -63.43599319458008, -53.953163146972656, -44.47032928466797, -34.98749542236328, -25.50466537475586, -16.021835327148438, -6.53900146484375, 2.9438304901123047, 12.42666244506836, 21.909494400024414, 31.39232635498047, 40.875160217285156, 50.35799026489258, 59.8408203125, 69.32365417480469, 78.80648803710938, 88.28932189941406, 97.77214813232422, 107.2549819946289, 116.7378158569336, 126.22064208984375, 135.70347595214844, 145.18630981445312]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 4.0, 6.0, 5.0, 3.0, 8.0, 10.0, 6.0, 9.0, 15.0, 22.0, 15.0, 24.0, 29.0, 33.0, 39.0, 37.0, 35.0, 40.0, 38.0, 45.0, 55.0, 58.0, 59.0, 50.0, 45.0, 34.0, 35.0, 25.0, 37.0, 31.0, 29.0, 19.0, 17.0, 19.0, 15.0, 11.0, 8.0, 9.0, 7.0, 5.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-124.01101684570312, -120.0135498046875, -116.01608276367188, -112.01861572265625, -108.02114868164062, -104.023681640625, -100.02621459960938, -96.02875518798828, -92.03128814697266, -88.03382110595703, -84.0363540649414, -80.03888702392578, -76.04141998291016, -72.04396057128906, -68.04649353027344, -64.04902648925781, -60.05155563354492, -56.0540885925293, -52.05662155151367, -48.05915832519531, -44.06169128417969, -40.06422424316406, -36.06675720214844, -32.06929016113281, -28.07182502746582, -24.074357986450195, -20.076892852783203, -16.079425811767578, -12.08195972442627, -8.084493637084961, -4.087026596069336, -0.08956146240234375, 3.9079055786132812, 7.90537166595459, 11.902837753295898, 15.900304794311523, 19.897769927978516, 23.89523696899414, 27.892704010009766, 31.890169143676758, 35.88763427734375, 39.885101318359375, 43.882568359375, 47.880035400390625, 51.877498626708984, 55.87496566772461, 59.872432708740234, 63.869895935058594, 67.86737060546875, 71.86483764648438, 75.8623046875, 79.85977172851562, 83.85723876953125, 87.85470581054688, 91.8521728515625, 95.8496322631836, 99.84709930419922, 103.84456634521484, 107.84203338623047, 111.8395004272461, 115.83696746826172, 119.83442687988281, 123.83189392089844, 127.82936096191406, 131.8268280029297]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 4.0, 12.0, 10.0, 19.0, 31.0, 38.0, 58.0, 111.0, 187.0, 341.0, 866.0, 2171.0, 7764.0, 125956.0, 4038512.0, 13347.0, 2822.0, 1034.0, 440.0, 218.0, 122.0, 74.0, 32.0, 29.0, 29.0, 16.0, 6.0, 3.0, 4.0, 5.0, 6.0, 3.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.46875, -32.97998046875, -31.4912109375, -30.00244140625, -28.513671875, -27.02490234375, -25.5361328125, -24.04736328125, -22.55859375, -21.06982421875, -19.5810546875, -18.09228515625, -16.603515625, -15.11474609375, -13.6259765625, -12.13720703125, -10.6484375, -9.15966796875, -7.6708984375, -6.18212890625, -4.693359375, -3.20458984375, -1.7158203125, -0.22705078125, 1.26171875, 2.75048828125, 4.2392578125, 5.72802734375, 7.216796875, 8.70556640625, 10.1943359375, 11.68310546875, 13.171875, 14.66064453125, 16.1494140625, 17.63818359375, 19.126953125, 20.61572265625, 22.1044921875, 23.59326171875, 25.08203125, 26.57080078125, 28.0595703125, 29.54833984375, 31.037109375, 32.52587890625, 34.0146484375, 35.50341796875, 36.9921875, 38.48095703125, 39.9697265625, 41.45849609375, 42.947265625, 44.43603515625, 45.9248046875, 47.41357421875, 48.90234375, 50.39111328125, 51.8798828125, 53.36865234375, 54.857421875, 56.34619140625, 57.8349609375, 59.32373046875, 60.8125]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 4.0, 1.0, 1.0, 5.0, 4.0, 7.0, 4.0, 7.0, 6.0, 17.0, 8.0, 15.0, 20.0, 17.0, 17.0, 19.0, 24.0, 26.0, 42.0, 40.0, 35.0, 27.0, 38.0, 50.0, 36.0, 52.0, 54.0, 48.0, 39.0, 37.0, 35.0, 41.0, 35.0, 16.0, 37.0, 16.0, 21.0, 22.0, 10.0, 13.0, 14.0, 9.0, 4.0, 10.0, 3.0, 4.0, 5.0, 4.0, 1.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.66015625, -4.51580810546875, -4.3714599609375, -4.22711181640625, -4.082763671875, -3.93841552734375, -3.7940673828125, -3.64971923828125, -3.50537109375, -3.36102294921875, -3.2166748046875, -3.07232666015625, -2.927978515625, -2.78363037109375, -2.6392822265625, -2.49493408203125, -2.3505859375, -2.20623779296875, -2.0618896484375, -1.91754150390625, -1.773193359375, -1.62884521484375, -1.4844970703125, -1.34014892578125, -1.19580078125, -1.05145263671875, -0.9071044921875, -0.76275634765625, -0.618408203125, -0.47406005859375, -0.3297119140625, -0.18536376953125, -0.041015625, 0.10333251953125, 0.2476806640625, 0.39202880859375, 0.536376953125, 0.68072509765625, 0.8250732421875, 0.96942138671875, 1.11376953125, 1.25811767578125, 1.4024658203125, 1.54681396484375, 1.691162109375, 1.83551025390625, 1.9798583984375, 2.12420654296875, 2.2685546875, 2.41290283203125, 2.5572509765625, 2.70159912109375, 2.845947265625, 2.99029541015625, 3.1346435546875, 3.27899169921875, 3.42333984375, 3.56768798828125, 3.7120361328125, 3.85638427734375, 4.000732421875, 4.14508056640625, 4.2894287109375, 4.43377685546875, 4.578125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 8.0, 10.0, 15.0, 17.0, 16.0, 27.0, 37.0, 63.0, 67.0, 86.0, 113.0, 183.0, 291.0, 418.0, 613.0, 948.0, 1612.0, 3074.0, 6764.0, 20253.0, 144601.0, 3941990.0, 50097.0, 12277.0, 4836.0, 2257.0, 1227.0, 751.0, 481.0, 334.0, 239.0, 163.0, 107.0, 87.0, 70.0, 43.0, 33.0, 21.0, 13.0, 12.0, 8.0, 7.0, 2.0, 2.0, 5.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.359375, -23.580810546875, -22.80224609375, -22.023681640625, -21.2451171875, -20.466552734375, -19.68798828125, -18.909423828125, -18.130859375, -17.352294921875, -16.57373046875, -15.795166015625, -15.0166015625, -14.238037109375, -13.45947265625, -12.680908203125, -11.90234375, -11.123779296875, -10.34521484375, -9.566650390625, -8.7880859375, -8.009521484375, -7.23095703125, -6.452392578125, -5.673828125, -4.895263671875, -4.11669921875, -3.338134765625, -2.5595703125, -1.781005859375, -1.00244140625, -0.223876953125, 0.5546875, 1.333251953125, 2.11181640625, 2.890380859375, 3.6689453125, 4.447509765625, 5.22607421875, 6.004638671875, 6.783203125, 7.561767578125, 8.34033203125, 9.118896484375, 9.8974609375, 10.676025390625, 11.45458984375, 12.233154296875, 13.01171875, 13.790283203125, 14.56884765625, 15.347412109375, 16.1259765625, 16.904541015625, 17.68310546875, 18.461669921875, 19.240234375, 20.018798828125, 20.79736328125, 21.575927734375, 22.3544921875, 23.133056640625, 23.91162109375, 24.690185546875, 25.46875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 8.0, 7.0, 7.0, 11.0, 23.0, 25.0, 48.0, 142.0, 3264.0, 348.0, 83.0, 32.0, 23.0, 12.0, 13.0, 4.0, 8.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.12109375, -5.90777587890625, -5.6944580078125, -5.48114013671875, -5.267822265625, -5.05450439453125, -4.8411865234375, -4.62786865234375, -4.41455078125, -4.20123291015625, -3.9879150390625, -3.77459716796875, -3.561279296875, -3.34796142578125, -3.1346435546875, -2.92132568359375, -2.7080078125, -2.49468994140625, -2.2813720703125, -2.06805419921875, -1.854736328125, -1.64141845703125, -1.4281005859375, -1.21478271484375, -1.00146484375, -0.78814697265625, -0.5748291015625, -0.36151123046875, -0.148193359375, 0.06512451171875, 0.2784423828125, 0.49176025390625, 0.705078125, 0.91839599609375, 1.1317138671875, 1.34503173828125, 1.558349609375, 1.77166748046875, 1.9849853515625, 2.19830322265625, 2.41162109375, 2.62493896484375, 2.8382568359375, 3.05157470703125, 3.264892578125, 3.47821044921875, 3.6915283203125, 3.90484619140625, 4.1181640625, 4.33148193359375, 4.5447998046875, 4.75811767578125, 4.971435546875, 5.18475341796875, 5.3980712890625, 5.61138916015625, 5.82470703125, 6.03802490234375, 6.2513427734375, 6.46466064453125, 6.677978515625, 6.89129638671875, 7.1046142578125, 7.31793212890625, 7.53125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 1.0, 6.0, 3.0, 17.0, 24.0, 34.0, 58.0, 108.0, 149.0, 127.0, 169.0, 120.0, 68.0, 51.0, 29.0, 15.0, 12.0, 6.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-24.560340881347656, -23.466367721557617, -22.37239646911621, -21.278423309326172, -20.184452056884766, -19.090478897094727, -17.996505737304688, -16.90253448486328, -15.808561325073242, -14.71458911895752, -13.620616912841797, -12.526643753051758, -11.432671546936035, -10.338699340820312, -9.244726181030273, -8.15075397491455, -7.056781768798828, -5.9628095626831055, -4.868836879730225, -3.774864435195923, -2.680891990661621, -1.5869197845458984, -0.4929471015930176, 0.6010255813598633, 1.694997787475586, 2.7889702320098877, 3.8829426765441895, 4.97691535949707, 6.070887565612793, 7.164859771728516, 8.258832931518555, 9.352805137634277, 10.446773529052734, 11.540745735168457, 12.63471794128418, 13.728691101074219, 14.822663307189941, 15.916635513305664, 17.010608673095703, 18.10457992553711, 19.19855308532715, 20.292526245117188, 21.386497497558594, 22.480470657348633, 23.574443817138672, 24.668415069580078, 25.762388229370117, 26.856361389160156, 27.950332641601562, 29.0443058013916, 30.138277053833008, 31.232250213623047, 32.32622146606445, 33.420196533203125, 34.51416778564453, 35.60813903808594, 36.702110290527344, 37.79608154296875, 38.89005661010742, 39.98402786254883, 41.077999114990234, 42.171974182128906, 43.26594543457031, 44.35991668701172, 45.45389175415039]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 6.0, 4.0, 6.0, 8.0, 16.0, 7.0, 8.0, 12.0, 17.0, 17.0, 30.0, 23.0, 28.0, 37.0, 35.0, 44.0, 47.0, 39.0, 47.0, 39.0, 48.0, 49.0, 46.0, 48.0, 44.0, 39.0, 39.0, 33.0, 27.0, 34.0, 16.0, 17.0, 19.0, 16.0, 15.0, 8.0, 8.0, 7.0, 7.0, 4.0, 7.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-13.37681770324707, -12.932601928710938, -12.488386154174805, -12.044171333312988, -11.599955558776855, -11.155739784240723, -10.711524963378906, -10.267309188842773, -9.82309341430664, -9.378877639770508, -8.934661865234375, -8.490447044372559, -8.046231269836426, -7.602015495300293, -7.157800197601318, -6.713584899902344, -6.269369125366211, -5.825153350830078, -5.3809380531311035, -4.936722755432129, -4.492506980895996, -4.048291206359863, -3.6040759086608887, -3.159860372543335, -2.7156448364257812, -2.2714293003082275, -1.8272137641906738, -1.3829982280731201, -0.9387826919555664, -0.4945671558380127, -0.050351619720458984, 0.3938639163970947, 0.8380794525146484, 1.2822949886322021, 1.7265105247497559, 2.1707260608673096, 2.6149415969848633, 3.059157133102417, 3.5033726692199707, 3.9475882053375244, 4.391803741455078, 4.836019515991211, 5.2802348136901855, 5.72445011138916, 6.168665885925293, 6.612881660461426, 7.0570969581604, 7.501312255859375, 7.945528030395508, 8.38974380493164, 8.833959579467773, 9.27817440032959, 9.722390174865723, 10.166605949401855, 10.610820770263672, 11.055036544799805, 11.499252319335938, 11.94346809387207, 12.387683868408203, 12.83189868927002, 13.276114463806152, 13.720330238342285, 14.164545059204102, 14.608760833740234, 15.052976608276367]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 3.0, 6.0, 3.0, 6.0, 16.0, 15.0, 28.0, 34.0, 47.0, 63.0, 98.0, 120.0, 189.0, 314.0, 497.0, 731.0, 1229.0, 2090.0, 3845.0, 7052.0, 13469.0, 27292.0, 58475.0, 129171.0, 246994.0, 268409.0, 152052.0, 69785.0, 32069.0, 15840.0, 7882.0, 4392.0, 2450.0, 1457.0, 863.0, 506.0, 330.0, 239.0, 156.0, 114.0, 74.0, 48.0, 33.0, 19.0, 11.0, 9.0, 14.0, 6.0, 3.0, 7.0, 6.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-9.6640625, -9.3721923828125, -9.080322265625, -8.7884521484375, -8.49658203125, -8.2047119140625, -7.912841796875, -7.6209716796875, -7.3291015625, -7.0372314453125, -6.745361328125, -6.4534912109375, -6.16162109375, -5.8697509765625, -5.577880859375, -5.2860107421875, -4.994140625, -4.7022705078125, -4.410400390625, -4.1185302734375, -3.82666015625, -3.5347900390625, -3.242919921875, -2.9510498046875, -2.6591796875, -2.3673095703125, -2.075439453125, -1.7835693359375, -1.49169921875, -1.1998291015625, -0.907958984375, -0.6160888671875, -0.32421875, -0.0323486328125, 0.259521484375, 0.5513916015625, 0.84326171875, 1.1351318359375, 1.427001953125, 1.7188720703125, 2.0107421875, 2.3026123046875, 2.594482421875, 2.8863525390625, 3.17822265625, 3.4700927734375, 3.761962890625, 4.0538330078125, 4.345703125, 4.6375732421875, 4.929443359375, 5.2213134765625, 5.51318359375, 5.8050537109375, 6.096923828125, 6.3887939453125, 6.6806640625, 6.9725341796875, 7.264404296875, 7.5562744140625, 7.84814453125, 8.1400146484375, 8.431884765625, 8.7237548828125, 9.015625]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 4.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 8.0, 4.0, 7.0, 7.0, 5.0, 11.0, 12.0, 13.0, 16.0, 22.0, 17.0, 17.0, 23.0, 33.0, 28.0, 45.0, 33.0, 33.0, 40.0, 47.0, 57.0, 52.0, 40.0, 45.0, 37.0, 43.0, 37.0, 30.0, 32.0, 28.0, 34.0, 24.0, 20.0, 14.0, 15.0, 18.0, 8.0, 9.0, 9.0, 10.0, 5.0, 2.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.04296875, -4.881591796875, -4.72021484375, -4.558837890625, -4.3974609375, -4.236083984375, -4.07470703125, -3.913330078125, -3.751953125, -3.590576171875, -3.42919921875, -3.267822265625, -3.1064453125, -2.945068359375, -2.78369140625, -2.622314453125, -2.4609375, -2.299560546875, -2.13818359375, -1.976806640625, -1.8154296875, -1.654052734375, -1.49267578125, -1.331298828125, -1.169921875, -1.008544921875, -0.84716796875, -0.685791015625, -0.5244140625, -0.363037109375, -0.20166015625, -0.040283203125, 0.12109375, 0.282470703125, 0.44384765625, 0.605224609375, 0.7666015625, 0.927978515625, 1.08935546875, 1.250732421875, 1.412109375, 1.573486328125, 1.73486328125, 1.896240234375, 2.0576171875, 2.218994140625, 2.38037109375, 2.541748046875, 2.703125, 2.864501953125, 3.02587890625, 3.187255859375, 3.3486328125, 3.510009765625, 3.67138671875, 3.832763671875, 3.994140625, 4.155517578125, 4.31689453125, 4.478271484375, 4.6396484375, 4.801025390625, 4.96240234375, 5.123779296875, 5.28515625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 1.0, 4.0, 6.0, 16.0, 22.0, 23.0, 37.0, 49.0, 85.0, 143.0, 164.0, 301.0, 425.0, 745.0, 1315.0, 3333.0, 15176.0, 214558.0, 747843.0, 52954.0, 6730.0, 2064.0, 952.0, 540.0, 343.0, 249.0, 172.0, 94.0, 57.0, 43.0, 35.0, 15.0, 21.0, 12.0, 8.0, 5.0, 4.0, 3.0, 4.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.625, -27.67919921875, -26.7333984375, -25.78759765625, -24.841796875, -23.89599609375, -22.9501953125, -22.00439453125, -21.05859375, -20.11279296875, -19.1669921875, -18.22119140625, -17.275390625, -16.32958984375, -15.3837890625, -14.43798828125, -13.4921875, -12.54638671875, -11.6005859375, -10.65478515625, -9.708984375, -8.76318359375, -7.8173828125, -6.87158203125, -5.92578125, -4.97998046875, -4.0341796875, -3.08837890625, -2.142578125, -1.19677734375, -0.2509765625, 0.69482421875, 1.640625, 2.58642578125, 3.5322265625, 4.47802734375, 5.423828125, 6.36962890625, 7.3154296875, 8.26123046875, 9.20703125, 10.15283203125, 11.0986328125, 12.04443359375, 12.990234375, 13.93603515625, 14.8818359375, 15.82763671875, 16.7734375, 17.71923828125, 18.6650390625, 19.61083984375, 20.556640625, 21.50244140625, 22.4482421875, 23.39404296875, 24.33984375, 25.28564453125, 26.2314453125, 27.17724609375, 28.123046875, 29.06884765625, 30.0146484375, 30.96044921875, 31.90625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 2.0, 2.0, 4.0, 3.0, 5.0, 3.0, 9.0, 11.0, 7.0, 9.0, 11.0, 9.0, 20.0, 33.0, 32.0, 22.0, 21.0, 39.0, 37.0, 48.0, 49.0, 57.0, 43.0, 52.0, 55.0, 58.0, 47.0, 34.0, 39.0, 42.0, 37.0, 17.0, 23.0, 16.0, 22.0, 17.0, 12.0, 17.0, 14.0, 6.0, 7.0, 4.0, 6.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.84375, -21.026611328125, -20.20947265625, -19.392333984375, -18.5751953125, -17.758056640625, -16.94091796875, -16.123779296875, -15.306640625, -14.489501953125, -13.67236328125, -12.855224609375, -12.0380859375, -11.220947265625, -10.40380859375, -9.586669921875, -8.76953125, -7.952392578125, -7.13525390625, -6.318115234375, -5.5009765625, -4.683837890625, -3.86669921875, -3.049560546875, -2.232421875, -1.415283203125, -0.59814453125, 0.218994140625, 1.0361328125, 1.853271484375, 2.67041015625, 3.487548828125, 4.3046875, 5.121826171875, 5.93896484375, 6.756103515625, 7.5732421875, 8.390380859375, 9.20751953125, 10.024658203125, 10.841796875, 11.658935546875, 12.47607421875, 13.293212890625, 14.1103515625, 14.927490234375, 15.74462890625, 16.561767578125, 17.37890625, 18.196044921875, 19.01318359375, 19.830322265625, 20.6474609375, 21.464599609375, 22.28173828125, 23.098876953125, 23.916015625, 24.733154296875, 25.55029296875, 26.367431640625, 27.1845703125, 28.001708984375, 28.81884765625, 29.635986328125, 30.453125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 5.0, 4.0, 2.0, 4.0, 12.0, 9.0, 16.0, 18.0, 25.0, 55.0, 84.0, 124.0, 242.0, 469.0, 1299.0, 4529.0, 32139.0, 665961.0, 321364.0, 17093.0, 3156.0, 987.0, 399.0, 214.0, 102.0, 68.0, 54.0, 33.0, 24.0, 11.0, 10.0, 10.0, 6.0, 5.0, 4.0, 2.0, 3.0, 4.0, 3.0, 3.0, 0.0, 0.0, 6.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-14.9453125, -14.476318359375, -14.00732421875, -13.538330078125, -13.0693359375, -12.600341796875, -12.13134765625, -11.662353515625, -11.193359375, -10.724365234375, -10.25537109375, -9.786376953125, -9.3173828125, -8.848388671875, -8.37939453125, -7.910400390625, -7.44140625, -6.972412109375, -6.50341796875, -6.034423828125, -5.5654296875, -5.096435546875, -4.62744140625, -4.158447265625, -3.689453125, -3.220458984375, -2.75146484375, -2.282470703125, -1.8134765625, -1.344482421875, -0.87548828125, -0.406494140625, 0.0625, 0.531494140625, 1.00048828125, 1.469482421875, 1.9384765625, 2.407470703125, 2.87646484375, 3.345458984375, 3.814453125, 4.283447265625, 4.75244140625, 5.221435546875, 5.6904296875, 6.159423828125, 6.62841796875, 7.097412109375, 7.56640625, 8.035400390625, 8.50439453125, 8.973388671875, 9.4423828125, 9.911376953125, 10.38037109375, 10.849365234375, 11.318359375, 11.787353515625, 12.25634765625, 12.725341796875, 13.1943359375, 13.663330078125, 14.13232421875, 14.601318359375, 15.0703125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 3.0, 1.0, 4.0, 12.0, 5.0, 13.0, 15.0, 15.0, 15.0, 32.0, 33.0, 44.0, 54.0, 54.0, 72.0, 95.0, 103.0, 88.0, 75.0, 60.0, 32.0, 39.0, 33.0, 23.0, 13.0, 15.0, 11.0, 10.0, 10.0, 8.0, 3.0, 2.0, 1.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0015249252319335938, -0.0014764368534088135, -0.0014279484748840332, -0.001379460096359253, -0.0013309717178344727, -0.0012824833393096924, -0.0012339949607849121, -0.0011855065822601318, -0.0011370182037353516, -0.0010885298252105713, -0.001040041446685791, -0.0009915530681610107, -0.0009430646896362305, -0.0008945763111114502, -0.0008460879325866699, -0.0007975995540618896, -0.0007491111755371094, -0.0007006227970123291, -0.0006521344184875488, -0.0006036460399627686, -0.0005551576614379883, -0.000506669282913208, -0.00045818090438842773, -0.00040969252586364746, -0.0003612041473388672, -0.0003127157688140869, -0.00026422739028930664, -0.00021573901176452637, -0.0001672506332397461, -0.00011876225471496582, -7.027387619018555e-05, -2.1785497665405273e-05, 2.6702880859375e-05, 7.519125938415527e-05, 0.00012367963790893555, 0.00017216801643371582, 0.0002206563949584961, 0.00026914477348327637, 0.00031763315200805664, 0.0003661215305328369, 0.0004146099090576172, 0.00046309828758239746, 0.0005115866661071777, 0.000560075044631958, 0.0006085634231567383, 0.0006570518016815186, 0.0007055401802062988, 0.0007540285587310791, 0.0008025169372558594, 0.0008510053157806396, 0.0008994936943054199, 0.0009479820728302002, 0.0009964704513549805, 0.0010449588298797607, 0.001093447208404541, 0.0011419355869293213, 0.0011904239654541016, 0.0012389123439788818, 0.0012874007225036621, 0.0013358891010284424, 0.0013843774795532227, 0.001432865858078003, 0.0014813542366027832, 0.0015298426151275635, 0.0015783309936523438]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 8.0, 5.0, 17.0, 17.0, 36.0, 72.0, 148.0, 374.0, 1153.0, 4917.0, 82477.0, 925163.0, 29718.0, 3125.0, 798.0, 262.0, 122.0, 69.0, 32.0, 14.0, 9.0, 5.0, 6.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.5, -24.779052734375, -24.05810546875, -23.337158203125, -22.6162109375, -21.895263671875, -21.17431640625, -20.453369140625, -19.732421875, -19.011474609375, -18.29052734375, -17.569580078125, -16.8486328125, -16.127685546875, -15.40673828125, -14.685791015625, -13.96484375, -13.243896484375, -12.52294921875, -11.802001953125, -11.0810546875, -10.360107421875, -9.63916015625, -8.918212890625, -8.197265625, -7.476318359375, -6.75537109375, -6.034423828125, -5.3134765625, -4.592529296875, -3.87158203125, -3.150634765625, -2.4296875, -1.708740234375, -0.98779296875, -0.266845703125, 0.4541015625, 1.175048828125, 1.89599609375, 2.616943359375, 3.337890625, 4.058837890625, 4.77978515625, 5.500732421875, 6.2216796875, 6.942626953125, 7.66357421875, 8.384521484375, 9.10546875, 9.826416015625, 10.54736328125, 11.268310546875, 11.9892578125, 12.710205078125, 13.43115234375, 14.152099609375, 14.873046875, 15.593994140625, 16.31494140625, 17.035888671875, 17.7568359375, 18.477783203125, 19.19873046875, 19.919677734375, 20.640625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 4.0, 6.0, 10.0, 5.0, 19.0, 22.0, 36.0, 71.0, 75.0, 108.0, 107.0, 129.0, 114.0, 96.0, 55.0, 50.0, 31.0, 23.0, 13.0, 4.0, 5.0, 6.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.765625, -10.4095458984375, -10.053466796875, -9.6973876953125, -9.34130859375, -8.9852294921875, -8.629150390625, -8.2730712890625, -7.9169921875, -7.5609130859375, -7.204833984375, -6.8487548828125, -6.49267578125, -6.1365966796875, -5.780517578125, -5.4244384765625, -5.068359375, -4.7122802734375, -4.356201171875, -4.0001220703125, -3.64404296875, -3.2879638671875, -2.931884765625, -2.5758056640625, -2.2197265625, -1.8636474609375, -1.507568359375, -1.1514892578125, -0.79541015625, -0.4393310546875, -0.083251953125, 0.2728271484375, 0.62890625, 0.9849853515625, 1.341064453125, 1.6971435546875, 2.05322265625, 2.4093017578125, 2.765380859375, 3.1214599609375, 3.4775390625, 3.8336181640625, 4.189697265625, 4.5457763671875, 4.90185546875, 5.2579345703125, 5.614013671875, 5.9700927734375, 6.326171875, 6.6822509765625, 7.038330078125, 7.3944091796875, 7.75048828125, 8.1065673828125, 8.462646484375, 8.8187255859375, 9.1748046875, 9.5308837890625, 9.886962890625, 10.2430419921875, 10.59912109375, 10.9552001953125, 11.311279296875, 11.6673583984375, 12.0234375]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 2.0, 9.0, 12.0, 17.0, 33.0, 49.0, 63.0, 90.0, 111.0, 130.0, 109.0, 107.0, 86.0, 63.0, 44.0, 19.0, 12.0, 15.0, 5.0, 7.0, 3.0, 3.0, 2.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-110.72756958007812, -106.51575469970703, -102.30393981933594, -98.09213256835938, -93.88031768798828, -89.66850280761719, -85.4566879272461, -81.244873046875, -77.03306579589844, -72.82125091552734, -68.60943603515625, -64.39762878417969, -60.185813903808594, -55.9739990234375, -51.762184143066406, -47.55036926269531, -43.33855438232422, -39.126739501953125, -34.9149284362793, -30.703113555908203, -26.491300582885742, -22.27948760986328, -18.067672729492188, -13.855859756469727, -9.644046783447266, -5.4322333335876465, -1.2204198837280273, 2.99139404296875, 7.203207015991211, 11.415019989013672, 15.626834869384766, 19.838647842407227, 24.050460815429688, 28.26227378845215, 32.47408676147461, 36.6859016418457, 40.89771270751953, 45.109527587890625, 49.32134246826172, 53.53315734863281, 57.74496841430664, 61.956783294677734, 66.16859436035156, 70.38040924072266, 74.59222412109375, 78.80403137207031, 83.01585388183594, 87.2276611328125, 91.4394760131836, 95.65129089355469, 99.86310577392578, 104.07492065429688, 108.28672790527344, 112.49854278564453, 116.71035766601562, 120.92217254638672, 125.13398742675781, 129.34579467773438, 133.5576171875, 137.76942443847656, 141.9812469482422, 146.19305419921875, 150.40487670898438, 154.61668395996094, 158.8284912109375]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 4.0, 3.0, 4.0, 6.0, 7.0, 16.0, 20.0, 23.0, 35.0, 26.0, 33.0, 38.0, 43.0, 49.0, 66.0, 57.0, 72.0, 56.0, 44.0, 45.0, 77.0, 44.0, 53.0, 32.0, 29.0, 25.0, 22.0, 18.0, 18.0, 7.0, 10.0, 10.0, 4.0, 7.0, 3.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-167.992431640625, -163.5846405029297, -159.1768341064453, -154.76904296875, -150.3612518310547, -145.95346069335938, -141.545654296875, -137.1378631591797, -132.73007202148438, -128.32228088378906, -123.91448211669922, -119.50668334960938, -115.09889221191406, -110.69109344482422, -106.28329467773438, -101.87550354003906, -97.46770477294922, -93.05990600585938, -88.65211486816406, -84.24431610107422, -79.8365249633789, -75.42872619628906, -71.02093505859375, -66.6131362915039, -62.20534133911133, -57.79754638671875, -53.38975143432617, -48.981956481933594, -44.57415771484375, -40.16636657714844, -35.758567810058594, -31.350772857666016, -26.942977905273438, -22.53518295288086, -18.12738800048828, -13.71959114074707, -9.311796188354492, -4.904001235961914, -0.4962043762207031, 3.911590576171875, 8.319385528564453, 12.727180480957031, 17.13497543334961, 21.54277229309082, 25.9505672454834, 30.358362197875977, 34.76615905761719, 39.173954010009766, 43.581748962402344, 47.98954391479492, 52.3973388671875, 56.805137634277344, 61.212928771972656, 65.6207275390625, 70.02851867675781, 74.43631744384766, 78.8441162109375, 83.25191497802734, 87.65970611572266, 92.0675048828125, 96.47529602050781, 100.88309478759766, 105.2908935546875, 109.69868469238281, 114.10647583007812]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 6.0, 3.0, 4.0, 10.0, 23.0, 26.0, 46.0, 83.0, 132.0, 184.0, 333.0, 645.0, 1491.0, 4406.0, 27482.0, 4132717.0, 20358.0, 3724.0, 1228.0, 577.0, 350.0, 156.0, 120.0, 58.0, 40.0, 26.0, 16.0, 10.0, 6.0, 8.0, 4.0, 7.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.140625, -29.812255859375, -28.48388671875, -27.155517578125, -25.8271484375, -24.498779296875, -23.17041015625, -21.842041015625, -20.513671875, -19.185302734375, -17.85693359375, -16.528564453125, -15.2001953125, -13.871826171875, -12.54345703125, -11.215087890625, -9.88671875, -8.558349609375, -7.22998046875, -5.901611328125, -4.5732421875, -3.244873046875, -1.91650390625, -0.588134765625, 0.740234375, 2.068603515625, 3.39697265625, 4.725341796875, 6.0537109375, 7.382080078125, 8.71044921875, 10.038818359375, 11.3671875, 12.695556640625, 14.02392578125, 15.352294921875, 16.6806640625, 18.009033203125, 19.33740234375, 20.665771484375, 21.994140625, 23.322509765625, 24.65087890625, 25.979248046875, 27.3076171875, 28.635986328125, 29.96435546875, 31.292724609375, 32.62109375, 33.949462890625, 35.27783203125, 36.606201171875, 37.9345703125, 39.262939453125, 40.59130859375, 41.919677734375, 43.248046875, 44.576416015625, 45.90478515625, 47.233154296875, 48.5615234375, 49.889892578125, 51.21826171875, 52.546630859375, 53.875]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 6.0, 4.0, 7.0, 6.0, 16.0, 24.0, 23.0, 27.0, 33.0, 33.0, 52.0, 59.0, 56.0, 78.0, 65.0, 64.0, 61.0, 77.0, 62.0, 51.0, 59.0, 31.0, 26.0, 19.0, 25.0, 16.0, 8.0, 8.0, 5.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.4453125, -10.18438720703125, -9.9234619140625, -9.66253662109375, -9.401611328125, -9.14068603515625, -8.8797607421875, -8.61883544921875, -8.35791015625, -8.09698486328125, -7.8360595703125, -7.57513427734375, -7.314208984375, -7.05328369140625, -6.7923583984375, -6.53143310546875, -6.2705078125, -6.00958251953125, -5.7486572265625, -5.48773193359375, -5.226806640625, -4.96588134765625, -4.7049560546875, -4.44403076171875, -4.18310546875, -3.92218017578125, -3.6612548828125, -3.40032958984375, -3.139404296875, -2.87847900390625, -2.6175537109375, -2.35662841796875, -2.095703125, -1.83477783203125, -1.5738525390625, -1.31292724609375, -1.052001953125, -0.79107666015625, -0.5301513671875, -0.26922607421875, -0.00830078125, 0.25262451171875, 0.5135498046875, 0.77447509765625, 1.035400390625, 1.29632568359375, 1.5572509765625, 1.81817626953125, 2.0791015625, 2.34002685546875, 2.6009521484375, 2.86187744140625, 3.122802734375, 3.38372802734375, 3.6446533203125, 3.90557861328125, 4.16650390625, 4.42742919921875, 4.6883544921875, 4.94927978515625, 5.210205078125, 5.47113037109375, 5.7320556640625, 5.99298095703125, 6.25390625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 11.0, 8.0, 9.0, 17.0, 20.0, 30.0, 49.0, 56.0, 67.0, 97.0, 145.0, 243.0, 422.0, 747.0, 1423.0, 3113.0, 8590.0, 46788.0, 4081135.0, 37392.0, 7810.0, 2967.0, 1317.0, 721.0, 407.0, 239.0, 147.0, 96.0, 68.0, 48.0, 33.0, 23.0, 11.0, 6.0, 12.0, 7.0, 6.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-35.21875, -34.252685546875, -33.28662109375, -32.320556640625, -31.3544921875, -30.388427734375, -29.42236328125, -28.456298828125, -27.490234375, -26.524169921875, -25.55810546875, -24.592041015625, -23.6259765625, -22.659912109375, -21.69384765625, -20.727783203125, -19.76171875, -18.795654296875, -17.82958984375, -16.863525390625, -15.8974609375, -14.931396484375, -13.96533203125, -12.999267578125, -12.033203125, -11.067138671875, -10.10107421875, -9.135009765625, -8.1689453125, -7.202880859375, -6.23681640625, -5.270751953125, -4.3046875, -3.338623046875, -2.37255859375, -1.406494140625, -0.4404296875, 0.525634765625, 1.49169921875, 2.457763671875, 3.423828125, 4.389892578125, 5.35595703125, 6.322021484375, 7.2880859375, 8.254150390625, 9.22021484375, 10.186279296875, 11.15234375, 12.118408203125, 13.08447265625, 14.050537109375, 15.0166015625, 15.982666015625, 16.94873046875, 17.914794921875, 18.880859375, 19.846923828125, 20.81298828125, 21.779052734375, 22.7451171875, 23.711181640625, 24.67724609375, 25.643310546875, 26.609375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 11.0, 9.0, 14.0, 32.0, 71.0, 3314.0, 497.0, 55.0, 25.0, 15.0, 8.0, 5.0, 5.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.0390625, -7.808837890625, -7.57861328125, -7.348388671875, -7.1181640625, -6.887939453125, -6.65771484375, -6.427490234375, -6.197265625, -5.967041015625, -5.73681640625, -5.506591796875, -5.2763671875, -5.046142578125, -4.81591796875, -4.585693359375, -4.35546875, -4.125244140625, -3.89501953125, -3.664794921875, -3.4345703125, -3.204345703125, -2.97412109375, -2.743896484375, -2.513671875, -2.283447265625, -2.05322265625, -1.822998046875, -1.5927734375, -1.362548828125, -1.13232421875, -0.902099609375, -0.671875, -0.441650390625, -0.21142578125, 0.018798828125, 0.2490234375, 0.479248046875, 0.70947265625, 0.939697265625, 1.169921875, 1.400146484375, 1.63037109375, 1.860595703125, 2.0908203125, 2.321044921875, 2.55126953125, 2.781494140625, 3.01171875, 3.241943359375, 3.47216796875, 3.702392578125, 3.9326171875, 4.162841796875, 4.39306640625, 4.623291015625, 4.853515625, 5.083740234375, 5.31396484375, 5.544189453125, 5.7744140625, 6.004638671875, 6.23486328125, 6.465087890625, 6.6953125]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 6.0, 11.0, 18.0, 34.0, 96.0, 173.0, 260.0, 208.0, 115.0, 53.0, 19.0, 7.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.346656799316406, -44.00086975097656, -42.65507888793945, -41.30929183959961, -39.963504791259766, -38.617713928222656, -37.27192687988281, -35.92613983154297, -34.58034896850586, -33.234561920166016, -31.88877296447754, -30.542984008789062, -29.197195053100586, -27.85140609741211, -26.505619049072266, -25.15983009338379, -23.814043045043945, -22.46825408935547, -21.122467041015625, -19.77667808532715, -18.430889129638672, -17.085102081298828, -15.739313125610352, -14.393524169921875, -13.047736167907715, -11.701948165893555, -10.356159210205078, -9.010371208190918, -7.6645827293396, -6.318794250488281, -4.973006248474121, -3.6272172927856445, -2.2814292907714844, -0.9356409311294556, 0.41014742851257324, 1.7559356689453125, 3.101724147796631, 4.447512626647949, 5.793300628662109, 7.139089584350586, 8.484877586364746, 9.830665588378906, 11.176454544067383, 12.522242546081543, 13.868030548095703, 15.21381950378418, 16.559608459472656, 17.9053955078125, 19.251184463500977, 20.596973419189453, 21.942760467529297, 23.288549423217773, 24.63433837890625, 25.980125427246094, 27.32591438293457, 28.671703338623047, 30.01749038696289, 31.363279342651367, 32.709068298339844, 34.05485534667969, 35.40064239501953, 36.74643325805664, 38.092220306396484, 39.438011169433594, 40.78379821777344]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 4.0, 6.0, 13.0, 21.0, 23.0, 15.0, 21.0, 33.0, 20.0, 30.0, 33.0, 33.0, 40.0, 33.0, 44.0, 42.0, 46.0, 61.0, 56.0, 47.0, 46.0, 39.0, 37.0, 40.0, 35.0, 29.0, 23.0, 14.0, 31.0, 11.0, 10.0, 12.0, 10.0, 13.0, 9.0, 4.0, 1.0, 6.0, 2.0, 1.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.789824485778809, -9.4209623336792, -9.052099227905273, -8.683237075805664, -8.314373970031738, -7.945511817932129, -7.576649188995361, -7.207786560058594, -6.838924407958984, -6.470061779022217, -6.101199150085449, -5.73233699798584, -5.363474369049072, -4.994611740112305, -4.625749111175537, -4.2568864822387695, -3.888023853302002, -3.5191612243652344, -3.150298833847046, -2.7814362049102783, -2.41257381439209, -2.0437111854553223, -1.6748485565185547, -1.3059861660003662, -0.9371235370635986, -0.5682610273361206, -0.1993984580039978, 0.169464111328125, 0.538326621055603, 0.907189130783081, 1.2760517597198486, 1.644914150238037, 2.0137767791748047, 2.3826394081115723, 2.7515017986297607, 3.1203644275665283, 3.489226818084717, 3.8580894470214844, 4.226952075958252, 4.5958147048950195, 4.964676856994629, 5.3335394859313965, 5.702402114868164, 6.071264266967773, 6.440126895904541, 6.808989524841309, 7.177852153778076, 7.546714782714844, 7.915577411651611, 8.284440040588379, 8.653302192687988, 9.022165298461914, 9.391027450561523, 9.759889602661133, 10.128752708435059, 10.497614860534668, 10.866477966308594, 11.235340118408203, 11.604203224182129, 11.973065376281738, 12.341928482055664, 12.710790634155273, 13.079652786254883, 13.448515892028809, 13.817378044128418]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 4.0, 9.0, 2.0, 11.0, 9.0, 35.0, 31.0, 62.0, 86.0, 151.0, 260.0, 469.0, 912.0, 1787.0, 3955.0, 8872.0, 22663.0, 62718.0, 185529.0, 401461.0, 232586.0, 79379.0, 27801.0, 10688.0, 4587.0, 2138.0, 1059.0, 543.0, 317.0, 148.0, 95.0, 72.0, 41.0, 15.0, 18.0, 8.0, 11.0, 6.0, 10.0, 5.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.640625, -10.22509765625, -9.8095703125, -9.39404296875, -8.978515625, -8.56298828125, -8.1474609375, -7.73193359375, -7.31640625, -6.90087890625, -6.4853515625, -6.06982421875, -5.654296875, -5.23876953125, -4.8232421875, -4.40771484375, -3.9921875, -3.57666015625, -3.1611328125, -2.74560546875, -2.330078125, -1.91455078125, -1.4990234375, -1.08349609375, -0.66796875, -0.25244140625, 0.1630859375, 0.57861328125, 0.994140625, 1.40966796875, 1.8251953125, 2.24072265625, 2.65625, 3.07177734375, 3.4873046875, 3.90283203125, 4.318359375, 4.73388671875, 5.1494140625, 5.56494140625, 5.98046875, 6.39599609375, 6.8115234375, 7.22705078125, 7.642578125, 8.05810546875, 8.4736328125, 8.88916015625, 9.3046875, 9.72021484375, 10.1357421875, 10.55126953125, 10.966796875, 11.38232421875, 11.7978515625, 12.21337890625, 12.62890625, 13.04443359375, 13.4599609375, 13.87548828125, 14.291015625, 14.70654296875, 15.1220703125, 15.53759765625, 15.953125]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 7.0, 7.0, 6.0, 9.0, 24.0, 25.0, 20.0, 33.0, 35.0, 29.0, 51.0, 48.0, 46.0, 62.0, 51.0, 69.0, 62.0, 58.0, 60.0, 39.0, 59.0, 33.0, 36.0, 32.0, 21.0, 15.0, 21.0, 13.0, 5.0, 7.0, 5.0, 9.0, 4.0, 2.0, 0.0, 0.0, 2.0], "bins": [-9.8515625, -9.6187744140625, -9.385986328125, -9.1531982421875, -8.92041015625, -8.6876220703125, -8.454833984375, -8.2220458984375, -7.9892578125, -7.7564697265625, -7.523681640625, -7.2908935546875, -7.05810546875, -6.8253173828125, -6.592529296875, -6.3597412109375, -6.126953125, -5.8941650390625, -5.661376953125, -5.4285888671875, -5.19580078125, -4.9630126953125, -4.730224609375, -4.4974365234375, -4.2646484375, -4.0318603515625, -3.799072265625, -3.5662841796875, -3.33349609375, -3.1007080078125, -2.867919921875, -2.6351318359375, -2.40234375, -2.1695556640625, -1.936767578125, -1.7039794921875, -1.47119140625, -1.2384033203125, -1.005615234375, -0.7728271484375, -0.5400390625, -0.3072509765625, -0.074462890625, 0.1583251953125, 0.39111328125, 0.6239013671875, 0.856689453125, 1.0894775390625, 1.322265625, 1.5550537109375, 1.787841796875, 2.0206298828125, 2.25341796875, 2.4862060546875, 2.718994140625, 2.9517822265625, 3.1845703125, 3.4173583984375, 3.650146484375, 3.8829345703125, 4.11572265625, 4.3485107421875, 4.581298828125, 4.8140869140625, 5.046875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 12.0, 11.0, 23.0, 32.0, 38.0, 48.0, 92.0, 124.0, 168.0, 296.0, 477.0, 770.0, 1393.0, 4161.0, 31604.0, 701292.0, 287810.0, 14457.0, 2693.0, 1244.0, 620.0, 400.0, 256.0, 180.0, 118.0, 74.0, 51.0, 32.0, 29.0, 7.0, 13.0, 11.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-30.171875, -29.224365234375, -28.27685546875, -27.329345703125, -26.3818359375, -25.434326171875, -24.48681640625, -23.539306640625, -22.591796875, -21.644287109375, -20.69677734375, -19.749267578125, -18.8017578125, -17.854248046875, -16.90673828125, -15.959228515625, -15.01171875, -14.064208984375, -13.11669921875, -12.169189453125, -11.2216796875, -10.274169921875, -9.32666015625, -8.379150390625, -7.431640625, -6.484130859375, -5.53662109375, -4.589111328125, -3.6416015625, -2.694091796875, -1.74658203125, -0.799072265625, 0.1484375, 1.095947265625, 2.04345703125, 2.990966796875, 3.9384765625, 4.885986328125, 5.83349609375, 6.781005859375, 7.728515625, 8.676025390625, 9.62353515625, 10.571044921875, 11.5185546875, 12.466064453125, 13.41357421875, 14.361083984375, 15.30859375, 16.256103515625, 17.20361328125, 18.151123046875, 19.0986328125, 20.046142578125, 20.99365234375, 21.941162109375, 22.888671875, 23.836181640625, 24.78369140625, 25.731201171875, 26.6787109375, 27.626220703125, 28.57373046875, 29.521240234375, 30.46875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 5.0, 6.0, 8.0, 15.0, 13.0, 20.0, 6.0, 16.0, 19.0, 26.0, 32.0, 34.0, 45.0, 52.0, 55.0, 48.0, 55.0, 46.0, 65.0, 50.0, 50.0, 53.0, 45.0, 35.0, 29.0, 38.0, 29.0, 31.0, 19.0, 25.0, 10.0, 6.0, 8.0, 6.0, 3.0, 1.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.015625, -27.11083984375, -26.2060546875, -25.30126953125, -24.396484375, -23.49169921875, -22.5869140625, -21.68212890625, -20.77734375, -19.87255859375, -18.9677734375, -18.06298828125, -17.158203125, -16.25341796875, -15.3486328125, -14.44384765625, -13.5390625, -12.63427734375, -11.7294921875, -10.82470703125, -9.919921875, -9.01513671875, -8.1103515625, -7.20556640625, -6.30078125, -5.39599609375, -4.4912109375, -3.58642578125, -2.681640625, -1.77685546875, -0.8720703125, 0.03271484375, 0.9375, 1.84228515625, 2.7470703125, 3.65185546875, 4.556640625, 5.46142578125, 6.3662109375, 7.27099609375, 8.17578125, 9.08056640625, 9.9853515625, 10.89013671875, 11.794921875, 12.69970703125, 13.6044921875, 14.50927734375, 15.4140625, 16.31884765625, 17.2236328125, 18.12841796875, 19.033203125, 19.93798828125, 20.8427734375, 21.74755859375, 22.65234375, 23.55712890625, 24.4619140625, 25.36669921875, 26.271484375, 27.17626953125, 28.0810546875, 28.98583984375, 29.890625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 7.0, 5.0, 7.0, 13.0, 23.0, 15.0, 31.0, 55.0, 56.0, 106.0, 197.0, 409.0, 829.0, 2259.0, 7819.0, 67669.0, 871324.0, 84772.0, 8737.0, 2378.0, 910.0, 381.0, 197.0, 126.0, 59.0, 45.0, 33.0, 25.0, 9.0, 13.0, 11.0, 9.0, 6.0, 5.0, 1.0, 1.0, 5.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 1.0], "bins": [-21.203125, -20.6064453125, -20.009765625, -19.4130859375, -18.81640625, -18.2197265625, -17.623046875, -17.0263671875, -16.4296875, -15.8330078125, -15.236328125, -14.6396484375, -14.04296875, -13.4462890625, -12.849609375, -12.2529296875, -11.65625, -11.0595703125, -10.462890625, -9.8662109375, -9.26953125, -8.6728515625, -8.076171875, -7.4794921875, -6.8828125, -6.2861328125, -5.689453125, -5.0927734375, -4.49609375, -3.8994140625, -3.302734375, -2.7060546875, -2.109375, -1.5126953125, -0.916015625, -0.3193359375, 0.27734375, 0.8740234375, 1.470703125, 2.0673828125, 2.6640625, 3.2607421875, 3.857421875, 4.4541015625, 5.05078125, 5.6474609375, 6.244140625, 6.8408203125, 7.4375, 8.0341796875, 8.630859375, 9.2275390625, 9.82421875, 10.4208984375, 11.017578125, 11.6142578125, 12.2109375, 12.8076171875, 13.404296875, 14.0009765625, 14.59765625, 15.1943359375, 15.791015625, 16.3876953125, 16.984375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 5.0, 7.0, 8.0, 7.0, 14.0, 15.0, 21.0, 36.0, 44.0, 49.0, 103.0, 145.0, 171.0, 129.0, 85.0, 44.0, 34.0, 26.0, 9.0, 16.0, 9.0, 5.0, 7.0, 3.0, 2.0, 7.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00353240966796875, -0.003422945737838745, -0.0033134818077087402, -0.0032040178775787354, -0.0030945539474487305, -0.0029850900173187256, -0.0028756260871887207, -0.002766162157058716, -0.002656698226928711, -0.002547234296798706, -0.002437770366668701, -0.0023283064365386963, -0.0022188425064086914, -0.0021093785762786865, -0.0019999146461486816, -0.0018904507160186768, -0.0017809867858886719, -0.001671522855758667, -0.0015620589256286621, -0.0014525949954986572, -0.0013431310653686523, -0.0012336671352386475, -0.0011242032051086426, -0.0010147392749786377, -0.0009052753448486328, -0.0007958114147186279, -0.000686347484588623, -0.0005768835544586182, -0.0004674196243286133, -0.0003579556941986084, -0.0002484917640686035, -0.00013902783393859863, -2.956390380859375e-05, 7.990002632141113e-05, 0.00018936395645141602, 0.0002988278865814209, 0.0004082918167114258, 0.0005177557468414307, 0.0006272196769714355, 0.0007366836071014404, 0.0008461475372314453, 0.0009556114673614502, 0.001065075397491455, 0.00117453932762146, 0.0012840032577514648, 0.0013934671878814697, 0.0015029311180114746, 0.0016123950481414795, 0.0017218589782714844, 0.0018313229084014893, 0.0019407868385314941, 0.002050250768661499, 0.002159714698791504, 0.002269178628921509, 0.0023786425590515137, 0.0024881064891815186, 0.0025975704193115234, 0.0027070343494415283, 0.002816498279571533, 0.002925962209701538, 0.003035426139831543, 0.003144890069961548, 0.0032543540000915527, 0.0033638179302215576, 0.0034732818603515625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 3.0, 9.0, 22.0, 18.0, 28.0, 36.0, 53.0, 107.0, 164.0, 316.0, 777.0, 2232.0, 13773.0, 532749.0, 481361.0, 13255.0, 2223.0, 722.0, 314.0, 147.0, 93.0, 55.0, 29.0, 19.0, 19.0, 10.0, 5.0, 5.0, 5.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-29.328125, -28.575927734375, -27.82373046875, -27.071533203125, -26.3193359375, -25.567138671875, -24.81494140625, -24.062744140625, -23.310546875, -22.558349609375, -21.80615234375, -21.053955078125, -20.3017578125, -19.549560546875, -18.79736328125, -18.045166015625, -17.29296875, -16.540771484375, -15.78857421875, -15.036376953125, -14.2841796875, -13.531982421875, -12.77978515625, -12.027587890625, -11.275390625, -10.523193359375, -9.77099609375, -9.018798828125, -8.2666015625, -7.514404296875, -6.76220703125, -6.010009765625, -5.2578125, -4.505615234375, -3.75341796875, -3.001220703125, -2.2490234375, -1.496826171875, -0.74462890625, 0.007568359375, 0.759765625, 1.511962890625, 2.26416015625, 3.016357421875, 3.7685546875, 4.520751953125, 5.27294921875, 6.025146484375, 6.77734375, 7.529541015625, 8.28173828125, 9.033935546875, 9.7861328125, 10.538330078125, 11.29052734375, 12.042724609375, 12.794921875, 13.547119140625, 14.29931640625, 15.051513671875, 15.8037109375, 16.555908203125, 17.30810546875, 18.060302734375, 18.8125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 3.0, 3.0, 6.0, 2.0, 4.0, 4.0, 7.0, 7.0, 6.0, 18.0, 22.0, 30.0, 39.0, 57.0, 52.0, 94.0, 88.0, 89.0, 104.0, 90.0, 61.0, 49.0, 50.0, 37.0, 30.0, 10.0, 10.0, 9.0, 6.0, 2.0, 7.0, 4.0, 4.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.90625, -7.524658203125, -7.14306640625, -6.761474609375, -6.3798828125, -5.998291015625, -5.61669921875, -5.235107421875, -4.853515625, -4.471923828125, -4.09033203125, -3.708740234375, -3.3271484375, -2.945556640625, -2.56396484375, -2.182373046875, -1.80078125, -1.419189453125, -1.03759765625, -0.656005859375, -0.2744140625, 0.107177734375, 0.48876953125, 0.870361328125, 1.251953125, 1.633544921875, 2.01513671875, 2.396728515625, 2.7783203125, 3.159912109375, 3.54150390625, 3.923095703125, 4.3046875, 4.686279296875, 5.06787109375, 5.449462890625, 5.8310546875, 6.212646484375, 6.59423828125, 6.975830078125, 7.357421875, 7.739013671875, 8.12060546875, 8.502197265625, 8.8837890625, 9.265380859375, 9.64697265625, 10.028564453125, 10.41015625, 10.791748046875, 11.17333984375, 11.554931640625, 11.9365234375, 12.318115234375, 12.69970703125, 13.081298828125, 13.462890625, 13.844482421875, 14.22607421875, 14.607666015625, 14.9892578125, 15.370849609375, 15.75244140625, 16.134033203125, 16.515625]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 9.0, 66.0, 332.0, 445.0, 108.0, 22.0, 12.0, 1.0, 4.0, 2.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-358.9692687988281, -341.81597900390625, -324.66265869140625, -307.5093688964844, -290.3560485839844, -273.2027587890625, -256.0494384765625, -238.89614868164062, -221.7428436279297, -204.58953857421875, -187.4362335205078, -170.28292846679688, -153.129638671875, -135.976318359375, -118.82302856445312, -101.66972351074219, -84.51641845703125, -67.36311340332031, -50.20981216430664, -33.05651092529297, -15.903205871582031, 1.2500991821289062, 18.403396606445312, 35.55670166015625, 52.71000671386719, 69.86331176757812, 87.01661682128906, 104.16991424560547, 121.3232192993164, 138.47653198242188, 155.62982177734375, 172.7831268310547, 189.93646240234375, 207.0897674560547, 224.24307250976562, 241.3963623046875, 258.5496826171875, 275.7029724121094, 292.85626220703125, 310.00958251953125, 327.16290283203125, 344.3161926269531, 361.4695129394531, 378.622802734375, 395.776123046875, 412.9294128417969, 430.08270263671875, 447.23602294921875, 464.3893127441406, 481.5426025390625, 498.6959228515625, 515.8492431640625, 533.0025024414062, 550.1558227539062, 567.3091430664062, 584.46240234375, 601.61572265625, 618.76904296875, 635.9223022460938, 653.0756225585938, 670.2289428710938, 687.3822631835938, 704.5355224609375, 721.6888427734375, 738.8421630859375]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 5.0, 5.0, 4.0, 12.0, 9.0, 21.0, 14.0, 21.0, 25.0, 18.0, 31.0, 41.0, 39.0, 43.0, 37.0, 41.0, 50.0, 48.0, 43.0, 55.0, 54.0, 43.0, 36.0, 39.0, 34.0, 36.0, 30.0, 23.0, 15.0, 29.0, 20.0, 13.0, 15.0, 9.0, 12.0, 8.0, 9.0, 1.0, 7.0, 2.0, 1.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-96.45306396484375, -92.89010620117188, -89.3271484375, -85.76419830322266, -82.20124053955078, -78.6382827758789, -75.07533264160156, -71.51237487792969, -67.94941711425781, -64.38645935058594, -60.82350540161133, -57.26055145263672, -53.697593688964844, -50.13463592529297, -46.57168197631836, -43.00872802734375, -39.445770263671875, -35.8828125, -32.31985855102539, -28.75690269470215, -25.193946838378906, -21.630990982055664, -18.068035125732422, -14.50507926940918, -10.942123413085938, -7.379167556762695, -3.816211700439453, -0.25325584411621094, 3.3097000122070312, 6.872655868530273, 10.435611724853516, 13.998567581176758, 17.5615234375, 21.124479293823242, 24.687435150146484, 28.250391006469727, 31.81334686279297, 35.376304626464844, 38.93925857543945, 42.50221252441406, 46.06517028808594, 49.62812805175781, 53.19108200073242, 56.75403594970703, 60.316993713378906, 63.87995147705078, 67.44290161132812, 71.005859375, 74.56881713867188, 78.13177490234375, 81.69473266601562, 85.25768280029297, 88.82064056396484, 92.38359832763672, 95.94654846191406, 99.50950622558594, 103.07246398925781, 106.63542175292969, 110.19837951660156, 113.7613296508789, 117.32428741455078, 120.88724517822266, 124.4501953125, 128.01315307617188, 131.57611083984375]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 7.0, 7.0, 14.0, 26.0, 31.0, 41.0, 89.0, 129.0, 224.0, 424.0, 973.0, 2262.0, 6981.0, 60152.0, 4088988.0, 25769.0, 4949.0, 1657.0, 694.0, 354.0, 200.0, 103.0, 71.0, 44.0, 23.0, 19.0, 6.0, 11.0, 17.0, 10.0, 3.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.96875, -23.85205078125, -22.7353515625, -21.61865234375, -20.501953125, -19.38525390625, -18.2685546875, -17.15185546875, -16.03515625, -14.91845703125, -13.8017578125, -12.68505859375, -11.568359375, -10.45166015625, -9.3349609375, -8.21826171875, -7.1015625, -5.98486328125, -4.8681640625, -3.75146484375, -2.634765625, -1.51806640625, -0.4013671875, 0.71533203125, 1.83203125, 2.94873046875, 4.0654296875, 5.18212890625, 6.298828125, 7.41552734375, 8.5322265625, 9.64892578125, 10.765625, 11.88232421875, 12.9990234375, 14.11572265625, 15.232421875, 16.34912109375, 17.4658203125, 18.58251953125, 19.69921875, 20.81591796875, 21.9326171875, 23.04931640625, 24.166015625, 25.28271484375, 26.3994140625, 27.51611328125, 28.6328125, 29.74951171875, 30.8662109375, 31.98291015625, 33.099609375, 34.21630859375, 35.3330078125, 36.44970703125, 37.56640625, 38.68310546875, 39.7998046875, 40.91650390625, 42.033203125, 43.14990234375, 44.2666015625, 45.38330078125, 46.5]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 4.0, 5.0, 5.0, 7.0, 7.0, 5.0, 12.0, 17.0, 17.0, 24.0, 24.0, 38.0, 29.0, 40.0, 62.0, 41.0, 44.0, 62.0, 55.0, 45.0, 66.0, 50.0, 48.0, 36.0, 45.0, 44.0, 26.0, 31.0, 21.0, 20.0, 11.0, 17.0, 12.0, 10.0, 4.0, 5.0, 6.0, 3.0, 5.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-7.3359375, -7.13250732421875, -6.9290771484375, -6.72564697265625, -6.522216796875, -6.31878662109375, -6.1153564453125, -5.91192626953125, -5.70849609375, -5.50506591796875, -5.3016357421875, -5.09820556640625, -4.894775390625, -4.69134521484375, -4.4879150390625, -4.28448486328125, -4.0810546875, -3.87762451171875, -3.6741943359375, -3.47076416015625, -3.267333984375, -3.06390380859375, -2.8604736328125, -2.65704345703125, -2.45361328125, -2.25018310546875, -2.0467529296875, -1.84332275390625, -1.639892578125, -1.43646240234375, -1.2330322265625, -1.02960205078125, -0.826171875, -0.62274169921875, -0.4193115234375, -0.21588134765625, -0.012451171875, 0.19097900390625, 0.3944091796875, 0.59783935546875, 0.80126953125, 1.00469970703125, 1.2081298828125, 1.41156005859375, 1.614990234375, 1.81842041015625, 2.0218505859375, 2.22528076171875, 2.4287109375, 2.63214111328125, 2.8355712890625, 3.03900146484375, 3.242431640625, 3.44586181640625, 3.6492919921875, 3.85272216796875, 4.05615234375, 4.25958251953125, 4.4630126953125, 4.66644287109375, 4.869873046875, 5.07330322265625, 5.2767333984375, 5.48016357421875, 5.68359375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 7.0, 6.0, 11.0, 15.0, 32.0, 42.0, 57.0, 93.0, 163.0, 295.0, 498.0, 853.0, 1857.0, 4715.0, 22272.0, 3834854.0, 306638.0, 14847.0, 3668.0, 1554.0, 740.0, 413.0, 250.0, 143.0, 106.0, 53.0, 46.0, 23.0, 16.0, 10.0, 4.0, 2.0, 6.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.28125, -34.240234375, -33.19921875, -32.158203125, -31.1171875, -30.076171875, -29.03515625, -27.994140625, -26.953125, -25.912109375, -24.87109375, -23.830078125, -22.7890625, -21.748046875, -20.70703125, -19.666015625, -18.625, -17.583984375, -16.54296875, -15.501953125, -14.4609375, -13.419921875, -12.37890625, -11.337890625, -10.296875, -9.255859375, -8.21484375, -7.173828125, -6.1328125, -5.091796875, -4.05078125, -3.009765625, -1.96875, -0.927734375, 0.11328125, 1.154296875, 2.1953125, 3.236328125, 4.27734375, 5.318359375, 6.359375, 7.400390625, 8.44140625, 9.482421875, 10.5234375, 11.564453125, 12.60546875, 13.646484375, 14.6875, 15.728515625, 16.76953125, 17.810546875, 18.8515625, 19.892578125, 20.93359375, 21.974609375, 23.015625, 24.056640625, 25.09765625, 26.138671875, 27.1796875, 28.220703125, 29.26171875, 30.302734375, 31.34375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 7.0, 4.0, 7.0, 11.0, 17.0, 31.0, 66.0, 339.0, 3284.0, 180.0, 63.0, 30.0, 14.0, 10.0, 8.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.28125, -12.8291015625, -12.376953125, -11.9248046875, -11.47265625, -11.0205078125, -10.568359375, -10.1162109375, -9.6640625, -9.2119140625, -8.759765625, -8.3076171875, -7.85546875, -7.4033203125, -6.951171875, -6.4990234375, -6.046875, -5.5947265625, -5.142578125, -4.6904296875, -4.23828125, -3.7861328125, -3.333984375, -2.8818359375, -2.4296875, -1.9775390625, -1.525390625, -1.0732421875, -0.62109375, -0.1689453125, 0.283203125, 0.7353515625, 1.1875, 1.6396484375, 2.091796875, 2.5439453125, 2.99609375, 3.4482421875, 3.900390625, 4.3525390625, 4.8046875, 5.2568359375, 5.708984375, 6.1611328125, 6.61328125, 7.0654296875, 7.517578125, 7.9697265625, 8.421875, 8.8740234375, 9.326171875, 9.7783203125, 10.23046875, 10.6826171875, 11.134765625, 11.5869140625, 12.0390625, 12.4912109375, 12.943359375, 13.3955078125, 13.84765625, 14.2998046875, 14.751953125, 15.2041015625, 15.65625]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 7.0, 5.0, 4.0, 11.0, 26.0, 48.0, 74.0, 100.0, 160.0, 157.0, 160.0, 100.0, 68.0, 31.0, 18.0, 13.0, 11.0, 3.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.750614166259766, -33.03110885620117, -31.31160545349121, -29.59210205078125, -27.872596740722656, -26.153091430664062, -24.4335880279541, -22.71408462524414, -20.994579315185547, -19.275074005126953, -17.555570602416992, -15.836066246032715, -14.116561889648438, -12.39705753326416, -10.677553176879883, -8.958048820495605, -7.238544464111328, -5.519040107727051, -3.7995357513427734, -2.080031394958496, -0.36052703857421875, 1.3589773178100586, 3.078481674194336, 4.797986030578613, 6.517490386962891, 8.236994743347168, 9.956499099731445, 11.676003456115723, 13.3955078125, 15.115012168884277, 16.834516525268555, 18.554019927978516, 20.273529052734375, 21.99303436279297, 23.71253776550293, 25.43204116821289, 27.151546478271484, 28.871051788330078, 30.59055519104004, 32.31005859375, 34.029563903808594, 35.74906921386719, 37.46857452392578, 39.18807601928711, 40.9075813293457, 42.6270866394043, 44.346588134765625, 46.06609344482422, 47.78559875488281, 49.505104064941406, 51.224609375, 52.94411087036133, 54.66361618041992, 56.383121490478516, 58.102622985839844, 59.82212829589844, 61.54163360595703, 63.261138916015625, 64.98064422607422, 66.70014953613281, 68.41964721679688, 70.13915252685547, 71.85865783691406, 73.57816314697266, 75.29766845703125]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 3.0, 4.0, 11.0, 14.0, 14.0, 13.0, 18.0, 20.0, 38.0, 38.0, 55.0, 53.0, 48.0, 64.0, 51.0, 55.0, 54.0, 60.0, 56.0, 60.0, 48.0, 35.0, 46.0, 24.0, 28.0, 23.0, 22.0, 23.0, 10.0, 7.0, 9.0, 4.0, 1.0, 2.0, 2.0, 1.0], "bins": [-40.79376983642578, -39.87073516845703, -38.947696685791016, -38.024658203125, -37.10162353515625, -36.1785888671875, -35.255550384521484, -34.33251190185547, -33.40947723388672, -32.48644256591797, -31.563404083251953, -30.64036750793457, -29.717330932617188, -28.794294357299805, -27.871257781982422, -26.94822120666504, -26.025184631347656, -25.102148056030273, -24.17911148071289, -23.256074905395508, -22.333038330078125, -21.410001754760742, -20.48696517944336, -19.563928604125977, -18.640892028808594, -17.71785545349121, -16.794818878173828, -15.871782302856445, -14.948745727539062, -14.02570915222168, -13.102672576904297, -12.179636001586914, -11.256601333618164, -10.333564758300781, -9.410528182983398, -8.487491607666016, -7.564455032348633, -6.64141845703125, -5.718381881713867, -4.795345306396484, -3.8723087310791016, -2.9492721557617188, -2.026235580444336, -1.1031990051269531, -0.1801624298095703, 0.7428741455078125, 1.6659107208251953, 2.588947296142578, 3.511983871459961, 4.435020446777344, 5.358057022094727, 6.281093597412109, 7.204130172729492, 8.127166748046875, 9.050203323364258, 9.97323989868164, 10.896276473999023, 11.819313049316406, 12.742349624633789, 13.665386199951172, 14.588422775268555, 15.511459350585938, 16.43449592590332, 17.357532501220703, 18.280569076538086]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 0.0, 1.0, 7.0, 7.0, 7.0, 11.0, 14.0, 26.0, 32.0, 26.0, 47.0, 69.0, 95.0, 139.0, 228.0, 387.0, 575.0, 1018.0, 1723.0, 3120.0, 6090.0, 11676.0, 25310.0, 56214.0, 130951.0, 303428.0, 286269.0, 121184.0, 52501.0, 23595.0, 11009.0, 5618.0, 2918.0, 1637.0, 951.0, 561.0, 377.0, 227.0, 147.0, 115.0, 73.0, 46.0, 39.0, 24.0, 20.0, 17.0, 10.0, 5.0, 7.0, 4.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-9.859375, -9.5067138671875, -9.154052734375, -8.8013916015625, -8.44873046875, -8.0960693359375, -7.743408203125, -7.3907470703125, -7.0380859375, -6.6854248046875, -6.332763671875, -5.9801025390625, -5.62744140625, -5.2747802734375, -4.922119140625, -4.5694580078125, -4.216796875, -3.8641357421875, -3.511474609375, -3.1588134765625, -2.80615234375, -2.4534912109375, -2.100830078125, -1.7481689453125, -1.3955078125, -1.0428466796875, -0.690185546875, -0.3375244140625, 0.01513671875, 0.3677978515625, 0.720458984375, 1.0731201171875, 1.42578125, 1.7784423828125, 2.131103515625, 2.4837646484375, 2.83642578125, 3.1890869140625, 3.541748046875, 3.8944091796875, 4.2470703125, 4.5997314453125, 4.952392578125, 5.3050537109375, 5.65771484375, 6.0103759765625, 6.363037109375, 6.7156982421875, 7.068359375, 7.4210205078125, 7.773681640625, 8.1263427734375, 8.47900390625, 8.8316650390625, 9.184326171875, 9.5369873046875, 9.8896484375, 10.2423095703125, 10.594970703125, 10.9476318359375, 11.30029296875, 11.6529541015625, 12.005615234375, 12.3582763671875, 12.7109375]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 6.0, 2.0, 8.0, 8.0, 7.0, 7.0, 10.0, 8.0, 16.0, 20.0, 17.0, 28.0, 30.0, 22.0, 31.0, 48.0, 36.0, 40.0, 48.0, 56.0, 48.0, 59.0, 38.0, 45.0, 51.0, 48.0, 27.0, 27.0, 37.0, 32.0, 20.0, 19.0, 22.0, 16.0, 12.0, 11.0, 10.0, 9.0, 11.0, 5.0, 5.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0], "bins": [-7.23828125, -7.04840087890625, -6.8585205078125, -6.66864013671875, -6.478759765625, -6.28887939453125, -6.0989990234375, -5.90911865234375, -5.71923828125, -5.52935791015625, -5.3394775390625, -5.14959716796875, -4.959716796875, -4.76983642578125, -4.5799560546875, -4.39007568359375, -4.2001953125, -4.01031494140625, -3.8204345703125, -3.63055419921875, -3.440673828125, -3.25079345703125, -3.0609130859375, -2.87103271484375, -2.68115234375, -2.49127197265625, -2.3013916015625, -2.11151123046875, -1.921630859375, -1.73175048828125, -1.5418701171875, -1.35198974609375, -1.162109375, -0.97222900390625, -0.7823486328125, -0.59246826171875, -0.402587890625, -0.21270751953125, -0.0228271484375, 0.16705322265625, 0.35693359375, 0.54681396484375, 0.7366943359375, 0.92657470703125, 1.116455078125, 1.30633544921875, 1.4962158203125, 1.68609619140625, 1.8759765625, 2.06585693359375, 2.2557373046875, 2.44561767578125, 2.635498046875, 2.82537841796875, 3.0152587890625, 3.20513916015625, 3.39501953125, 3.58489990234375, 3.7747802734375, 3.96466064453125, 4.154541015625, 4.34442138671875, 4.5343017578125, 4.72418212890625, 4.9140625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 3.0, 5.0, 4.0, 6.0, 10.0, 19.0, 39.0, 47.0, 99.0, 235.0, 503.0, 1305.0, 5082.0, 201065.0, 826197.0, 10802.0, 1894.0, 665.0, 259.0, 143.0, 78.0, 32.0, 23.0, 16.0, 8.0, 2.0, 7.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-71.6875, -69.80859375, -67.9296875, -66.05078125, -64.171875, -62.29296875, -60.4140625, -58.53515625, -56.65625, -54.77734375, -52.8984375, -51.01953125, -49.140625, -47.26171875, -45.3828125, -43.50390625, -41.625, -39.74609375, -37.8671875, -35.98828125, -34.109375, -32.23046875, -30.3515625, -28.47265625, -26.59375, -24.71484375, -22.8359375, -20.95703125, -19.078125, -17.19921875, -15.3203125, -13.44140625, -11.5625, -9.68359375, -7.8046875, -5.92578125, -4.046875, -2.16796875, -0.2890625, 1.58984375, 3.46875, 5.34765625, 7.2265625, 9.10546875, 10.984375, 12.86328125, 14.7421875, 16.62109375, 18.5, 20.37890625, 22.2578125, 24.13671875, 26.015625, 27.89453125, 29.7734375, 31.65234375, 33.53125, 35.41015625, 37.2890625, 39.16796875, 41.046875, 42.92578125, 44.8046875, 46.68359375, 48.5625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 4.0, 3.0, 2.0, 6.0, 10.0, 3.0, 10.0, 10.0, 8.0, 14.0, 13.0, 16.0, 27.0, 30.0, 26.0, 29.0, 30.0, 35.0, 36.0, 42.0, 51.0, 41.0, 52.0, 36.0, 52.0, 45.0, 32.0, 44.0, 35.0, 32.0, 33.0, 24.0, 30.0, 17.0, 17.0, 15.0, 25.0, 18.0, 13.0, 12.0, 5.0, 5.0, 6.0, 1.0, 4.0, 3.0, 2.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-23.0, -22.237548828125, -21.47509765625, -20.712646484375, -19.9501953125, -19.187744140625, -18.42529296875, -17.662841796875, -16.900390625, -16.137939453125, -15.37548828125, -14.613037109375, -13.8505859375, -13.088134765625, -12.32568359375, -11.563232421875, -10.80078125, -10.038330078125, -9.27587890625, -8.513427734375, -7.7509765625, -6.988525390625, -6.22607421875, -5.463623046875, -4.701171875, -3.938720703125, -3.17626953125, -2.413818359375, -1.6513671875, -0.888916015625, -0.12646484375, 0.635986328125, 1.3984375, 2.160888671875, 2.92333984375, 3.685791015625, 4.4482421875, 5.210693359375, 5.97314453125, 6.735595703125, 7.498046875, 8.260498046875, 9.02294921875, 9.785400390625, 10.5478515625, 11.310302734375, 12.07275390625, 12.835205078125, 13.59765625, 14.360107421875, 15.12255859375, 15.885009765625, 16.6474609375, 17.409912109375, 18.17236328125, 18.934814453125, 19.697265625, 20.459716796875, 21.22216796875, 21.984619140625, 22.7470703125, 23.509521484375, 24.27197265625, 25.034423828125, 25.796875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 6.0, 2.0, 6.0, 7.0, 12.0, 16.0, 27.0, 29.0, 27.0, 59.0, 62.0, 89.0, 140.0, 242.0, 355.0, 678.0, 1312.0, 3133.0, 8866.0, 33510.0, 176159.0, 635583.0, 145969.0, 28906.0, 7708.0, 2730.0, 1255.0, 604.0, 362.0, 225.0, 143.0, 91.0, 75.0, 49.0, 32.0, 29.0, 14.0, 16.0, 9.0, 8.0, 3.0, 3.0, 3.0, 1.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.8515625, -6.618896484375, -6.38623046875, -6.153564453125, -5.9208984375, -5.688232421875, -5.45556640625, -5.222900390625, -4.990234375, -4.757568359375, -4.52490234375, -4.292236328125, -4.0595703125, -3.826904296875, -3.59423828125, -3.361572265625, -3.12890625, -2.896240234375, -2.66357421875, -2.430908203125, -2.1982421875, -1.965576171875, -1.73291015625, -1.500244140625, -1.267578125, -1.034912109375, -0.80224609375, -0.569580078125, -0.3369140625, -0.104248046875, 0.12841796875, 0.361083984375, 0.59375, 0.826416015625, 1.05908203125, 1.291748046875, 1.5244140625, 1.757080078125, 1.98974609375, 2.222412109375, 2.455078125, 2.687744140625, 2.92041015625, 3.153076171875, 3.3857421875, 3.618408203125, 3.85107421875, 4.083740234375, 4.31640625, 4.549072265625, 4.78173828125, 5.014404296875, 5.2470703125, 5.479736328125, 5.71240234375, 5.945068359375, 6.177734375, 6.410400390625, 6.64306640625, 6.875732421875, 7.1083984375, 7.341064453125, 7.57373046875, 7.806396484375, 8.0390625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 1.0, 2.0, 2.0, 2.0, 8.0, 10.0, 5.0, 7.0, 13.0, 7.0, 17.0, 15.0, 20.0, 24.0, 25.0, 22.0, 30.0, 39.0, 59.0, 96.0, 120.0, 107.0, 61.0, 57.0, 45.0, 40.0, 26.0, 25.0, 20.0, 22.0, 14.0, 12.0, 7.0, 10.0, 9.0, 7.0, 4.0, 5.0, 3.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0014467239379882812, -0.0013994574546813965, -0.0013521909713745117, -0.001304924488067627, -0.0012576580047607422, -0.0012103915214538574, -0.0011631250381469727, -0.0011158585548400879, -0.0010685920715332031, -0.0010213255882263184, -0.0009740591049194336, -0.0009267926216125488, -0.0008795261383056641, -0.0008322596549987793, -0.0007849931716918945, -0.0007377266883850098, -0.000690460205078125, -0.0006431937217712402, -0.0005959272384643555, -0.0005486607551574707, -0.0005013942718505859, -0.00045412778854370117, -0.0004068613052368164, -0.00035959482192993164, -0.0003123283386230469, -0.0002650618553161621, -0.00021779537200927734, -0.00017052888870239258, -0.0001232624053955078, -7.599592208862305e-05, -2.872943878173828e-05, 1.8537044525146484e-05, 6.580352783203125e-05, 0.00011307001113891602, 0.00016033649444580078, 0.00020760297775268555, 0.0002548694610595703, 0.0003021359443664551, 0.00034940242767333984, 0.0003966689109802246, 0.0004439353942871094, 0.0004912018775939941, 0.0005384683609008789, 0.0005857348442077637, 0.0006330013275146484, 0.0006802678108215332, 0.000727534294128418, 0.0007748007774353027, 0.0008220672607421875, 0.0008693337440490723, 0.000916600227355957, 0.0009638667106628418, 0.0010111331939697266, 0.0010583996772766113, 0.001105666160583496, 0.0011529326438903809, 0.0012001991271972656, 0.0012474656105041504, 0.0012947320938110352, 0.00134199857711792, 0.0013892650604248047, 0.0014365315437316895, 0.0014837980270385742, 0.001531064510345459, 0.0015783309936523438]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 2.0, 3.0, 8.0, 2.0, 12.0, 8.0, 19.0, 28.0, 18.0, 41.0, 61.0, 107.0, 142.0, 213.0, 370.0, 722.0, 1453.0, 3505.0, 11528.0, 60709.0, 520840.0, 386925.0, 46439.0, 9505.0, 3061.0, 1229.0, 651.0, 349.0, 203.0, 132.0, 89.0, 52.0, 40.0, 29.0, 19.0, 8.0, 14.0, 8.0, 5.0, 6.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.60546875, -7.32305908203125, -7.0406494140625, -6.75823974609375, -6.475830078125, -6.19342041015625, -5.9110107421875, -5.62860107421875, -5.34619140625, -5.06378173828125, -4.7813720703125, -4.49896240234375, -4.216552734375, -3.93414306640625, -3.6517333984375, -3.36932373046875, -3.0869140625, -2.80450439453125, -2.5220947265625, -2.23968505859375, -1.957275390625, -1.67486572265625, -1.3924560546875, -1.11004638671875, -0.82763671875, -0.54522705078125, -0.2628173828125, 0.01959228515625, 0.302001953125, 0.58441162109375, 0.8668212890625, 1.14923095703125, 1.431640625, 1.71405029296875, 1.9964599609375, 2.27886962890625, 2.561279296875, 2.84368896484375, 3.1260986328125, 3.40850830078125, 3.69091796875, 3.97332763671875, 4.2557373046875, 4.53814697265625, 4.820556640625, 5.10296630859375, 5.3853759765625, 5.66778564453125, 5.9501953125, 6.23260498046875, 6.5150146484375, 6.79742431640625, 7.079833984375, 7.36224365234375, 7.6446533203125, 7.92706298828125, 8.20947265625, 8.49188232421875, 8.7742919921875, 9.05670166015625, 9.339111328125, 9.62152099609375, 9.9039306640625, 10.18634033203125, 10.46875]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 7.0, 7.0, 3.0, 5.0, 9.0, 13.0, 22.0, 17.0, 19.0, 23.0, 40.0, 56.0, 69.0, 75.0, 82.0, 107.0, 89.0, 64.0, 66.0, 60.0, 52.0, 30.0, 30.0, 12.0, 11.0, 12.0, 6.0, 9.0, 10.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.390625, -10.11981201171875, -9.8489990234375, -9.57818603515625, -9.307373046875, -9.03656005859375, -8.7657470703125, -8.49493408203125, -8.22412109375, -7.95330810546875, -7.6824951171875, -7.41168212890625, -7.140869140625, -6.87005615234375, -6.5992431640625, -6.32843017578125, -6.0576171875, -5.78680419921875, -5.5159912109375, -5.24517822265625, -4.974365234375, -4.70355224609375, -4.4327392578125, -4.16192626953125, -3.89111328125, -3.62030029296875, -3.3494873046875, -3.07867431640625, -2.807861328125, -2.53704833984375, -2.2662353515625, -1.99542236328125, -1.724609375, -1.45379638671875, -1.1829833984375, -0.91217041015625, -0.641357421875, -0.37054443359375, -0.0997314453125, 0.17108154296875, 0.44189453125, 0.71270751953125, 0.9835205078125, 1.25433349609375, 1.525146484375, 1.79595947265625, 2.0667724609375, 2.33758544921875, 2.6083984375, 2.87921142578125, 3.1500244140625, 3.42083740234375, 3.691650390625, 3.96246337890625, 4.2332763671875, 4.50408935546875, 4.77490234375, 5.04571533203125, 5.3165283203125, 5.58734130859375, 5.858154296875, 6.12896728515625, 6.3997802734375, 6.67059326171875, 6.94140625]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 13.0, 6.0, 30.0, 66.0, 130.0, 171.0, 209.0, 158.0, 102.0, 54.0, 28.0, 11.0, 11.0, 3.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-143.96824645996094, -137.1471405029297, -130.3260498046875, -123.50494384765625, -116.683837890625, -109.86273956298828, -103.04164123535156, -96.22053527832031, -89.3994369506836, -82.57833862304688, -75.75723266601562, -68.9361343383789, -62.11503219604492, -55.29393005371094, -48.47283172607422, -41.651729583740234, -34.83062744140625, -28.009525299072266, -21.188425064086914, -14.367324829101562, -7.546222686767578, -0.7251205444335938, 6.095977783203125, 12.91707992553711, 19.738182067871094, 26.559284210205078, 33.38038635253906, 40.20148468017578, 47.022586822509766, 53.84368896484375, 60.66478729248047, 67.48588562011719, 74.30697631835938, 81.1280746459961, 87.94918060302734, 94.77027893066406, 101.59138488769531, 108.41248321533203, 115.23358154296875, 122.0546875, 128.87579345703125, 135.6968994140625, 142.5179901123047, 149.33909606933594, 156.1602020263672, 162.98129272460938, 169.80239868164062, 176.62350463867188, 183.44459533691406, 190.2657012939453, 197.0867919921875, 203.90789794921875, 210.72900390625, 217.55010986328125, 224.37120056152344, 231.1923065185547, 238.01339721679688, 244.83450317382812, 251.6555938720703, 258.4766845703125, 265.29779052734375, 272.118896484375, 278.94000244140625, 285.7611083984375, 292.58221435546875]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 1.0, 10.0, 5.0, 10.0, 4.0, 14.0, 8.0, 19.0, 18.0, 21.0, 23.0, 36.0, 34.0, 37.0, 40.0, 39.0, 45.0, 52.0, 61.0, 46.0, 43.0, 55.0, 32.0, 52.0, 26.0, 37.0, 46.0, 26.0, 28.0, 15.0, 19.0, 17.0, 21.0, 19.0, 6.0, 12.0, 8.0, 4.0, 3.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-111.12625122070312, -107.6392822265625, -104.1523208618164, -100.66535186767578, -97.17839050292969, -93.69142150878906, -90.20445251464844, -86.71749114990234, -83.23052978515625, -79.74356079101562, -76.25659942626953, -72.7696304321289, -69.28266906738281, -65.79570007324219, -62.30873489379883, -58.82176971435547, -55.334800720214844, -51.847835540771484, -48.360870361328125, -44.8739013671875, -41.386940002441406, -37.89997100830078, -34.41300582885742, -30.926040649414062, -27.439075469970703, -23.952110290527344, -20.465145111083984, -16.978178024291992, -13.491212844848633, -10.004247665405273, -6.517280578613281, -3.030315399169922, 0.4566497802734375, 3.943615436553955, 7.430581092834473, 10.917547225952148, 14.404512405395508, 17.891477584838867, 21.37844467163086, 24.86540985107422, 28.352375030517578, 31.839340209960938, 35.3263053894043, 38.813270568847656, 42.30023956298828, 45.787200927734375, 49.274169921875, 52.76113510131836, 56.24810028076172, 59.73506546020508, 63.22203063964844, 66.70899963378906, 70.19596099853516, 73.68292999267578, 77.16989135742188, 80.6568603515625, 84.14382934570312, 87.63079833984375, 91.11775970458984, 94.60472869873047, 98.09169006347656, 101.57865905761719, 105.06562805175781, 108.5525894165039, 112.03955078125]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 3.0, 1.0, 0.0, 4.0, 7.0, 10.0, 16.0, 31.0, 58.0, 133.0, 225.0, 631.0, 1656.0, 4123.0, 12882.0, 52485.0, 614603.0, 3320923.0, 149619.0, 24894.0, 7361.0, 2554.0, 1031.0, 440.0, 257.0, 121.0, 75.0, 43.0, 27.0, 26.0, 9.0, 12.0, 16.0, 5.0, 1.0, 6.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.71875, -11.16796875, -10.6171875, -10.06640625, -9.515625, -8.96484375, -8.4140625, -7.86328125, -7.3125, -6.76171875, -6.2109375, -5.66015625, -5.109375, -4.55859375, -4.0078125, -3.45703125, -2.90625, -2.35546875, -1.8046875, -1.25390625, -0.703125, -0.15234375, 0.3984375, 0.94921875, 1.5, 2.05078125, 2.6015625, 3.15234375, 3.703125, 4.25390625, 4.8046875, 5.35546875, 5.90625, 6.45703125, 7.0078125, 7.55859375, 8.109375, 8.66015625, 9.2109375, 9.76171875, 10.3125, 10.86328125, 11.4140625, 11.96484375, 12.515625, 13.06640625, 13.6171875, 14.16796875, 14.71875, 15.26953125, 15.8203125, 16.37109375, 16.921875, 17.47265625, 18.0234375, 18.57421875, 19.125, 19.67578125, 20.2265625, 20.77734375, 21.328125, 21.87890625, 22.4296875, 22.98046875, 23.53125]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 3.0, 2.0, 6.0, 5.0, 9.0, 7.0, 14.0, 17.0, 15.0, 14.0, 36.0, 25.0, 30.0, 41.0, 32.0, 38.0, 49.0, 38.0, 59.0, 52.0, 56.0, 44.0, 54.0, 49.0, 46.0, 39.0, 34.0, 20.0, 22.0, 24.0, 25.0, 15.0, 15.0, 16.0, 12.0, 6.0, 11.0, 5.0, 6.0, 3.0, 6.0, 7.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1171875, -4.9300537109375, -4.742919921875, -4.5557861328125, -4.36865234375, -4.1815185546875, -3.994384765625, -3.8072509765625, -3.6201171875, -3.4329833984375, -3.245849609375, -3.0587158203125, -2.87158203125, -2.6844482421875, -2.497314453125, -2.3101806640625, -2.123046875, -1.9359130859375, -1.748779296875, -1.5616455078125, -1.37451171875, -1.1873779296875, -1.000244140625, -0.8131103515625, -0.6259765625, -0.4388427734375, -0.251708984375, -0.0645751953125, 0.12255859375, 0.3096923828125, 0.496826171875, 0.6839599609375, 0.87109375, 1.0582275390625, 1.245361328125, 1.4324951171875, 1.61962890625, 1.8067626953125, 1.993896484375, 2.1810302734375, 2.3681640625, 2.5552978515625, 2.742431640625, 2.9295654296875, 3.11669921875, 3.3038330078125, 3.490966796875, 3.6781005859375, 3.865234375, 4.0523681640625, 4.239501953125, 4.4266357421875, 4.61376953125, 4.8009033203125, 4.988037109375, 5.1751708984375, 5.3623046875, 5.5494384765625, 5.736572265625, 5.9237060546875, 6.11083984375, 6.2979736328125, 6.485107421875, 6.6722412109375, 6.859375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 4.0, 8.0, 6.0, 8.0, 12.0, 24.0, 33.0, 48.0, 79.0, 148.0, 299.0, 670.0, 1884.0, 7260.0, 42347.0, 1402489.0, 2676920.0, 50607.0, 8146.0, 1939.0, 676.0, 301.0, 130.0, 92.0, 55.0, 29.0, 20.0, 19.0, 11.0, 6.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 4.0], "bins": [-37.625, -36.685546875, -35.74609375, -34.806640625, -33.8671875, -32.927734375, -31.98828125, -31.048828125, -30.109375, -29.169921875, -28.23046875, -27.291015625, -26.3515625, -25.412109375, -24.47265625, -23.533203125, -22.59375, -21.654296875, -20.71484375, -19.775390625, -18.8359375, -17.896484375, -16.95703125, -16.017578125, -15.078125, -14.138671875, -13.19921875, -12.259765625, -11.3203125, -10.380859375, -9.44140625, -8.501953125, -7.5625, -6.623046875, -5.68359375, -4.744140625, -3.8046875, -2.865234375, -1.92578125, -0.986328125, -0.046875, 0.892578125, 1.83203125, 2.771484375, 3.7109375, 4.650390625, 5.58984375, 6.529296875, 7.46875, 8.408203125, 9.34765625, 10.287109375, 11.2265625, 12.166015625, 13.10546875, 14.044921875, 14.984375, 15.923828125, 16.86328125, 17.802734375, 18.7421875, 19.681640625, 20.62109375, 21.560546875, 22.5]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 6.0, 7.0, 9.0, 9.0, 9.0, 20.0, 27.0, 39.0, 32.0, 55.0, 55.0, 102.0, 153.0, 230.0, 538.0, 1007.0, 836.0, 388.0, 193.0, 104.0, 69.0, 45.0, 31.0, 25.0, 18.0, 16.0, 11.0, 10.0, 8.0, 2.0, 4.0, 4.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-19.796875, -19.228515625, -18.66015625, -18.091796875, -17.5234375, -16.955078125, -16.38671875, -15.818359375, -15.25, -14.681640625, -14.11328125, -13.544921875, -12.9765625, -12.408203125, -11.83984375, -11.271484375, -10.703125, -10.134765625, -9.56640625, -8.998046875, -8.4296875, -7.861328125, -7.29296875, -6.724609375, -6.15625, -5.587890625, -5.01953125, -4.451171875, -3.8828125, -3.314453125, -2.74609375, -2.177734375, -1.609375, -1.041015625, -0.47265625, 0.095703125, 0.6640625, 1.232421875, 1.80078125, 2.369140625, 2.9375, 3.505859375, 4.07421875, 4.642578125, 5.2109375, 5.779296875, 6.34765625, 6.916015625, 7.484375, 8.052734375, 8.62109375, 9.189453125, 9.7578125, 10.326171875, 10.89453125, 11.462890625, 12.03125, 12.599609375, 13.16796875, 13.736328125, 14.3046875, 14.873046875, 15.44140625, 16.009765625, 16.578125]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 3.0, 2.0, 2.0, 3.0, 3.0, 4.0, 1.0, 3.0, 7.0, 9.0, 7.0, 17.0, 22.0, 27.0, 42.0, 67.0, 102.0, 105.0, 128.0, 123.0, 98.0, 90.0, 46.0, 31.0, 26.0, 13.0, 6.0, 4.0, 2.0, 5.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-153.15533447265625, -149.0448455810547, -144.93435668945312, -140.8238525390625, -136.71336364746094, -132.60287475585938, -128.4923858642578, -124.38188934326172, -120.27139282226562, -116.16090393066406, -112.05040740966797, -107.9399185180664, -103.82942199707031, -99.71893310546875, -95.60844421386719, -91.4979476928711, -87.38745880126953, -83.27696990966797, -79.16647338867188, -75.05598449707031, -70.94548797607422, -66.83499908447266, -62.72450637817383, -58.614013671875, -54.50352096557617, -50.393028259277344, -46.282535552978516, -42.17204284667969, -38.061553955078125, -33.95105743408203, -29.84056854248047, -25.73007583618164, -21.619583129882812, -17.509090423583984, -13.398598670959473, -9.288106918334961, -5.177614212036133, -1.0671215057373047, 3.0433692932128906, 7.153861999511719, 11.264354705810547, 15.374847412109375, 19.485340118408203, 23.5958309173584, 27.706323623657227, 31.816816329956055, 35.92730712890625, 40.03779983520508, 44.148292541503906, 48.258785247802734, 52.36927795410156, 56.479766845703125, 60.59026336669922, 64.70075225830078, 68.81124877929688, 72.92173767089844, 77.0322265625, 81.14271545410156, 85.25321197509766, 89.36370086669922, 93.47419738769531, 97.58468627929688, 101.69517517089844, 105.80567169189453, 109.91616821289062]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 3.0, 7.0, 6.0, 7.0, 12.0, 11.0, 15.0, 24.0, 30.0, 16.0, 33.0, 36.0, 37.0, 41.0, 35.0, 42.0, 41.0, 50.0, 41.0, 50.0, 43.0, 49.0, 46.0, 31.0, 43.0, 34.0, 36.0, 39.0, 37.0, 16.0, 14.0, 22.0, 16.0, 8.0, 8.0, 7.0, 8.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-82.00660705566406, -79.22114562988281, -76.43567657470703, -73.65020751953125, -70.86474609375, -68.07928466796875, -65.29381561279297, -62.50835037231445, -59.72288513183594, -56.93741989135742, -54.151954650878906, -51.36648941040039, -48.581024169921875, -45.79555892944336, -43.010093688964844, -40.22462844848633, -37.43916320800781, -34.6536979675293, -31.86823272705078, -29.082767486572266, -26.29730224609375, -23.511837005615234, -20.72637176513672, -17.940906524658203, -15.155441284179688, -12.369976043701172, -9.584510803222656, -6.799045562744141, -4.013580322265625, -1.2281150817871094, 1.5573501586914062, 4.342815399169922, 7.128288269042969, 9.913753509521484, 12.69921875, 15.484683990478516, 18.27014923095703, 21.055614471435547, 23.841079711914062, 26.626544952392578, 29.412010192871094, 32.19747543334961, 34.982940673828125, 37.76840591430664, 40.553871154785156, 43.33933639526367, 46.12480163574219, 48.9102668762207, 51.69573211669922, 54.481197357177734, 57.26666259765625, 60.052127838134766, 62.83759307861328, 65.62306213378906, 68.40852355957031, 71.19398498535156, 73.97945404052734, 76.76492309570312, 79.55038452148438, 82.33584594726562, 85.1213150024414, 87.90678405761719, 90.69224548339844, 93.47770690917969, 96.26317596435547]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 5.0, 12.0, 11.0, 10.0, 22.0, 22.0, 38.0, 60.0, 86.0, 125.0, 206.0, 367.0, 615.0, 1158.0, 2021.0, 3787.0, 7603.0, 16255.0, 37948.0, 100637.0, 332335.0, 360078.0, 110050.0, 40694.0, 17304.0, 8146.0, 4035.0, 2143.0, 1148.0, 637.0, 411.0, 219.0, 129.0, 79.0, 52.0, 32.0, 19.0, 18.0, 8.0, 8.0, 6.0, 5.0, 2.0, 7.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-12.03125, -11.6021728515625, -11.173095703125, -10.7440185546875, -10.31494140625, -9.8858642578125, -9.456787109375, -9.0277099609375, -8.5986328125, -8.1695556640625, -7.740478515625, -7.3114013671875, -6.88232421875, -6.4532470703125, -6.024169921875, -5.5950927734375, -5.166015625, -4.7369384765625, -4.307861328125, -3.8787841796875, -3.44970703125, -3.0206298828125, -2.591552734375, -2.1624755859375, -1.7333984375, -1.3043212890625, -0.875244140625, -0.4461669921875, -0.01708984375, 0.4119873046875, 0.841064453125, 1.2701416015625, 1.69921875, 2.1282958984375, 2.557373046875, 2.9864501953125, 3.41552734375, 3.8446044921875, 4.273681640625, 4.7027587890625, 5.1318359375, 5.5609130859375, 5.989990234375, 6.4190673828125, 6.84814453125, 7.2772216796875, 7.706298828125, 8.1353759765625, 8.564453125, 8.9935302734375, 9.422607421875, 9.8516845703125, 10.28076171875, 10.7098388671875, 11.138916015625, 11.5679931640625, 11.9970703125, 12.4261474609375, 12.855224609375, 13.2843017578125, 13.71337890625, 14.1424560546875, 14.571533203125, 15.0006103515625, 15.4296875]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 10.0, 11.0, 4.0, 12.0, 12.0, 13.0, 19.0, 17.0, 20.0, 26.0, 29.0, 26.0, 35.0, 36.0, 45.0, 30.0, 38.0, 46.0, 41.0, 38.0, 52.0, 48.0, 43.0, 30.0, 46.0, 29.0, 31.0, 37.0, 20.0, 25.0, 20.0, 20.0, 20.0, 13.0, 13.0, 10.0, 7.0, 5.0, 6.0, 2.0, 6.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.1171875, -4.94384765625, -4.7705078125, -4.59716796875, -4.423828125, -4.25048828125, -4.0771484375, -3.90380859375, -3.73046875, -3.55712890625, -3.3837890625, -3.21044921875, -3.037109375, -2.86376953125, -2.6904296875, -2.51708984375, -2.34375, -2.17041015625, -1.9970703125, -1.82373046875, -1.650390625, -1.47705078125, -1.3037109375, -1.13037109375, -0.95703125, -0.78369140625, -0.6103515625, -0.43701171875, -0.263671875, -0.09033203125, 0.0830078125, 0.25634765625, 0.4296875, 0.60302734375, 0.7763671875, 0.94970703125, 1.123046875, 1.29638671875, 1.4697265625, 1.64306640625, 1.81640625, 1.98974609375, 2.1630859375, 2.33642578125, 2.509765625, 2.68310546875, 2.8564453125, 3.02978515625, 3.203125, 3.37646484375, 3.5498046875, 3.72314453125, 3.896484375, 4.06982421875, 4.2431640625, 4.41650390625, 4.58984375, 4.76318359375, 4.9365234375, 5.10986328125, 5.283203125, 5.45654296875, 5.6298828125, 5.80322265625, 5.9765625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 7.0, 9.0, 15.0, 19.0, 36.0, 44.0, 67.0, 110.0, 214.0, 408.0, 788.0, 1856.0, 6984.0, 133018.0, 877410.0, 22030.0, 3232.0, 1112.0, 490.0, 281.0, 149.0, 84.0, 63.0, 27.0, 30.0, 13.0, 19.0, 10.0, 2.0, 5.0, 2.0, 6.0, 4.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.59375, -52.95166015625, -51.3095703125, -49.66748046875, -48.025390625, -46.38330078125, -44.7412109375, -43.09912109375, -41.45703125, -39.81494140625, -38.1728515625, -36.53076171875, -34.888671875, -33.24658203125, -31.6044921875, -29.96240234375, -28.3203125, -26.67822265625, -25.0361328125, -23.39404296875, -21.751953125, -20.10986328125, -18.4677734375, -16.82568359375, -15.18359375, -13.54150390625, -11.8994140625, -10.25732421875, -8.615234375, -6.97314453125, -5.3310546875, -3.68896484375, -2.046875, -0.40478515625, 1.2373046875, 2.87939453125, 4.521484375, 6.16357421875, 7.8056640625, 9.44775390625, 11.08984375, 12.73193359375, 14.3740234375, 16.01611328125, 17.658203125, 19.30029296875, 20.9423828125, 22.58447265625, 24.2265625, 25.86865234375, 27.5107421875, 29.15283203125, 30.794921875, 32.43701171875, 34.0791015625, 35.72119140625, 37.36328125, 39.00537109375, 40.6474609375, 42.28955078125, 43.931640625, 45.57373046875, 47.2158203125, 48.85791015625, 50.5]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 2.0, 6.0, 3.0, 9.0, 7.0, 6.0, 11.0, 23.0, 32.0, 22.0, 35.0, 36.0, 47.0, 71.0, 67.0, 58.0, 60.0, 76.0, 65.0, 52.0, 55.0, 45.0, 45.0, 34.0, 35.0, 21.0, 26.0, 15.0, 12.0, 9.0, 8.0, 5.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.40625, -39.16796875, -37.9296875, -36.69140625, -35.453125, -34.21484375, -32.9765625, -31.73828125, -30.5, -29.26171875, -28.0234375, -26.78515625, -25.546875, -24.30859375, -23.0703125, -21.83203125, -20.59375, -19.35546875, -18.1171875, -16.87890625, -15.640625, -14.40234375, -13.1640625, -11.92578125, -10.6875, -9.44921875, -8.2109375, -6.97265625, -5.734375, -4.49609375, -3.2578125, -2.01953125, -0.78125, 0.45703125, 1.6953125, 2.93359375, 4.171875, 5.41015625, 6.6484375, 7.88671875, 9.125, 10.36328125, 11.6015625, 12.83984375, 14.078125, 15.31640625, 16.5546875, 17.79296875, 19.03125, 20.26953125, 21.5078125, 22.74609375, 23.984375, 25.22265625, 26.4609375, 27.69921875, 28.9375, 30.17578125, 31.4140625, 32.65234375, 33.890625, 35.12890625, 36.3671875, 37.60546875, 38.84375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 3.0, 6.0, 1.0, 6.0, 8.0, 12.0, 12.0, 12.0, 30.0, 39.0, 75.0, 87.0, 157.0, 277.0, 522.0, 992.0, 2627.0, 7977.0, 36839.0, 382794.0, 558003.0, 43851.0, 8998.0, 2807.0, 1092.0, 533.0, 290.0, 177.0, 120.0, 61.0, 37.0, 29.0, 20.0, 20.0, 14.0, 15.0, 3.0, 7.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.171875, -9.7813720703125, -9.390869140625, -9.0003662109375, -8.60986328125, -8.2193603515625, -7.828857421875, -7.4383544921875, -7.0478515625, -6.6573486328125, -6.266845703125, -5.8763427734375, -5.48583984375, -5.0953369140625, -4.704833984375, -4.3143310546875, -3.923828125, -3.5333251953125, -3.142822265625, -2.7523193359375, -2.36181640625, -1.9713134765625, -1.580810546875, -1.1903076171875, -0.7998046875, -0.4093017578125, -0.018798828125, 0.3717041015625, 0.76220703125, 1.1527099609375, 1.543212890625, 1.9337158203125, 2.32421875, 2.7147216796875, 3.105224609375, 3.4957275390625, 3.88623046875, 4.2767333984375, 4.667236328125, 5.0577392578125, 5.4482421875, 5.8387451171875, 6.229248046875, 6.6197509765625, 7.01025390625, 7.4007568359375, 7.791259765625, 8.1817626953125, 8.572265625, 8.9627685546875, 9.353271484375, 9.7437744140625, 10.13427734375, 10.5247802734375, 10.915283203125, 11.3057861328125, 11.6962890625, 12.0867919921875, 12.477294921875, 12.8677978515625, 13.25830078125, 13.6488037109375, 14.039306640625, 14.4298095703125, 14.8203125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 3.0, 7.0, 10.0, 8.0, 8.0, 12.0, 13.0, 25.0, 35.0, 41.0, 76.0, 115.0, 189.0, 143.0, 88.0, 73.0, 43.0, 26.0, 32.0, 12.0, 15.0, 14.0, 4.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0023059844970703125, -0.0022094249725341797, -0.002112865447998047, -0.002016305923461914, -0.0019197463989257812, -0.0018231868743896484, -0.0017266273498535156, -0.0016300678253173828, -0.00153350830078125, -0.0014369487762451172, -0.0013403892517089844, -0.0012438297271728516, -0.0011472702026367188, -0.001050710678100586, -0.0009541511535644531, -0.0008575916290283203, -0.0007610321044921875, -0.0006644725799560547, -0.0005679130554199219, -0.00047135353088378906, -0.00037479400634765625, -0.00027823448181152344, -0.00018167495727539062, -8.511543273925781e-05, 1.1444091796875e-05, 0.00010800361633300781, 0.00020456314086914062, 0.00030112266540527344, 0.00039768218994140625, 0.0004942417144775391, 0.0005908012390136719, 0.0006873607635498047, 0.0007839202880859375, 0.0008804798126220703, 0.0009770393371582031, 0.001073598861694336, 0.0011701583862304688, 0.0012667179107666016, 0.0013632774353027344, 0.0014598369598388672, 0.001556396484375, 0.0016529560089111328, 0.0017495155334472656, 0.0018460750579833984, 0.0019426345825195312, 0.002039194107055664, 0.002135753631591797, 0.0022323131561279297, 0.0023288726806640625, 0.0024254322052001953, 0.002521991729736328, 0.002618551254272461, 0.0027151107788085938, 0.0028116703033447266, 0.0029082298278808594, 0.003004789352416992, 0.003101348876953125, 0.003197908401489258, 0.0032944679260253906, 0.0033910274505615234, 0.0034875869750976562, 0.003584146499633789, 0.003680706024169922, 0.0037772655487060547, 0.0038738250732421875]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 4.0, 4.0, 6.0, 6.0, 5.0, 10.0, 15.0, 30.0, 54.0, 86.0, 125.0, 197.0, 388.0, 780.0, 1560.0, 4094.0, 15843.0, 136143.0, 782695.0, 88448.0, 11875.0, 3386.0, 1287.0, 646.0, 345.0, 205.0, 118.0, 67.0, 43.0, 24.0, 15.0, 18.0, 6.0, 6.0, 5.0, 7.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.859375, -11.4420166015625, -11.024658203125, -10.6072998046875, -10.18994140625, -9.7725830078125, -9.355224609375, -8.9378662109375, -8.5205078125, -8.1031494140625, -7.685791015625, -7.2684326171875, -6.85107421875, -6.4337158203125, -6.016357421875, -5.5989990234375, -5.181640625, -4.7642822265625, -4.346923828125, -3.9295654296875, -3.51220703125, -3.0948486328125, -2.677490234375, -2.2601318359375, -1.8427734375, -1.4254150390625, -1.008056640625, -0.5906982421875, -0.17333984375, 0.2440185546875, 0.661376953125, 1.0787353515625, 1.49609375, 1.9134521484375, 2.330810546875, 2.7481689453125, 3.16552734375, 3.5828857421875, 4.000244140625, 4.4176025390625, 4.8349609375, 5.2523193359375, 5.669677734375, 6.0870361328125, 6.50439453125, 6.9217529296875, 7.339111328125, 7.7564697265625, 8.173828125, 8.5911865234375, 9.008544921875, 9.4259033203125, 9.84326171875, 10.2606201171875, 10.677978515625, 11.0953369140625, 11.5126953125, 11.9300537109375, 12.347412109375, 12.7647705078125, 13.18212890625, 13.5994873046875, 14.016845703125, 14.4342041015625, 14.8515625]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 6.0, 6.0, 5.0, 7.0, 11.0, 8.0, 19.0, 22.0, 17.0, 22.0, 35.0, 39.0, 49.0, 68.0, 78.0, 81.0, 78.0, 76.0, 71.0, 51.0, 40.0, 41.0, 36.0, 20.0, 29.0, 22.0, 13.0, 10.0, 10.0, 9.0, 4.0, 4.0, 2.0, 1.0, 2.0, 3.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0], "bins": [-10.078125, -9.80987548828125, -9.5416259765625, -9.27337646484375, -9.005126953125, -8.73687744140625, -8.4686279296875, -8.20037841796875, -7.93212890625, -7.66387939453125, -7.3956298828125, -7.12738037109375, -6.859130859375, -6.59088134765625, -6.3226318359375, -6.05438232421875, -5.7861328125, -5.51788330078125, -5.2496337890625, -4.98138427734375, -4.713134765625, -4.44488525390625, -4.1766357421875, -3.90838623046875, -3.64013671875, -3.37188720703125, -3.1036376953125, -2.83538818359375, -2.567138671875, -2.29888916015625, -2.0306396484375, -1.76239013671875, -1.494140625, -1.22589111328125, -0.9576416015625, -0.68939208984375, -0.421142578125, -0.15289306640625, 0.1153564453125, 0.38360595703125, 0.65185546875, 0.92010498046875, 1.1883544921875, 1.45660400390625, 1.724853515625, 1.99310302734375, 2.2613525390625, 2.52960205078125, 2.7978515625, 3.06610107421875, 3.3343505859375, 3.60260009765625, 3.870849609375, 4.13909912109375, 4.4073486328125, 4.67559814453125, 4.94384765625, 5.21209716796875, 5.4803466796875, 5.74859619140625, 6.016845703125, 6.28509521484375, 6.5533447265625, 6.82159423828125, 7.08984375]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 8.0, 14.0, 34.0, 71.0, 170.0, 251.0, 205.0, 122.0, 70.0, 27.0, 9.0, 8.0, 9.0, 1.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-172.012451171875, -164.0671844482422, -156.12191772460938, -148.17665100097656, -140.23138427734375, -132.28611755371094, -124.34085845947266, -116.39559173583984, -108.45032501220703, -100.50505828857422, -92.5597915649414, -84.61453247070312, -76.66926574707031, -68.7239990234375, -60.77873229980469, -52.833465576171875, -44.88819885253906, -36.94293212890625, -28.99766731262207, -21.05240249633789, -13.107135772705078, -5.161869049072266, 2.7833938598632812, 10.728660583496094, 18.673927307128906, 26.61919403076172, 34.56446075439453, 42.50972366333008, 50.45499038696289, 58.4002571105957, 66.34552001953125, 74.29078674316406, 82.23605346679688, 90.18132019042969, 98.1265869140625, 106.07185363769531, 114.01712036132812, 121.96238708496094, 129.90765380859375, 137.8529052734375, 145.79818725585938, 153.7434539794922, 161.688720703125, 169.6339874267578, 177.57925415039062, 185.52452087402344, 193.46978759765625, 201.4150390625, 209.3603057861328, 217.30557250976562, 225.25083923339844, 233.19610595703125, 241.14137268066406, 249.08663940429688, 257.0318908691406, 264.9771728515625, 272.92242431640625, 280.86767578125, 288.8129577636719, 296.7582092285156, 304.7034912109375, 312.64874267578125, 320.5940246582031, 328.5392761230469, 336.48455810546875]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 6.0, 5.0, 10.0, 13.0, 34.0, 28.0, 48.0, 67.0, 56.0, 81.0, 84.0, 90.0, 105.0, 88.0, 76.0, 56.0, 37.0, 47.0, 24.0, 17.0, 13.0, 9.0, 13.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-277.60174560546875, -271.27587890625, -264.9499816894531, -258.6241149902344, -252.2982177734375, -245.9723358154297, -239.64645385742188, -233.32057189941406, -226.99468994140625, -220.66880798339844, -214.34292602539062, -208.0170440673828, -201.691162109375, -195.3652801513672, -189.03939819335938, -182.71351623535156, -176.38763427734375, -170.06175231933594, -163.73587036132812, -157.4099884033203, -151.0841064453125, -144.7582244873047, -138.43234252929688, -132.10646057128906, -125.78059387207031, -119.4547119140625, -113.12882995605469, -106.80294799804688, -100.47706604003906, -94.15118408203125, -87.82530212402344, -81.49942016601562, -75.17353820800781, -68.84765625, -62.52177429199219, -56.195892333984375, -49.87001037597656, -43.54412841796875, -37.2182502746582, -30.89236831665039, -24.566486358642578, -18.240604400634766, -11.91472339630127, -5.588842391967773, 0.7370395660400391, 7.062921524047852, 13.388801574707031, 19.714683532714844, 26.040565490722656, 32.36644744873047, 38.69232940673828, 45.018211364746094, 51.344093322753906, 57.66997528076172, 63.995853424072266, 70.32173156738281, 76.64761352539062, 82.97349548339844, 89.29937744140625, 95.62525939941406, 101.95114135742188, 108.27702331542969, 114.6029052734375, 120.92878723144531, 127.25466918945312]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 0.0, 2.0, 3.0, 3.0, 5.0, 8.0, 7.0, 8.0, 21.0, 28.0, 26.0, 58.0, 79.0, 160.0, 372.0, 3180.0, 4138655.0, 50116.0, 975.0, 263.0, 127.0, 62.0, 46.0, 32.0, 11.0, 14.0, 10.0, 8.0, 2.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-88.4375, -85.4658203125, -82.494140625, -79.5224609375, -76.55078125, -73.5791015625, -70.607421875, -67.6357421875, -64.6640625, -61.6923828125, -58.720703125, -55.7490234375, -52.77734375, -49.8056640625, -46.833984375, -43.8623046875, -40.890625, -37.9189453125, -34.947265625, -31.9755859375, -29.00390625, -26.0322265625, -23.060546875, -20.0888671875, -17.1171875, -14.1455078125, -11.173828125, -8.2021484375, -5.23046875, -2.2587890625, 0.712890625, 3.6845703125, 6.65625, 9.6279296875, 12.599609375, 15.5712890625, 18.54296875, 21.5146484375, 24.486328125, 27.4580078125, 30.4296875, 33.4013671875, 36.373046875, 39.3447265625, 42.31640625, 45.2880859375, 48.259765625, 51.2314453125, 54.203125, 57.1748046875, 60.146484375, 63.1181640625, 66.08984375, 69.0615234375, 72.033203125, 75.0048828125, 77.9765625, 80.9482421875, 83.919921875, 86.8916015625, 89.86328125, 92.8349609375, 95.806640625, 98.7783203125, 101.75]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 6.0, 6.0, 13.0, 12.0, 35.0, 35.0, 48.0, 49.0, 64.0, 101.0, 108.0, 94.0, 101.0, 95.0, 66.0, 44.0, 32.0, 37.0, 27.0, 11.0, 14.0, 6.0, 3.0, 0.0, 3.0, 2.0, 1.0, 1.0], "bins": [-17.671875, -17.29791259765625, -16.9239501953125, -16.54998779296875, -16.176025390625, -15.80206298828125, -15.4281005859375, -15.05413818359375, -14.68017578125, -14.30621337890625, -13.9322509765625, -13.55828857421875, -13.184326171875, -12.81036376953125, -12.4364013671875, -12.06243896484375, -11.6884765625, -11.31451416015625, -10.9405517578125, -10.56658935546875, -10.192626953125, -9.81866455078125, -9.4447021484375, -9.07073974609375, -8.69677734375, -8.32281494140625, -7.9488525390625, -7.57489013671875, -7.200927734375, -6.82696533203125, -6.4530029296875, -6.07904052734375, -5.705078125, -5.33111572265625, -4.9571533203125, -4.58319091796875, -4.209228515625, -3.83526611328125, -3.4613037109375, -3.08734130859375, -2.71337890625, -2.33941650390625, -1.9654541015625, -1.59149169921875, -1.217529296875, -0.84356689453125, -0.4696044921875, -0.09564208984375, 0.2783203125, 0.65228271484375, 1.0262451171875, 1.40020751953125, 1.774169921875, 2.14813232421875, 2.5220947265625, 2.89605712890625, 3.27001953125, 3.64398193359375, 4.0179443359375, 4.39190673828125, 4.765869140625, 5.13983154296875, 5.5137939453125, 5.88775634765625, 6.26171875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 6.0, 6.0, 7.0, 13.0, 20.0, 33.0, 46.0, 82.0, 130.0, 244.0, 488.0, 943.0, 2491.0, 7939.0, 35727.0, 354748.0, 3592214.0, 165713.0, 23646.0, 5918.0, 1976.0, 817.0, 432.0, 279.0, 150.0, 94.0, 51.0, 35.0, 14.0, 6.0, 6.0, 5.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-27.28125, -26.55126953125, -25.8212890625, -25.09130859375, -24.361328125, -23.63134765625, -22.9013671875, -22.17138671875, -21.44140625, -20.71142578125, -19.9814453125, -19.25146484375, -18.521484375, -17.79150390625, -17.0615234375, -16.33154296875, -15.6015625, -14.87158203125, -14.1416015625, -13.41162109375, -12.681640625, -11.95166015625, -11.2216796875, -10.49169921875, -9.76171875, -9.03173828125, -8.3017578125, -7.57177734375, -6.841796875, -6.11181640625, -5.3818359375, -4.65185546875, -3.921875, -3.19189453125, -2.4619140625, -1.73193359375, -1.001953125, -0.27197265625, 0.4580078125, 1.18798828125, 1.91796875, 2.64794921875, 3.3779296875, 4.10791015625, 4.837890625, 5.56787109375, 6.2978515625, 7.02783203125, 7.7578125, 8.48779296875, 9.2177734375, 9.94775390625, 10.677734375, 11.40771484375, 12.1376953125, 12.86767578125, 13.59765625, 14.32763671875, 15.0576171875, 15.78759765625, 16.517578125, 17.24755859375, 17.9775390625, 18.70751953125, 19.4375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 4.0, 2.0, 4.0, 6.0, 13.0, 5.0, 22.0, 17.0, 31.0, 35.0, 56.0, 93.0, 140.0, 285.0, 671.0, 1081.0, 753.0, 342.0, 180.0, 113.0, 64.0, 45.0, 27.0, 24.0, 18.0, 7.0, 6.0, 8.0, 6.0, 7.0, 9.0, 0.0, 5.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.109375, -15.50439453125, -14.8994140625, -14.29443359375, -13.689453125, -13.08447265625, -12.4794921875, -11.87451171875, -11.26953125, -10.66455078125, -10.0595703125, -9.45458984375, -8.849609375, -8.24462890625, -7.6396484375, -7.03466796875, -6.4296875, -5.82470703125, -5.2197265625, -4.61474609375, -4.009765625, -3.40478515625, -2.7998046875, -2.19482421875, -1.58984375, -0.98486328125, -0.3798828125, 0.22509765625, 0.830078125, 1.43505859375, 2.0400390625, 2.64501953125, 3.25, 3.85498046875, 4.4599609375, 5.06494140625, 5.669921875, 6.27490234375, 6.8798828125, 7.48486328125, 8.08984375, 8.69482421875, 9.2998046875, 9.90478515625, 10.509765625, 11.11474609375, 11.7197265625, 12.32470703125, 12.9296875, 13.53466796875, 14.1396484375, 14.74462890625, 15.349609375, 15.95458984375, 16.5595703125, 17.16455078125, 17.76953125, 18.37451171875, 18.9794921875, 19.58447265625, 20.189453125, 20.79443359375, 21.3994140625, 22.00439453125, 22.609375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 2.0, 0.0, 4.0, 0.0, 5.0, 15.0, 13.0, 27.0, 63.0, 111.0, 165.0, 169.0, 173.0, 101.0, 59.0, 40.0, 18.0, 11.0, 8.0, 7.0, 4.0, 4.0, 2.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-92.11575317382812, -87.31382751464844, -82.51190948486328, -77.7099838256836, -72.90806579589844, -68.10614013671875, -63.30421447753906, -58.50229263305664, -53.70037078857422, -48.8984489440918, -44.096527099609375, -39.29460144042969, -34.492679595947266, -29.690757751464844, -24.88883399963379, -20.086910247802734, -15.284988403320312, -10.483065605163574, -5.681142807006836, -0.8792200088500977, 3.9227027893066406, 8.724624633789062, 13.526548385620117, 18.328472137451172, 23.130393981933594, 27.932315826416016, 32.73423767089844, 37.536163330078125, 42.33808517456055, 47.14000701904297, 51.941932678222656, 56.74385452270508, 61.54576110839844, 66.34768676757812, 71.14960479736328, 75.95153045654297, 80.75344848632812, 85.55537414550781, 90.3572998046875, 95.15922546386719, 99.96114349365234, 104.76306915283203, 109.56498718261719, 114.36691284179688, 119.16883850097656, 123.97075653076172, 128.77267456054688, 133.57460021972656, 138.37652587890625, 143.17845153808594, 147.98037719726562, 152.78228759765625, 157.58421325683594, 162.38613891601562, 167.1880645751953, 171.989990234375, 176.79190063476562, 181.5938262939453, 186.395751953125, 191.19766235351562, 195.9995880126953, 200.801513671875, 205.6034393310547, 210.40536499023438, 215.20729064941406]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 5.0, 3.0, 5.0, 6.0, 11.0, 7.0, 13.0, 15.0, 20.0, 14.0, 32.0, 16.0, 29.0, 34.0, 34.0, 39.0, 49.0, 53.0, 36.0, 50.0, 50.0, 50.0, 47.0, 58.0, 37.0, 37.0, 32.0, 28.0, 21.0, 38.0, 14.0, 21.0, 22.0, 17.0, 14.0, 10.0, 8.0, 6.0, 7.0, 6.0, 3.0, 4.0, 2.0, 5.0, 1.0, 1.0, 1.0, 3.0], "bins": [-84.90214538574219, -82.56751251220703, -80.2328872680664, -77.89825439453125, -75.5636215209961, -73.22898864746094, -70.89436340332031, -68.55973052978516, -66.22509765625, -63.89046859741211, -61.55583572387695, -59.22120666503906, -56.886573791503906, -54.551944732666016, -52.217315673828125, -49.88268280029297, -47.548057556152344, -45.21342849731445, -42.8787956237793, -40.544166564941406, -38.20953369140625, -35.87490463256836, -33.54027557373047, -31.205644607543945, -28.871013641357422, -26.5363826751709, -24.201751708984375, -21.867122650146484, -19.53249168395996, -17.197860717773438, -14.86323070526123, -12.528600692749023, -10.193977355957031, -7.859346866607666, -5.524716377258301, -3.1900858879089355, -0.8554553985595703, 1.4791755676269531, 3.81380558013916, 6.148435592651367, 8.48306655883789, 10.817697525024414, 13.152327537536621, 15.486957550048828, 17.82158851623535, 20.156219482421875, 22.490848541259766, 24.82547950744629, 27.160110473632812, 29.494741439819336, 31.82937240600586, 34.16400146484375, 36.498634338378906, 38.8332633972168, 41.16789245605469, 43.502525329589844, 45.837154388427734, 48.171783447265625, 50.50641632080078, 52.84104537963867, 55.17567443847656, 57.51030731201172, 59.84493637084961, 62.1795654296875, 64.51419830322266]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 7.0, 5.0, 5.0, 12.0, 20.0, 27.0, 41.0, 64.0, 70.0, 124.0, 210.0, 432.0, 700.0, 1387.0, 2519.0, 5203.0, 11623.0, 27868.0, 77856.0, 284882.0, 438859.0, 125123.0, 40714.0, 16319.0, 7230.0, 3297.0, 1743.0, 912.0, 534.0, 296.0, 162.0, 119.0, 73.0, 41.0, 36.0, 13.0, 12.0, 4.0, 4.0, 8.0, 3.0, 0.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0], "bins": [-14.9375, -14.487548828125, -14.03759765625, -13.587646484375, -13.1376953125, -12.687744140625, -12.23779296875, -11.787841796875, -11.337890625, -10.887939453125, -10.43798828125, -9.988037109375, -9.5380859375, -9.088134765625, -8.63818359375, -8.188232421875, -7.73828125, -7.288330078125, -6.83837890625, -6.388427734375, -5.9384765625, -5.488525390625, -5.03857421875, -4.588623046875, -4.138671875, -3.688720703125, -3.23876953125, -2.788818359375, -2.3388671875, -1.888916015625, -1.43896484375, -0.989013671875, -0.5390625, -0.089111328125, 0.36083984375, 0.810791015625, 1.2607421875, 1.710693359375, 2.16064453125, 2.610595703125, 3.060546875, 3.510498046875, 3.96044921875, 4.410400390625, 4.8603515625, 5.310302734375, 5.76025390625, 6.210205078125, 6.66015625, 7.110107421875, 7.56005859375, 8.010009765625, 8.4599609375, 8.909912109375, 9.35986328125, 9.809814453125, 10.259765625, 10.709716796875, 11.15966796875, 11.609619140625, 12.0595703125, 12.509521484375, 12.95947265625, 13.409423828125, 13.859375]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 9.0, 9.0, 16.0, 24.0, 21.0, 40.0, 44.0, 51.0, 72.0, 76.0, 79.0, 87.0, 80.0, 85.0, 80.0, 64.0, 53.0, 31.0, 28.0, 23.0, 16.0, 8.0, 11.0, 1.0, 2.0, 4.0, 2.0, 2.0], "bins": [-17.21875, -16.85772705078125, -16.4967041015625, -16.13568115234375, -15.774658203125, -15.41363525390625, -15.0526123046875, -14.69158935546875, -14.33056640625, -13.96954345703125, -13.6085205078125, -13.24749755859375, -12.886474609375, -12.52545166015625, -12.1644287109375, -11.80340576171875, -11.4423828125, -11.08135986328125, -10.7203369140625, -10.35931396484375, -9.998291015625, -9.63726806640625, -9.2762451171875, -8.91522216796875, -8.55419921875, -8.19317626953125, -7.8321533203125, -7.47113037109375, -7.110107421875, -6.74908447265625, -6.3880615234375, -6.02703857421875, -5.666015625, -5.30499267578125, -4.9439697265625, -4.58294677734375, -4.221923828125, -3.86090087890625, -3.4998779296875, -3.13885498046875, -2.77783203125, -2.41680908203125, -2.0557861328125, -1.69476318359375, -1.333740234375, -0.97271728515625, -0.6116943359375, -0.25067138671875, 0.1103515625, 0.47137451171875, 0.8323974609375, 1.19342041015625, 1.554443359375, 1.91546630859375, 2.2764892578125, 2.63751220703125, 2.99853515625, 3.35955810546875, 3.7205810546875, 4.08160400390625, 4.442626953125, 4.80364990234375, 5.1646728515625, 5.52569580078125, 5.88671875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 2.0, 2.0, 4.0, 4.0, 10.0, 9.0, 13.0, 14.0, 27.0, 32.0, 60.0, 46.0, 89.0, 105.0, 152.0, 202.0, 306.0, 446.0, 636.0, 1121.0, 2095.0, 4599.0, 12014.0, 40959.0, 225080.0, 634104.0, 89692.0, 21871.0, 7452.0, 3236.0, 1548.0, 793.0, 617.0, 335.0, 256.0, 167.0, 130.0, 76.0, 67.0, 46.0, 34.0, 31.0, 19.0, 14.0, 11.0, 9.0, 7.0, 7.0, 1.0, 5.0, 2.0, 0.0, 1.0, 4.0, 1.0, 1.0, 1.0], "bins": [-20.390625, -19.758544921875, -19.12646484375, -18.494384765625, -17.8623046875, -17.230224609375, -16.59814453125, -15.966064453125, -15.333984375, -14.701904296875, -14.06982421875, -13.437744140625, -12.8056640625, -12.173583984375, -11.54150390625, -10.909423828125, -10.27734375, -9.645263671875, -9.01318359375, -8.381103515625, -7.7490234375, -7.116943359375, -6.48486328125, -5.852783203125, -5.220703125, -4.588623046875, -3.95654296875, -3.324462890625, -2.6923828125, -2.060302734375, -1.42822265625, -0.796142578125, -0.1640625, 0.468017578125, 1.10009765625, 1.732177734375, 2.3642578125, 2.996337890625, 3.62841796875, 4.260498046875, 4.892578125, 5.524658203125, 6.15673828125, 6.788818359375, 7.4208984375, 8.052978515625, 8.68505859375, 9.317138671875, 9.94921875, 10.581298828125, 11.21337890625, 11.845458984375, 12.4775390625, 13.109619140625, 13.74169921875, 14.373779296875, 15.005859375, 15.637939453125, 16.27001953125, 16.902099609375, 17.5341796875, 18.166259765625, 18.79833984375, 19.430419921875, 20.0625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 8.0, 3.0, 5.0, 9.0, 19.0, 25.0, 33.0, 40.0, 48.0, 68.0, 66.0, 84.0, 91.0, 74.0, 87.0, 71.0, 63.0, 56.0, 52.0, 32.0, 28.0, 9.0, 16.0, 7.0, 4.0, 5.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-48.96875, -47.52978515625, -46.0908203125, -44.65185546875, -43.212890625, -41.77392578125, -40.3349609375, -38.89599609375, -37.45703125, -36.01806640625, -34.5791015625, -33.14013671875, -31.701171875, -30.26220703125, -28.8232421875, -27.38427734375, -25.9453125, -24.50634765625, -23.0673828125, -21.62841796875, -20.189453125, -18.75048828125, -17.3115234375, -15.87255859375, -14.43359375, -12.99462890625, -11.5556640625, -10.11669921875, -8.677734375, -7.23876953125, -5.7998046875, -4.36083984375, -2.921875, -1.48291015625, -0.0439453125, 1.39501953125, 2.833984375, 4.27294921875, 5.7119140625, 7.15087890625, 8.58984375, 10.02880859375, 11.4677734375, 12.90673828125, 14.345703125, 15.78466796875, 17.2236328125, 18.66259765625, 20.1015625, 21.54052734375, 22.9794921875, 24.41845703125, 25.857421875, 27.29638671875, 28.7353515625, 30.17431640625, 31.61328125, 33.05224609375, 34.4912109375, 35.93017578125, 37.369140625, 38.80810546875, 40.2470703125, 41.68603515625, 43.125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 2.0, 5.0, 4.0, 1.0, 4.0, 10.0, 9.0, 23.0, 34.0, 71.0, 173.0, 426.0, 1586.0, 11577.0, 287313.0, 723429.0, 20582.0, 2377.0, 560.0, 197.0, 62.0, 43.0, 24.0, 12.0, 10.0, 5.0, 4.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-24.078125, -23.372314453125, -22.66650390625, -21.960693359375, -21.2548828125, -20.549072265625, -19.84326171875, -19.137451171875, -18.431640625, -17.725830078125, -17.02001953125, -16.314208984375, -15.6083984375, -14.902587890625, -14.19677734375, -13.490966796875, -12.78515625, -12.079345703125, -11.37353515625, -10.667724609375, -9.9619140625, -9.256103515625, -8.55029296875, -7.844482421875, -7.138671875, -6.432861328125, -5.72705078125, -5.021240234375, -4.3154296875, -3.609619140625, -2.90380859375, -2.197998046875, -1.4921875, -0.786376953125, -0.08056640625, 0.625244140625, 1.3310546875, 2.036865234375, 2.74267578125, 3.448486328125, 4.154296875, 4.860107421875, 5.56591796875, 6.271728515625, 6.9775390625, 7.683349609375, 8.38916015625, 9.094970703125, 9.80078125, 10.506591796875, 11.21240234375, 11.918212890625, 12.6240234375, 13.329833984375, 14.03564453125, 14.741455078125, 15.447265625, 16.153076171875, 16.85888671875, 17.564697265625, 18.2705078125, 18.976318359375, 19.68212890625, 20.387939453125, 21.09375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 5.0, 5.0, 4.0, 9.0, 16.0, 27.0, 34.0, 43.0, 90.0, 134.0, 223.0, 154.0, 98.0, 49.0, 32.0, 27.0, 12.0, 14.0, 9.0, 4.0, 4.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00469970703125, -0.004571288824081421, -0.004442870616912842, -0.004314452409744263, -0.004186034202575684, -0.0040576159954071045, -0.003929197788238525, -0.0038007795810699463, -0.003672361373901367, -0.003543943166732788, -0.003415524959564209, -0.00328710675239563, -0.0031586885452270508, -0.0030302703380584717, -0.0029018521308898926, -0.0027734339237213135, -0.0026450157165527344, -0.0025165975093841553, -0.002388179302215576, -0.002259761095046997, -0.002131342887878418, -0.002002924680709839, -0.0018745064735412598, -0.0017460882663726807, -0.0016176700592041016, -0.0014892518520355225, -0.0013608336448669434, -0.0012324154376983643, -0.0011039972305297852, -0.0009755790233612061, -0.000847160816192627, -0.0007187426090240479, -0.0005903244018554688, -0.00046190619468688965, -0.00033348798751831055, -0.00020506978034973145, -7.665157318115234e-05, 5.176663398742676e-05, 0.00018018484115600586, 0.00030860304832458496, 0.00043702125549316406, 0.0005654394626617432, 0.0006938576698303223, 0.0008222758769989014, 0.0009506940841674805, 0.0010791122913360596, 0.0012075304985046387, 0.0013359487056732178, 0.0014643669128417969, 0.001592785120010376, 0.001721203327178955, 0.0018496215343475342, 0.0019780397415161133, 0.0021064579486846924, 0.0022348761558532715, 0.0023632943630218506, 0.0024917125701904297, 0.002620130777359009, 0.002748548984527588, 0.002876967191696167, 0.003005385398864746, 0.003133803606033325, 0.0032622218132019043, 0.0033906400203704834, 0.0035190582275390625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 1.0, 1.0, 4.0, 0.0, 3.0, 2.0, 5.0, 4.0, 10.0, 17.0, 22.0, 36.0, 56.0, 71.0, 133.0, 212.0, 444.0, 892.0, 2234.0, 6499.0, 26668.0, 191066.0, 697337.0, 98740.0, 16273.0, 4588.0, 1669.0, 730.0, 365.0, 182.0, 88.0, 50.0, 43.0, 36.0, 17.0, 22.0, 10.0, 6.0, 8.0, 4.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.3359375, -11.95458984375, -11.5732421875, -11.19189453125, -10.810546875, -10.42919921875, -10.0478515625, -9.66650390625, -9.28515625, -8.90380859375, -8.5224609375, -8.14111328125, -7.759765625, -7.37841796875, -6.9970703125, -6.61572265625, -6.234375, -5.85302734375, -5.4716796875, -5.09033203125, -4.708984375, -4.32763671875, -3.9462890625, -3.56494140625, -3.18359375, -2.80224609375, -2.4208984375, -2.03955078125, -1.658203125, -1.27685546875, -0.8955078125, -0.51416015625, -0.1328125, 0.24853515625, 0.6298828125, 1.01123046875, 1.392578125, 1.77392578125, 2.1552734375, 2.53662109375, 2.91796875, 3.29931640625, 3.6806640625, 4.06201171875, 4.443359375, 4.82470703125, 5.2060546875, 5.58740234375, 5.96875, 6.35009765625, 6.7314453125, 7.11279296875, 7.494140625, 7.87548828125, 8.2568359375, 8.63818359375, 9.01953125, 9.40087890625, 9.7822265625, 10.16357421875, 10.544921875, 10.92626953125, 11.3076171875, 11.68896484375, 12.0703125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 3.0, 8.0, 5.0, 11.0, 13.0, 16.0, 22.0, 22.0, 31.0, 43.0, 49.0, 60.0, 70.0, 85.0, 111.0, 74.0, 76.0, 59.0, 52.0, 40.0, 37.0, 26.0, 19.0, 17.0, 15.0, 11.0, 3.0, 7.0, 5.0, 3.0, 5.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.1171875, -8.79931640625, -8.4814453125, -8.16357421875, -7.845703125, -7.52783203125, -7.2099609375, -6.89208984375, -6.57421875, -6.25634765625, -5.9384765625, -5.62060546875, -5.302734375, -4.98486328125, -4.6669921875, -4.34912109375, -4.03125, -3.71337890625, -3.3955078125, -3.07763671875, -2.759765625, -2.44189453125, -2.1240234375, -1.80615234375, -1.48828125, -1.17041015625, -0.8525390625, -0.53466796875, -0.216796875, 0.10107421875, 0.4189453125, 0.73681640625, 1.0546875, 1.37255859375, 1.6904296875, 2.00830078125, 2.326171875, 2.64404296875, 2.9619140625, 3.27978515625, 3.59765625, 3.91552734375, 4.2333984375, 4.55126953125, 4.869140625, 5.18701171875, 5.5048828125, 5.82275390625, 6.140625, 6.45849609375, 6.7763671875, 7.09423828125, 7.412109375, 7.72998046875, 8.0478515625, 8.36572265625, 8.68359375, 9.00146484375, 9.3193359375, 9.63720703125, 9.955078125, 10.27294921875, 10.5908203125, 10.90869140625, 11.2265625]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 6.0, 6.0, 3.0, 11.0, 32.0, 75.0, 183.0, 292.0, 210.0, 107.0, 45.0, 18.0, 11.0, 8.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-352.0806884765625, -342.9710388183594, -333.8614196777344, -324.75177001953125, -315.6421203613281, -306.532470703125, -297.4228515625, -288.3132019042969, -279.20355224609375, -270.0939025878906, -260.9842834472656, -251.8746337890625, -242.76498413085938, -233.6553497314453, -224.54571533203125, -215.43606567382812, -206.32643127441406, -197.216796875, -188.10714721679688, -178.9975128173828, -169.8878631591797, -160.77822875976562, -151.6685791015625, -142.55894470214844, -133.44931030273438, -124.33966827392578, -115.23002624511719, -106.12039184570312, -97.0107421875, -87.90110778808594, -78.79146575927734, -69.68182373046875, -60.57218933105469, -51.462547302246094, -42.3529052734375, -33.24326705932617, -24.133625030517578, -15.023983001708984, -5.914344787597656, 3.1952972412109375, 12.304939270019531, 21.414581298828125, 30.524221420288086, 39.63386154174805, 48.74350357055664, 57.853145599365234, 66.96278381347656, 76.07242584228516, 85.18206787109375, 94.29170989990234, 103.40135192871094, 112.510986328125, 121.62063598632812, 130.7302703857422, 139.83990478515625, 148.94955444335938, 158.0592041015625, 167.16883850097656, 176.2784881591797, 185.38812255859375, 194.49777221679688, 203.60740661621094, 212.717041015625, 221.82669067382812, 230.9363250732422]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 12.0, 7.0, 11.0, 27.0, 36.0, 44.0, 41.0, 64.0, 100.0, 119.0, 132.0, 106.0, 79.0, 57.0, 43.0, 46.0, 30.0, 17.0, 18.0, 11.0, 7.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-108.8934326171875, -101.80403900146484, -94.71464538574219, -87.62525939941406, -80.53585815429688, -73.44647216796875, -66.3570785522461, -59.26768493652344, -52.17829132080078, -45.088897705078125, -37.99950408935547, -30.910114288330078, -23.820720672607422, -16.731327056884766, -9.641937255859375, -2.5525436401367188, 4.5368499755859375, 11.626242637634277, 18.715635299682617, 25.80502700805664, 32.8944206237793, 39.98381423950195, 47.073204040527344, 54.16259765625, 61.251991271972656, 68.34138488769531, 75.43077850341797, 82.52017211914062, 89.60955810546875, 96.69895935058594, 103.78834533691406, 110.87773895263672, 117.96713256835938, 125.05652618408203, 132.1459197998047, 139.2353057861328, 146.32470703125, 153.41409301757812, 160.50347900390625, 167.59288024902344, 174.68228149414062, 181.77166748046875, 188.86106872558594, 195.95045471191406, 203.03985595703125, 210.12924194335938, 217.2186279296875, 224.3080291748047, 231.3974151611328, 238.48680114746094, 245.57620239257812, 252.66558837890625, 259.7549743652344, 266.8443908691406, 273.93377685546875, 281.0231628417969, 288.112548828125, 295.2019348144531, 302.29132080078125, 309.3807373046875, 316.4701232910156, 323.55950927734375, 330.6488952636719, 337.73828125, 344.82769775390625]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 7.0, 12.0, 16.0, 19.0, 22.0, 38.0, 60.0, 97.0, 171.0, 272.0, 473.0, 931.0, 1782.0, 4143.0, 10379.0, 32087.0, 149412.0, 1674794.0, 2082712.0, 185322.0, 33025.0, 10185.0, 3855.0, 1738.0, 969.0, 533.0, 364.0, 248.0, 139.0, 131.0, 90.0, 71.0, 36.0, 30.0, 31.0, 26.0, 18.0, 6.0, 13.0, 8.0, 5.0, 7.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-11.4453125, -11.022216796875, -10.59912109375, -10.176025390625, -9.7529296875, -9.329833984375, -8.90673828125, -8.483642578125, -8.060546875, -7.637451171875, -7.21435546875, -6.791259765625, -6.3681640625, -5.945068359375, -5.52197265625, -5.098876953125, -4.67578125, -4.252685546875, -3.82958984375, -3.406494140625, -2.9833984375, -2.560302734375, -2.13720703125, -1.714111328125, -1.291015625, -0.867919921875, -0.44482421875, -0.021728515625, 0.4013671875, 0.824462890625, 1.24755859375, 1.670654296875, 2.09375, 2.516845703125, 2.93994140625, 3.363037109375, 3.7861328125, 4.209228515625, 4.63232421875, 5.055419921875, 5.478515625, 5.901611328125, 6.32470703125, 6.747802734375, 7.1708984375, 7.593994140625, 8.01708984375, 8.440185546875, 8.86328125, 9.286376953125, 9.70947265625, 10.132568359375, 10.5556640625, 10.978759765625, 11.40185546875, 11.824951171875, 12.248046875, 12.671142578125, 13.09423828125, 13.517333984375, 13.9404296875, 14.363525390625, 14.78662109375, 15.209716796875, 15.6328125]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 3.0, 9.0, 7.0, 13.0, 18.0, 24.0, 31.0, 56.0, 78.0, 98.0, 96.0, 118.0, 90.0, 83.0, 95.0, 60.0, 44.0, 28.0, 33.0, 16.0, 6.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3984375, -4.9764404296875, -4.554443359375, -4.1324462890625, -3.71044921875, -3.2884521484375, -2.866455078125, -2.4444580078125, -2.0224609375, -1.6004638671875, -1.178466796875, -0.7564697265625, -0.33447265625, 0.0875244140625, 0.509521484375, 0.9315185546875, 1.353515625, 1.7755126953125, 2.197509765625, 2.6195068359375, 3.04150390625, 3.4635009765625, 3.885498046875, 4.3074951171875, 4.7294921875, 5.1514892578125, 5.573486328125, 5.9954833984375, 6.41748046875, 6.8394775390625, 7.261474609375, 7.6834716796875, 8.10546875, 8.5274658203125, 8.949462890625, 9.3714599609375, 9.79345703125, 10.2154541015625, 10.637451171875, 11.0594482421875, 11.4814453125, 11.9034423828125, 12.325439453125, 12.7474365234375, 13.16943359375, 13.5914306640625, 14.013427734375, 14.4354248046875, 14.857421875, 15.2794189453125, 15.701416015625, 16.1234130859375, 16.54541015625, 16.9674072265625, 17.389404296875, 17.8114013671875, 18.2333984375, 18.6553955078125, 19.077392578125, 19.4993896484375, 19.92138671875, 20.3433837890625, 20.765380859375, 21.1873779296875, 21.609375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 4.0, 6.0, 15.0, 18.0, 24.0, 44.0, 55.0, 110.0, 189.0, 330.0, 666.0, 1602.0, 4994.0, 20181.0, 128784.0, 2821410.0, 1123450.0, 72054.0, 13926.0, 3744.0, 1387.0, 579.0, 297.0, 142.0, 84.0, 70.0, 39.0, 21.0, 24.0, 8.0, 10.0, 13.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.75, -21.021728515625, -20.29345703125, -19.565185546875, -18.8369140625, -18.108642578125, -17.38037109375, -16.652099609375, -15.923828125, -15.195556640625, -14.46728515625, -13.739013671875, -13.0107421875, -12.282470703125, -11.55419921875, -10.825927734375, -10.09765625, -9.369384765625, -8.64111328125, -7.912841796875, -7.1845703125, -6.456298828125, -5.72802734375, -4.999755859375, -4.271484375, -3.543212890625, -2.81494140625, -2.086669921875, -1.3583984375, -0.630126953125, 0.09814453125, 0.826416015625, 1.5546875, 2.282958984375, 3.01123046875, 3.739501953125, 4.4677734375, 5.196044921875, 5.92431640625, 6.652587890625, 7.380859375, 8.109130859375, 8.83740234375, 9.565673828125, 10.2939453125, 11.022216796875, 11.75048828125, 12.478759765625, 13.20703125, 13.935302734375, 14.66357421875, 15.391845703125, 16.1201171875, 16.848388671875, 17.57666015625, 18.304931640625, 19.033203125, 19.761474609375, 20.48974609375, 21.218017578125, 21.9462890625, 22.674560546875, 23.40283203125, 24.131103515625, 24.859375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 5.0, 2.0, 5.0, 7.0, 5.0, 9.0, 16.0, 20.0, 26.0, 45.0, 58.0, 82.0, 151.0, 222.0, 368.0, 635.0, 887.0, 611.0, 360.0, 195.0, 116.0, 79.0, 48.0, 40.0, 28.0, 16.0, 15.0, 5.0, 4.0, 10.0, 7.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.609375, -24.885986328125, -24.16259765625, -23.439208984375, -22.7158203125, -21.992431640625, -21.26904296875, -20.545654296875, -19.822265625, -19.098876953125, -18.37548828125, -17.652099609375, -16.9287109375, -16.205322265625, -15.48193359375, -14.758544921875, -14.03515625, -13.311767578125, -12.58837890625, -11.864990234375, -11.1416015625, -10.418212890625, -9.69482421875, -8.971435546875, -8.248046875, -7.524658203125, -6.80126953125, -6.077880859375, -5.3544921875, -4.631103515625, -3.90771484375, -3.184326171875, -2.4609375, -1.737548828125, -1.01416015625, -0.290771484375, 0.4326171875, 1.156005859375, 1.87939453125, 2.602783203125, 3.326171875, 4.049560546875, 4.77294921875, 5.496337890625, 6.2197265625, 6.943115234375, 7.66650390625, 8.389892578125, 9.11328125, 9.836669921875, 10.56005859375, 11.283447265625, 12.0068359375, 12.730224609375, 13.45361328125, 14.177001953125, 14.900390625, 15.623779296875, 16.34716796875, 17.070556640625, 17.7939453125, 18.517333984375, 19.24072265625, 19.964111328125, 20.6875]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 8.0, 8.0, 17.0, 60.0, 278.0, 388.0, 184.0, 39.0, 15.0, 7.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-324.2515869140625, -309.0975341796875, -293.9434814453125, -278.7894287109375, -263.6353759765625, -248.4813232421875, -233.32728576660156, -218.17323303222656, -203.01918029785156, -187.86512756347656, -172.71107482910156, -157.55703735351562, -142.40298461914062, -127.2489242553711, -112.09487915039062, -96.94082641601562, -81.78677368164062, -66.63272094726562, -51.47867202758789, -36.324623107910156, -21.170570373535156, -6.016517639160156, 9.137527465820312, 24.291580200195312, 39.44563293457031, 54.59968566894531, 69.75373840332031, 84.90778350830078, 100.06183624267578, 115.21588897705078, 130.36993408203125, 145.52398681640625, 160.67803955078125, 175.83209228515625, 190.98614501953125, 206.14019775390625, 221.29425048828125, 236.44830322265625, 251.6023406982422, 266.75640869140625, 281.91046142578125, 297.06451416015625, 312.21856689453125, 327.37261962890625, 342.52667236328125, 357.68072509765625, 372.83477783203125, 387.98883056640625, 403.1428527832031, 418.2969055175781, 433.4509582519531, 448.6050109863281, 463.7590637207031, 478.9131164550781, 494.067138671875, 509.22119140625, 524.375244140625, 539.529296875, 554.683349609375, 569.83740234375, 584.991455078125, 600.1455078125, 615.299560546875, 630.45361328125, 645.607666015625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 7.0, 1.0, 11.0, 4.0, 11.0, 3.0, 21.0, 23.0, 37.0, 33.0, 41.0, 43.0, 47.0, 63.0, 67.0, 66.0, 71.0, 75.0, 64.0, 77.0, 54.0, 45.0, 41.0, 37.0, 16.0, 18.0, 14.0, 9.0, 6.0, 2.0, 6.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-140.87799072265625, -136.82595825195312, -132.77392578125, -128.72190856933594, -124.66987609863281, -120.61784362792969, -116.56581115722656, -112.51377868652344, -108.46175384521484, -104.40972137451172, -100.35769653320312, -96.3056640625, -92.25363159179688, -88.20160675048828, -84.14957427978516, -80.09754943847656, -76.04551696777344, -71.99348449707031, -67.94145965576172, -63.889427185058594, -59.837398529052734, -55.785369873046875, -51.73333740234375, -47.68130874633789, -43.62928009033203, -39.57725143432617, -35.52522277832031, -31.473190307617188, -27.421161651611328, -23.36913299560547, -19.317102432250977, -15.265071868896484, -11.213058471679688, -7.161028861999512, -3.108999252319336, 0.9430303573608398, 4.995059967041016, 9.047088623046875, 13.099119186401367, 17.15114974975586, 21.20317840576172, 25.255207061767578, 29.30723762512207, 33.35926818847656, 37.41129684448242, 41.46332550048828, 45.515357971191406, 49.567386627197266, 53.619415283203125, 57.671443939208984, 61.723472595214844, 65.77550506591797, 69.82752990722656, 73.87956237792969, 77.93159484863281, 81.98362731933594, 86.03565216064453, 90.08768463134766, 94.13970947265625, 98.19174194335938, 102.2437744140625, 106.2957992553711, 110.34783172607422, 114.39985656738281, 118.45188903808594]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 3.0, 3.0, 7.0, 3.0, 5.0, 15.0, 16.0, 21.0, 21.0, 28.0, 52.0, 74.0, 126.0, 180.0, 261.0, 432.0, 737.0, 1216.0, 2246.0, 4022.0, 7798.0, 15430.0, 31445.0, 67071.0, 155921.0, 337894.0, 237668.0, 97155.0, 44030.0, 21348.0, 10786.0, 5532.0, 2946.0, 1597.0, 957.0, 567.0, 342.0, 202.0, 129.0, 78.0, 69.0, 45.0, 30.0, 11.0, 19.0, 10.0, 5.0, 3.0, 1.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-10.59375, -10.2374267578125, -9.881103515625, -9.5247802734375, -9.16845703125, -8.8121337890625, -8.455810546875, -8.0994873046875, -7.7431640625, -7.3868408203125, -7.030517578125, -6.6741943359375, -6.31787109375, -5.9615478515625, -5.605224609375, -5.2489013671875, -4.892578125, -4.5362548828125, -4.179931640625, -3.8236083984375, -3.46728515625, -3.1109619140625, -2.754638671875, -2.3983154296875, -2.0419921875, -1.6856689453125, -1.329345703125, -0.9730224609375, -0.61669921875, -0.2603759765625, 0.095947265625, 0.4522705078125, 0.80859375, 1.1649169921875, 1.521240234375, 1.8775634765625, 2.23388671875, 2.5902099609375, 2.946533203125, 3.3028564453125, 3.6591796875, 4.0155029296875, 4.371826171875, 4.7281494140625, 5.08447265625, 5.4407958984375, 5.797119140625, 6.1534423828125, 6.509765625, 6.8660888671875, 7.222412109375, 7.5787353515625, 7.93505859375, 8.2913818359375, 8.647705078125, 9.0040283203125, 9.3603515625, 9.7166748046875, 10.072998046875, 10.4293212890625, 10.78564453125, 11.1419677734375, 11.498291015625, 11.8546142578125, 12.2109375]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 6.0, 5.0, 3.0, 10.0, 7.0, 11.0, 16.0, 26.0, 20.0, 34.0, 22.0, 28.0, 33.0, 56.0, 41.0, 48.0, 61.0, 50.0, 52.0, 60.0, 54.0, 56.0, 39.0, 41.0, 40.0, 40.0, 34.0, 35.0, 15.0, 17.0, 13.0, 10.0, 13.0, 4.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.078125, -7.84283447265625, -7.6075439453125, -7.37225341796875, -7.136962890625, -6.90167236328125, -6.6663818359375, -6.43109130859375, -6.19580078125, -5.96051025390625, -5.7252197265625, -5.48992919921875, -5.254638671875, -5.01934814453125, -4.7840576171875, -4.54876708984375, -4.3134765625, -4.07818603515625, -3.8428955078125, -3.60760498046875, -3.372314453125, -3.13702392578125, -2.9017333984375, -2.66644287109375, -2.43115234375, -2.19586181640625, -1.9605712890625, -1.72528076171875, -1.489990234375, -1.25469970703125, -1.0194091796875, -0.78411865234375, -0.548828125, -0.31353759765625, -0.0782470703125, 0.15704345703125, 0.392333984375, 0.62762451171875, 0.8629150390625, 1.09820556640625, 1.33349609375, 1.56878662109375, 1.8040771484375, 2.03936767578125, 2.274658203125, 2.50994873046875, 2.7452392578125, 2.98052978515625, 3.2158203125, 3.45111083984375, 3.6864013671875, 3.92169189453125, 4.156982421875, 4.39227294921875, 4.6275634765625, 4.86285400390625, 5.09814453125, 5.33343505859375, 5.5687255859375, 5.80401611328125, 6.039306640625, 6.27459716796875, 6.5098876953125, 6.74517822265625, 6.98046875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 8.0, 7.0, 15.0, 11.0, 10.0, 14.0, 23.0, 28.0, 44.0, 61.0, 64.0, 104.0, 126.0, 176.0, 252.0, 328.0, 479.0, 668.0, 961.0, 1507.0, 2530.0, 4837.0, 11402.0, 37371.0, 168863.0, 643023.0, 125025.0, 29805.0, 9608.0, 4298.0, 2220.0, 1471.0, 911.0, 623.0, 465.0, 329.0, 211.0, 153.0, 115.0, 95.0, 73.0, 63.0, 38.0, 28.0, 31.0, 22.0, 12.0, 14.0, 9.0, 6.0, 7.0, 5.0, 3.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 4.0, 2.0], "bins": [-18.3125, -17.66796875, -17.0234375, -16.37890625, -15.734375, -15.08984375, -14.4453125, -13.80078125, -13.15625, -12.51171875, -11.8671875, -11.22265625, -10.578125, -9.93359375, -9.2890625, -8.64453125, -8.0, -7.35546875, -6.7109375, -6.06640625, -5.421875, -4.77734375, -4.1328125, -3.48828125, -2.84375, -2.19921875, -1.5546875, -0.91015625, -0.265625, 0.37890625, 1.0234375, 1.66796875, 2.3125, 2.95703125, 3.6015625, 4.24609375, 4.890625, 5.53515625, 6.1796875, 6.82421875, 7.46875, 8.11328125, 8.7578125, 9.40234375, 10.046875, 10.69140625, 11.3359375, 11.98046875, 12.625, 13.26953125, 13.9140625, 14.55859375, 15.203125, 15.84765625, 16.4921875, 17.13671875, 17.78125, 18.42578125, 19.0703125, 19.71484375, 20.359375, 21.00390625, 21.6484375, 22.29296875, 22.9375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 4.0, 9.0, 4.0, 8.0, 4.0, 11.0, 5.0, 13.0, 14.0, 10.0, 24.0, 25.0, 31.0, 33.0, 35.0, 36.0, 38.0, 37.0, 51.0, 44.0, 48.0, 32.0, 56.0, 39.0, 39.0, 41.0, 40.0, 31.0, 31.0, 36.0, 19.0, 18.0, 25.0, 18.0, 17.0, 18.0, 11.0, 14.0, 7.0, 8.0, 4.0, 4.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-24.734375, -23.89404296875, -23.0537109375, -22.21337890625, -21.373046875, -20.53271484375, -19.6923828125, -18.85205078125, -18.01171875, -17.17138671875, -16.3310546875, -15.49072265625, -14.650390625, -13.81005859375, -12.9697265625, -12.12939453125, -11.2890625, -10.44873046875, -9.6083984375, -8.76806640625, -7.927734375, -7.08740234375, -6.2470703125, -5.40673828125, -4.56640625, -3.72607421875, -2.8857421875, -2.04541015625, -1.205078125, -0.36474609375, 0.4755859375, 1.31591796875, 2.15625, 2.99658203125, 3.8369140625, 4.67724609375, 5.517578125, 6.35791015625, 7.1982421875, 8.03857421875, 8.87890625, 9.71923828125, 10.5595703125, 11.39990234375, 12.240234375, 13.08056640625, 13.9208984375, 14.76123046875, 15.6015625, 16.44189453125, 17.2822265625, 18.12255859375, 18.962890625, 19.80322265625, 20.6435546875, 21.48388671875, 22.32421875, 23.16455078125, 24.0048828125, 24.84521484375, 25.685546875, 26.52587890625, 27.3662109375, 28.20654296875, 29.046875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 5.0, 9.0, 3.0, 5.0, 11.0, 17.0, 15.0, 24.0, 46.0, 74.0, 106.0, 164.0, 310.0, 637.0, 1684.0, 5201.0, 23015.0, 163452.0, 754732.0, 79470.0, 13687.0, 3489.0, 1179.0, 550.0, 256.0, 148.0, 89.0, 62.0, 43.0, 24.0, 14.0, 15.0, 5.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-14.140625, -13.7164306640625, -13.292236328125, -12.8680419921875, -12.44384765625, -12.0196533203125, -11.595458984375, -11.1712646484375, -10.7470703125, -10.3228759765625, -9.898681640625, -9.4744873046875, -9.05029296875, -8.6260986328125, -8.201904296875, -7.7777099609375, -7.353515625, -6.9293212890625, -6.505126953125, -6.0809326171875, -5.65673828125, -5.2325439453125, -4.808349609375, -4.3841552734375, -3.9599609375, -3.5357666015625, -3.111572265625, -2.6873779296875, -2.26318359375, -1.8389892578125, -1.414794921875, -0.9906005859375, -0.56640625, -0.1422119140625, 0.281982421875, 0.7061767578125, 1.13037109375, 1.5545654296875, 1.978759765625, 2.4029541015625, 2.8271484375, 3.2513427734375, 3.675537109375, 4.0997314453125, 4.52392578125, 4.9481201171875, 5.372314453125, 5.7965087890625, 6.220703125, 6.6448974609375, 7.069091796875, 7.4932861328125, 7.91748046875, 8.3416748046875, 8.765869140625, 9.1900634765625, 9.6142578125, 10.0384521484375, 10.462646484375, 10.8868408203125, 11.31103515625, 11.7352294921875, 12.159423828125, 12.5836181640625, 13.0078125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 8.0, 6.0, 3.0, 8.0, 14.0, 17.0, 33.0, 52.0, 60.0, 111.0, 207.0, 170.0, 93.0, 63.0, 43.0, 38.0, 21.0, 13.0, 16.0, 12.0, 3.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00588226318359375, -0.005734622478485107, -0.005586981773376465, -0.005439341068267822, -0.00529170036315918, -0.005144059658050537, -0.0049964189529418945, -0.004848778247833252, -0.004701137542724609, -0.004553496837615967, -0.004405856132507324, -0.004258215427398682, -0.004110574722290039, -0.0039629340171813965, -0.003815293312072754, -0.0036676526069641113, -0.0035200119018554688, -0.003372371196746826, -0.0032247304916381836, -0.003077089786529541, -0.0029294490814208984, -0.002781808376312256, -0.0026341676712036133, -0.0024865269660949707, -0.002338886260986328, -0.0021912455558776855, -0.002043604850769043, -0.0018959641456604004, -0.0017483234405517578, -0.0016006827354431152, -0.0014530420303344727, -0.00130540132522583, -0.0011577606201171875, -0.001010119915008545, -0.0008624792098999023, -0.0007148385047912598, -0.0005671977996826172, -0.0004195570945739746, -0.00027191638946533203, -0.00012427568435668945, 2.3365020751953125e-05, 0.0001710057258605957, 0.0003186464309692383, 0.00046628713607788086, 0.0006139278411865234, 0.000761568546295166, 0.0009092092514038086, 0.0010568499565124512, 0.0012044906616210938, 0.0013521313667297363, 0.001499772071838379, 0.0016474127769470215, 0.001795053482055664, 0.0019426941871643066, 0.0020903348922729492, 0.002237975597381592, 0.0023856163024902344, 0.002533257007598877, 0.0026808977127075195, 0.002828538417816162, 0.0029761791229248047, 0.0031238198280334473, 0.00327146053314209, 0.0034191012382507324, 0.003566741943359375]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 4.0, 4.0, 4.0, 11.0, 7.0, 11.0, 10.0, 15.0, 15.0, 48.0, 36.0, 68.0, 123.0, 184.0, 386.0, 676.0, 1482.0, 3330.0, 8685.0, 29345.0, 172808.0, 713412.0, 88010.0, 18605.0, 6327.0, 2448.0, 1116.0, 605.0, 290.0, 168.0, 107.0, 70.0, 36.0, 28.0, 22.0, 11.0, 16.0, 10.0, 9.0, 4.0, 5.0, 3.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.609375, -11.213623046875, -10.81787109375, -10.422119140625, -10.0263671875, -9.630615234375, -9.23486328125, -8.839111328125, -8.443359375, -8.047607421875, -7.65185546875, -7.256103515625, -6.8603515625, -6.464599609375, -6.06884765625, -5.673095703125, -5.27734375, -4.881591796875, -4.48583984375, -4.090087890625, -3.6943359375, -3.298583984375, -2.90283203125, -2.507080078125, -2.111328125, -1.715576171875, -1.31982421875, -0.924072265625, -0.5283203125, -0.132568359375, 0.26318359375, 0.658935546875, 1.0546875, 1.450439453125, 1.84619140625, 2.241943359375, 2.6376953125, 3.033447265625, 3.42919921875, 3.824951171875, 4.220703125, 4.616455078125, 5.01220703125, 5.407958984375, 5.8037109375, 6.199462890625, 6.59521484375, 6.990966796875, 7.38671875, 7.782470703125, 8.17822265625, 8.573974609375, 8.9697265625, 9.365478515625, 9.76123046875, 10.156982421875, 10.552734375, 10.948486328125, 11.34423828125, 11.739990234375, 12.1357421875, 12.531494140625, 12.92724609375, 13.322998046875, 13.71875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 10.0, 11.0, 12.0, 16.0, 6.0, 22.0, 31.0, 22.0, 35.0, 57.0, 71.0, 72.0, 101.0, 122.0, 101.0, 60.0, 53.0, 48.0, 28.0, 23.0, 17.0, 14.0, 14.0, 6.0, 8.0, 13.0, 4.0, 7.0, 7.0, 4.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.625, -10.272216796875, -9.91943359375, -9.566650390625, -9.2138671875, -8.861083984375, -8.50830078125, -8.155517578125, -7.802734375, -7.449951171875, -7.09716796875, -6.744384765625, -6.3916015625, -6.038818359375, -5.68603515625, -5.333251953125, -4.98046875, -4.627685546875, -4.27490234375, -3.922119140625, -3.5693359375, -3.216552734375, -2.86376953125, -2.510986328125, -2.158203125, -1.805419921875, -1.45263671875, -1.099853515625, -0.7470703125, -0.394287109375, -0.04150390625, 0.311279296875, 0.6640625, 1.016845703125, 1.36962890625, 1.722412109375, 2.0751953125, 2.427978515625, 2.78076171875, 3.133544921875, 3.486328125, 3.839111328125, 4.19189453125, 4.544677734375, 4.8974609375, 5.250244140625, 5.60302734375, 5.955810546875, 6.30859375, 6.661376953125, 7.01416015625, 7.366943359375, 7.7197265625, 8.072509765625, 8.42529296875, 8.778076171875, 9.130859375, 9.483642578125, 9.83642578125, 10.189208984375, 10.5419921875, 10.894775390625, 11.24755859375, 11.600341796875, 11.953125]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 5.0, 3.0, 8.0, 11.0, 22.0, 52.0, 146.0, 275.0, 247.0, 133.0, 49.0, 22.0, 12.0, 4.0, 3.0, 3.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-250.92996215820312, -241.960205078125, -232.99044799804688, -224.02069091796875, -215.05093383789062, -206.0811767578125, -197.1114044189453, -188.1416473388672, -179.17189025878906, -170.20213317871094, -161.2323760986328, -152.2626190185547, -143.2928466796875, -134.32308959960938, -125.35333251953125, -116.38357543945312, -107.413818359375, -98.44406127929688, -89.47430419921875, -80.5045394897461, -71.53478240966797, -62.565025329589844, -53.59526443481445, -44.62550354003906, -35.65574645996094, -26.68598747253418, -17.716228485107422, -8.746469497680664, 0.22328948974609375, 9.193046569824219, 18.16280746459961, 27.132568359375, 36.10235595703125, 45.072113037109375, 54.041873931884766, 63.011634826660156, 71.98139190673828, 80.9511489868164, 89.92091369628906, 98.89067077636719, 107.86042785644531, 116.83018493652344, 125.79994201660156, 134.7696990966797, 143.73947143554688, 152.709228515625, 161.67898559570312, 170.64874267578125, 179.61849975585938, 188.5882568359375, 197.55801391601562, 206.52777099609375, 215.49752807617188, 224.46728515625, 233.4370574951172, 242.4068145751953, 251.37657165527344, 260.3463439941406, 269.31610107421875, 278.2858581542969, 287.255615234375, 296.2253723144531, 305.19512939453125, 314.1648864746094, 323.1346435546875]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 2.0, 5.0, 7.0, 7.0, 8.0, 8.0, 14.0, 22.0, 13.0, 19.0, 20.0, 28.0, 22.0, 22.0, 32.0, 29.0, 36.0, 41.0, 59.0, 50.0, 72.0, 56.0, 41.0, 25.0, 52.0, 38.0, 34.0, 19.0, 39.0, 27.0, 20.0, 20.0, 24.0, 13.0, 12.0, 14.0, 12.0, 11.0, 6.0, 6.0, 4.0, 2.0, 6.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-95.28793334960938, -92.28878021240234, -89.28962707519531, -86.29048156738281, -83.29132843017578, -80.29217529296875, -77.29302215576172, -74.29386901855469, -71.29472351074219, -68.29557037353516, -65.29641723632812, -62.29726791381836, -59.298118591308594, -56.29896545410156, -53.29981231689453, -50.3006591796875, -47.30150604248047, -44.30235290527344, -41.30320358276367, -38.30405044555664, -35.304901123046875, -32.305747985839844, -29.306594848632812, -26.307443618774414, -23.308292388916016, -20.309141159057617, -17.30998992919922, -14.310836791992188, -11.311685562133789, -8.31253433227539, -5.313381195068359, -2.314229965209961, 0.6849212646484375, 3.684072971343994, 6.683224678039551, 9.682376861572266, 12.681528091430664, 15.680679321289062, 18.679832458496094, 21.678983688354492, 24.67813491821289, 27.67728614807129, 30.676437377929688, 33.67559051513672, 36.67474365234375, 39.673892974853516, 42.67304611206055, 45.67219543457031, 48.671348571777344, 51.670501708984375, 54.66965103149414, 57.66880416870117, 60.66795349121094, 63.66710662841797, 66.666259765625, 69.66541290283203, 72.66456604003906, 75.6637191772461, 78.66287231445312, 81.66201782226562, 84.66117095947266, 87.66032409667969, 90.65947723388672, 93.65863037109375, 96.65777587890625]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 9.0, 13.0, 15.0, 21.0, 31.0, 58.0, 95.0, 186.0, 382.0, 774.0, 1655.0, 4216.0, 13910.0, 84568.0, 2537779.0, 1478428.0, 55027.0, 10386.0, 3442.0, 1472.0, 722.0, 397.0, 233.0, 144.0, 96.0, 61.0, 57.0, 37.0, 19.0, 17.0, 17.0, 6.0, 2.0, 5.0, 4.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 4.0], "bins": [-23.953125, -23.26708984375, -22.5810546875, -21.89501953125, -21.208984375, -20.52294921875, -19.8369140625, -19.15087890625, -18.46484375, -17.77880859375, -17.0927734375, -16.40673828125, -15.720703125, -15.03466796875, -14.3486328125, -13.66259765625, -12.9765625, -12.29052734375, -11.6044921875, -10.91845703125, -10.232421875, -9.54638671875, -8.8603515625, -8.17431640625, -7.48828125, -6.80224609375, -6.1162109375, -5.43017578125, -4.744140625, -4.05810546875, -3.3720703125, -2.68603515625, -2.0, -1.31396484375, -0.6279296875, 0.05810546875, 0.744140625, 1.43017578125, 2.1162109375, 2.80224609375, 3.48828125, 4.17431640625, 4.8603515625, 5.54638671875, 6.232421875, 6.91845703125, 7.6044921875, 8.29052734375, 8.9765625, 9.66259765625, 10.3486328125, 11.03466796875, 11.720703125, 12.40673828125, 13.0927734375, 13.77880859375, 14.46484375, 15.15087890625, 15.8369140625, 16.52294921875, 17.208984375, 17.89501953125, 18.5810546875, 19.26708984375, 19.953125]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 6.0, 4.0, 2.0, 7.0, 10.0, 6.0, 9.0, 19.0, 10.0, 26.0, 28.0, 23.0, 35.0, 33.0, 51.0, 41.0, 50.0, 49.0, 47.0, 48.0, 42.0, 51.0, 47.0, 57.0, 32.0, 29.0, 32.0, 32.0, 27.0, 30.0, 28.0, 17.0, 15.0, 17.0, 11.0, 10.0, 10.0, 2.0, 7.0, 1.0, 2.0, 1.0, 5.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.8203125, -6.61431884765625, -6.4083251953125, -6.20233154296875, -5.996337890625, -5.79034423828125, -5.5843505859375, -5.37835693359375, -5.17236328125, -4.96636962890625, -4.7603759765625, -4.55438232421875, -4.348388671875, -4.14239501953125, -3.9364013671875, -3.73040771484375, -3.5244140625, -3.31842041015625, -3.1124267578125, -2.90643310546875, -2.700439453125, -2.49444580078125, -2.2884521484375, -2.08245849609375, -1.87646484375, -1.67047119140625, -1.4644775390625, -1.25848388671875, -1.052490234375, -0.84649658203125, -0.6405029296875, -0.43450927734375, -0.228515625, -0.02252197265625, 0.1834716796875, 0.38946533203125, 0.595458984375, 0.80145263671875, 1.0074462890625, 1.21343994140625, 1.41943359375, 1.62542724609375, 1.8314208984375, 2.03741455078125, 2.243408203125, 2.44940185546875, 2.6553955078125, 2.86138916015625, 3.0673828125, 3.27337646484375, 3.4793701171875, 3.68536376953125, 3.891357421875, 4.09735107421875, 4.3033447265625, 4.50933837890625, 4.71533203125, 4.92132568359375, 5.1273193359375, 5.33331298828125, 5.539306640625, 5.74530029296875, 5.9512939453125, 6.15728759765625, 6.36328125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 4.0, 4.0, 3.0, 15.0, 15.0, 19.0, 23.0, 42.0, 66.0, 78.0, 157.0, 287.0, 538.0, 1033.0, 2413.0, 6349.0, 21339.0, 110078.0, 2089277.0, 1828988.0, 103764.0, 20088.0, 5736.0, 2083.0, 871.0, 407.0, 230.0, 129.0, 90.0, 45.0, 32.0, 31.0, 18.0, 11.0, 11.0, 8.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.46875, -16.8212890625, -16.173828125, -15.5263671875, -14.87890625, -14.2314453125, -13.583984375, -12.9365234375, -12.2890625, -11.6416015625, -10.994140625, -10.3466796875, -9.69921875, -9.0517578125, -8.404296875, -7.7568359375, -7.109375, -6.4619140625, -5.814453125, -5.1669921875, -4.51953125, -3.8720703125, -3.224609375, -2.5771484375, -1.9296875, -1.2822265625, -0.634765625, 0.0126953125, 0.66015625, 1.3076171875, 1.955078125, 2.6025390625, 3.25, 3.8974609375, 4.544921875, 5.1923828125, 5.83984375, 6.4873046875, 7.134765625, 7.7822265625, 8.4296875, 9.0771484375, 9.724609375, 10.3720703125, 11.01953125, 11.6669921875, 12.314453125, 12.9619140625, 13.609375, 14.2568359375, 14.904296875, 15.5517578125, 16.19921875, 16.8466796875, 17.494140625, 18.1416015625, 18.7890625, 19.4365234375, 20.083984375, 20.7314453125, 21.37890625, 22.0263671875, 22.673828125, 23.3212890625, 23.96875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 1.0, 6.0, 4.0, 4.0, 4.0, 2.0, 5.0, 7.0, 10.0, 15.0, 15.0, 14.0, 25.0, 41.0, 42.0, 86.0, 83.0, 169.0, 252.0, 373.0, 568.0, 694.0, 558.0, 361.0, 232.0, 128.0, 78.0, 76.0, 54.0, 44.0, 29.0, 26.0, 16.0, 13.0, 11.0, 7.0, 7.0, 8.0, 6.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.828125, -17.278564453125, -16.72900390625, -16.179443359375, -15.6298828125, -15.080322265625, -14.53076171875, -13.981201171875, -13.431640625, -12.882080078125, -12.33251953125, -11.782958984375, -11.2333984375, -10.683837890625, -10.13427734375, -9.584716796875, -9.03515625, -8.485595703125, -7.93603515625, -7.386474609375, -6.8369140625, -6.287353515625, -5.73779296875, -5.188232421875, -4.638671875, -4.089111328125, -3.53955078125, -2.989990234375, -2.4404296875, -1.890869140625, -1.34130859375, -0.791748046875, -0.2421875, 0.307373046875, 0.85693359375, 1.406494140625, 1.9560546875, 2.505615234375, 3.05517578125, 3.604736328125, 4.154296875, 4.703857421875, 5.25341796875, 5.802978515625, 6.3525390625, 6.902099609375, 7.45166015625, 8.001220703125, 8.55078125, 9.100341796875, 9.64990234375, 10.199462890625, 10.7490234375, 11.298583984375, 11.84814453125, 12.397705078125, 12.947265625, 13.496826171875, 14.04638671875, 14.595947265625, 15.1455078125, 15.695068359375, 16.24462890625, 16.794189453125, 17.34375]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 7.0, 1.0, 3.0, 7.0, 16.0, 24.0, 47.0, 106.0, 210.0, 279.0, 167.0, 71.0, 40.0, 10.0, 8.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-316.7023010253906, -307.9582214355469, -299.2141418457031, -290.4700622558594, -281.7259826660156, -272.9819030761719, -264.2378234863281, -255.49374389648438, -246.74966430664062, -238.00558471679688, -229.26150512695312, -220.51742553710938, -211.77334594726562, -203.02926635742188, -194.28518676757812, -185.54110717773438, -176.7970428466797, -168.05296325683594, -159.3088836669922, -150.56480407714844, -141.8207244873047, -133.07664489746094, -124.33257293701172, -115.58849334716797, -106.84441375732422, -98.10033416748047, -89.35625457763672, -80.6121826171875, -71.86810302734375, -63.124019622802734, -54.37994384765625, -45.6358642578125, -36.89178466796875, -28.147705078125, -19.403627395629883, -10.659549713134766, -1.9154701232910156, 6.828609466552734, 15.572685241699219, 24.31676483154297, 33.06084442138672, 41.80492401123047, 50.54900360107422, 59.2930793762207, 68.03715515136719, 76.78123474121094, 85.52531433105469, 94.26939392089844, 103.01347351074219, 111.75755310058594, 120.50163269042969, 129.24571228027344, 137.9897918701172, 146.73387145996094, 155.47793579101562, 164.22201538085938, 172.96609497070312, 181.71017456054688, 190.45425415039062, 199.19833374023438, 207.94241333007812, 216.68649291992188, 225.43057250976562, 234.17465209960938, 242.91873168945312]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 4.0, 1.0, 0.0, 2.0, 4.0, 2.0, 4.0, 7.0, 6.0, 15.0, 14.0, 13.0, 8.0, 18.0, 21.0, 20.0, 18.0, 21.0, 29.0, 50.0, 59.0, 42.0, 48.0, 50.0, 49.0, 56.0, 55.0, 56.0, 39.0, 48.0, 34.0, 31.0, 27.0, 20.0, 25.0, 21.0, 19.0, 22.0, 18.0, 9.0, 6.0, 9.0, 1.0, 3.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-73.36774444580078, -70.4909896850586, -67.61422729492188, -64.73747253417969, -61.8607177734375, -58.98396301269531, -56.10720443725586, -53.230445861816406, -50.35369110107422, -47.47693634033203, -44.60017776489258, -41.723419189453125, -38.84666442871094, -35.96990966796875, -33.0931510925293, -30.216394424438477, -27.339637756347656, -24.462881088256836, -21.586124420166016, -18.709367752075195, -15.832611083984375, -12.955854415893555, -10.079097747802734, -7.202341079711914, -4.325584411621094, -1.4488277435302734, 1.4279289245605469, 4.304685592651367, 7.1814422607421875, 10.058198928833008, 12.934955596923828, 15.811712265014648, 18.68846893310547, 21.56522560119629, 24.44198226928711, 27.31873893737793, 30.19549560546875, 33.07225036621094, 35.94900894165039, 38.825767517089844, 41.70252227783203, 44.57927703857422, 47.45603561401367, 50.332794189453125, 53.20954895019531, 56.0863037109375, 58.96306228637695, 61.839820861816406, 64.7165756225586, 67.59333038330078, 70.4700927734375, 73.34684753417969, 76.22360229492188, 79.10035705566406, 81.97711181640625, 84.85387420654297, 87.73062896728516, 90.60738372802734, 93.48414611816406, 96.36090087890625, 99.23765563964844, 102.11441040039062, 104.99116516113281, 107.86792755126953, 110.74468231201172]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 4.0, 10.0, 9.0, 18.0, 19.0, 27.0, 36.0, 66.0, 105.0, 123.0, 205.0, 280.0, 433.0, 711.0, 1145.0, 2044.0, 3719.0, 7606.0, 16236.0, 40755.0, 124650.0, 412762.0, 297799.0, 84000.0, 29846.0, 12484.0, 5861.0, 3128.0, 1728.0, 1003.0, 591.0, 397.0, 218.0, 170.0, 105.0, 87.0, 52.0, 26.0, 26.0, 22.0, 12.0, 20.0, 10.0, 3.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.90625, -13.440185546875, -12.97412109375, -12.508056640625, -12.0419921875, -11.575927734375, -11.10986328125, -10.643798828125, -10.177734375, -9.711669921875, -9.24560546875, -8.779541015625, -8.3134765625, -7.847412109375, -7.38134765625, -6.915283203125, -6.44921875, -5.983154296875, -5.51708984375, -5.051025390625, -4.5849609375, -4.118896484375, -3.65283203125, -3.186767578125, -2.720703125, -2.254638671875, -1.78857421875, -1.322509765625, -0.8564453125, -0.390380859375, 0.07568359375, 0.541748046875, 1.0078125, 1.473876953125, 1.93994140625, 2.406005859375, 2.8720703125, 3.338134765625, 3.80419921875, 4.270263671875, 4.736328125, 5.202392578125, 5.66845703125, 6.134521484375, 6.6005859375, 7.066650390625, 7.53271484375, 7.998779296875, 8.46484375, 8.930908203125, 9.39697265625, 9.863037109375, 10.3291015625, 10.795166015625, 11.26123046875, 11.727294921875, 12.193359375, 12.659423828125, 13.12548828125, 13.591552734375, 14.0576171875, 14.523681640625, 14.98974609375, 15.455810546875, 15.921875]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 7.0, 5.0, 7.0, 6.0, 11.0, 13.0, 20.0, 28.0, 23.0, 26.0, 40.0, 33.0, 44.0, 44.0, 48.0, 46.0, 53.0, 53.0, 47.0, 48.0, 49.0, 55.0, 41.0, 42.0, 34.0, 43.0, 15.0, 23.0, 14.0, 11.0, 13.0, 16.0, 9.0, 5.0, 10.0, 2.0, 4.0, 2.0, 2.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0], "bins": [-7.96484375, -7.74896240234375, -7.5330810546875, -7.31719970703125, -7.101318359375, -6.88543701171875, -6.6695556640625, -6.45367431640625, -6.23779296875, -6.02191162109375, -5.8060302734375, -5.59014892578125, -5.374267578125, -5.15838623046875, -4.9425048828125, -4.72662353515625, -4.5107421875, -4.29486083984375, -4.0789794921875, -3.86309814453125, -3.647216796875, -3.43133544921875, -3.2154541015625, -2.99957275390625, -2.78369140625, -2.56781005859375, -2.3519287109375, -2.13604736328125, -1.920166015625, -1.70428466796875, -1.4884033203125, -1.27252197265625, -1.056640625, -0.84075927734375, -0.6248779296875, -0.40899658203125, -0.193115234375, 0.02276611328125, 0.2386474609375, 0.45452880859375, 0.67041015625, 0.88629150390625, 1.1021728515625, 1.31805419921875, 1.533935546875, 1.74981689453125, 1.9656982421875, 2.18157958984375, 2.3974609375, 2.61334228515625, 2.8292236328125, 3.04510498046875, 3.260986328125, 3.47686767578125, 3.6927490234375, 3.90863037109375, 4.12451171875, 4.34039306640625, 4.5562744140625, 4.77215576171875, 4.988037109375, 5.20391845703125, 5.4197998046875, 5.63568115234375, 5.8515625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 4.0, 4.0, 7.0, 9.0, 13.0, 7.0, 30.0, 26.0, 40.0, 43.0, 74.0, 114.0, 152.0, 217.0, 349.0, 562.0, 1002.0, 1903.0, 4724.0, 15409.0, 81011.0, 752393.0, 154999.0, 23563.0, 6412.0, 2464.0, 1169.0, 666.0, 390.0, 243.0, 167.0, 131.0, 83.0, 50.0, 39.0, 33.0, 19.0, 10.0, 14.0, 5.0, 3.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.15625, -25.27392578125, -24.3916015625, -23.50927734375, -22.626953125, -21.74462890625, -20.8623046875, -19.97998046875, -19.09765625, -18.21533203125, -17.3330078125, -16.45068359375, -15.568359375, -14.68603515625, -13.8037109375, -12.92138671875, -12.0390625, -11.15673828125, -10.2744140625, -9.39208984375, -8.509765625, -7.62744140625, -6.7451171875, -5.86279296875, -4.98046875, -4.09814453125, -3.2158203125, -2.33349609375, -1.451171875, -0.56884765625, 0.3134765625, 1.19580078125, 2.078125, 2.96044921875, 3.8427734375, 4.72509765625, 5.607421875, 6.48974609375, 7.3720703125, 8.25439453125, 9.13671875, 10.01904296875, 10.9013671875, 11.78369140625, 12.666015625, 13.54833984375, 14.4306640625, 15.31298828125, 16.1953125, 17.07763671875, 17.9599609375, 18.84228515625, 19.724609375, 20.60693359375, 21.4892578125, 22.37158203125, 23.25390625, 24.13623046875, 25.0185546875, 25.90087890625, 26.783203125, 27.66552734375, 28.5478515625, 29.43017578125, 30.3125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 6.0, 4.0, 6.0, 10.0, 10.0, 12.0, 13.0, 12.0, 17.0, 23.0, 25.0, 18.0, 29.0, 38.0, 29.0, 36.0, 38.0, 52.0, 38.0, 47.0, 49.0, 50.0, 51.0, 43.0, 48.0, 36.0, 35.0, 29.0, 30.0, 26.0, 20.0, 19.0, 24.0, 22.0, 11.0, 14.0, 7.0, 8.0, 4.0, 3.0, 7.0, 5.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-26.15625, -25.40185546875, -24.6474609375, -23.89306640625, -23.138671875, -22.38427734375, -21.6298828125, -20.87548828125, -20.12109375, -19.36669921875, -18.6123046875, -17.85791015625, -17.103515625, -16.34912109375, -15.5947265625, -14.84033203125, -14.0859375, -13.33154296875, -12.5771484375, -11.82275390625, -11.068359375, -10.31396484375, -9.5595703125, -8.80517578125, -8.05078125, -7.29638671875, -6.5419921875, -5.78759765625, -5.033203125, -4.27880859375, -3.5244140625, -2.77001953125, -2.015625, -1.26123046875, -0.5068359375, 0.24755859375, 1.001953125, 1.75634765625, 2.5107421875, 3.26513671875, 4.01953125, 4.77392578125, 5.5283203125, 6.28271484375, 7.037109375, 7.79150390625, 8.5458984375, 9.30029296875, 10.0546875, 10.80908203125, 11.5634765625, 12.31787109375, 13.072265625, 13.82666015625, 14.5810546875, 15.33544921875, 16.08984375, 16.84423828125, 17.5986328125, 18.35302734375, 19.107421875, 19.86181640625, 20.6162109375, 21.37060546875, 22.125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 2.0, 6.0, 12.0, 13.0, 20.0, 33.0, 40.0, 52.0, 91.0, 159.0, 280.0, 543.0, 1142.0, 2641.0, 7940.0, 31761.0, 207904.0, 691927.0, 79889.0, 15890.0, 4713.0, 1810.0, 729.0, 353.0, 193.0, 136.0, 78.0, 66.0, 33.0, 27.0, 17.0, 13.0, 13.0, 5.0, 7.0, 6.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.2734375, -8.933349609375, -8.59326171875, -8.253173828125, -7.9130859375, -7.572998046875, -7.23291015625, -6.892822265625, -6.552734375, -6.212646484375, -5.87255859375, -5.532470703125, -5.1923828125, -4.852294921875, -4.51220703125, -4.172119140625, -3.83203125, -3.491943359375, -3.15185546875, -2.811767578125, -2.4716796875, -2.131591796875, -1.79150390625, -1.451416015625, -1.111328125, -0.771240234375, -0.43115234375, -0.091064453125, 0.2490234375, 0.589111328125, 0.92919921875, 1.269287109375, 1.609375, 1.949462890625, 2.28955078125, 2.629638671875, 2.9697265625, 3.309814453125, 3.64990234375, 3.989990234375, 4.330078125, 4.670166015625, 5.01025390625, 5.350341796875, 5.6904296875, 6.030517578125, 6.37060546875, 6.710693359375, 7.05078125, 7.390869140625, 7.73095703125, 8.071044921875, 8.4111328125, 8.751220703125, 9.09130859375, 9.431396484375, 9.771484375, 10.111572265625, 10.45166015625, 10.791748046875, 11.1318359375, 11.471923828125, 11.81201171875, 12.152099609375, 12.4921875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 5.0, 6.0, 5.0, 5.0, 13.0, 12.0, 10.0, 16.0, 23.0, 26.0, 22.0, 62.0, 75.0, 111.0, 144.0, 131.0, 84.0, 57.0, 42.0, 29.0, 31.0, 25.0, 19.0, 7.0, 13.0, 10.0, 2.0, 2.0, 1.0, 5.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002742767333984375, -0.002653568983078003, -0.002564370632171631, -0.002475172281265259, -0.0023859739303588867, -0.0022967755794525146, -0.0022075772285461426, -0.0021183788776397705, -0.0020291805267333984, -0.0019399821758270264, -0.0018507838249206543, -0.0017615854740142822, -0.0016723871231079102, -0.001583188772201538, -0.001493990421295166, -0.001404792070388794, -0.0013155937194824219, -0.0012263953685760498, -0.0011371970176696777, -0.0010479986667633057, -0.0009588003158569336, -0.0008696019649505615, -0.0007804036140441895, -0.0006912052631378174, -0.0006020069122314453, -0.0005128085613250732, -0.00042361021041870117, -0.0003344118595123291, -0.00024521350860595703, -0.00015601515769958496, -6.681680679321289e-05, 2.238154411315918e-05, 0.00011157989501953125, 0.00020077824592590332, 0.0002899765968322754, 0.00037917494773864746, 0.00046837329864501953, 0.0005575716495513916, 0.0006467700004577637, 0.0007359683513641357, 0.0008251667022705078, 0.0009143650531768799, 0.001003563404083252, 0.001092761754989624, 0.001181960105895996, 0.0012711584568023682, 0.0013603568077087402, 0.0014495551586151123, 0.0015387535095214844, 0.0016279518604278564, 0.0017171502113342285, 0.0018063485622406006, 0.0018955469131469727, 0.0019847452640533447, 0.002073943614959717, 0.002163141965866089, 0.002252340316772461, 0.002341538667678833, 0.002430737018585205, 0.002519935369491577, 0.0026091337203979492, 0.0026983320713043213, 0.0027875304222106934, 0.0028767287731170654, 0.0029659271240234375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 5.0, 6.0, 4.0, 9.0, 10.0, 13.0, 10.0, 15.0, 29.0, 41.0, 62.0, 99.0, 129.0, 199.0, 326.0, 486.0, 787.0, 1489.0, 2741.0, 5801.0, 14489.0, 45261.0, 231511.0, 618639.0, 86501.0, 22788.0, 8578.0, 3845.0, 1882.0, 1058.0, 618.0, 379.0, 232.0, 164.0, 90.0, 71.0, 42.0, 30.0, 25.0, 18.0, 15.0, 13.0, 11.0, 6.0, 9.0, 6.0, 2.0, 8.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-8.1015625, -7.8243408203125, -7.547119140625, -7.2698974609375, -6.99267578125, -6.7154541015625, -6.438232421875, -6.1610107421875, -5.8837890625, -5.6065673828125, -5.329345703125, -5.0521240234375, -4.77490234375, -4.4976806640625, -4.220458984375, -3.9432373046875, -3.666015625, -3.3887939453125, -3.111572265625, -2.8343505859375, -2.55712890625, -2.2799072265625, -2.002685546875, -1.7254638671875, -1.4482421875, -1.1710205078125, -0.893798828125, -0.6165771484375, -0.33935546875, -0.0621337890625, 0.215087890625, 0.4923095703125, 0.76953125, 1.0467529296875, 1.323974609375, 1.6011962890625, 1.87841796875, 2.1556396484375, 2.432861328125, 2.7100830078125, 2.9873046875, 3.2645263671875, 3.541748046875, 3.8189697265625, 4.09619140625, 4.3734130859375, 4.650634765625, 4.9278564453125, 5.205078125, 5.4822998046875, 5.759521484375, 6.0367431640625, 6.31396484375, 6.5911865234375, 6.868408203125, 7.1456298828125, 7.4228515625, 7.7000732421875, 7.977294921875, 8.2545166015625, 8.53173828125, 8.8089599609375, 9.086181640625, 9.3634033203125, 9.640625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 4.0, 1.0, 6.0, 3.0, 4.0, 10.0, 4.0, 14.0, 21.0, 17.0, 39.0, 25.0, 68.0, 68.0, 101.0, 114.0, 135.0, 111.0, 70.0, 55.0, 35.0, 19.0, 15.0, 16.0, 13.0, 12.0, 14.0, 3.0, 5.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.8671875, -12.5098876953125, -12.152587890625, -11.7952880859375, -11.43798828125, -11.0806884765625, -10.723388671875, -10.3660888671875, -10.0087890625, -9.6514892578125, -9.294189453125, -8.9368896484375, -8.57958984375, -8.2222900390625, -7.864990234375, -7.5076904296875, -7.150390625, -6.7930908203125, -6.435791015625, -6.0784912109375, -5.72119140625, -5.3638916015625, -5.006591796875, -4.6492919921875, -4.2919921875, -3.9346923828125, -3.577392578125, -3.2200927734375, -2.86279296875, -2.5054931640625, -2.148193359375, -1.7908935546875, -1.43359375, -1.0762939453125, -0.718994140625, -0.3616943359375, -0.00439453125, 0.3529052734375, 0.710205078125, 1.0675048828125, 1.4248046875, 1.7821044921875, 2.139404296875, 2.4967041015625, 2.85400390625, 3.2113037109375, 3.568603515625, 3.9259033203125, 4.283203125, 4.6405029296875, 4.997802734375, 5.3551025390625, 5.71240234375, 6.0697021484375, 6.427001953125, 6.7843017578125, 7.1416015625, 7.4989013671875, 7.856201171875, 8.2135009765625, 8.57080078125, 8.9281005859375, 9.285400390625, 9.6427001953125, 10.0]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 11.0, 8.0, 18.0, 55.0, 111.0, 160.0, 305.0, 178.0, 80.0, 43.0, 11.0, 4.0, 6.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-251.28143310546875, -243.08099365234375, -234.8805694580078, -226.6801300048828, -218.47970581054688, -210.27926635742188, -202.07882690429688, -193.87838745117188, -185.67796325683594, -177.47752380371094, -169.277099609375, -161.07666015625, -152.876220703125, -144.67579650878906, -136.47535705566406, -128.27493286132812, -120.07449340820312, -111.87406158447266, -103.67362976074219, -95.47319030761719, -87.27275848388672, -79.07232666015625, -70.87188720703125, -62.67145538330078, -54.47102355957031, -46.270591735839844, -38.07015609741211, -29.869722366333008, -21.669288635253906, -13.468856811523438, -5.268421173095703, 2.9320144653320312, 11.132415771484375, 19.332849502563477, 27.533283233642578, 35.73371887207031, 43.93415069580078, 52.13458251953125, 60.335018157958984, 68.53545379638672, 76.73588562011719, 84.93631744384766, 93.13674926757812, 101.33718872070312, 109.5376205444336, 117.73805236816406, 125.93849182128906, 134.138916015625, 142.33935546875, 150.539794921875, 158.74021911621094, 166.94065856933594, 175.14108276367188, 183.34152221679688, 191.54196166992188, 199.74240112304688, 207.9428253173828, 216.1432647705078, 224.34368896484375, 232.54412841796875, 240.74456787109375, 248.9449920654297, 257.1454162597656, 265.3458557128906, 273.5462951660156]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 3.0, 6.0, 3.0, 7.0, 13.0, 6.0, 11.0, 7.0, 10.0, 17.0, 18.0, 20.0, 32.0, 24.0, 24.0, 28.0, 30.0, 34.0, 52.0, 57.0, 65.0, 49.0, 69.0, 53.0, 56.0, 47.0, 33.0, 23.0, 27.0, 26.0, 22.0, 20.0, 20.0, 16.0, 13.0, 12.0, 6.0, 13.0, 5.0, 5.0, 7.0, 8.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-93.75105285644531, -90.76712036132812, -87.78318786621094, -84.79924774169922, -81.81531524658203, -78.83138275146484, -75.84744262695312, -72.86351013183594, -69.87957763671875, -66.89564514160156, -63.91170883178711, -60.927772521972656, -57.94384002685547, -54.95990753173828, -51.97597122192383, -48.992034912109375, -46.00810241699219, -43.024169921875, -40.04023361206055, -37.056297302246094, -34.072364807128906, -31.088430404663086, -28.104496002197266, -25.120561599731445, -22.136627197265625, -19.152692794799805, -16.168758392333984, -13.184823989868164, -10.200889587402344, -7.216955184936523, -4.233020782470703, -1.2490863800048828, 1.7348556518554688, 4.718790054321289, 7.702724456787109, 10.68665885925293, 13.67059326171875, 16.65452766418457, 19.63846206665039, 22.62239646911621, 25.60633087158203, 28.59026527404785, 31.574199676513672, 34.558135986328125, 37.54206848144531, 40.5260009765625, 43.50993728637695, 46.493873596191406, 49.477806091308594, 52.46173858642578, 55.445674896240234, 58.42961120605469, 61.413543701171875, 64.39747619628906, 67.38140869140625, 70.36534881591797, 73.34928131103516, 76.33321380615234, 79.31715393066406, 82.30108642578125, 85.28501892089844, 88.26895141601562, 91.25288391113281, 94.23682403564453, 97.22075653076172]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 6.0, 3.0, 9.0, 7.0, 13.0, 22.0, 24.0, 39.0, 64.0, 94.0, 142.0, 275.0, 444.0, 777.0, 1436.0, 3022.0, 7209.0, 21462.0, 92102.0, 1092890.0, 2665248.0, 251477.0, 37318.0, 11222.0, 4261.0, 2005.0, 1054.0, 604.0, 372.0, 213.0, 131.0, 93.0, 77.0, 42.0, 30.0, 25.0, 13.0, 17.0, 9.0, 6.0, 13.0, 5.0, 4.0, 3.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-12.2421875, -11.8084716796875, -11.374755859375, -10.9410400390625, -10.50732421875, -10.0736083984375, -9.639892578125, -9.2061767578125, -8.7724609375, -8.3387451171875, -7.905029296875, -7.4713134765625, -7.03759765625, -6.6038818359375, -6.170166015625, -5.7364501953125, -5.302734375, -4.8690185546875, -4.435302734375, -4.0015869140625, -3.56787109375, -3.1341552734375, -2.700439453125, -2.2667236328125, -1.8330078125, -1.3992919921875, -0.965576171875, -0.5318603515625, -0.09814453125, 0.3355712890625, 0.769287109375, 1.2030029296875, 1.63671875, 2.0704345703125, 2.504150390625, 2.9378662109375, 3.37158203125, 3.8052978515625, 4.239013671875, 4.6727294921875, 5.1064453125, 5.5401611328125, 5.973876953125, 6.4075927734375, 6.84130859375, 7.2750244140625, 7.708740234375, 8.1424560546875, 8.576171875, 9.0098876953125, 9.443603515625, 9.8773193359375, 10.31103515625, 10.7447509765625, 11.178466796875, 11.6121826171875, 12.0458984375, 12.4796142578125, 12.913330078125, 13.3470458984375, 13.78076171875, 14.2144775390625, 14.648193359375, 15.0819091796875, 15.515625]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 3.0, 5.0, 6.0, 6.0, 11.0, 18.0, 19.0, 17.0, 33.0, 41.0, 55.0, 53.0, 49.0, 62.0, 69.0, 67.0, 77.0, 42.0, 68.0, 45.0, 47.0, 40.0, 41.0, 30.0, 32.0, 15.0, 11.0, 18.0, 8.0, 6.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-11.484375, -11.21612548828125, -10.9478759765625, -10.67962646484375, -10.411376953125, -10.14312744140625, -9.8748779296875, -9.60662841796875, -9.33837890625, -9.07012939453125, -8.8018798828125, -8.53363037109375, -8.265380859375, -7.99713134765625, -7.7288818359375, -7.46063232421875, -7.1923828125, -6.92413330078125, -6.6558837890625, -6.38763427734375, -6.119384765625, -5.85113525390625, -5.5828857421875, -5.31463623046875, -5.04638671875, -4.77813720703125, -4.5098876953125, -4.24163818359375, -3.973388671875, -3.70513916015625, -3.4368896484375, -3.16864013671875, -2.900390625, -2.63214111328125, -2.3638916015625, -2.09564208984375, -1.827392578125, -1.55914306640625, -1.2908935546875, -1.02264404296875, -0.75439453125, -0.48614501953125, -0.2178955078125, 0.05035400390625, 0.318603515625, 0.58685302734375, 0.8551025390625, 1.12335205078125, 1.3916015625, 1.65985107421875, 1.9281005859375, 2.19635009765625, 2.464599609375, 2.73284912109375, 3.0010986328125, 3.26934814453125, 3.53759765625, 3.80584716796875, 4.0740966796875, 4.34234619140625, 4.610595703125, 4.87884521484375, 5.1470947265625, 5.41534423828125, 5.68359375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 2.0, 4.0, 2.0, 11.0, 14.0, 20.0, 28.0, 29.0, 56.0, 58.0, 116.0, 159.0, 220.0, 379.0, 558.0, 1241.0, 3479.0, 16735.0, 372233.0, 3732154.0, 56523.0, 6524.0, 1775.0, 724.0, 452.0, 276.0, 180.0, 114.0, 69.0, 44.0, 28.0, 21.0, 13.0, 14.0, 5.0, 6.0, 10.0, 2.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-30.9375, -29.75927734375, -28.5810546875, -27.40283203125, -26.224609375, -25.04638671875, -23.8681640625, -22.68994140625, -21.51171875, -20.33349609375, -19.1552734375, -17.97705078125, -16.798828125, -15.62060546875, -14.4423828125, -13.26416015625, -12.0859375, -10.90771484375, -9.7294921875, -8.55126953125, -7.373046875, -6.19482421875, -5.0166015625, -3.83837890625, -2.66015625, -1.48193359375, -0.3037109375, 0.87451171875, 2.052734375, 3.23095703125, 4.4091796875, 5.58740234375, 6.765625, 7.94384765625, 9.1220703125, 10.30029296875, 11.478515625, 12.65673828125, 13.8349609375, 15.01318359375, 16.19140625, 17.36962890625, 18.5478515625, 19.72607421875, 20.904296875, 22.08251953125, 23.2607421875, 24.43896484375, 25.6171875, 26.79541015625, 27.9736328125, 29.15185546875, 30.330078125, 31.50830078125, 32.6865234375, 33.86474609375, 35.04296875, 36.22119140625, 37.3994140625, 38.57763671875, 39.755859375, 40.93408203125, 42.1123046875, 43.29052734375, 44.46875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 1.0, 7.0, 7.0, 15.0, 17.0, 23.0, 48.0, 109.0, 250.0, 710.0, 1382.0, 883.0, 335.0, 129.0, 70.0, 38.0, 21.0, 11.0, 5.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.875, -35.74658203125, -34.6181640625, -33.48974609375, -32.361328125, -31.23291015625, -30.1044921875, -28.97607421875, -27.84765625, -26.71923828125, -25.5908203125, -24.46240234375, -23.333984375, -22.20556640625, -21.0771484375, -19.94873046875, -18.8203125, -17.69189453125, -16.5634765625, -15.43505859375, -14.306640625, -13.17822265625, -12.0498046875, -10.92138671875, -9.79296875, -8.66455078125, -7.5361328125, -6.40771484375, -5.279296875, -4.15087890625, -3.0224609375, -1.89404296875, -0.765625, 0.36279296875, 1.4912109375, 2.61962890625, 3.748046875, 4.87646484375, 6.0048828125, 7.13330078125, 8.26171875, 9.39013671875, 10.5185546875, 11.64697265625, 12.775390625, 13.90380859375, 15.0322265625, 16.16064453125, 17.2890625, 18.41748046875, 19.5458984375, 20.67431640625, 21.802734375, 22.93115234375, 24.0595703125, 25.18798828125, 26.31640625, 27.44482421875, 28.5732421875, 29.70166015625, 30.830078125, 31.95849609375, 33.0869140625, 34.21533203125, 35.34375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 1.0, 1.0, 0.0, 5.0, 8.0, 20.0, 83.0, 303.0, 418.0, 108.0, 43.0, 10.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-851.09033203125, -833.4228515625, -815.7554321289062, -798.0880126953125, -780.4205322265625, -762.7530517578125, -745.0856323242188, -727.418212890625, -709.750732421875, -692.083251953125, -674.4158325195312, -656.7484130859375, -639.0809326171875, -621.4134521484375, -603.7460327148438, -586.07861328125, -568.4111328125, -550.74365234375, -533.0762329101562, -515.4088134765625, -497.7413330078125, -480.0738830566406, -462.40643310546875, -444.7389831542969, -427.071533203125, -409.4040832519531, -391.73663330078125, -374.0691833496094, -356.4017333984375, -338.7342834472656, -321.06683349609375, -303.3993835449219, -285.73187255859375, -268.0644226074219, -250.39697265625, -232.72952270507812, -215.06207275390625, -197.39462280273438, -179.7271728515625, -162.05972290039062, -144.39227294921875, -126.72482299804688, -109.057373046875, -91.38992309570312, -73.72247314453125, -56.055023193359375, -38.3875732421875, -20.720123291015625, -3.05267333984375, 14.614776611328125, 32.2822265625, 49.949676513671875, 67.61712646484375, 85.28457641601562, 102.9520263671875, 120.61947631835938, 138.28692626953125, 155.95437622070312, 173.621826171875, 191.28927612304688, 208.95672607421875, 226.62417602539062, 244.2916259765625, 261.9590759277344, 279.62652587890625]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 8.0, 6.0, 11.0, 15.0, 14.0, 20.0, 21.0, 37.0, 51.0, 51.0, 52.0, 59.0, 63.0, 60.0, 78.0, 48.0, 71.0, 52.0, 45.0, 55.0, 43.0, 38.0, 20.0, 14.0, 24.0, 13.0, 11.0, 4.0, 5.0, 8.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-140.09962463378906, -136.37442016601562, -132.64923095703125, -128.9240264892578, -125.1988296508789, -121.4736328125, -117.74842834472656, -114.02323150634766, -110.29803466796875, -106.57283782958984, -102.84764099121094, -99.1224365234375, -95.3972396850586, -91.67204284667969, -87.94683837890625, -84.22164154052734, -80.49644470214844, -76.77124786376953, -73.04605102539062, -69.32084655761719, -65.59564971923828, -61.870452880859375, -58.1452522277832, -54.42005157470703, -50.694854736328125, -46.96965789794922, -43.24445724487305, -39.519256591796875, -35.79405975341797, -32.06886291503906, -28.34366226196289, -24.61846351623535, -20.893272399902344, -17.168073654174805, -13.442874908447266, -9.717676162719727, -5.9924774169921875, -2.2672786712646484, 1.4579200744628906, 5.18311882019043, 8.908317565917969, 12.633516311645508, 16.358715057373047, 20.083913803100586, 23.809112548828125, 27.534311294555664, 31.259510040283203, 34.984710693359375, 38.70990753173828, 42.43510437011719, 46.16030502319336, 49.88550567626953, 53.61070251464844, 57.335899353027344, 61.061100006103516, 64.78630065917969, 68.5114974975586, 72.2366943359375, 75.96189880371094, 79.68709564208984, 83.41229248046875, 87.13748931884766, 90.86268615722656, 94.587890625, 98.3130874633789]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 4.0, 3.0, 6.0, 5.0, 5.0, 15.0, 17.0, 35.0, 35.0, 73.0, 102.0, 137.0, 250.0, 422.0, 734.0, 1210.0, 2374.0, 4538.0, 10208.0, 30788.0, 127049.0, 451899.0, 312010.0, 72082.0, 19502.0, 7180.0, 3384.0, 1827.0, 1041.0, 600.0, 368.0, 254.0, 132.0, 69.0, 63.0, 46.0, 30.0, 15.0, 13.0, 11.0, 4.0, 6.0, 1.0, 5.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.6796875, -12.2237548828125, -11.767822265625, -11.3118896484375, -10.85595703125, -10.4000244140625, -9.944091796875, -9.4881591796875, -9.0322265625, -8.5762939453125, -8.120361328125, -7.6644287109375, -7.20849609375, -6.7525634765625, -6.296630859375, -5.8406982421875, -5.384765625, -4.9288330078125, -4.472900390625, -4.0169677734375, -3.56103515625, -3.1051025390625, -2.649169921875, -2.1932373046875, -1.7373046875, -1.2813720703125, -0.825439453125, -0.3695068359375, 0.08642578125, 0.5423583984375, 0.998291015625, 1.4542236328125, 1.91015625, 2.3660888671875, 2.822021484375, 3.2779541015625, 3.73388671875, 4.1898193359375, 4.645751953125, 5.1016845703125, 5.5576171875, 6.0135498046875, 6.469482421875, 6.9254150390625, 7.38134765625, 7.8372802734375, 8.293212890625, 8.7491455078125, 9.205078125, 9.6610107421875, 10.116943359375, 10.5728759765625, 11.02880859375, 11.4847412109375, 11.940673828125, 12.3966064453125, 12.8525390625, 13.3084716796875, 13.764404296875, 14.2203369140625, 14.67626953125, 15.1322021484375, 15.588134765625, 16.0440673828125, 16.5]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 5.0, 20.0, 10.0, 13.0, 17.0, 26.0, 23.0, 34.0, 34.0, 26.0, 56.0, 55.0, 46.0, 43.0, 71.0, 67.0, 70.0, 54.0, 46.0, 36.0, 50.0, 31.0, 39.0, 27.0, 25.0, 13.0, 14.0, 14.0, 6.0, 11.0, 11.0, 7.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-10.8828125, -10.60675048828125, -10.3306884765625, -10.05462646484375, -9.778564453125, -9.50250244140625, -9.2264404296875, -8.95037841796875, -8.67431640625, -8.39825439453125, -8.1221923828125, -7.84613037109375, -7.570068359375, -7.29400634765625, -7.0179443359375, -6.74188232421875, -6.4658203125, -6.18975830078125, -5.9136962890625, -5.63763427734375, -5.361572265625, -5.08551025390625, -4.8094482421875, -4.53338623046875, -4.25732421875, -3.98126220703125, -3.7052001953125, -3.42913818359375, -3.153076171875, -2.87701416015625, -2.6009521484375, -2.32489013671875, -2.048828125, -1.77276611328125, -1.4967041015625, -1.22064208984375, -0.944580078125, -0.66851806640625, -0.3924560546875, -0.11639404296875, 0.15966796875, 0.43572998046875, 0.7117919921875, 0.98785400390625, 1.263916015625, 1.53997802734375, 1.8160400390625, 2.09210205078125, 2.3681640625, 2.64422607421875, 2.9202880859375, 3.19635009765625, 3.472412109375, 3.74847412109375, 4.0245361328125, 4.30059814453125, 4.57666015625, 4.85272216796875, 5.1287841796875, 5.40484619140625, 5.680908203125, 5.95697021484375, 6.2330322265625, 6.50909423828125, 6.78515625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 5.0, 7.0, 15.0, 13.0, 17.0, 23.0, 40.0, 53.0, 96.0, 164.0, 258.0, 453.0, 794.0, 1654.0, 4108.0, 15669.0, 171139.0, 779121.0, 60621.0, 8697.0, 2840.0, 1254.0, 647.0, 326.0, 205.0, 127.0, 83.0, 40.0, 32.0, 26.0, 10.0, 4.0, 6.0, 6.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-30.953125, -30.051025390625, -29.14892578125, -28.246826171875, -27.3447265625, -26.442626953125, -25.54052734375, -24.638427734375, -23.736328125, -22.834228515625, -21.93212890625, -21.030029296875, -20.1279296875, -19.225830078125, -18.32373046875, -17.421630859375, -16.51953125, -15.617431640625, -14.71533203125, -13.813232421875, -12.9111328125, -12.009033203125, -11.10693359375, -10.204833984375, -9.302734375, -8.400634765625, -7.49853515625, -6.596435546875, -5.6943359375, -4.792236328125, -3.89013671875, -2.988037109375, -2.0859375, -1.183837890625, -0.28173828125, 0.620361328125, 1.5224609375, 2.424560546875, 3.32666015625, 4.228759765625, 5.130859375, 6.032958984375, 6.93505859375, 7.837158203125, 8.7392578125, 9.641357421875, 10.54345703125, 11.445556640625, 12.34765625, 13.249755859375, 14.15185546875, 15.053955078125, 15.9560546875, 16.858154296875, 17.76025390625, 18.662353515625, 19.564453125, 20.466552734375, 21.36865234375, 22.270751953125, 23.1728515625, 24.074951171875, 24.97705078125, 25.879150390625, 26.78125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 6.0, 5.0, 2.0, 9.0, 9.0, 5.0, 9.0, 14.0, 10.0, 20.0, 14.0, 18.0, 18.0, 25.0, 28.0, 37.0, 41.0, 36.0, 37.0, 32.0, 45.0, 46.0, 45.0, 46.0, 46.0, 50.0, 43.0, 33.0, 40.0, 36.0, 36.0, 18.0, 23.0, 19.0, 15.0, 16.0, 18.0, 10.0, 7.0, 4.0, 10.0, 11.0, 2.0, 6.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.828125, -24.04833984375, -23.2685546875, -22.48876953125, -21.708984375, -20.92919921875, -20.1494140625, -19.36962890625, -18.58984375, -17.81005859375, -17.0302734375, -16.25048828125, -15.470703125, -14.69091796875, -13.9111328125, -13.13134765625, -12.3515625, -11.57177734375, -10.7919921875, -10.01220703125, -9.232421875, -8.45263671875, -7.6728515625, -6.89306640625, -6.11328125, -5.33349609375, -4.5537109375, -3.77392578125, -2.994140625, -2.21435546875, -1.4345703125, -0.65478515625, 0.125, 0.90478515625, 1.6845703125, 2.46435546875, 3.244140625, 4.02392578125, 4.8037109375, 5.58349609375, 6.36328125, 7.14306640625, 7.9228515625, 8.70263671875, 9.482421875, 10.26220703125, 11.0419921875, 11.82177734375, 12.6015625, 13.38134765625, 14.1611328125, 14.94091796875, 15.720703125, 16.50048828125, 17.2802734375, 18.06005859375, 18.83984375, 19.61962890625, 20.3994140625, 21.17919921875, 21.958984375, 22.73876953125, 23.5185546875, 24.29833984375, 25.078125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 5.0, 5.0, 1.0, 3.0, 5.0, 14.0, 15.0, 12.0, 40.0, 44.0, 66.0, 84.0, 143.0, 208.0, 407.0, 777.0, 1543.0, 3673.0, 9126.0, 25606.0, 85708.0, 505131.0, 303824.0, 74922.0, 22656.0, 8150.0, 3288.0, 1477.0, 662.0, 372.0, 214.0, 118.0, 79.0, 45.0, 30.0, 27.0, 20.0, 13.0, 12.0, 9.0, 8.0, 3.0, 8.0, 2.0, 1.0, 5.0, 0.0, 0.0, 2.0], "bins": [-7.28125, -7.08416748046875, -6.8870849609375, -6.69000244140625, -6.492919921875, -6.29583740234375, -6.0987548828125, -5.90167236328125, -5.70458984375, -5.50750732421875, -5.3104248046875, -5.11334228515625, -4.916259765625, -4.71917724609375, -4.5220947265625, -4.32501220703125, -4.1279296875, -3.93084716796875, -3.7337646484375, -3.53668212890625, -3.339599609375, -3.14251708984375, -2.9454345703125, -2.74835205078125, -2.55126953125, -2.35418701171875, -2.1571044921875, -1.96002197265625, -1.762939453125, -1.56585693359375, -1.3687744140625, -1.17169189453125, -0.974609375, -0.77752685546875, -0.5804443359375, -0.38336181640625, -0.186279296875, 0.01080322265625, 0.2078857421875, 0.40496826171875, 0.60205078125, 0.79913330078125, 0.9962158203125, 1.19329833984375, 1.390380859375, 1.58746337890625, 1.7845458984375, 1.98162841796875, 2.1787109375, 2.37579345703125, 2.5728759765625, 2.76995849609375, 2.967041015625, 3.16412353515625, 3.3612060546875, 3.55828857421875, 3.75537109375, 3.95245361328125, 4.1495361328125, 4.34661865234375, 4.543701171875, 4.74078369140625, 4.9378662109375, 5.13494873046875, 5.33203125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 8.0, 0.0, 5.0, 5.0, 6.0, 5.0, 14.0, 13.0, 11.0, 16.0, 25.0, 29.0, 34.0, 66.0, 61.0, 89.0, 122.0, 88.0, 106.0, 74.0, 51.0, 43.0, 23.0, 26.0, 25.0, 13.0, 11.0, 8.0, 6.0, 6.0, 3.0, 6.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0018520355224609375, -0.001794382929801941, -0.0017367303371429443, -0.0016790777444839478, -0.0016214251518249512, -0.0015637725591659546, -0.001506119966506958, -0.0014484673738479614, -0.0013908147811889648, -0.0013331621885299683, -0.0012755095958709717, -0.001217857003211975, -0.0011602044105529785, -0.001102551817893982, -0.0010448992252349854, -0.0009872466325759888, -0.0009295940399169922, -0.0008719414472579956, -0.000814288854598999, -0.0007566362619400024, -0.0006989836692810059, -0.0006413310766220093, -0.0005836784839630127, -0.0005260258913040161, -0.00046837329864501953, -0.00041072070598602295, -0.00035306811332702637, -0.0002954155206680298, -0.0002377629280090332, -0.00018011033535003662, -0.00012245774269104004, -6.480515003204346e-05, -7.152557373046875e-06, 5.050003528594971e-05, 0.00010815262794494629, 0.00016580522060394287, 0.00022345781326293945, 0.00028111040592193604, 0.0003387629985809326, 0.0003964155912399292, 0.0004540681838989258, 0.0005117207765579224, 0.0005693733692169189, 0.0006270259618759155, 0.0006846785545349121, 0.0007423311471939087, 0.0007999837398529053, 0.0008576363325119019, 0.0009152889251708984, 0.000972941517829895, 0.0010305941104888916, 0.0010882467031478882, 0.0011458992958068848, 0.0012035518884658813, 0.001261204481124878, 0.0013188570737838745, 0.001376509666442871, 0.0014341622591018677, 0.0014918148517608643, 0.0015494674444198608, 0.0016071200370788574, 0.001664772629737854, 0.0017224252223968506, 0.0017800778150558472, 0.0018377304077148438]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 0.0, 6.0, 1.0, 10.0, 12.0, 14.0, 24.0, 39.0, 52.0, 79.0, 120.0, 207.0, 322.0, 604.0, 1215.0, 2732.0, 6870.0, 20414.0, 75193.0, 485284.0, 352691.0, 71536.0, 19458.0, 6453.0, 2625.0, 1132.0, 577.0, 306.0, 208.0, 120.0, 77.0, 58.0, 48.0, 24.0, 18.0, 5.0, 7.0, 7.0, 4.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.1953125, -6.955322265625, -6.71533203125, -6.475341796875, -6.2353515625, -5.995361328125, -5.75537109375, -5.515380859375, -5.275390625, -5.035400390625, -4.79541015625, -4.555419921875, -4.3154296875, -4.075439453125, -3.83544921875, -3.595458984375, -3.35546875, -3.115478515625, -2.87548828125, -2.635498046875, -2.3955078125, -2.155517578125, -1.91552734375, -1.675537109375, -1.435546875, -1.195556640625, -0.95556640625, -0.715576171875, -0.4755859375, -0.235595703125, 0.00439453125, 0.244384765625, 0.484375, 0.724365234375, 0.96435546875, 1.204345703125, 1.4443359375, 1.684326171875, 1.92431640625, 2.164306640625, 2.404296875, 2.644287109375, 2.88427734375, 3.124267578125, 3.3642578125, 3.604248046875, 3.84423828125, 4.084228515625, 4.32421875, 4.564208984375, 4.80419921875, 5.044189453125, 5.2841796875, 5.524169921875, 5.76416015625, 6.004150390625, 6.244140625, 6.484130859375, 6.72412109375, 6.964111328125, 7.2041015625, 7.444091796875, 7.68408203125, 7.924072265625, 8.1640625]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 4.0, 6.0, 8.0, 9.0, 15.0, 24.0, 26.0, 44.0, 51.0, 69.0, 65.0, 93.0, 105.0, 131.0, 78.0, 66.0, 44.0, 40.0, 27.0, 27.0, 12.0, 16.0, 10.0, 8.0, 13.0, 6.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.62890625, -6.36297607421875, -6.0970458984375, -5.83111572265625, -5.565185546875, -5.29925537109375, -5.0333251953125, -4.76739501953125, -4.50146484375, -4.23553466796875, -3.9696044921875, -3.70367431640625, -3.437744140625, -3.17181396484375, -2.9058837890625, -2.63995361328125, -2.3740234375, -2.10809326171875, -1.8421630859375, -1.57623291015625, -1.310302734375, -1.04437255859375, -0.7784423828125, -0.51251220703125, -0.24658203125, 0.01934814453125, 0.2852783203125, 0.55120849609375, 0.817138671875, 1.08306884765625, 1.3489990234375, 1.61492919921875, 1.880859375, 2.14678955078125, 2.4127197265625, 2.67864990234375, 2.944580078125, 3.21051025390625, 3.4764404296875, 3.74237060546875, 4.00830078125, 4.27423095703125, 4.5401611328125, 4.80609130859375, 5.072021484375, 5.33795166015625, 5.6038818359375, 5.86981201171875, 6.1357421875, 6.40167236328125, 6.6676025390625, 6.93353271484375, 7.199462890625, 7.46539306640625, 7.7313232421875, 7.99725341796875, 8.26318359375, 8.52911376953125, 8.7950439453125, 9.06097412109375, 9.326904296875, 9.59283447265625, 9.8587646484375, 10.12469482421875, 10.390625]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 9.0, 12.0, 26.0, 58.0, 145.0, 348.0, 198.0, 110.0, 53.0, 20.0, 16.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-142.0369873046875, -134.0119171142578, -125.98684692382812, -117.9617691040039, -109.93669891357422, -101.91162872314453, -93.88655090332031, -85.86148071289062, -77.83641052246094, -69.81134033203125, -61.7862663269043, -53.761192321777344, -45.736122131347656, -37.71105194091797, -29.685977935791016, -21.660903930664062, -13.635833740234375, -5.610761642456055, 2.4143104553222656, 10.439382553100586, 18.464454650878906, 26.489524841308594, 34.51459884643555, 42.5396728515625, 50.56474304199219, 58.589813232421875, 66.61488342285156, 74.63996124267578, 82.66503143310547, 90.69010162353516, 98.71517944335938, 106.74024963378906, 114.76531982421875, 122.79039001464844, 130.81546020507812, 138.8405303955078, 146.8656005859375, 154.89068603515625, 162.91575622558594, 170.94082641601562, 178.9658966064453, 186.990966796875, 195.0160369873047, 203.04110717773438, 211.06619262695312, 219.09124755859375, 227.1163330078125, 235.1414031982422, 243.16647338867188, 251.19154357910156, 259.21661376953125, 267.24169921875, 275.2667541503906, 283.2918395996094, 291.31689453125, 299.34197998046875, 307.3670654296875, 315.39215087890625, 323.4172058105469, 331.4422912597656, 339.46734619140625, 347.492431640625, 355.5174865722656, 363.5425720214844, 371.567626953125]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 4.0, 3.0, 7.0, 3.0, 5.0, 4.0, 13.0, 6.0, 10.0, 11.0, 23.0, 26.0, 20.0, 31.0, 30.0, 26.0, 26.0, 27.0, 42.0, 59.0, 87.0, 86.0, 85.0, 52.0, 45.0, 33.0, 32.0, 26.0, 29.0, 27.0, 21.0, 22.0, 18.0, 13.0, 10.0, 17.0, 5.0, 9.0, 3.0, 1.0, 2.0, 3.0, 1.0, 6.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-126.36698913574219, -122.80669403076172, -119.24639129638672, -115.68609619140625, -112.12579345703125, -108.56549835205078, -105.00520324707031, -101.44490051269531, -97.88459777832031, -94.32430267333984, -90.76399993896484, -87.20370483398438, -83.64340209960938, -80.0831069946289, -76.52281188964844, -72.96250915527344, -69.40221405029297, -65.8419189453125, -62.2816162109375, -58.72132110595703, -55.16101837158203, -51.60072326660156, -48.04042434692383, -44.480125427246094, -40.91982650756836, -37.359527587890625, -33.79922866821289, -30.23893165588379, -26.678632736206055, -23.11833381652832, -19.55803680419922, -15.997737884521484, -12.43743896484375, -8.877140045166016, -5.316842079162598, -1.7565441131591797, 1.8037548065185547, 5.364053726196289, 8.92435073852539, 12.484649658203125, 16.04494857788086, 19.605247497558594, 23.165546417236328, 26.72584342956543, 30.286142349243164, 33.84644317626953, 37.40673828125, 40.967037200927734, 44.52733612060547, 48.0876350402832, 51.64793395996094, 55.208229064941406, 58.768531799316406, 62.328826904296875, 65.88912963867188, 69.44942474365234, 73.00971984863281, 76.57001495361328, 80.13031768798828, 83.69061279296875, 87.25091552734375, 90.81121063232422, 94.37150573730469, 97.93180847167969, 101.49211120605469]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0, 9.0, 5.0, 10.0, 10.0, 23.0, 39.0, 69.0, 99.0, 144.0, 225.0, 343.0, 651.0, 1160.0, 2242.0, 4838.0, 12692.0, 46995.0, 330864.0, 2557547.0, 1090939.0, 109236.0, 21619.0, 7328.0, 3208.0, 1532.0, 932.0, 473.0, 346.0, 202.0, 155.0, 103.0, 63.0, 46.0, 23.0, 24.0, 20.0, 21.0, 13.0, 4.0, 11.0, 5.0, 2.0, 7.0, 1.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.28125, -9.8819580078125, -9.482666015625, -9.0833740234375, -8.68408203125, -8.2847900390625, -7.885498046875, -7.4862060546875, -7.0869140625, -6.6876220703125, -6.288330078125, -5.8890380859375, -5.48974609375, -5.0904541015625, -4.691162109375, -4.2918701171875, -3.892578125, -3.4932861328125, -3.093994140625, -2.6947021484375, -2.29541015625, -1.8961181640625, -1.496826171875, -1.0975341796875, -0.6982421875, -0.2989501953125, 0.100341796875, 0.4996337890625, 0.89892578125, 1.2982177734375, 1.697509765625, 2.0968017578125, 2.49609375, 2.8953857421875, 3.294677734375, 3.6939697265625, 4.09326171875, 4.4925537109375, 4.891845703125, 5.2911376953125, 5.6904296875, 6.0897216796875, 6.489013671875, 6.8883056640625, 7.28759765625, 7.6868896484375, 8.086181640625, 8.4854736328125, 8.884765625, 9.2840576171875, 9.683349609375, 10.0826416015625, 10.48193359375, 10.8812255859375, 11.280517578125, 11.6798095703125, 12.0791015625, 12.4783935546875, 12.877685546875, 13.2769775390625, 13.67626953125, 14.0755615234375, 14.474853515625, 14.8741455078125, 15.2734375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 4.0, 3.0, 6.0, 7.0, 13.0, 11.0, 18.0, 15.0, 24.0, 29.0, 23.0, 49.0, 47.0, 47.0, 45.0, 42.0, 65.0, 54.0, 47.0, 53.0, 38.0, 63.0, 40.0, 37.0, 35.0, 36.0, 32.0, 20.0, 23.0, 18.0, 12.0, 16.0, 8.0, 8.0, 9.0, 7.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-9.6796875, -9.4195556640625, -9.159423828125, -8.8992919921875, -8.63916015625, -8.3790283203125, -8.118896484375, -7.8587646484375, -7.5986328125, -7.3385009765625, -7.078369140625, -6.8182373046875, -6.55810546875, -6.2979736328125, -6.037841796875, -5.7777099609375, -5.517578125, -5.2574462890625, -4.997314453125, -4.7371826171875, -4.47705078125, -4.2169189453125, -3.956787109375, -3.6966552734375, -3.4365234375, -3.1763916015625, -2.916259765625, -2.6561279296875, -2.39599609375, -2.1358642578125, -1.875732421875, -1.6156005859375, -1.35546875, -1.0953369140625, -0.835205078125, -0.5750732421875, -0.31494140625, -0.0548095703125, 0.205322265625, 0.4654541015625, 0.7255859375, 0.9857177734375, 1.245849609375, 1.5059814453125, 1.76611328125, 2.0262451171875, 2.286376953125, 2.5465087890625, 2.806640625, 3.0667724609375, 3.326904296875, 3.5870361328125, 3.84716796875, 4.1072998046875, 4.367431640625, 4.6275634765625, 4.8876953125, 5.1478271484375, 5.407958984375, 5.6680908203125, 5.92822265625, 6.1883544921875, 6.448486328125, 6.7086181640625, 6.96875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 8.0, 10.0, 11.0, 25.0, 56.0, 139.0, 334.0, 1509.0, 53512.0, 4130764.0, 6796.0, 728.0, 219.0, 86.0, 46.0, 32.0, 7.0, 7.0, 2.0, 2.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-89.5, -86.2197265625, -82.939453125, -79.6591796875, -76.37890625, -73.0986328125, -69.818359375, -66.5380859375, -63.2578125, -59.9775390625, -56.697265625, -53.4169921875, -50.13671875, -46.8564453125, -43.576171875, -40.2958984375, -37.015625, -33.7353515625, -30.455078125, -27.1748046875, -23.89453125, -20.6142578125, -17.333984375, -14.0537109375, -10.7734375, -7.4931640625, -4.212890625, -0.9326171875, 2.34765625, 5.6279296875, 8.908203125, 12.1884765625, 15.46875, 18.7490234375, 22.029296875, 25.3095703125, 28.58984375, 31.8701171875, 35.150390625, 38.4306640625, 41.7109375, 44.9912109375, 48.271484375, 51.5517578125, 54.83203125, 58.1123046875, 61.392578125, 64.6728515625, 67.953125, 71.2333984375, 74.513671875, 77.7939453125, 81.07421875, 84.3544921875, 87.634765625, 90.9150390625, 94.1953125, 97.4755859375, 100.755859375, 104.0361328125, 107.31640625, 110.5966796875, 113.876953125, 117.1572265625, 120.4375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 15.0, 26.0, 65.0, 179.0, 586.0, 1775.0, 958.0, 278.0, 103.0, 42.0, 19.0, 11.0, 7.0, 4.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.34375, -31.80810546875, -30.2724609375, -28.73681640625, -27.201171875, -25.66552734375, -24.1298828125, -22.59423828125, -21.05859375, -19.52294921875, -17.9873046875, -16.45166015625, -14.916015625, -13.38037109375, -11.8447265625, -10.30908203125, -8.7734375, -7.23779296875, -5.7021484375, -4.16650390625, -2.630859375, -1.09521484375, 0.4404296875, 1.97607421875, 3.51171875, 5.04736328125, 6.5830078125, 8.11865234375, 9.654296875, 11.18994140625, 12.7255859375, 14.26123046875, 15.796875, 17.33251953125, 18.8681640625, 20.40380859375, 21.939453125, 23.47509765625, 25.0107421875, 26.54638671875, 28.08203125, 29.61767578125, 31.1533203125, 32.68896484375, 34.224609375, 35.76025390625, 37.2958984375, 38.83154296875, 40.3671875, 41.90283203125, 43.4384765625, 44.97412109375, 46.509765625, 48.04541015625, 49.5810546875, 51.11669921875, 52.65234375, 54.18798828125, 55.7236328125, 57.25927734375, 58.794921875, 60.33056640625, 61.8662109375, 63.40185546875, 64.9375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 2.0, 6.0, 4.0, 11.0, 15.0, 53.0, 100.0, 196.0, 244.0, 174.0, 102.0, 57.0, 20.0, 8.0, 9.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-349.3370361328125, -339.99755859375, -330.6580810546875, -321.318603515625, -311.9791259765625, -302.6396484375, -293.3001708984375, -283.960693359375, -274.6212158203125, -265.28173828125, -255.9422607421875, -246.602783203125, -237.2633056640625, -227.923828125, -218.58436584472656, -209.24488830566406, -199.90542602539062, -190.56594848632812, -181.22647094726562, -171.88699340820312, -162.54751586914062, -153.20803833007812, -143.8685760498047, -134.5290985107422, -125.18962097167969, -115.85014343261719, -106.51066589355469, -97.17119598388672, -87.83171844482422, -78.49224090576172, -69.15277099609375, -59.81329345703125, -50.47381591796875, -41.13433837890625, -31.794864654541016, -22.45538902282715, -13.115913391113281, -3.7764358520507812, 5.563037872314453, 14.902511596679688, 24.241989135742188, 33.58146667480469, 42.92094039916992, 52.260414123535156, 61.599891662597656, 70.93936920166016, 80.27883911132812, 89.61831665039062, 98.95779418945312, 108.29727172851562, 117.63674926757812, 126.9762191772461, 136.31570434570312, 145.65518188476562, 154.99464416503906, 164.33412170410156, 173.67359924316406, 183.01307678222656, 192.35255432128906, 201.69203186035156, 211.031494140625, 220.3709716796875, 229.71044921875, 239.0499267578125, 248.389404296875]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 6.0, 4.0, 2.0, 6.0, 12.0, 9.0, 18.0, 16.0, 20.0, 21.0, 31.0, 39.0, 50.0, 40.0, 45.0, 57.0, 43.0, 56.0, 69.0, 78.0, 55.0, 43.0, 42.0, 38.0, 35.0, 22.0, 27.0, 18.0, 16.0, 25.0, 14.0, 13.0, 15.0, 3.0, 7.0, 5.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-102.00552368164062, -98.64037322998047, -95.27522277832031, -91.91007995605469, -88.54492950439453, -85.17977905273438, -81.81463623046875, -78.4494857788086, -75.08433532714844, -71.71918487548828, -68.35403442382812, -64.9888916015625, -61.623741149902344, -58.25859069824219, -54.8934440612793, -51.528297424316406, -48.16314697265625, -44.797996520996094, -41.4328498840332, -38.06770324707031, -34.702552795410156, -31.337404251098633, -27.97225570678711, -24.607107162475586, -21.241958618164062, -17.87681007385254, -14.511661529541016, -11.146512985229492, -7.781364440917969, -4.416215896606445, -1.0510673522949219, 2.3140811920166016, 5.679237365722656, 9.04438591003418, 12.409534454345703, 15.774682998657227, 19.13983154296875, 22.504980087280273, 25.870128631591797, 29.23527717590332, 32.600425720214844, 35.965576171875, 39.33072280883789, 42.69586944580078, 46.06101989746094, 49.426170349121094, 52.791316986083984, 56.156463623046875, 59.52161407470703, 62.88676452636719, 66.25190734863281, 69.61705780029297, 72.98220825195312, 76.34735870361328, 79.71250915527344, 83.07765197753906, 86.44280242919922, 89.80795288085938, 93.173095703125, 96.53824615478516, 99.90339660644531, 103.26854705810547, 106.63369750976562, 109.99884033203125, 113.3639907836914]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 6.0, 6.0, 8.0, 5.0, 12.0, 9.0, 19.0, 31.0, 56.0, 67.0, 107.0, 161.0, 220.0, 341.0, 493.0, 860.0, 1345.0, 2411.0, 4449.0, 8939.0, 19820.0, 47093.0, 123198.0, 316406.0, 314597.0, 121677.0, 47141.0, 19606.0, 8987.0, 4520.0, 2341.0, 1343.0, 794.0, 493.0, 338.0, 214.0, 132.0, 79.0, 81.0, 52.0, 28.0, 24.0, 17.0, 13.0, 10.0, 4.0, 3.0, 1.0, 4.0, 2.0, 0.0, 0.0, 3.0, 2.0], "bins": [-10.1796875, -9.8802490234375, -9.580810546875, -9.2813720703125, -8.98193359375, -8.6824951171875, -8.383056640625, -8.0836181640625, -7.7841796875, -7.4847412109375, -7.185302734375, -6.8858642578125, -6.58642578125, -6.2869873046875, -5.987548828125, -5.6881103515625, -5.388671875, -5.0892333984375, -4.789794921875, -4.4903564453125, -4.19091796875, -3.8914794921875, -3.592041015625, -3.2926025390625, -2.9931640625, -2.6937255859375, -2.394287109375, -2.0948486328125, -1.79541015625, -1.4959716796875, -1.196533203125, -0.8970947265625, -0.59765625, -0.2982177734375, 0.001220703125, 0.3006591796875, 0.60009765625, 0.8995361328125, 1.198974609375, 1.4984130859375, 1.7978515625, 2.0972900390625, 2.396728515625, 2.6961669921875, 2.99560546875, 3.2950439453125, 3.594482421875, 3.8939208984375, 4.193359375, 4.4927978515625, 4.792236328125, 5.0916748046875, 5.39111328125, 5.6905517578125, 5.989990234375, 6.2894287109375, 6.5888671875, 6.8883056640625, 7.187744140625, 7.4871826171875, 7.78662109375, 8.0860595703125, 8.385498046875, 8.6849365234375, 8.984375]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 1.0, 3.0, 6.0, 5.0, 4.0, 12.0, 13.0, 27.0, 21.0, 24.0, 23.0, 30.0, 42.0, 58.0, 38.0, 44.0, 60.0, 66.0, 61.0, 51.0, 61.0, 51.0, 43.0, 45.0, 48.0, 34.0, 28.0, 18.0, 19.0, 21.0, 13.0, 11.0, 3.0, 7.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.625, -11.3040771484375, -10.983154296875, -10.6622314453125, -10.34130859375, -10.0203857421875, -9.699462890625, -9.3785400390625, -9.0576171875, -8.7366943359375, -8.415771484375, -8.0948486328125, -7.77392578125, -7.4530029296875, -7.132080078125, -6.8111572265625, -6.490234375, -6.1693115234375, -5.848388671875, -5.5274658203125, -5.20654296875, -4.8856201171875, -4.564697265625, -4.2437744140625, -3.9228515625, -3.6019287109375, -3.281005859375, -2.9600830078125, -2.63916015625, -2.3182373046875, -1.997314453125, -1.6763916015625, -1.35546875, -1.0345458984375, -0.713623046875, -0.3927001953125, -0.07177734375, 0.2491455078125, 0.570068359375, 0.8909912109375, 1.2119140625, 1.5328369140625, 1.853759765625, 2.1746826171875, 2.49560546875, 2.8165283203125, 3.137451171875, 3.4583740234375, 3.779296875, 4.1002197265625, 4.421142578125, 4.7420654296875, 5.06298828125, 5.3839111328125, 5.704833984375, 6.0257568359375, 6.3466796875, 6.6676025390625, 6.988525390625, 7.3094482421875, 7.63037109375, 7.9512939453125, 8.272216796875, 8.5931396484375, 8.9140625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 3.0, 8.0, 8.0, 13.0, 16.0, 20.0, 43.0, 38.0, 79.0, 109.0, 226.0, 402.0, 1058.0, 3238.0, 18681.0, 286772.0, 701426.0, 29882.0, 4256.0, 1169.0, 475.0, 251.0, 137.0, 85.0, 48.0, 45.0, 14.0, 18.0, 7.0, 10.0, 5.0, 5.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-35.15625, -34.09423828125, -33.0322265625, -31.97021484375, -30.908203125, -29.84619140625, -28.7841796875, -27.72216796875, -26.66015625, -25.59814453125, -24.5361328125, -23.47412109375, -22.412109375, -21.35009765625, -20.2880859375, -19.22607421875, -18.1640625, -17.10205078125, -16.0400390625, -14.97802734375, -13.916015625, -12.85400390625, -11.7919921875, -10.72998046875, -9.66796875, -8.60595703125, -7.5439453125, -6.48193359375, -5.419921875, -4.35791015625, -3.2958984375, -2.23388671875, -1.171875, -0.10986328125, 0.9521484375, 2.01416015625, 3.076171875, 4.13818359375, 5.2001953125, 6.26220703125, 7.32421875, 8.38623046875, 9.4482421875, 10.51025390625, 11.572265625, 12.63427734375, 13.6962890625, 14.75830078125, 15.8203125, 16.88232421875, 17.9443359375, 19.00634765625, 20.068359375, 21.13037109375, 22.1923828125, 23.25439453125, 24.31640625, 25.37841796875, 26.4404296875, 27.50244140625, 28.564453125, 29.62646484375, 30.6884765625, 31.75048828125, 32.8125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 3.0, 4.0, 2.0, 9.0, 5.0, 6.0, 14.0, 15.0, 9.0, 15.0, 25.0, 27.0, 35.0, 28.0, 38.0, 35.0, 52.0, 49.0, 56.0, 50.0, 49.0, 47.0, 39.0, 44.0, 35.0, 44.0, 43.0, 26.0, 41.0, 33.0, 25.0, 19.0, 12.0, 9.0, 9.0, 11.0, 4.0, 11.0, 9.0, 2.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-33.15625, -32.078125, -31.0, -29.921875, -28.84375, -27.765625, -26.6875, -25.609375, -24.53125, -23.453125, -22.375, -21.296875, -20.21875, -19.140625, -18.0625, -16.984375, -15.90625, -14.828125, -13.75, -12.671875, -11.59375, -10.515625, -9.4375, -8.359375, -7.28125, -6.203125, -5.125, -4.046875, -2.96875, -1.890625, -0.8125, 0.265625, 1.34375, 2.421875, 3.5, 4.578125, 5.65625, 6.734375, 7.8125, 8.890625, 9.96875, 11.046875, 12.125, 13.203125, 14.28125, 15.359375, 16.4375, 17.515625, 18.59375, 19.671875, 20.75, 21.828125, 22.90625, 23.984375, 25.0625, 26.140625, 27.21875, 28.296875, 29.375, 30.453125, 31.53125, 32.609375, 33.6875, 34.765625, 35.84375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 5.0, 6.0, 9.0, 10.0, 8.0, 12.0, 26.0, 40.0, 67.0, 119.0, 222.0, 324.0, 697.0, 1733.0, 4511.0, 15416.0, 67865.0, 733859.0, 180530.0, 29883.0, 8144.0, 2811.0, 1116.0, 513.0, 247.0, 121.0, 96.0, 62.0, 43.0, 17.0, 14.0, 17.0, 8.0, 2.0, 2.0, 6.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.5546875, -12.2130126953125, -11.871337890625, -11.5296630859375, -11.18798828125, -10.8463134765625, -10.504638671875, -10.1629638671875, -9.8212890625, -9.4796142578125, -9.137939453125, -8.7962646484375, -8.45458984375, -8.1129150390625, -7.771240234375, -7.4295654296875, -7.087890625, -6.7462158203125, -6.404541015625, -6.0628662109375, -5.72119140625, -5.3795166015625, -5.037841796875, -4.6961669921875, -4.3544921875, -4.0128173828125, -3.671142578125, -3.3294677734375, -2.98779296875, -2.6461181640625, -2.304443359375, -1.9627685546875, -1.62109375, -1.2794189453125, -0.937744140625, -0.5960693359375, -0.25439453125, 0.0872802734375, 0.428955078125, 0.7706298828125, 1.1123046875, 1.4539794921875, 1.795654296875, 2.1373291015625, 2.47900390625, 2.8206787109375, 3.162353515625, 3.5040283203125, 3.845703125, 4.1873779296875, 4.529052734375, 4.8707275390625, 5.21240234375, 5.5540771484375, 5.895751953125, 6.2374267578125, 6.5791015625, 6.9207763671875, 7.262451171875, 7.6041259765625, 7.94580078125, 8.2874755859375, 8.629150390625, 8.9708251953125, 9.3125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 6.0, 3.0, 3.0, 6.0, 13.0, 11.0, 16.0, 25.0, 35.0, 53.0, 79.0, 149.0, 252.0, 130.0, 65.0, 38.0, 36.0, 26.0, 18.0, 12.0, 5.0, 9.0, 3.0, 5.0, 3.0, 2.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0024700164794921875, -0.002348989248275757, -0.002227962017059326, -0.0021069347858428955, -0.001985907554626465, -0.0018648803234100342, -0.0017438530921936035, -0.0016228258609771729, -0.0015017986297607422, -0.0013807713985443115, -0.0012597441673278809, -0.0011387169361114502, -0.0010176897048950195, -0.0008966624736785889, -0.0007756352424621582, -0.0006546080112457275, -0.0005335807800292969, -0.0004125535488128662, -0.00029152631759643555, -0.00017049908638000488, -4.947185516357422e-05, 7.155537605285645e-05, 0.0001925826072692871, 0.0003136098384857178, 0.00043463706970214844, 0.0005556643009185791, 0.0006766915321350098, 0.0007977187633514404, 0.0009187459945678711, 0.0010397732257843018, 0.0011608004570007324, 0.001281827688217163, 0.0014028549194335938, 0.0015238821506500244, 0.001644909381866455, 0.0017659366130828857, 0.0018869638442993164, 0.002007991075515747, 0.0021290183067321777, 0.0022500455379486084, 0.002371072769165039, 0.0024921000003814697, 0.0026131272315979004, 0.002734154462814331, 0.0028551816940307617, 0.0029762089252471924, 0.003097236156463623, 0.0032182633876800537, 0.0033392906188964844, 0.003460317850112915, 0.0035813450813293457, 0.0037023723125457764, 0.003823399543762207, 0.003944426774978638, 0.004065454006195068, 0.004186481237411499, 0.00430750846862793, 0.00442853569984436, 0.004549562931060791, 0.004670590162277222, 0.004791617393493652, 0.004912644624710083, 0.005033671855926514, 0.005154699087142944, 0.005275726318359375]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 2.0, 8.0, 6.0, 9.0, 17.0, 22.0, 26.0, 38.0, 61.0, 70.0, 129.0, 187.0, 341.0, 564.0, 946.0, 1876.0, 3880.0, 8970.0, 25107.0, 95648.0, 695163.0, 157806.0, 35776.0, 11964.0, 4998.0, 2290.0, 1139.0, 611.0, 338.0, 200.0, 122.0, 79.0, 50.0, 28.0, 25.0, 17.0, 10.0, 12.0, 10.0, 3.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0], "bins": [-9.828125, -9.54443359375, -9.2607421875, -8.97705078125, -8.693359375, -8.40966796875, -8.1259765625, -7.84228515625, -7.55859375, -7.27490234375, -6.9912109375, -6.70751953125, -6.423828125, -6.14013671875, -5.8564453125, -5.57275390625, -5.2890625, -5.00537109375, -4.7216796875, -4.43798828125, -4.154296875, -3.87060546875, -3.5869140625, -3.30322265625, -3.01953125, -2.73583984375, -2.4521484375, -2.16845703125, -1.884765625, -1.60107421875, -1.3173828125, -1.03369140625, -0.75, -0.46630859375, -0.1826171875, 0.10107421875, 0.384765625, 0.66845703125, 0.9521484375, 1.23583984375, 1.51953125, 1.80322265625, 2.0869140625, 2.37060546875, 2.654296875, 2.93798828125, 3.2216796875, 3.50537109375, 3.7890625, 4.07275390625, 4.3564453125, 4.64013671875, 4.923828125, 5.20751953125, 5.4912109375, 5.77490234375, 6.05859375, 6.34228515625, 6.6259765625, 6.90966796875, 7.193359375, 7.47705078125, 7.7607421875, 8.04443359375, 8.328125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 3.0, 9.0, 2.0, 5.0, 8.0, 16.0, 7.0, 10.0, 12.0, 11.0, 27.0, 22.0, 31.0, 41.0, 48.0, 95.0, 117.0, 136.0, 108.0, 92.0, 53.0, 38.0, 30.0, 20.0, 13.0, 8.0, 11.0, 9.0, 4.0, 6.0, 5.0, 1.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.75, -8.4405517578125, -8.131103515625, -7.8216552734375, -7.51220703125, -7.2027587890625, -6.893310546875, -6.5838623046875, -6.2744140625, -5.9649658203125, -5.655517578125, -5.3460693359375, -5.03662109375, -4.7271728515625, -4.417724609375, -4.1082763671875, -3.798828125, -3.4893798828125, -3.179931640625, -2.8704833984375, -2.56103515625, -2.2515869140625, -1.942138671875, -1.6326904296875, -1.3232421875, -1.0137939453125, -0.704345703125, -0.3948974609375, -0.08544921875, 0.2239990234375, 0.533447265625, 0.8428955078125, 1.15234375, 1.4617919921875, 1.771240234375, 2.0806884765625, 2.39013671875, 2.6995849609375, 3.009033203125, 3.3184814453125, 3.6279296875, 3.9373779296875, 4.246826171875, 4.5562744140625, 4.86572265625, 5.1751708984375, 5.484619140625, 5.7940673828125, 6.103515625, 6.4129638671875, 6.722412109375, 7.0318603515625, 7.34130859375, 7.6507568359375, 7.960205078125, 8.2696533203125, 8.5791015625, 8.8885498046875, 9.197998046875, 9.5074462890625, 9.81689453125, 10.1263427734375, 10.435791015625, 10.7452392578125, 11.0546875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 8.0, 9.0, 15.0, 19.0, 43.0, 128.0, 406.0, 243.0, 85.0, 31.0, 13.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-350.8371276855469, -339.8031311035156, -328.76910400390625, -317.735107421875, -306.7010803222656, -295.6670837402344, -284.633056640625, -273.59906005859375, -262.5650634765625, -251.5310516357422, -240.49703979492188, -229.46304321289062, -218.42901611328125, -207.39501953125, -196.3610076904297, -185.32699584960938, -174.29296875, -163.2589569091797, -152.22494506835938, -141.19094848632812, -130.15692138671875, -119.12291717529297, -108.08891296386719, -97.05490112304688, -86.02088928222656, -74.98687744140625, -63.9528694152832, -52.918861389160156, -41.884849548339844, -30.85083770751953, -19.81683349609375, -8.782821655273438, 2.251220703125, 13.28523063659668, 24.31924057006836, 35.353248596191406, 46.38726043701172, 57.42127227783203, 68.45527648925781, 79.48928833007812, 90.52330017089844, 101.55731201171875, 112.59132385253906, 123.62532806396484, 134.65933227539062, 145.693359375, 156.72735595703125, 167.76136779785156, 178.79537963867188, 189.8293914794922, 200.8634033203125, 211.89739990234375, 222.93142700195312, 233.96542358398438, 244.9994354248047, 256.033447265625, 267.06744384765625, 278.1014404296875, 289.1354675292969, 300.1694641113281, 311.2034912109375, 322.23748779296875, 333.271484375, 344.3055114746094, 355.33953857421875]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 3.0, 5.0, 1.0, 9.0, 11.0, 6.0, 12.0, 7.0, 21.0, 17.0, 29.0, 26.0, 22.0, 34.0, 28.0, 39.0, 50.0, 57.0, 77.0, 99.0, 90.0, 62.0, 30.0, 44.0, 31.0, 17.0, 25.0, 26.0, 18.0, 19.0, 11.0, 13.0, 13.0, 17.0, 11.0, 6.0, 3.0, 6.0, 0.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-138.25018310546875, -133.57875061035156, -128.90731811523438, -124.23588562011719, -119.564453125, -114.89302062988281, -110.22159576416016, -105.55016326904297, -100.87873077392578, -96.2072982788086, -91.5358657836914, -86.86443328857422, -82.19300842285156, -77.52157592773438, -72.85014343261719, -68.1787109375, -63.50727844238281, -58.835845947265625, -54.16441345214844, -49.492984771728516, -44.82155227661133, -40.15011978149414, -35.47869110107422, -30.80725860595703, -26.135826110839844, -21.464393615722656, -16.7929630279541, -12.12153148651123, -7.450099945068359, -2.778667449951172, 1.8927631378173828, 6.5641937255859375, 11.235610961914062, 15.907042503356934, 20.578474044799805, 25.24990463256836, 29.921337127685547, 34.592769622802734, 39.264198303222656, 43.935630798339844, 48.60706329345703, 53.27849578857422, 57.949928283691406, 62.62135696411133, 67.29278564453125, 71.96421813964844, 76.63565063476562, 81.30708312988281, 85.978515625, 90.64994812011719, 95.32138061523438, 99.99281311035156, 104.66424560546875, 109.33567810058594, 114.0071029663086, 118.67853546142578, 123.34996795654297, 128.02139282226562, 132.6928253173828, 137.3642578125, 142.0356903076172, 146.70712280273438, 151.37855529785156, 156.04998779296875, 160.72142028808594]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 3.0, 4.0, 5.0, 7.0, 11.0, 9.0, 21.0, 36.0, 45.0, 73.0, 92.0, 183.0, 267.0, 433.0, 757.0, 1375.0, 2646.0, 6218.0, 20080.0, 132758.0, 1723233.0, 2103651.0, 166023.0, 22955.0, 6870.0, 2802.0, 1459.0, 766.0, 459.0, 334.0, 235.0, 153.0, 97.0, 74.0, 63.0, 24.0, 21.0, 11.0, 7.0, 6.0, 11.0, 5.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-18.578125, -18.062744140625, -17.54736328125, -17.031982421875, -16.5166015625, -16.001220703125, -15.48583984375, -14.970458984375, -14.455078125, -13.939697265625, -13.42431640625, -12.908935546875, -12.3935546875, -11.878173828125, -11.36279296875, -10.847412109375, -10.33203125, -9.816650390625, -9.30126953125, -8.785888671875, -8.2705078125, -7.755126953125, -7.23974609375, -6.724365234375, -6.208984375, -5.693603515625, -5.17822265625, -4.662841796875, -4.1474609375, -3.632080078125, -3.11669921875, -2.601318359375, -2.0859375, -1.570556640625, -1.05517578125, -0.539794921875, -0.0244140625, 0.490966796875, 1.00634765625, 1.521728515625, 2.037109375, 2.552490234375, 3.06787109375, 3.583251953125, 4.0986328125, 4.614013671875, 5.12939453125, 5.644775390625, 6.16015625, 6.675537109375, 7.19091796875, 7.706298828125, 8.2216796875, 8.737060546875, 9.25244140625, 9.767822265625, 10.283203125, 10.798583984375, 11.31396484375, 11.829345703125, 12.3447265625, 12.860107421875, 13.37548828125, 13.890869140625, 14.40625]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 7.0, 6.0, 2.0, 8.0, 7.0, 11.0, 4.0, 14.0, 15.0, 28.0, 28.0, 31.0, 32.0, 44.0, 37.0, 43.0, 49.0, 42.0, 66.0, 53.0, 55.0, 51.0, 60.0, 51.0, 35.0, 38.0, 33.0, 31.0, 28.0, 22.0, 12.0, 13.0, 12.0, 8.0, 11.0, 8.0, 7.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.3203125, -9.0145263671875, -8.708740234375, -8.4029541015625, -8.09716796875, -7.7913818359375, -7.485595703125, -7.1798095703125, -6.8740234375, -6.5682373046875, -6.262451171875, -5.9566650390625, -5.65087890625, -5.3450927734375, -5.039306640625, -4.7335205078125, -4.427734375, -4.1219482421875, -3.816162109375, -3.5103759765625, -3.20458984375, -2.8988037109375, -2.593017578125, -2.2872314453125, -1.9814453125, -1.6756591796875, -1.369873046875, -1.0640869140625, -0.75830078125, -0.4525146484375, -0.146728515625, 0.1590576171875, 0.46484375, 0.7706298828125, 1.076416015625, 1.3822021484375, 1.68798828125, 1.9937744140625, 2.299560546875, 2.6053466796875, 2.9111328125, 3.2169189453125, 3.522705078125, 3.8284912109375, 4.13427734375, 4.4400634765625, 4.745849609375, 5.0516357421875, 5.357421875, 5.6632080078125, 5.968994140625, 6.2747802734375, 6.58056640625, 6.8863525390625, 7.192138671875, 7.4979248046875, 7.8037109375, 8.1094970703125, 8.415283203125, 8.7210693359375, 9.02685546875, 9.3326416015625, 9.638427734375, 9.9442138671875, 10.25]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 2.0, 7.0, 17.0, 12.0, 17.0, 24.0, 56.0, 74.0, 104.0, 163.0, 258.0, 441.0, 908.0, 3021.0, 17655.0, 1903801.0, 2243859.0, 18611.0, 3108.0, 998.0, 451.0, 257.0, 156.0, 107.0, 63.0, 28.0, 26.0, 20.0, 9.0, 4.0, 7.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-56.0625, -54.31103515625, -52.5595703125, -50.80810546875, -49.056640625, -47.30517578125, -45.5537109375, -43.80224609375, -42.05078125, -40.29931640625, -38.5478515625, -36.79638671875, -35.044921875, -33.29345703125, -31.5419921875, -29.79052734375, -28.0390625, -26.28759765625, -24.5361328125, -22.78466796875, -21.033203125, -19.28173828125, -17.5302734375, -15.77880859375, -14.02734375, -12.27587890625, -10.5244140625, -8.77294921875, -7.021484375, -5.27001953125, -3.5185546875, -1.76708984375, -0.015625, 1.73583984375, 3.4873046875, 5.23876953125, 6.990234375, 8.74169921875, 10.4931640625, 12.24462890625, 13.99609375, 15.74755859375, 17.4990234375, 19.25048828125, 21.001953125, 22.75341796875, 24.5048828125, 26.25634765625, 28.0078125, 29.75927734375, 31.5107421875, 33.26220703125, 35.013671875, 36.76513671875, 38.5166015625, 40.26806640625, 42.01953125, 43.77099609375, 45.5224609375, 47.27392578125, 49.025390625, 50.77685546875, 52.5283203125, 54.27978515625, 56.03125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 10.0, 10.0, 15.0, 25.0, 46.0, 89.0, 201.0, 628.0, 1436.0, 968.0, 359.0, 146.0, 48.0, 30.0, 20.0, 10.0, 12.0, 6.0, 5.0, 7.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-66.5625, -65.136474609375, -63.71044921875, -62.284423828125, -60.8583984375, -59.432373046875, -58.00634765625, -56.580322265625, -55.154296875, -53.728271484375, -52.30224609375, -50.876220703125, -49.4501953125, -48.024169921875, -46.59814453125, -45.172119140625, -43.74609375, -42.320068359375, -40.89404296875, -39.468017578125, -38.0419921875, -36.615966796875, -35.18994140625, -33.763916015625, -32.337890625, -30.911865234375, -29.48583984375, -28.059814453125, -26.6337890625, -25.207763671875, -23.78173828125, -22.355712890625, -20.9296875, -19.503662109375, -18.07763671875, -16.651611328125, -15.2255859375, -13.799560546875, -12.37353515625, -10.947509765625, -9.521484375, -8.095458984375, -6.66943359375, -5.243408203125, -3.8173828125, -2.391357421875, -0.96533203125, 0.460693359375, 1.88671875, 3.312744140625, 4.73876953125, 6.164794921875, 7.5908203125, 9.016845703125, 10.44287109375, 11.868896484375, 13.294921875, 14.720947265625, 16.14697265625, 17.572998046875, 18.9990234375, 20.425048828125, 21.85107421875, 23.277099609375, 24.703125]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 4.0, 6.0, 4.0, 10.0, 19.0, 16.0, 37.0, 65.0, 86.0, 136.0, 153.0, 156.0, 115.0, 65.0, 44.0, 29.0, 22.0, 7.0, 8.0, 7.0, 2.0, 2.0, 5.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-228.4371795654297, -221.63119506835938, -214.82522583007812, -208.0192413330078, -201.21327209472656, -194.40728759765625, -187.601318359375, -180.7953338623047, -173.98934936523438, -167.18336486816406, -160.3773956298828, -153.5714111328125, -146.76544189453125, -139.95945739746094, -133.15347290039062, -126.34750366210938, -119.5415267944336, -112.73554992675781, -105.92957305908203, -99.12359619140625, -92.31761169433594, -85.51163482666016, -78.70565795898438, -71.89967346191406, -65.09370422363281, -58.28772735595703, -51.481746673583984, -44.6757698059082, -37.869789123535156, -31.063812255859375, -24.257835388183594, -17.451854705810547, -10.6458740234375, -3.839895725250244, 2.9660825729370117, 9.77206039428711, 16.578039169311523, 23.384017944335938, 30.18999481201172, 36.995975494384766, 43.80195236206055, 50.60792922973633, 57.413909912109375, 64.21988677978516, 71.02586364746094, 77.83184814453125, 84.6378173828125, 91.44380187988281, 98.2497787475586, 105.05575561523438, 111.86173248291016, 118.66770935058594, 125.47369384765625, 132.2796630859375, 139.0856475830078, 145.89163208007812, 152.69760131835938, 159.5035858154297, 166.30955505371094, 173.11553955078125, 179.9215087890625, 186.7274932861328, 193.53347778320312, 200.33944702148438, 207.1454315185547]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 3.0, 3.0, 5.0, 4.0, 11.0, 6.0, 10.0, 14.0, 12.0, 19.0, 29.0, 29.0, 38.0, 29.0, 44.0, 45.0, 44.0, 44.0, 51.0, 53.0, 31.0, 57.0, 50.0, 48.0, 40.0, 38.0, 33.0, 26.0, 28.0, 26.0, 19.0, 22.0, 20.0, 16.0, 7.0, 12.0, 9.0, 7.0, 6.0, 3.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-117.62723541259766, -114.12811279296875, -110.62899017333984, -107.12986755371094, -103.63075256347656, -100.13162994384766, -96.63250732421875, -93.13338470458984, -89.63426208496094, -86.13513946533203, -82.63601684570312, -79.13690185546875, -75.63777923583984, -72.13865661621094, -68.63953399658203, -65.14041137695312, -61.64129638671875, -58.142173767089844, -54.6430549621582, -51.1439323425293, -47.644813537597656, -44.14569091796875, -40.646568298339844, -37.14744567871094, -33.6483268737793, -30.149206161499023, -26.65008544921875, -23.150962829589844, -19.65184211730957, -16.152721405029297, -12.65359878540039, -9.154478073120117, -5.6553497314453125, -2.156228542327881, 1.3428926467895508, 4.842014312744141, 8.341135025024414, 11.840255737304688, 15.339378356933594, 18.838499069213867, 22.33761978149414, 25.836740493774414, 29.335861206054688, 32.834983825683594, 36.3341064453125, 39.83322525024414, 43.33234786987305, 46.83146667480469, 50.330589294433594, 53.8297119140625, 57.32883071899414, 60.82795333862305, 64.32707214355469, 67.8261947631836, 71.3253173828125, 74.8244400024414, 78.32356262207031, 81.82268524169922, 85.32180786132812, 88.8209228515625, 92.3200454711914, 95.81916809082031, 99.31829071044922, 102.81741333007812, 106.3165283203125]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 5.0, 9.0, 7.0, 16.0, 16.0, 28.0, 32.0, 47.0, 76.0, 129.0, 188.0, 300.0, 493.0, 796.0, 1466.0, 2739.0, 5640.0, 11875.0, 27647.0, 71623.0, 208162.0, 410534.0, 192466.0, 65738.0, 26079.0, 11114.0, 5251.0, 2632.0, 1394.0, 792.0, 438.0, 281.0, 180.0, 121.0, 79.0, 46.0, 37.0, 27.0, 10.0, 17.0, 7.0, 7.0, 7.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-13.71875, -13.28271484375, -12.8466796875, -12.41064453125, -11.974609375, -11.53857421875, -11.1025390625, -10.66650390625, -10.23046875, -9.79443359375, -9.3583984375, -8.92236328125, -8.486328125, -8.05029296875, -7.6142578125, -7.17822265625, -6.7421875, -6.30615234375, -5.8701171875, -5.43408203125, -4.998046875, -4.56201171875, -4.1259765625, -3.68994140625, -3.25390625, -2.81787109375, -2.3818359375, -1.94580078125, -1.509765625, -1.07373046875, -0.6376953125, -0.20166015625, 0.234375, 0.67041015625, 1.1064453125, 1.54248046875, 1.978515625, 2.41455078125, 2.8505859375, 3.28662109375, 3.72265625, 4.15869140625, 4.5947265625, 5.03076171875, 5.466796875, 5.90283203125, 6.3388671875, 6.77490234375, 7.2109375, 7.64697265625, 8.0830078125, 8.51904296875, 8.955078125, 9.39111328125, 9.8271484375, 10.26318359375, 10.69921875, 11.13525390625, 11.5712890625, 12.00732421875, 12.443359375, 12.87939453125, 13.3154296875, 13.75146484375, 14.1875]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 7.0, 6.0, 6.0, 6.0, 8.0, 5.0, 9.0, 11.0, 13.0, 11.0, 14.0, 18.0, 22.0, 25.0, 29.0, 32.0, 37.0, 39.0, 37.0, 47.0, 35.0, 47.0, 42.0, 40.0, 46.0, 33.0, 38.0, 40.0, 43.0, 35.0, 34.0, 31.0, 28.0, 21.0, 15.0, 11.0, 13.0, 11.0, 6.0, 8.0, 11.0, 9.0, 5.0, 6.0, 3.0, 3.0, 1.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-9.0234375, -8.7315673828125, -8.439697265625, -8.1478271484375, -7.85595703125, -7.5640869140625, -7.272216796875, -6.9803466796875, -6.6884765625, -6.3966064453125, -6.104736328125, -5.8128662109375, -5.52099609375, -5.2291259765625, -4.937255859375, -4.6453857421875, -4.353515625, -4.0616455078125, -3.769775390625, -3.4779052734375, -3.18603515625, -2.8941650390625, -2.602294921875, -2.3104248046875, -2.0185546875, -1.7266845703125, -1.434814453125, -1.1429443359375, -0.85107421875, -0.5592041015625, -0.267333984375, 0.0245361328125, 0.31640625, 0.6082763671875, 0.900146484375, 1.1920166015625, 1.48388671875, 1.7757568359375, 2.067626953125, 2.3594970703125, 2.6513671875, 2.9432373046875, 3.235107421875, 3.5269775390625, 3.81884765625, 4.1107177734375, 4.402587890625, 4.6944580078125, 4.986328125, 5.2781982421875, 5.570068359375, 5.8619384765625, 6.15380859375, 6.4456787109375, 6.737548828125, 7.0294189453125, 7.3212890625, 7.6131591796875, 7.905029296875, 8.1968994140625, 8.48876953125, 8.7806396484375, 9.072509765625, 9.3643798828125, 9.65625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 6.0, 4.0, 6.0, 11.0, 15.0, 13.0, 17.0, 33.0, 41.0, 58.0, 67.0, 121.0, 198.0, 339.0, 608.0, 1268.0, 3064.0, 10695.0, 61075.0, 782558.0, 159595.0, 20265.0, 4838.0, 1714.0, 773.0, 424.0, 241.0, 154.0, 97.0, 77.0, 44.0, 37.0, 28.0, 16.0, 16.0, 12.0, 14.0, 7.0, 4.0, 2.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-39.65625, -38.575927734375, -37.49560546875, -36.415283203125, -35.3349609375, -34.254638671875, -33.17431640625, -32.093994140625, -31.013671875, -29.933349609375, -28.85302734375, -27.772705078125, -26.6923828125, -25.612060546875, -24.53173828125, -23.451416015625, -22.37109375, -21.290771484375, -20.21044921875, -19.130126953125, -18.0498046875, -16.969482421875, -15.88916015625, -14.808837890625, -13.728515625, -12.648193359375, -11.56787109375, -10.487548828125, -9.4072265625, -8.326904296875, -7.24658203125, -6.166259765625, -5.0859375, -4.005615234375, -2.92529296875, -1.844970703125, -0.7646484375, 0.315673828125, 1.39599609375, 2.476318359375, 3.556640625, 4.636962890625, 5.71728515625, 6.797607421875, 7.8779296875, 8.958251953125, 10.03857421875, 11.118896484375, 12.19921875, 13.279541015625, 14.35986328125, 15.440185546875, 16.5205078125, 17.600830078125, 18.68115234375, 19.761474609375, 20.841796875, 21.922119140625, 23.00244140625, 24.082763671875, 25.1630859375, 26.243408203125, 27.32373046875, 28.404052734375, 29.484375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 3.0, 1.0, 7.0, 8.0, 5.0, 5.0, 6.0, 12.0, 20.0, 12.0, 23.0, 18.0, 37.0, 31.0, 43.0, 38.0, 61.0, 57.0, 71.0, 58.0, 39.0, 50.0, 52.0, 43.0, 49.0, 41.0, 26.0, 26.0, 22.0, 29.0, 24.0, 10.0, 10.0, 16.0, 6.0, 3.0, 7.0, 6.0, 5.0, 6.0, 7.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-47.75, -46.359375, -44.96875, -43.578125, -42.1875, -40.796875, -39.40625, -38.015625, -36.625, -35.234375, -33.84375, -32.453125, -31.0625, -29.671875, -28.28125, -26.890625, -25.5, -24.109375, -22.71875, -21.328125, -19.9375, -18.546875, -17.15625, -15.765625, -14.375, -12.984375, -11.59375, -10.203125, -8.8125, -7.421875, -6.03125, -4.640625, -3.25, -1.859375, -0.46875, 0.921875, 2.3125, 3.703125, 5.09375, 6.484375, 7.875, 9.265625, 10.65625, 12.046875, 13.4375, 14.828125, 16.21875, 17.609375, 19.0, 20.390625, 21.78125, 23.171875, 24.5625, 25.953125, 27.34375, 28.734375, 30.125, 31.515625, 32.90625, 34.296875, 35.6875, 37.078125, 38.46875, 39.859375, 41.25]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 3.0, 5.0, 5.0, 5.0, 5.0, 9.0, 23.0, 18.0, 33.0, 49.0, 65.0, 84.0, 174.0, 334.0, 666.0, 1406.0, 3563.0, 11206.0, 49599.0, 696141.0, 238838.0, 32765.0, 8228.0, 2907.0, 1149.0, 538.0, 297.0, 145.0, 95.0, 56.0, 37.0, 31.0, 19.0, 9.0, 13.0, 14.0, 8.0, 5.0, 1.0, 3.0, 0.0, 1.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-13.8515625, -13.4654541015625, -13.079345703125, -12.6932373046875, -12.30712890625, -11.9210205078125, -11.534912109375, -11.1488037109375, -10.7626953125, -10.3765869140625, -9.990478515625, -9.6043701171875, -9.21826171875, -8.8321533203125, -8.446044921875, -8.0599365234375, -7.673828125, -7.2877197265625, -6.901611328125, -6.5155029296875, -6.12939453125, -5.7432861328125, -5.357177734375, -4.9710693359375, -4.5849609375, -4.1988525390625, -3.812744140625, -3.4266357421875, -3.04052734375, -2.6544189453125, -2.268310546875, -1.8822021484375, -1.49609375, -1.1099853515625, -0.723876953125, -0.3377685546875, 0.04833984375, 0.4344482421875, 0.820556640625, 1.2066650390625, 1.5927734375, 1.9788818359375, 2.364990234375, 2.7510986328125, 3.13720703125, 3.5233154296875, 3.909423828125, 4.2955322265625, 4.681640625, 5.0677490234375, 5.453857421875, 5.8399658203125, 6.22607421875, 6.6121826171875, 6.998291015625, 7.3843994140625, 7.7705078125, 8.1566162109375, 8.542724609375, 8.9288330078125, 9.31494140625, 9.7010498046875, 10.087158203125, 10.4732666015625, 10.859375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 3.0, 2.0, 4.0, 5.0, 4.0, 3.0, 7.0, 9.0, 11.0, 15.0, 15.0, 20.0, 25.0, 20.0, 39.0, 45.0, 61.0, 95.0, 134.0, 140.0, 77.0, 55.0, 39.0, 30.0, 40.0, 20.0, 16.0, 12.0, 17.0, 9.0, 6.0, 3.0, 3.0, 2.0, 6.0, 1.0, 3.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00269317626953125, -0.002605259418487549, -0.0025173425674438477, -0.0024294257164001465, -0.0023415088653564453, -0.002253592014312744, -0.002165675163269043, -0.002077758312225342, -0.0019898414611816406, -0.0019019246101379395, -0.0018140077590942383, -0.0017260909080505371, -0.001638174057006836, -0.0015502572059631348, -0.0014623403549194336, -0.0013744235038757324, -0.0012865066528320312, -0.00119858980178833, -0.001110672950744629, -0.0010227560997009277, -0.0009348392486572266, -0.0008469223976135254, -0.0007590055465698242, -0.000671088695526123, -0.0005831718444824219, -0.0004952549934387207, -0.00040733814239501953, -0.00031942129135131836, -0.0002315044403076172, -0.00014358758926391602, -5.5670738220214844e-05, 3.224611282348633e-05, 0.0001201629638671875, 0.00020807981491088867, 0.00029599666595458984, 0.000383913516998291, 0.0004718303680419922, 0.0005597472190856934, 0.0006476640701293945, 0.0007355809211730957, 0.0008234977722167969, 0.000911414623260498, 0.0009993314743041992, 0.0010872483253479004, 0.0011751651763916016, 0.0012630820274353027, 0.001350998878479004, 0.001438915729522705, 0.0015268325805664062, 0.0016147494316101074, 0.0017026662826538086, 0.0017905831336975098, 0.001878499984741211, 0.001966416835784912, 0.0020543336868286133, 0.0021422505378723145, 0.0022301673889160156, 0.002318084239959717, 0.002406001091003418, 0.002493917942047119, 0.0025818347930908203, 0.0026697516441345215, 0.0027576684951782227, 0.002845585346221924, 0.002933502197265625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 8.0, 0.0, 2.0, 2.0, 11.0, 5.0, 8.0, 12.0, 17.0, 30.0, 38.0, 39.0, 42.0, 76.0, 135.0, 186.0, 318.0, 434.0, 801.0, 1597.0, 3486.0, 8492.0, 26689.0, 117316.0, 715520.0, 128621.0, 28121.0, 9095.0, 3508.0, 1673.0, 888.0, 505.0, 285.0, 195.0, 128.0, 73.0, 61.0, 46.0, 24.0, 22.0, 17.0, 15.0, 10.0, 7.0, 1.0, 3.0, 3.0, 3.0, 0.0, 1.0, 3.0, 1.0], "bins": [-10.59375, -10.3037109375, -10.013671875, -9.7236328125, -9.43359375, -9.1435546875, -8.853515625, -8.5634765625, -8.2734375, -7.9833984375, -7.693359375, -7.4033203125, -7.11328125, -6.8232421875, -6.533203125, -6.2431640625, -5.953125, -5.6630859375, -5.373046875, -5.0830078125, -4.79296875, -4.5029296875, -4.212890625, -3.9228515625, -3.6328125, -3.3427734375, -3.052734375, -2.7626953125, -2.47265625, -2.1826171875, -1.892578125, -1.6025390625, -1.3125, -1.0224609375, -0.732421875, -0.4423828125, -0.15234375, 0.1376953125, 0.427734375, 0.7177734375, 1.0078125, 1.2978515625, 1.587890625, 1.8779296875, 2.16796875, 2.4580078125, 2.748046875, 3.0380859375, 3.328125, 3.6181640625, 3.908203125, 4.1982421875, 4.48828125, 4.7783203125, 5.068359375, 5.3583984375, 5.6484375, 5.9384765625, 6.228515625, 6.5185546875, 6.80859375, 7.0986328125, 7.388671875, 7.6787109375, 7.96875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 4.0, 4.0, 6.0, 7.0, 3.0, 14.0, 20.0, 12.0, 23.0, 33.0, 43.0, 40.0, 42.0, 68.0, 71.0, 96.0, 113.0, 92.0, 58.0, 51.0, 41.0, 36.0, 34.0, 19.0, 12.0, 10.0, 9.0, 6.0, 11.0, 5.0, 5.0, 4.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.6796875, -9.3865966796875, -9.093505859375, -8.8004150390625, -8.50732421875, -8.2142333984375, -7.921142578125, -7.6280517578125, -7.3349609375, -7.0418701171875, -6.748779296875, -6.4556884765625, -6.16259765625, -5.8695068359375, -5.576416015625, -5.2833251953125, -4.990234375, -4.6971435546875, -4.404052734375, -4.1109619140625, -3.81787109375, -3.5247802734375, -3.231689453125, -2.9385986328125, -2.6455078125, -2.3524169921875, -2.059326171875, -1.7662353515625, -1.47314453125, -1.1800537109375, -0.886962890625, -0.5938720703125, -0.30078125, -0.0076904296875, 0.285400390625, 0.5784912109375, 0.87158203125, 1.1646728515625, 1.457763671875, 1.7508544921875, 2.0439453125, 2.3370361328125, 2.630126953125, 2.9232177734375, 3.21630859375, 3.5093994140625, 3.802490234375, 4.0955810546875, 4.388671875, 4.6817626953125, 4.974853515625, 5.2679443359375, 5.56103515625, 5.8541259765625, 6.147216796875, 6.4403076171875, 6.7333984375, 7.0264892578125, 7.319580078125, 7.6126708984375, 7.90576171875, 8.1988525390625, 8.491943359375, 8.7850341796875, 9.078125]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 8.0, 18.0, 25.0, 77.0, 241.0, 449.0, 108.0, 37.0, 22.0, 6.0, 4.0, 2.0, 6.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-550.93505859375, -535.275146484375, -519.615234375, -503.9552917480469, -488.29534912109375, -472.63543701171875, -456.97552490234375, -441.3155822753906, -425.6556396484375, -409.9957275390625, -394.3357849121094, -378.6758728027344, -363.01593017578125, -347.35601806640625, -331.69610595703125, -316.0361633300781, -300.3762512207031, -284.7163391113281, -269.056396484375, -253.396484375, -237.73654174804688, -222.07662963867188, -206.4167022705078, -190.75677490234375, -175.0968475341797, -159.43692016601562, -143.77699279785156, -128.1170654296875, -112.45714569091797, -96.7972183227539, -81.13729858398438, -65.47737121582031, -49.817413330078125, -34.15748596191406, -18.497562408447266, -2.8376388549804688, 12.822288513183594, 28.482215881347656, 44.14213562011719, 59.80206298828125, 75.46199035644531, 91.12191772460938, 106.78184509277344, 122.44176483154297, 138.1016845703125, 153.76162719726562, 169.42153930664062, 185.0814666748047, 200.74139404296875, 216.4013214111328, 232.06124877929688, 247.72116088867188, 263.381103515625, 279.041015625, 294.700927734375, 310.3608703613281, 326.02081298828125, 341.68072509765625, 357.3406677246094, 373.0005798339844, 388.6605224609375, 404.3204345703125, 419.9803466796875, 435.6402893066406, 451.3002014160156]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 3.0, 5.0, 0.0, 4.0, 3.0, 5.0, 13.0, 9.0, 17.0, 18.0, 15.0, 25.0, 16.0, 18.0, 31.0, 40.0, 46.0, 37.0, 65.0, 131.0, 134.0, 71.0, 47.0, 25.0, 39.0, 28.0, 23.0, 30.0, 17.0, 19.0, 14.0, 11.0, 9.0, 8.0, 4.0, 8.0, 3.0, 7.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-208.40194702148438, -201.4549102783203, -194.50787353515625, -187.5608367919922, -180.61380004882812, -173.66676330566406, -166.7197265625, -159.772705078125, -152.82565307617188, -145.8786163330078, -138.93157958984375, -131.9845428466797, -125.03750610351562, -118.09046936035156, -111.14344024658203, -104.19640350341797, -97.24937438964844, -90.30233764648438, -83.35530090332031, -76.40826416015625, -69.46122741699219, -62.51419448852539, -55.567161560058594, -48.62012481689453, -41.67308807373047, -34.726051330566406, -27.779016494750977, -20.831981658935547, -13.884944915771484, -6.937908172607422, 0.009124755859375, 6.9561614990234375, 13.903182983398438, 20.8502197265625, 27.79725456237793, 34.74428939819336, 41.69132614135742, 48.638362884521484, 55.58539581298828, 62.532432556152344, 69.4794692993164, 76.42650604248047, 83.37354278564453, 90.32057189941406, 97.26760864257812, 104.21464538574219, 111.16168212890625, 118.10871887207031, 125.05575561523438, 132.00279235839844, 138.9498291015625, 145.89686584472656, 152.84390258789062, 159.7909393310547, 166.73797607421875, 173.68499755859375, 180.63204956054688, 187.57908630371094, 194.526123046875, 201.47315979003906, 208.42019653320312, 215.3672332763672, 222.31427001953125, 229.26129150390625, 236.2083282470703]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 1.0, 5.0, 3.0, 8.0, 17.0, 24.0, 40.0, 56.0, 134.0, 218.0, 485.0, 1062.0, 2505.0, 7451.0, 30530.0, 264749.0, 3017869.0, 792073.0, 58806.0, 11724.0, 3668.0, 1459.0, 661.0, 310.0, 167.0, 110.0, 55.0, 34.0, 19.0, 12.0, 10.0, 10.0, 5.0, 2.0, 2.0, 4.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.515625, -24.522216796875, -23.52880859375, -22.535400390625, -21.5419921875, -20.548583984375, -19.55517578125, -18.561767578125, -17.568359375, -16.574951171875, -15.58154296875, -14.588134765625, -13.5947265625, -12.601318359375, -11.60791015625, -10.614501953125, -9.62109375, -8.627685546875, -7.63427734375, -6.640869140625, -5.6474609375, -4.654052734375, -3.66064453125, -2.667236328125, -1.673828125, -0.680419921875, 0.31298828125, 1.306396484375, 2.2998046875, 3.293212890625, 4.28662109375, 5.280029296875, 6.2734375, 7.266845703125, 8.26025390625, 9.253662109375, 10.2470703125, 11.240478515625, 12.23388671875, 13.227294921875, 14.220703125, 15.214111328125, 16.20751953125, 17.200927734375, 18.1943359375, 19.187744140625, 20.18115234375, 21.174560546875, 22.16796875, 23.161376953125, 24.15478515625, 25.148193359375, 26.1416015625, 27.135009765625, 28.12841796875, 29.121826171875, 30.115234375, 31.108642578125, 32.10205078125, 33.095458984375, 34.0888671875, 35.082275390625, 36.07568359375, 37.069091796875, 38.0625]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 7.0, 5.0, 8.0, 8.0, 16.0, 19.0, 19.0, 11.0, 28.0, 32.0, 31.0, 52.0, 43.0, 42.0, 47.0, 64.0, 48.0, 51.0, 68.0, 69.0, 45.0, 49.0, 47.0, 28.0, 29.0, 36.0, 23.0, 17.0, 12.0, 8.0, 13.0, 10.0, 8.0, 6.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.21875, -9.857177734375, -9.49560546875, -9.134033203125, -8.7724609375, -8.410888671875, -8.04931640625, -7.687744140625, -7.326171875, -6.964599609375, -6.60302734375, -6.241455078125, -5.8798828125, -5.518310546875, -5.15673828125, -4.795166015625, -4.43359375, -4.072021484375, -3.71044921875, -3.348876953125, -2.9873046875, -2.625732421875, -2.26416015625, -1.902587890625, -1.541015625, -1.179443359375, -0.81787109375, -0.456298828125, -0.0947265625, 0.266845703125, 0.62841796875, 0.989990234375, 1.3515625, 1.713134765625, 2.07470703125, 2.436279296875, 2.7978515625, 3.159423828125, 3.52099609375, 3.882568359375, 4.244140625, 4.605712890625, 4.96728515625, 5.328857421875, 5.6904296875, 6.052001953125, 6.41357421875, 6.775146484375, 7.13671875, 7.498291015625, 7.85986328125, 8.221435546875, 8.5830078125, 8.944580078125, 9.30615234375, 9.667724609375, 10.029296875, 10.390869140625, 10.75244140625, 11.114013671875, 11.4755859375, 11.837158203125, 12.19873046875, 12.560302734375, 12.921875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 6.0, 5.0, 14.0, 24.0, 57.0, 93.0, 154.0, 345.0, 945.0, 4746.0, 3971061.0, 212784.0, 2789.0, 709.0, 288.0, 115.0, 71.0, 33.0, 14.0, 8.0, 5.0, 3.0, 2.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-172.0, -165.828125, -159.65625, -153.484375, -147.3125, -141.140625, -134.96875, -128.796875, -122.625, -116.453125, -110.28125, -104.109375, -97.9375, -91.765625, -85.59375, -79.421875, -73.25, -67.078125, -60.90625, -54.734375, -48.5625, -42.390625, -36.21875, -30.046875, -23.875, -17.703125, -11.53125, -5.359375, 0.8125, 6.984375, 13.15625, 19.328125, 25.5, 31.671875, 37.84375, 44.015625, 50.1875, 56.359375, 62.53125, 68.703125, 74.875, 81.046875, 87.21875, 93.390625, 99.5625, 105.734375, 111.90625, 118.078125, 124.25, 130.421875, 136.59375, 142.765625, 148.9375, 155.109375, 161.28125, 167.453125, 173.625, 179.796875, 185.96875, 192.140625, 198.3125, 204.484375, 210.65625, 216.828125, 223.0]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 15.0, 19.0, 33.0, 75.0, 166.0, 437.0, 1212.0, 1257.0, 493.0, 186.0, 80.0, 40.0, 30.0, 14.0, 13.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-121.6875, -118.92333984375, -116.1591796875, -113.39501953125, -110.630859375, -107.86669921875, -105.1025390625, -102.33837890625, -99.57421875, -96.81005859375, -94.0458984375, -91.28173828125, -88.517578125, -85.75341796875, -82.9892578125, -80.22509765625, -77.4609375, -74.69677734375, -71.9326171875, -69.16845703125, -66.404296875, -63.64013671875, -60.8759765625, -58.11181640625, -55.34765625, -52.58349609375, -49.8193359375, -47.05517578125, -44.291015625, -41.52685546875, -38.7626953125, -35.99853515625, -33.234375, -30.47021484375, -27.7060546875, -24.94189453125, -22.177734375, -19.41357421875, -16.6494140625, -13.88525390625, -11.12109375, -8.35693359375, -5.5927734375, -2.82861328125, -0.064453125, 2.69970703125, 5.4638671875, 8.22802734375, 10.9921875, 13.75634765625, 16.5205078125, 19.28466796875, 22.048828125, 24.81298828125, 27.5771484375, 30.34130859375, 33.10546875, 35.86962890625, 38.6337890625, 41.39794921875, 44.162109375, 46.92626953125, 49.6904296875, 52.45458984375, 55.21875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 2.0, 9.0, 7.0, 10.0, 18.0, 34.0, 42.0, 104.0, 168.0, 238.0, 169.0, 99.0, 40.0, 23.0, 14.0, 10.0, 4.0, 3.0, 3.0, 3.0, 3.0, 4.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-715.1956787109375, -696.035888671875, -676.8760375976562, -657.7161865234375, -638.556396484375, -619.3966064453125, -600.2367553710938, -581.076904296875, -561.9171142578125, -542.75732421875, -523.5974731445312, -504.4376525878906, -485.27783203125, -466.1180114746094, -446.95819091796875, -427.7983703613281, -408.6385498046875, -389.4787292480469, -370.31890869140625, -351.1590881347656, -331.999267578125, -312.8394470214844, -293.67962646484375, -274.5198059082031, -255.3599853515625, -236.20016479492188, -217.04034423828125, -197.88052368164062, -178.720703125, -159.56088256835938, -140.40106201171875, -121.24124145507812, -102.08139038085938, -82.92156982421875, -63.761749267578125, -44.6019287109375, -25.442108154296875, -6.28228759765625, 12.877532958984375, 32.037353515625, 51.197174072265625, 70.35699462890625, 89.51681518554688, 108.6766357421875, 127.83645629882812, 146.99627685546875, 166.15609741210938, 185.31591796875, 204.47573852539062, 223.63555908203125, 242.79537963867188, 261.9552001953125, 281.1150207519531, 300.27484130859375, 319.4346618652344, 338.594482421875, 357.7543029785156, 376.91412353515625, 396.0739440917969, 415.2337646484375, 434.3935852050781, 453.55340576171875, 472.7132263183594, 491.873046875, 511.0328674316406]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 6.0, 2.0, 7.0, 7.0, 7.0, 12.0, 9.0, 15.0, 16.0, 21.0, 31.0, 28.0, 36.0, 38.0, 46.0, 41.0, 53.0, 62.0, 82.0, 64.0, 62.0, 43.0, 51.0, 50.0, 45.0, 33.0, 34.0, 20.0, 20.0, 14.0, 12.0, 4.0, 11.0, 10.0, 4.0, 3.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-230.41290283203125, -222.38433837890625, -214.3557586669922, -206.3271942138672, -198.29861450195312, -190.27005004882812, -182.24148559570312, -174.21292114257812, -166.18434143066406, -158.15577697753906, -150.127197265625, -142.0986328125, -134.070068359375, -126.04148864746094, -118.01292419433594, -109.9843521118164, -101.95578002929688, -93.92720794677734, -85.89863586425781, -77.87007141113281, -69.84149932861328, -61.81292724609375, -53.784358978271484, -45.75579071044922, -37.72721862792969, -29.69864845275879, -21.67007827758789, -13.641508102416992, -5.612937927246094, 2.4156341552734375, 10.444202423095703, 18.47277069091797, 26.501373291015625, 34.529945373535156, 42.55851364135742, 50.58708190917969, 58.61565399169922, 66.64422607421875, 74.67279052734375, 82.70136260986328, 90.72993469238281, 98.75850677490234, 106.78707885742188, 114.81564331054688, 122.8442153930664, 130.87278747558594, 138.90135192871094, 146.929931640625, 154.95849609375, 162.987060546875, 171.01564025878906, 179.04420471191406, 187.07278442382812, 195.10134887695312, 203.12991333007812, 211.15847778320312, 219.1870574951172, 227.2156219482422, 235.24420166015625, 243.27276611328125, 251.30133056640625, 259.32989501953125, 267.3584899902344, 275.3870544433594, 283.4156188964844]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 8.0, 5.0, 6.0, 14.0, 17.0, 36.0, 40.0, 50.0, 94.0, 162.0, 254.0, 456.0, 816.0, 1686.0, 3487.0, 8302.0, 24096.0, 99887.0, 584361.0, 253375.0, 47117.0, 13781.0, 5418.0, 2396.0, 1214.0, 629.0, 315.0, 194.0, 120.0, 65.0, 41.0, 41.0, 31.0, 12.0, 10.0, 8.0, 4.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.78125, -21.96044921875, -21.1396484375, -20.31884765625, -19.498046875, -18.67724609375, -17.8564453125, -17.03564453125, -16.21484375, -15.39404296875, -14.5732421875, -13.75244140625, -12.931640625, -12.11083984375, -11.2900390625, -10.46923828125, -9.6484375, -8.82763671875, -8.0068359375, -7.18603515625, -6.365234375, -5.54443359375, -4.7236328125, -3.90283203125, -3.08203125, -2.26123046875, -1.4404296875, -0.61962890625, 0.201171875, 1.02197265625, 1.8427734375, 2.66357421875, 3.484375, 4.30517578125, 5.1259765625, 5.94677734375, 6.767578125, 7.58837890625, 8.4091796875, 9.22998046875, 10.05078125, 10.87158203125, 11.6923828125, 12.51318359375, 13.333984375, 14.15478515625, 14.9755859375, 15.79638671875, 16.6171875, 17.43798828125, 18.2587890625, 19.07958984375, 19.900390625, 20.72119140625, 21.5419921875, 22.36279296875, 23.18359375, 24.00439453125, 24.8251953125, 25.64599609375, 26.466796875, 27.28759765625, 28.1083984375, 28.92919921875, 29.75]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 5.0, 4.0, 15.0, 10.0, 14.0, 8.0, 28.0, 28.0, 25.0, 28.0, 39.0, 68.0, 58.0, 63.0, 70.0, 54.0, 65.0, 51.0, 60.0, 63.0, 60.0, 32.0, 22.0, 33.0, 26.0, 20.0, 10.0, 17.0, 7.0, 3.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.609375, -17.01416015625, -16.4189453125, -15.82373046875, -15.228515625, -14.63330078125, -14.0380859375, -13.44287109375, -12.84765625, -12.25244140625, -11.6572265625, -11.06201171875, -10.466796875, -9.87158203125, -9.2763671875, -8.68115234375, -8.0859375, -7.49072265625, -6.8955078125, -6.30029296875, -5.705078125, -5.10986328125, -4.5146484375, -3.91943359375, -3.32421875, -2.72900390625, -2.1337890625, -1.53857421875, -0.943359375, -0.34814453125, 0.2470703125, 0.84228515625, 1.4375, 2.03271484375, 2.6279296875, 3.22314453125, 3.818359375, 4.41357421875, 5.0087890625, 5.60400390625, 6.19921875, 6.79443359375, 7.3896484375, 7.98486328125, 8.580078125, 9.17529296875, 9.7705078125, 10.36572265625, 10.9609375, 11.55615234375, 12.1513671875, 12.74658203125, 13.341796875, 13.93701171875, 14.5322265625, 15.12744140625, 15.72265625, 16.31787109375, 16.9130859375, 17.50830078125, 18.103515625, 18.69873046875, 19.2939453125, 19.88916015625, 20.484375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 3.0, 1.0, 7.0, 2.0, 7.0, 10.0, 15.0, 29.0, 28.0, 38.0, 53.0, 103.0, 136.0, 256.0, 477.0, 1114.0, 3547.0, 19385.0, 669453.0, 332460.0, 16034.0, 3282.0, 1019.0, 471.0, 221.0, 116.0, 93.0, 62.0, 31.0, 26.0, 13.0, 14.0, 11.0, 5.0, 6.0, 6.0, 9.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.8125, -38.5263671875, -37.240234375, -35.9541015625, -34.66796875, -33.3818359375, -32.095703125, -30.8095703125, -29.5234375, -28.2373046875, -26.951171875, -25.6650390625, -24.37890625, -23.0927734375, -21.806640625, -20.5205078125, -19.234375, -17.9482421875, -16.662109375, -15.3759765625, -14.08984375, -12.8037109375, -11.517578125, -10.2314453125, -8.9453125, -7.6591796875, -6.373046875, -5.0869140625, -3.80078125, -2.5146484375, -1.228515625, 0.0576171875, 1.34375, 2.6298828125, 3.916015625, 5.2021484375, 6.48828125, 7.7744140625, 9.060546875, 10.3466796875, 11.6328125, 12.9189453125, 14.205078125, 15.4912109375, 16.77734375, 18.0634765625, 19.349609375, 20.6357421875, 21.921875, 23.2080078125, 24.494140625, 25.7802734375, 27.06640625, 28.3525390625, 29.638671875, 30.9248046875, 32.2109375, 33.4970703125, 34.783203125, 36.0693359375, 37.35546875, 38.6416015625, 39.927734375, 41.2138671875, 42.5]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 4.0, 4.0, 7.0, 9.0, 5.0, 8.0, 13.0, 12.0, 22.0, 21.0, 25.0, 21.0, 33.0, 44.0, 40.0, 66.0, 70.0, 75.0, 80.0, 64.0, 57.0, 60.0, 51.0, 50.0, 21.0, 22.0, 21.0, 19.0, 14.0, 10.0, 11.0, 8.0, 11.0, 4.0, 6.0, 3.0, 3.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-66.4375, -64.498046875, -62.55859375, -60.619140625, -58.6796875, -56.740234375, -54.80078125, -52.861328125, -50.921875, -48.982421875, -47.04296875, -45.103515625, -43.1640625, -41.224609375, -39.28515625, -37.345703125, -35.40625, -33.466796875, -31.52734375, -29.587890625, -27.6484375, -25.708984375, -23.76953125, -21.830078125, -19.890625, -17.951171875, -16.01171875, -14.072265625, -12.1328125, -10.193359375, -8.25390625, -6.314453125, -4.375, -2.435546875, -0.49609375, 1.443359375, 3.3828125, 5.322265625, 7.26171875, 9.201171875, 11.140625, 13.080078125, 15.01953125, 16.958984375, 18.8984375, 20.837890625, 22.77734375, 24.716796875, 26.65625, 28.595703125, 30.53515625, 32.474609375, 34.4140625, 36.353515625, 38.29296875, 40.232421875, 42.171875, 44.111328125, 46.05078125, 47.990234375, 49.9296875, 51.869140625, 53.80859375, 55.748046875, 57.6875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 7.0, 4.0, 5.0, 6.0, 8.0, 11.0, 15.0, 20.0, 34.0, 39.0, 59.0, 108.0, 196.0, 327.0, 597.0, 1259.0, 3662.0, 13969.0, 215657.0, 789120.0, 16472.0, 3994.0, 1490.0, 625.0, 315.0, 195.0, 115.0, 61.0, 45.0, 30.0, 28.0, 23.0, 21.0, 8.0, 5.0, 8.0, 5.0, 4.0, 6.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.46875, -14.031005859375, -13.59326171875, -13.155517578125, -12.7177734375, -12.280029296875, -11.84228515625, -11.404541015625, -10.966796875, -10.529052734375, -10.09130859375, -9.653564453125, -9.2158203125, -8.778076171875, -8.34033203125, -7.902587890625, -7.46484375, -7.027099609375, -6.58935546875, -6.151611328125, -5.7138671875, -5.276123046875, -4.83837890625, -4.400634765625, -3.962890625, -3.525146484375, -3.08740234375, -2.649658203125, -2.2119140625, -1.774169921875, -1.33642578125, -0.898681640625, -0.4609375, -0.023193359375, 0.41455078125, 0.852294921875, 1.2900390625, 1.727783203125, 2.16552734375, 2.603271484375, 3.041015625, 3.478759765625, 3.91650390625, 4.354248046875, 4.7919921875, 5.229736328125, 5.66748046875, 6.105224609375, 6.54296875, 6.980712890625, 7.41845703125, 7.856201171875, 8.2939453125, 8.731689453125, 9.16943359375, 9.607177734375, 10.044921875, 10.482666015625, 10.92041015625, 11.358154296875, 11.7958984375, 12.233642578125, 12.67138671875, 13.109130859375, 13.546875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 4.0, 4.0, 4.0, 14.0, 9.0, 11.0, 25.0, 69.0, 159.0, 345.0, 177.0, 67.0, 32.0, 23.0, 19.0, 7.0, 10.0, 9.0, 4.0, 3.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.006259918212890625, -0.006088733673095703, -0.005917549133300781, -0.005746364593505859, -0.0055751800537109375, -0.005403995513916016, -0.005232810974121094, -0.005061626434326172, -0.00489044189453125, -0.004719257354736328, -0.004548072814941406, -0.004376888275146484, -0.0042057037353515625, -0.004034519195556641, -0.0038633346557617188, -0.003692150115966797, -0.003520965576171875, -0.003349781036376953, -0.0031785964965820312, -0.0030074119567871094, -0.0028362274169921875, -0.0026650428771972656, -0.0024938583374023438, -0.002322673797607422, -0.0021514892578125, -0.001980304718017578, -0.0018091201782226562, -0.0016379356384277344, -0.0014667510986328125, -0.0012955665588378906, -0.0011243820190429688, -0.0009531974792480469, -0.000782012939453125, -0.0006108283996582031, -0.00043964385986328125, -0.0002684593200683594, -9.72747802734375e-05, 7.390975952148438e-05, 0.00024509429931640625, 0.0004162788391113281, 0.00058746337890625, 0.0007586479187011719, 0.0009298324584960938, 0.0011010169982910156, 0.0012722015380859375, 0.0014433860778808594, 0.0016145706176757812, 0.0017857551574707031, 0.001956939697265625, 0.002128124237060547, 0.0022993087768554688, 0.0024704933166503906, 0.0026416778564453125, 0.0028128623962402344, 0.0029840469360351562, 0.003155231475830078, 0.003326416015625, 0.003497600555419922, 0.0036687850952148438, 0.0038399696350097656, 0.0040111541748046875, 0.004182338714599609, 0.004353523254394531, 0.004524707794189453, 0.004695892333984375]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 1.0, 3.0, 9.0, 8.0, 11.0, 22.0, 43.0, 54.0, 134.0, 279.0, 675.0, 2066.0, 8885.0, 126460.0, 890000.0, 15437.0, 2909.0, 884.0, 346.0, 152.0, 79.0, 35.0, 31.0, 11.0, 2.0, 4.0, 7.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-20.953125, -20.33935546875, -19.7255859375, -19.11181640625, -18.498046875, -17.88427734375, -17.2705078125, -16.65673828125, -16.04296875, -15.42919921875, -14.8154296875, -14.20166015625, -13.587890625, -12.97412109375, -12.3603515625, -11.74658203125, -11.1328125, -10.51904296875, -9.9052734375, -9.29150390625, -8.677734375, -8.06396484375, -7.4501953125, -6.83642578125, -6.22265625, -5.60888671875, -4.9951171875, -4.38134765625, -3.767578125, -3.15380859375, -2.5400390625, -1.92626953125, -1.3125, -0.69873046875, -0.0849609375, 0.52880859375, 1.142578125, 1.75634765625, 2.3701171875, 2.98388671875, 3.59765625, 4.21142578125, 4.8251953125, 5.43896484375, 6.052734375, 6.66650390625, 7.2802734375, 7.89404296875, 8.5078125, 9.12158203125, 9.7353515625, 10.34912109375, 10.962890625, 11.57666015625, 12.1904296875, 12.80419921875, 13.41796875, 14.03173828125, 14.6455078125, 15.25927734375, 15.873046875, 16.48681640625, 17.1005859375, 17.71435546875, 18.328125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 4.0, 4.0, 3.0, 4.0, 3.0, 2.0, 8.0, 7.0, 11.0, 12.0, 6.0, 28.0, 62.0, 72.0, 133.0, 211.0, 157.0, 108.0, 65.0, 25.0, 18.0, 10.0, 7.0, 15.0, 8.0, 5.0, 4.0, 3.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.2890625, -10.92138671875, -10.5537109375, -10.18603515625, -9.818359375, -9.45068359375, -9.0830078125, -8.71533203125, -8.34765625, -7.97998046875, -7.6123046875, -7.24462890625, -6.876953125, -6.50927734375, -6.1416015625, -5.77392578125, -5.40625, -5.03857421875, -4.6708984375, -4.30322265625, -3.935546875, -3.56787109375, -3.2001953125, -2.83251953125, -2.46484375, -2.09716796875, -1.7294921875, -1.36181640625, -0.994140625, -0.62646484375, -0.2587890625, 0.10888671875, 0.4765625, 0.84423828125, 1.2119140625, 1.57958984375, 1.947265625, 2.31494140625, 2.6826171875, 3.05029296875, 3.41796875, 3.78564453125, 4.1533203125, 4.52099609375, 4.888671875, 5.25634765625, 5.6240234375, 5.99169921875, 6.359375, 6.72705078125, 7.0947265625, 7.46240234375, 7.830078125, 8.19775390625, 8.5654296875, 8.93310546875, 9.30078125, 9.66845703125, 10.0361328125, 10.40380859375, 10.771484375, 11.13916015625, 11.5068359375, 11.87451171875, 12.2421875]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 11.0, 21.0, 36.0, 100.0, 410.0, 278.0, 84.0, 34.0, 13.0, 7.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-231.27040100097656, -218.3673553466797, -205.46429443359375, -192.56124877929688, -179.658203125, -166.75515747070312, -153.8520965576172, -140.9490509033203, -128.04598999023438, -115.14293670654297, -102.2398910522461, -89.33683776855469, -76.43379211425781, -63.530738830566406, -50.627685546875, -37.724639892578125, -24.82159423828125, -11.918543815612793, 0.9845066070556641, 13.887557983398438, 26.790607452392578, 39.69365692138672, 52.596710205078125, 65.499755859375, 78.4028091430664, 91.30586242675781, 104.20890808105469, 117.1119613647461, 130.0150146484375, 142.91806030273438, 155.82110595703125, 168.72415161132812, 181.62722778320312, 194.5302734375, 207.43333435058594, 220.3363800048828, 233.2394256591797, 246.14248657226562, 259.0455322265625, 271.9485778808594, 284.85162353515625, 297.7546691894531, 310.65771484375, 323.560791015625, 336.4638366699219, 349.36688232421875, 362.2699279785156, 375.1729736328125, 388.0760498046875, 400.9790954589844, 413.88214111328125, 426.78521728515625, 439.6882629394531, 452.59130859375, 465.4943542480469, 478.39739990234375, 491.3004455566406, 504.2034912109375, 517.1065673828125, 530.0095825195312, 542.9126586914062, 555.815673828125, 568.71875, 581.621826171875, 594.5248413085938]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 6.0, 3.0, 4.0, 5.0, 2.0, 5.0, 8.0, 6.0, 15.0, 13.0, 12.0, 9.0, 11.0, 11.0, 21.0, 21.0, 19.0, 21.0, 20.0, 42.0, 77.0, 142.0, 183.0, 92.0, 46.0, 28.0, 18.0, 12.0, 17.0, 18.0, 12.0, 17.0, 10.0, 14.0, 10.0, 5.0, 12.0, 5.0, 8.0, 1.0, 4.0, 3.0, 4.0, 4.0, 5.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-135.93521118164062, -131.41534423828125, -126.8954849243164, -122.37562561035156, -117.85576629638672, -113.33590698242188, -108.8160400390625, -104.29618072509766, -99.77632141113281, -95.25646209716797, -90.7365951538086, -86.21673583984375, -81.6968765258789, -77.17701721191406, -72.65715026855469, -68.13729095458984, -63.61742401123047, -59.09756088256836, -54.577701568603516, -50.057838439941406, -45.53797912597656, -41.01811599731445, -36.498252868652344, -31.978391647338867, -27.45853042602539, -22.938669204711914, -18.418807983398438, -13.898944854736328, -9.379083633422852, -4.859222412109375, -0.3393592834472656, 4.180501937866211, 8.700363159179688, 13.220224380493164, 17.74008560180664, 22.25994873046875, 26.779809951782227, 31.299671173095703, 35.81953430175781, 40.339393615722656, 44.859256744384766, 49.379119873046875, 53.89897918701172, 58.41884231567383, 62.93870544433594, 67.45856475830078, 71.97842407226562, 76.498291015625, 81.01815032958984, 85.53800964355469, 90.05787658691406, 94.5777359008789, 99.09759521484375, 103.61746215820312, 108.13732147216797, 112.65718078613281, 117.17704772949219, 121.69690704345703, 126.2167739868164, 130.73663330078125, 135.25650024414062, 139.77635192871094, 144.2962188720703, 148.8160858154297, 153.3359375]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 9.0, 5.0, 9.0, 11.0, 8.0, 19.0, 13.0, 14.0, 23.0, 31.0, 36.0, 45.0, 41.0, 72.0, 182.0, 173.0, 60.0, 44.0, 32.0, 30.0, 34.0, 15.0, 23.0, 11.0, 14.0, 6.0, 11.0, 8.0, 7.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-20.484375, -19.93115234375, -19.3779296875, -18.82470703125, -18.271484375, -17.71826171875, -17.1650390625, -16.61181640625, -16.05859375, -15.50537109375, -14.9521484375, -14.39892578125, -13.845703125, -13.29248046875, -12.7392578125, -12.18603515625, -11.6328125, -11.07958984375, -10.5263671875, -9.97314453125, -9.419921875, -8.86669921875, -8.3134765625, -7.76025390625, -7.20703125, -6.65380859375, -6.1005859375, -5.54736328125, -4.994140625, -4.44091796875, -3.8876953125, -3.33447265625, -2.78125, -2.22802734375, -1.6748046875, -1.12158203125, -0.568359375, -0.01513671875, 0.5380859375, 1.09130859375, 1.64453125, 2.19775390625, 2.7509765625, 3.30419921875, 3.857421875, 4.41064453125, 4.9638671875, 5.51708984375, 6.0703125, 6.62353515625, 7.1767578125, 7.72998046875, 8.283203125, 8.83642578125, 9.3896484375, 9.94287109375, 10.49609375, 11.04931640625, 11.6025390625, 12.15576171875, 12.708984375, 13.26220703125, 13.8154296875, 14.36865234375, 14.921875]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 3.0, 8.0, 8.0, 13.0, 12.0, 13.0, 15.0, 23.0, 37.0, 45.0, 69.0, 124.0, 202.0, 343.0, 969.0, 3103.0, 19210.0, 8342773.0, 16873.0, 2980.0, 879.0, 365.0, 195.0, 110.0, 80.0, 31.0, 34.0, 21.0, 13.0, 9.0, 8.0, 5.0, 5.0, 2.0, 4.0, 3.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-93.67627716064453, -89.31395721435547, -84.95164489746094, -80.58932495117188, -76.22701263427734, -71.86469268798828, -67.50238037109375, -63.14006042480469, -58.77774429321289, -54.415428161621094, -50.0531120300293, -45.6907958984375, -41.32847595214844, -36.966163635253906, -32.603843688964844, -28.241527557373047, -23.87921142578125, -19.516895294189453, -15.15457820892334, -10.792261123657227, -6.42994499206543, -2.067628860473633, 2.294689178466797, 6.657005310058594, 11.01932144165039, 15.381637573242188, 19.743953704833984, 24.106271743774414, 28.46858787536621, 32.830902099609375, 37.19322204589844, 41.555538177490234, 45.91786193847656, 50.28017807006836, 54.642494201660156, 59.00481414794922, 63.36712646484375, 67.72944641113281, 72.09176635742188, 76.4540786743164, 80.81639099121094, 85.1787109375, 89.54102325439453, 93.9033432006836, 98.26565551757812, 102.62797546386719, 106.99029541015625, 111.35260772705078, 115.71492767333984, 120.0772476196289, 124.43955993652344, 128.8018798828125, 133.16419982910156, 137.52650451660156, 141.88882446289062, 146.2511444091797, 150.61346435546875, 154.9757843017578, 159.33810424804688, 163.70040893554688, 168.06272888183594, 172.425048828125, 176.78736877441406, 181.14968872070312, 185.51199340820312]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 3.0, 6.0, 3.0, 9.0, 4.0, 5.0, 2.0, 5.0, 4.0, 6.0, 6.0, 9.0, 3.0, 2.0, 4.0, 3.0, 3.0, 3.0, 4.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-199.30096435546875, -193.9467010498047, -188.59242248535156, -183.2381591796875, -177.88389587402344, -172.52963256835938, -167.17535400390625, -161.8210906982422, -156.46682739257812, -151.11256408691406, -145.75828552246094, -140.40402221679688, -135.0497589111328, -129.69549560546875, -124.34121704101562, -118.98695373535156, -113.63267517089844, -108.27840423583984, -102.92414093017578, -97.56986999511719, -92.21560668945312, -86.86133575439453, -81.50706481933594, -76.15280151367188, -70.79853057861328, -65.44425964355469, -60.089996337890625, -54.73572540283203, -49.3814582824707, -44.027191162109375, -38.67292022705078, -33.31865310668945, -27.964401245117188, -22.61013412475586, -17.2558650970459, -11.901596069335938, -6.547328948974609, -1.1930618286132812, 4.1612091064453125, 9.51547622680664, 14.869743347167969, 20.224010467529297, 25.578279495239258, 30.93254852294922, 36.28681564331055, 41.641082763671875, 46.99535369873047, 52.3496208190918, 57.703887939453125, 63.05815505981445, 68.41242218017578, 73.76669311523438, 79.12095642089844, 84.47522735595703, 89.82949829101562, 95.18376159667969, 100.53803253173828, 105.89230346679688, 111.24656677246094, 116.60083770751953, 121.95510864257812, 127.30937194824219, 132.66363525390625, 138.01791381835938, 143.37217712402344]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 5.0, 5.0, 5.0, 3.0, 11.0, 9.0, 19.0, 23.0, 32.0, 42.0, 49.0, 46.0, 53.0, 51.0, 59.0, 47.0, 68.0, 70.0, 71.0, 68.0, 45.0, 36.0, 33.0, 37.0, 23.0, 21.0, 18.0, 13.0, 12.0, 10.0, 6.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.09375, -7.86370849609375, -7.6336669921875, -7.40362548828125, -7.173583984375, -6.94354248046875, -6.7135009765625, -6.48345947265625, -6.25341796875, -6.02337646484375, -5.7933349609375, -5.56329345703125, -5.333251953125, -5.10321044921875, -4.8731689453125, -4.64312744140625, -4.4130859375, -4.18304443359375, -3.9530029296875, -3.72296142578125, -3.492919921875, -3.26287841796875, -3.0328369140625, -2.80279541015625, -2.57275390625, -2.34271240234375, -2.1126708984375, -1.88262939453125, -1.652587890625, -1.42254638671875, -1.1925048828125, -0.96246337890625, -0.732421875, -0.50238037109375, -0.2723388671875, -0.04229736328125, 0.187744140625, 0.41778564453125, 0.6478271484375, 0.87786865234375, 1.10791015625, 1.33795166015625, 1.5679931640625, 1.79803466796875, 2.028076171875, 2.25811767578125, 2.4881591796875, 2.71820068359375, 2.9482421875, 3.17828369140625, 3.4083251953125, 3.63836669921875, 3.868408203125, 4.09844970703125, 4.3284912109375, 4.55853271484375, 4.78857421875, 5.01861572265625, 5.2486572265625, 5.47869873046875, 5.708740234375, 5.93878173828125, 6.1688232421875, 6.39886474609375, 6.62890625]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 7.0, 6.0, 4.0, 12.0, 9.0, 17.0, 35.0, 51.0, 86.0, 140.0, 290.0, 515.0, 1119.0, 2681.0, 6630.0, 19541.0, 67899.0, 207901.0, 151732.0, 42779.0, 13495.0, 4938.0, 2114.0, 994.0, 539.0, 268.0, 155.0, 96.0, 70.0, 48.0, 32.0, 26.0, 8.0, 5.0, 12.0, 2.0, 7.0, 0.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-97.3125, -93.2275390625, -89.142578125, -85.0576171875, -80.97265625, -76.8876953125, -72.802734375, -68.7177734375, -64.6328125, -60.5478515625, -56.462890625, -52.3779296875, -48.29296875, -44.2080078125, -40.123046875, -36.0380859375, -31.953125, -27.8681640625, -23.783203125, -19.6982421875, -15.61328125, -11.5283203125, -7.443359375, -3.3583984375, 0.7265625, 4.8115234375, 8.896484375, 12.9814453125, 17.06640625, 21.1513671875, 25.236328125, 29.3212890625, 33.40625, 37.4912109375, 41.576171875, 45.6611328125, 49.74609375, 53.8310546875, 57.916015625, 62.0009765625, 66.0859375, 70.1708984375, 74.255859375, 78.3408203125, 82.42578125, 86.5107421875, 90.595703125, 94.6806640625, 98.765625, 102.8505859375, 106.935546875, 111.0205078125, 115.10546875, 119.1904296875, 123.275390625, 127.3603515625, 131.4453125, 135.5302734375, 139.615234375, 143.7001953125, 147.78515625, 151.8701171875, 155.955078125, 160.0400390625, 164.125]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 2.0, 6.0, 4.0, 10.0, 10.0, 15.0, 23.0, 25.0, 30.0, 40.0, 41.0, 57.0, 43.0, 64.0, 61.0, 88.0, 57.0, 69.0, 66.0, 64.0, 44.0, 31.0, 34.0, 26.0, 22.0, 11.0, 9.0, 11.0, 9.0, 5.0, 8.0, 7.0, 2.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.96875, -17.39404296875, -16.8193359375, -16.24462890625, -15.669921875, -15.09521484375, -14.5205078125, -13.94580078125, -13.37109375, -12.79638671875, -12.2216796875, -11.64697265625, -11.072265625, -10.49755859375, -9.9228515625, -9.34814453125, -8.7734375, -8.19873046875, -7.6240234375, -7.04931640625, -6.474609375, -5.89990234375, -5.3251953125, -4.75048828125, -4.17578125, -3.60107421875, -3.0263671875, -2.45166015625, -1.876953125, -1.30224609375, -0.7275390625, -0.15283203125, 0.421875, 0.99658203125, 1.5712890625, 2.14599609375, 2.720703125, 3.29541015625, 3.8701171875, 4.44482421875, 5.01953125, 5.59423828125, 6.1689453125, 6.74365234375, 7.318359375, 7.89306640625, 8.4677734375, 9.04248046875, 9.6171875, 10.19189453125, 10.7666015625, 11.34130859375, 11.916015625, 12.49072265625, 13.0654296875, 13.64013671875, 14.21484375, 14.78955078125, 15.3642578125, 15.93896484375, 16.513671875, 17.08837890625, 17.6630859375, 18.23779296875, 18.8125]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 4.0, 1.0, 3.0, 5.0, 5.0, 2.0, 1.0, 7.0, 9.0, 12.0, 13.0, 17.0, 30.0, 33.0, 32.0, 42.0, 59.0, 66.0, 35.0, 42.0, 19.0, 16.0, 10.0, 13.0, 5.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-93.818115234375, -90.95408630371094, -88.09005737304688, -85.22602844238281, -82.36199188232422, -79.49796295166016, -76.6339340209961, -73.76990509033203, -70.90586853027344, -68.04183959960938, -65.17781066894531, -62.313777923583984, -59.449745178222656, -56.585716247558594, -53.72168731689453, -50.85765838623047, -47.993629455566406, -45.129600524902344, -42.265567779541016, -39.40153884887695, -36.537506103515625, -33.67347717285156, -30.8094482421875, -27.945417404174805, -25.08138656616211, -22.217355728149414, -19.35332489013672, -16.489295959472656, -13.625265121459961, -10.761234283447266, -7.897205352783203, -5.033174514770508, -2.1691436767578125, 0.6948866844177246, 3.5589170455932617, 6.422946929931641, 9.286977767944336, 12.151008605957031, 15.015037536621094, 17.87906837463379, 20.743099212646484, 23.60713005065918, 26.471160888671875, 29.335189819335938, 32.19921875, 35.06325149536133, 37.92728042602539, 40.79131317138672, 43.65534210205078, 46.519371032714844, 49.38340377807617, 52.247432708740234, 55.11146545410156, 57.975494384765625, 60.83952331542969, 63.70355224609375, 66.56758117675781, 69.43161010742188, 72.29563903808594, 75.15966796875, 78.0237045288086, 80.88773345947266, 83.75176239013672, 86.61579132080078, 89.47982788085938]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 5.0, 3.0, 8.0, 5.0, 7.0, 5.0, 15.0, 25.0, 38.0, 55.0, 93.0, 89.0, 56.0, 29.0, 15.0, 5.0, 5.0, 6.0, 3.0, 4.0, 0.0, 2.0, 5.0, 3.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-115.83482360839844, -112.69192504882812, -109.54902648925781, -106.4061279296875, -103.26322937011719, -100.12033081054688, -96.97743225097656, -93.83454132080078, -90.69164276123047, -87.54874420166016, -84.40584564208984, -81.26294708251953, -78.12004852294922, -74.97715759277344, -71.83425903320312, -68.69136047363281, -65.5484619140625, -62.40556335449219, -59.262664794921875, -56.11976623535156, -52.976871490478516, -49.8339729309082, -46.69107437133789, -43.548179626464844, -40.4052734375, -37.26237487792969, -34.119476318359375, -30.976579666137695, -27.833683013916016, -24.690784454345703, -21.54788589477539, -18.40498924255371, -15.262092590332031, -12.119194984436035, -8.976297378540039, -5.833398818969727, -2.6905012130737305, 0.4523963928222656, 3.595294952392578, 6.738191604614258, 9.88109016418457, 13.023987770080566, 16.166885375976562, 19.309783935546875, 22.452682495117188, 25.595579147338867, 28.73847770690918, 31.88137435913086, 35.02427291870117, 38.167171478271484, 41.3100700378418, 44.452964782714844, 47.595863342285156, 50.73876190185547, 53.88166046142578, 57.024559020996094, 60.167457580566406, 63.31035614013672, 66.45325469970703, 69.59615325927734, 72.73905181884766, 75.88194274902344, 79.02484130859375, 82.16773986816406, 85.31063842773438]}, "eval/loss": 0.717689573764801, "eval/wer": 0.12834192780642603, "eval/runtime": 818.6465, "eval/samples_per_second": 3.227, "eval/steps_per_second": 0.404} \ No newline at end of file +{"train/loss": 0.4226, "train/learning_rate": 1.267605633802817e-08, "train/epoch": 25.0, "train/global_step": 22300, "_runtime": 35320, "_timestamp": 1648176660, "_step": 5803, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 4.0, 3.0, 5.0, 6.0, 7.0, 11.0, 11.0, 20.0, 11.0, 14.0, 23.0, 26.0, 38.0, 45.0, 46.0, 65.0, 51.0, 60.0, 89.0, 87.0, 60.0, 64.0, 45.0, 40.0, 34.0, 22.0, 25.0, 14.0, 13.0, 11.0, 11.0, 8.0, 3.0, 5.0, 7.0, 6.0, 2.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.9212875366211, -70.6487808227539, -68.37626647949219, -66.103759765625, -63.83124542236328, -61.558738708496094, -59.28622817993164, -57.01371765136719, -54.741207122802734, -52.46869659423828, -50.19618606567383, -47.923675537109375, -45.65116882324219, -43.37865447998047, -41.10614776611328, -38.83363723754883, -36.561126708984375, -34.28861618041992, -32.01610565185547, -29.74359703063965, -27.471086502075195, -25.198575973510742, -22.926067352294922, -20.65355682373047, -18.381046295166016, -16.108535766601562, -13.836026191711426, -11.563516616821289, -9.291006088256836, -7.018495559692383, -4.745985984802246, -2.4734764099121094, -0.200958251953125, 2.07155179977417, 4.344061851501465, 6.61657190322876, 8.889081954956055, 11.161592483520508, 13.434102058410645, 15.706611633300781, 17.979122161865234, 20.251632690429688, 22.52414321899414, 24.79665184020996, 27.069162368774414, 29.341672897338867, 31.614181518554688, 33.88669204711914, 36.159202575683594, 38.43171310424805, 40.7042236328125, 42.97673416137695, 45.249244689941406, 47.521751403808594, 49.79426193237305, 52.0667724609375, 54.33928298950195, 56.611793518066406, 58.88430404663086, 61.15681457519531, 63.4293212890625, 65.70183563232422, 67.9743423461914, 70.24685668945312, 72.51936340332031]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 1.0, 7.0, 5.0, 10.0, 12.0, 19.0, 19.0, 23.0, 12.0, 26.0, 25.0, 37.0, 27.0, 17.0, 37.0, 38.0, 45.0, 38.0, 52.0, 47.0, 29.0, 52.0, 38.0, 43.0, 46.0, 35.0, 37.0, 25.0, 26.0, 29.0, 22.0, 33.0, 14.0, 17.0, 18.0, 12.0, 4.0, 6.0, 6.0, 5.0, 5.0, 2.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.53594207763672, -54.687095642089844, -52.8382453918457, -50.98939895629883, -49.14055252075195, -47.29170227050781, -45.44285583496094, -43.59400939941406, -41.74516296386719, -39.89631652832031, -38.04746627807617, -36.1986198425293, -34.34977340698242, -32.50092315673828, -30.652076721191406, -28.80323028564453, -26.954381942749023, -25.105533599853516, -23.25668716430664, -21.407838821411133, -19.558992385864258, -17.71014404296875, -15.861296653747559, -14.012449264526367, -12.163601875305176, -10.314754486083984, -8.465907096862793, -6.617059230804443, -4.768211841583252, -2.9193639755249023, -1.070516586303711, 0.7783308029174805, 2.627178192138672, 4.476025581359863, 6.324872970581055, 8.173721313476562, 10.022567749023438, 11.871416091918945, 13.720263481140137, 15.569110870361328, 17.417957305908203, 19.26680564880371, 21.115652084350586, 22.964500427246094, 24.81334686279297, 26.662195205688477, 28.511043548583984, 30.35988998413086, 32.208740234375, 34.057586669921875, 35.906436920166016, 37.75528335571289, 39.604129791259766, 41.452980041503906, 43.30182647705078, 45.150672912597656, 46.99951934814453, 48.848365783691406, 50.69721603393555, 52.54606246948242, 54.3949089050293, 56.24375915527344, 58.09260559082031, 59.94145202636719, 61.79029846191406]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 10.0, 10.0, 21.0, 26.0, 44.0, 83.0, 134.0, 211.0, 327.0, 586.0, 931.0, 1394.0, 2381.0, 3782.0, 6175.0, 10901.0, 18717.0, 34611.0, 67966.0, 161762.0, 685990.0, 2363443.0, 548131.0, 146489.0, 64826.0, 32758.0, 17488.0, 9830.0, 5845.0, 3556.0, 2130.0, 1248.0, 867.0, 542.0, 362.0, 241.0, 149.0, 93.0, 73.0, 40.0, 38.0, 33.0, 15.0, 11.0, 8.0, 3.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-158.25, -152.685546875, -147.12109375, -141.556640625, -135.9921875, -130.427734375, -124.86328125, -119.298828125, -113.734375, -108.169921875, -102.60546875, -97.041015625, -91.4765625, -85.912109375, -80.34765625, -74.783203125, -69.21875, -63.654296875, -58.08984375, -52.525390625, -46.9609375, -41.396484375, -35.83203125, -30.267578125, -24.703125, -19.138671875, -13.57421875, -8.009765625, -2.4453125, 3.119140625, 8.68359375, 14.248046875, 19.8125, 25.376953125, 30.94140625, 36.505859375, 42.0703125, 47.634765625, 53.19921875, 58.763671875, 64.328125, 69.892578125, 75.45703125, 81.021484375, 86.5859375, 92.150390625, 97.71484375, 103.279296875, 108.84375, 114.408203125, 119.97265625, 125.537109375, 131.1015625, 136.666015625, 142.23046875, 147.794921875, 153.359375, 158.923828125, 164.48828125, 170.052734375, 175.6171875, 181.181640625, 186.74609375, 192.310546875, 197.875]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 2.0, 8.0, 4.0, 10.0, 9.0, 13.0, 15.0, 20.0, 23.0, 15.0, 19.0, 24.0, 29.0, 28.0, 38.0, 39.0, 47.0, 41.0, 45.0, 41.0, 34.0, 49.0, 34.0, 40.0, 46.0, 35.0, 36.0, 35.0, 44.0, 21.0, 18.0, 35.0, 22.0, 16.0, 10.0, 6.0, 7.0, 10.0, 8.0, 6.0, 7.0, 6.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-63.4375, -61.49560546875, -59.5537109375, -57.61181640625, -55.669921875, -53.72802734375, -51.7861328125, -49.84423828125, -47.90234375, -45.96044921875, -44.0185546875, -42.07666015625, -40.134765625, -38.19287109375, -36.2509765625, -34.30908203125, -32.3671875, -30.42529296875, -28.4833984375, -26.54150390625, -24.599609375, -22.65771484375, -20.7158203125, -18.77392578125, -16.83203125, -14.89013671875, -12.9482421875, -11.00634765625, -9.064453125, -7.12255859375, -5.1806640625, -3.23876953125, -1.296875, 0.64501953125, 2.5869140625, 4.52880859375, 6.470703125, 8.41259765625, 10.3544921875, 12.29638671875, 14.23828125, 16.18017578125, 18.1220703125, 20.06396484375, 22.005859375, 23.94775390625, 25.8896484375, 27.83154296875, 29.7734375, 31.71533203125, 33.6572265625, 35.59912109375, 37.541015625, 39.48291015625, 41.4248046875, 43.36669921875, 45.30859375, 47.25048828125, 49.1923828125, 51.13427734375, 53.076171875, 55.01806640625, 56.9599609375, 58.90185546875, 60.84375]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 3.0, 2.0, 8.0, 18.0, 12.0, 27.0, 40.0, 59.0, 61.0, 123.0, 172.0, 219.0, 378.0, 518.0, 799.0, 1188.0, 1920.0, 2780.0, 4217.0, 6438.0, 10368.0, 17425.0, 29950.0, 54812.0, 111080.0, 264698.0, 961221.0, 1966680.0, 431117.0, 157512.0, 73304.0, 39152.0, 21986.0, 13041.0, 8045.0, 5078.0, 3254.0, 2147.0, 1441.0, 980.0, 662.0, 416.0, 313.0, 210.0, 133.0, 101.0, 55.0, 43.0, 30.0, 21.0, 10.0, 13.0, 8.0, 5.0, 2.0, 2.0, 2.0], "bins": [-144.5, -140.27734375, -136.0546875, -131.83203125, -127.609375, -123.38671875, -119.1640625, -114.94140625, -110.71875, -106.49609375, -102.2734375, -98.05078125, -93.828125, -89.60546875, -85.3828125, -81.16015625, -76.9375, -72.71484375, -68.4921875, -64.26953125, -60.046875, -55.82421875, -51.6015625, -47.37890625, -43.15625, -38.93359375, -34.7109375, -30.48828125, -26.265625, -22.04296875, -17.8203125, -13.59765625, -9.375, -5.15234375, -0.9296875, 3.29296875, 7.515625, 11.73828125, 15.9609375, 20.18359375, 24.40625, 28.62890625, 32.8515625, 37.07421875, 41.296875, 45.51953125, 49.7421875, 53.96484375, 58.1875, 62.41015625, 66.6328125, 70.85546875, 75.078125, 79.30078125, 83.5234375, 87.74609375, 91.96875, 96.19140625, 100.4140625, 104.63671875, 108.859375, 113.08203125, 117.3046875, 121.52734375, 125.75]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 3.0, 6.0, 4.0, 13.0, 10.0, 9.0, 24.0, 25.0, 23.0, 27.0, 39.0, 34.0, 58.0, 85.0, 121.0, 139.0, 177.0, 279.0, 392.0, 639.0, 571.0, 368.0, 270.0, 182.0, 125.0, 92.0, 82.0, 67.0, 38.0, 33.0, 21.0, 28.0, 15.0, 11.0, 12.0, 10.0, 9.0, 9.0, 6.0, 5.0, 2.0, 2.0, 6.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-45.4375, -44.05517578125, -42.6728515625, -41.29052734375, -39.908203125, -38.52587890625, -37.1435546875, -35.76123046875, -34.37890625, -32.99658203125, -31.6142578125, -30.23193359375, -28.849609375, -27.46728515625, -26.0849609375, -24.70263671875, -23.3203125, -21.93798828125, -20.5556640625, -19.17333984375, -17.791015625, -16.40869140625, -15.0263671875, -13.64404296875, -12.26171875, -10.87939453125, -9.4970703125, -8.11474609375, -6.732421875, -5.35009765625, -3.9677734375, -2.58544921875, -1.203125, 0.17919921875, 1.5615234375, 2.94384765625, 4.326171875, 5.70849609375, 7.0908203125, 8.47314453125, 9.85546875, 11.23779296875, 12.6201171875, 14.00244140625, 15.384765625, 16.76708984375, 18.1494140625, 19.53173828125, 20.9140625, 22.29638671875, 23.6787109375, 25.06103515625, 26.443359375, 27.82568359375, 29.2080078125, 30.59033203125, 31.97265625, 33.35498046875, 34.7373046875, 36.11962890625, 37.501953125, 38.88427734375, 40.2666015625, 41.64892578125, 43.03125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 5.0, 10.0, 8.0, 7.0, 16.0, 8.0, 20.0, 26.0, 29.0, 43.0, 62.0, 83.0, 100.0, 122.0, 107.0, 85.0, 76.0, 42.0, 34.0, 32.0, 24.0, 19.0, 6.0, 11.0, 12.0, 5.0, 2.0, 1.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-136.39942932128906, -132.21673583984375, -128.0340576171875, -123.85136413574219, -119.66867065429688, -115.4859848022461, -111.30329895019531, -107.12060546875, -102.93791961669922, -98.75523376464844, -94.57254028320312, -90.38985443115234, -86.20716857910156, -82.02447509765625, -77.84178924560547, -73.65910339355469, -69.47640991210938, -65.2937240600586, -61.11103057861328, -56.9283447265625, -52.74565505981445, -48.562965393066406, -44.380279541015625, -40.19758987426758, -36.01490020751953, -31.832210540771484, -27.64952278137207, -23.466835021972656, -19.28414535522461, -15.101455688476562, -10.918767929077148, -6.736080169677734, -2.55340576171875, 1.6292829513549805, 5.811971664428711, 9.994660377502441, 14.177349090576172, 18.36003875732422, 22.542726516723633, 26.725414276123047, 30.908103942871094, 35.09079360961914, 39.27348327636719, 43.45616912841797, 47.638858795166016, 51.82154846191406, 56.004234313964844, 60.18692398071289, 64.36961364746094, 68.55229949951172, 72.73499298095703, 76.91767883300781, 81.10037231445312, 85.2830581665039, 89.46574401855469, 93.6484375, 97.83112335205078, 102.01380920410156, 106.19650268554688, 110.37918853759766, 114.56187438964844, 118.74456787109375, 122.92725372314453, 127.10993957519531, 131.29263305664062]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 6.0, 4.0, 7.0, 7.0, 13.0, 7.0, 15.0, 11.0, 20.0, 22.0, 25.0, 22.0, 38.0, 24.0, 36.0, 46.0, 43.0, 41.0, 46.0, 53.0, 46.0, 52.0, 39.0, 45.0, 42.0, 40.0, 20.0, 33.0, 29.0, 28.0, 20.0, 21.0, 16.0, 15.0, 12.0, 12.0, 8.0, 10.0, 10.0, 9.0, 3.0, 2.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-74.71490478515625, -72.24452209472656, -69.7741470336914, -67.30377197265625, -64.83338928222656, -62.36301040649414, -59.89263153076172, -57.4222526550293, -54.951873779296875, -52.48149490356445, -50.01111602783203, -47.54073715209961, -45.07035827636719, -42.599979400634766, -40.129600524902344, -37.65922164916992, -35.1888427734375, -32.71846389770508, -30.248085021972656, -27.777706146240234, -25.307327270507812, -22.83694839477539, -20.36656951904297, -17.896190643310547, -15.425811767578125, -12.955432891845703, -10.485054016113281, -8.01467514038086, -5.5442962646484375, -3.0739173889160156, -0.6035385131835938, 1.8668403625488281, 4.337226867675781, 6.807605743408203, 9.277984619140625, 11.748363494873047, 14.218742370605469, 16.68912124633789, 19.159500122070312, 21.629878997802734, 24.100257873535156, 26.570636749267578, 29.041015625, 31.511394500732422, 33.981773376464844, 36.452152252197266, 38.92253112792969, 41.39291000366211, 43.86328887939453, 46.33366775512695, 48.804046630859375, 51.2744255065918, 53.74480438232422, 56.21518325805664, 58.68556213378906, 61.155941009521484, 63.626319885253906, 66.09669494628906, 68.56707763671875, 71.03746032714844, 73.5078353881836, 75.97821044921875, 78.44859313964844, 80.91897583007812, 83.38935089111328]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 8.0, 8.0, 8.0, 19.0, 26.0, 35.0, 52.0, 72.0, 118.0, 150.0, 238.0, 300.0, 445.0, 676.0, 925.0, 1418.0, 2052.0, 3065.0, 4531.0, 6650.0, 10002.0, 15085.0, 23352.0, 37639.0, 62513.0, 109378.0, 212042.0, 244831.0, 125036.0, 69905.0, 41915.0, 26019.0, 16541.0, 10825.0, 7336.0, 4831.0, 3302.0, 2227.0, 1539.0, 1116.0, 706.0, 496.0, 325.0, 240.0, 180.0, 118.0, 93.0, 54.0, 35.0, 26.0, 21.0, 17.0, 4.0, 8.0, 5.0, 3.0, 3.0, 2.0, 2.0], "bins": [-36.90625, -35.7568359375, -34.607421875, -33.4580078125, -32.30859375, -31.1591796875, -30.009765625, -28.8603515625, -27.7109375, -26.5615234375, -25.412109375, -24.2626953125, -23.11328125, -21.9638671875, -20.814453125, -19.6650390625, -18.515625, -17.3662109375, -16.216796875, -15.0673828125, -13.91796875, -12.7685546875, -11.619140625, -10.4697265625, -9.3203125, -8.1708984375, -7.021484375, -5.8720703125, -4.72265625, -3.5732421875, -2.423828125, -1.2744140625, -0.125, 1.0244140625, 2.173828125, 3.3232421875, 4.47265625, 5.6220703125, 6.771484375, 7.9208984375, 9.0703125, 10.2197265625, 11.369140625, 12.5185546875, 13.66796875, 14.8173828125, 15.966796875, 17.1162109375, 18.265625, 19.4150390625, 20.564453125, 21.7138671875, 22.86328125, 24.0126953125, 25.162109375, 26.3115234375, 27.4609375, 28.6103515625, 29.759765625, 30.9091796875, 32.05859375, 33.2080078125, 34.357421875, 35.5068359375, 36.65625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 5.0, 7.0, 10.0, 9.0, 12.0, 11.0, 15.0, 14.0, 22.0, 26.0, 31.0, 27.0, 31.0, 37.0, 43.0, 46.0, 40.0, 60.0, 61.0, 54.0, 51.0, 54.0, 39.0, 34.0, 39.0, 23.0, 29.0, 25.0, 22.0, 11.0, 21.0, 15.0, 15.0, 12.0, 8.0, 10.0, 8.0, 7.0, 5.0, 3.0, 2.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-81.875, -79.2421875, -76.609375, -73.9765625, -71.34375, -68.7109375, -66.078125, -63.4453125, -60.8125, -58.1796875, -55.546875, -52.9140625, -50.28125, -47.6484375, -45.015625, -42.3828125, -39.75, -37.1171875, -34.484375, -31.8515625, -29.21875, -26.5859375, -23.953125, -21.3203125, -18.6875, -16.0546875, -13.421875, -10.7890625, -8.15625, -5.5234375, -2.890625, -0.2578125, 2.375, 5.0078125, 7.640625, 10.2734375, 12.90625, 15.5390625, 18.171875, 20.8046875, 23.4375, 26.0703125, 28.703125, 31.3359375, 33.96875, 36.6015625, 39.234375, 41.8671875, 44.5, 47.1328125, 49.765625, 52.3984375, 55.03125, 57.6640625, 60.296875, 62.9296875, 65.5625, 68.1953125, 70.828125, 73.4609375, 76.09375, 78.7265625, 81.359375, 83.9921875, 86.625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 4.0, 4.0, 7.0, 16.0, 12.0, 21.0, 26.0, 45.0, 75.0, 131.0, 225.0, 492.0, 1114.0, 2880.0, 8596.0, 33849.0, 919540.0, 62954.0, 11954.0, 3874.0, 1440.0, 627.0, 265.0, 146.0, 87.0, 48.0, 29.0, 26.0, 13.0, 17.0, 10.0, 6.0, 9.0, 2.0, 4.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-111.75, -107.84765625, -103.9453125, -100.04296875, -96.140625, -92.23828125, -88.3359375, -84.43359375, -80.53125, -76.62890625, -72.7265625, -68.82421875, -64.921875, -61.01953125, -57.1171875, -53.21484375, -49.3125, -45.41015625, -41.5078125, -37.60546875, -33.703125, -29.80078125, -25.8984375, -21.99609375, -18.09375, -14.19140625, -10.2890625, -6.38671875, -2.484375, 1.41796875, 5.3203125, 9.22265625, 13.125, 17.02734375, 20.9296875, 24.83203125, 28.734375, 32.63671875, 36.5390625, 40.44140625, 44.34375, 48.24609375, 52.1484375, 56.05078125, 59.953125, 63.85546875, 67.7578125, 71.66015625, 75.5625, 79.46484375, 83.3671875, 87.26953125, 91.171875, 95.07421875, 98.9765625, 102.87890625, 106.78125, 110.68359375, 114.5859375, 118.48828125, 122.390625, 126.29296875, 130.1953125, 134.09765625, 138.0]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 3.0, 7.0, 6.0, 11.0, 17.0, 13.0, 15.0, 23.0, 29.0, 22.0, 20.0, 23.0, 17.0, 31.0, 35.0, 43.0, 37.0, 34.0, 36.0, 47.0, 35.0, 40.0, 44.0, 33.0, 30.0, 41.0, 49.0, 24.0, 28.0, 34.0, 27.0, 28.0, 13.0, 15.0, 12.0, 18.0, 12.0, 9.0, 5.0, 8.0, 8.0, 4.0, 4.0, 5.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.53125, -48.93505859375, -47.3388671875, -45.74267578125, -44.146484375, -42.55029296875, -40.9541015625, -39.35791015625, -37.76171875, -36.16552734375, -34.5693359375, -32.97314453125, -31.376953125, -29.78076171875, -28.1845703125, -26.58837890625, -24.9921875, -23.39599609375, -21.7998046875, -20.20361328125, -18.607421875, -17.01123046875, -15.4150390625, -13.81884765625, -12.22265625, -10.62646484375, -9.0302734375, -7.43408203125, -5.837890625, -4.24169921875, -2.6455078125, -1.04931640625, 0.546875, 2.14306640625, 3.7392578125, 5.33544921875, 6.931640625, 8.52783203125, 10.1240234375, 11.72021484375, 13.31640625, 14.91259765625, 16.5087890625, 18.10498046875, 19.701171875, 21.29736328125, 22.8935546875, 24.48974609375, 26.0859375, 27.68212890625, 29.2783203125, 30.87451171875, 32.470703125, 34.06689453125, 35.6630859375, 37.25927734375, 38.85546875, 40.45166015625, 42.0478515625, 43.64404296875, 45.240234375, 46.83642578125, 48.4326171875, 50.02880859375, 51.625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 6.0, 4.0, 6.0, 12.0, 11.0, 15.0, 21.0, 30.0, 33.0, 43.0, 59.0, 83.0, 126.0, 208.0, 435.0, 794.0, 1796.0, 5140.0, 21582.0, 946542.0, 57893.0, 8498.0, 2769.0, 1117.0, 524.0, 268.0, 146.0, 107.0, 76.0, 49.0, 30.0, 29.0, 30.0, 15.0, 12.0, 10.0, 5.0, 8.0, 2.0, 7.0, 5.0, 6.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-26.3125, -25.5078125, -24.703125, -23.8984375, -23.09375, -22.2890625, -21.484375, -20.6796875, -19.875, -19.0703125, -18.265625, -17.4609375, -16.65625, -15.8515625, -15.046875, -14.2421875, -13.4375, -12.6328125, -11.828125, -11.0234375, -10.21875, -9.4140625, -8.609375, -7.8046875, -7.0, -6.1953125, -5.390625, -4.5859375, -3.78125, -2.9765625, -2.171875, -1.3671875, -0.5625, 0.2421875, 1.046875, 1.8515625, 2.65625, 3.4609375, 4.265625, 5.0703125, 5.875, 6.6796875, 7.484375, 8.2890625, 9.09375, 9.8984375, 10.703125, 11.5078125, 12.3125, 13.1171875, 13.921875, 14.7265625, 15.53125, 16.3359375, 17.140625, 17.9453125, 18.75, 19.5546875, 20.359375, 21.1640625, 21.96875, 22.7734375, 23.578125, 24.3828125, 25.1875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 7.0, 4.0, 10.0, 7.0, 16.0, 22.0, 27.0, 39.0, 49.0, 70.0, 83.0, 108.0, 101.0, 105.0, 96.0, 77.0, 44.0, 32.0, 31.0, 24.0, 13.0, 13.0, 11.0, 6.0, 5.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014286041259765625, -0.0013845711946487427, -0.0013405382633209229, -0.001296505331993103, -0.0012524724006652832, -0.0012084394693374634, -0.0011644065380096436, -0.0011203736066818237, -0.001076340675354004, -0.001032307744026184, -0.0009882748126983643, -0.0009442418813705444, -0.0009002089500427246, -0.0008561760187149048, -0.000812143087387085, -0.0007681101560592651, -0.0007240772247314453, -0.0006800442934036255, -0.0006360113620758057, -0.0005919784307479858, -0.000547945499420166, -0.0005039125680923462, -0.00045987963676452637, -0.00041584670543670654, -0.0003718137741088867, -0.0003277808427810669, -0.00028374791145324707, -0.00023971498012542725, -0.00019568204879760742, -0.0001516491174697876, -0.00010761618614196777, -6.358325481414795e-05, -1.9550323486328125e-05, 2.44826078414917e-05, 6.851553916931152e-05, 0.00011254847049713135, 0.00015658140182495117, 0.000200614333152771, 0.0002446472644805908, 0.00028868019580841064, 0.00033271312713623047, 0.0003767460584640503, 0.0004207789897918701, 0.00046481192111968994, 0.0005088448524475098, 0.0005528777837753296, 0.0005969107151031494, 0.0006409436464309692, 0.0006849765777587891, 0.0007290095090866089, 0.0007730424404144287, 0.0008170753717422485, 0.0008611083030700684, 0.0009051412343978882, 0.000949174165725708, 0.0009932070970535278, 0.0010372400283813477, 0.0010812729597091675, 0.0011253058910369873, 0.0011693388223648071, 0.001213371753692627, 0.0012574046850204468, 0.0013014376163482666, 0.0013454705476760864, 0.0013895034790039062]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 2.0, 11.0, 11.0, 10.0, 20.0, 33.0, 49.0, 44.0, 76.0, 108.0, 146.0, 217.0, 306.0, 352.0, 492.0, 681.0, 911.0, 1266.0, 1732.0, 2524.0, 3726.0, 6371.0, 12084.0, 28814.0, 88302.0, 439730.0, 333502.0, 73171.0, 25142.0, 10758.0, 5804.0, 3628.0, 2362.0, 1669.0, 1200.0, 856.0, 671.0, 457.0, 315.0, 284.0, 207.0, 162.0, 98.0, 58.0, 56.0, 45.0, 37.0, 27.0, 14.0, 5.0, 6.0, 7.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-19.171875, -18.589599609375, -18.00732421875, -17.425048828125, -16.8427734375, -16.260498046875, -15.67822265625, -15.095947265625, -14.513671875, -13.931396484375, -13.34912109375, -12.766845703125, -12.1845703125, -11.602294921875, -11.02001953125, -10.437744140625, -9.85546875, -9.273193359375, -8.69091796875, -8.108642578125, -7.5263671875, -6.944091796875, -6.36181640625, -5.779541015625, -5.197265625, -4.614990234375, -4.03271484375, -3.450439453125, -2.8681640625, -2.285888671875, -1.70361328125, -1.121337890625, -0.5390625, 0.043212890625, 0.62548828125, 1.207763671875, 1.7900390625, 2.372314453125, 2.95458984375, 3.536865234375, 4.119140625, 4.701416015625, 5.28369140625, 5.865966796875, 6.4482421875, 7.030517578125, 7.61279296875, 8.195068359375, 8.77734375, 9.359619140625, 9.94189453125, 10.524169921875, 11.1064453125, 11.688720703125, 12.27099609375, 12.853271484375, 13.435546875, 14.017822265625, 14.60009765625, 15.182373046875, 15.7646484375, 16.346923828125, 16.92919921875, 17.511474609375, 18.09375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 4.0, 6.0, 3.0, 5.0, 7.0, 6.0, 12.0, 16.0, 18.0, 28.0, 24.0, 32.0, 61.0, 59.0, 70.0, 64.0, 81.0, 69.0, 77.0, 64.0, 57.0, 44.0, 43.0, 32.0, 42.0, 20.0, 9.0, 15.0, 8.0, 6.0, 6.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 6.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.880859375, -2.770904541015625, -2.66094970703125, -2.550994873046875, -2.4410400390625, -2.331085205078125, -2.22113037109375, -2.111175537109375, -2.001220703125, -1.891265869140625, -1.78131103515625, -1.671356201171875, -1.5614013671875, -1.451446533203125, -1.34149169921875, -1.231536865234375, -1.12158203125, -1.011627197265625, -0.90167236328125, -0.791717529296875, -0.6817626953125, -0.571807861328125, -0.46185302734375, -0.351898193359375, -0.241943359375, -0.131988525390625, -0.02203369140625, 0.087921142578125, 0.1978759765625, 0.307830810546875, 0.41778564453125, 0.527740478515625, 0.6376953125, 0.747650146484375, 0.85760498046875, 0.967559814453125, 1.0775146484375, 1.187469482421875, 1.29742431640625, 1.407379150390625, 1.517333984375, 1.627288818359375, 1.73724365234375, 1.847198486328125, 1.9571533203125, 2.067108154296875, 2.17706298828125, 2.287017822265625, 2.39697265625, 2.506927490234375, 2.61688232421875, 2.726837158203125, 2.8367919921875, 2.946746826171875, 3.05670166015625, 3.166656494140625, 3.276611328125, 3.386566162109375, 3.49652099609375, 3.606475830078125, 3.7164306640625, 3.826385498046875, 3.93634033203125, 4.046295166015625, 4.15625]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 4.0, 7.0, 11.0, 10.0, 13.0, 17.0, 13.0, 31.0, 45.0, 43.0, 69.0, 103.0, 116.0, 124.0, 102.0, 72.0, 56.0, 34.0, 42.0, 23.0, 22.0, 9.0, 13.0, 9.0, 3.0, 2.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-136.05120849609375, -131.8037872314453, -127.55636596679688, -123.30895233154297, -119.06153106689453, -114.8141098022461, -110.56669616699219, -106.31927490234375, -102.07185363769531, -97.82443237304688, -93.57701110839844, -89.32959747314453, -85.0821762084961, -80.83475494384766, -76.58734130859375, -72.33992004394531, -68.09249877929688, -63.84507751464844, -59.597660064697266, -55.350242614746094, -51.102821350097656, -46.85540008544922, -42.60798263549805, -38.360565185546875, -34.11314392089844, -29.865724563598633, -25.618305206298828, -21.370885848999023, -17.12346649169922, -12.876047134399414, -8.62862777709961, -4.381208419799805, -0.1337738037109375, 4.113645553588867, 8.361064910888672, 12.608484268188477, 16.85590362548828, 21.103322982788086, 25.35074234008789, 29.598161697387695, 33.8455810546875, 38.09300231933594, 42.34041976928711, 46.58783721923828, 50.83525848388672, 55.082679748535156, 59.33009719848633, 63.5775146484375, 67.82493591308594, 72.07235717773438, 76.31977844238281, 80.56719207763672, 84.81461334228516, 89.0620346069336, 93.3094482421875, 97.55686950683594, 101.80429077148438, 106.05171203613281, 110.29913330078125, 114.54654693603516, 118.7939682006836, 123.04138946533203, 127.28880310058594, 131.53622436523438, 135.7836456298828]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 3.0, 7.0, 7.0, 10.0, 10.0, 10.0, 14.0, 15.0, 18.0, 21.0, 34.0, 28.0, 30.0, 25.0, 35.0, 50.0, 41.0, 44.0, 41.0, 57.0, 45.0, 47.0, 43.0, 39.0, 48.0, 24.0, 25.0, 35.0, 29.0, 26.0, 18.0, 20.0, 15.0, 16.0, 11.0, 10.0, 11.0, 10.0, 7.0, 8.0, 4.0, 2.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-72.27301788330078, -69.8780288696289, -67.48304748535156, -65.08805847167969, -62.693077087402344, -60.298091888427734, -57.903106689453125, -55.50811767578125, -53.113136291503906, -50.7181510925293, -48.32316589355469, -45.92818069458008, -43.53319549560547, -41.13821029663086, -38.74322509765625, -36.348236083984375, -33.953250885009766, -31.558265686035156, -29.163280487060547, -26.768295288085938, -24.373310089111328, -21.97832489013672, -19.583337783813477, -17.188352584838867, -14.793367385864258, -12.398382186889648, -10.003396987915039, -7.608410835266113, -5.213425636291504, -2.8184404373168945, -0.42345428466796875, 1.9715309143066406, 4.36651611328125, 6.761501312255859, 9.156486511230469, 11.551472663879395, 13.946457862854004, 16.341442108154297, 18.73642921447754, 21.13141441345215, 23.526399612426758, 25.921384811401367, 28.316370010375977, 30.71135711669922, 33.10634231567383, 35.50132751464844, 37.89631271362305, 40.291297912597656, 42.686283111572266, 45.081268310546875, 47.476253509521484, 49.871238708496094, 52.2662239074707, 54.66120910644531, 57.05619812011719, 59.45117950439453, 61.846168518066406, 64.24115753173828, 66.63613891601562, 69.0311279296875, 71.42610931396484, 73.82109832763672, 76.21607971191406, 78.61106872558594, 81.00605010986328]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 0.0, 7.0, 9.0, 9.0, 23.0, 35.0, 40.0, 64.0, 83.0, 136.0, 194.0, 277.0, 430.0, 640.0, 981.0, 1567.0, 2528.0, 3755.0, 6369.0, 11011.0, 19240.0, 36117.0, 71115.0, 146939.0, 287531.0, 228464.0, 110071.0, 54486.0, 27885.0, 15306.0, 8896.0, 5282.0, 3225.0, 1959.0, 1356.0, 830.0, 549.0, 357.0, 283.0, 166.0, 97.0, 80.0, 57.0, 39.0, 17.0, 18.0, 6.0, 6.0, 7.0, 6.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-132.625, -128.455078125, -124.28515625, -120.115234375, -115.9453125, -111.775390625, -107.60546875, -103.435546875, -99.265625, -95.095703125, -90.92578125, -86.755859375, -82.5859375, -78.416015625, -74.24609375, -70.076171875, -65.90625, -61.736328125, -57.56640625, -53.396484375, -49.2265625, -45.056640625, -40.88671875, -36.716796875, -32.546875, -28.376953125, -24.20703125, -20.037109375, -15.8671875, -11.697265625, -7.52734375, -3.357421875, 0.8125, 4.982421875, 9.15234375, 13.322265625, 17.4921875, 21.662109375, 25.83203125, 30.001953125, 34.171875, 38.341796875, 42.51171875, 46.681640625, 50.8515625, 55.021484375, 59.19140625, 63.361328125, 67.53125, 71.701171875, 75.87109375, 80.041015625, 84.2109375, 88.380859375, 92.55078125, 96.720703125, 100.890625, 105.060546875, 109.23046875, 113.400390625, 117.5703125, 121.740234375, 125.91015625, 130.080078125, 134.25]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 6.0, 8.0, 11.0, 9.0, 11.0, 9.0, 22.0, 18.0, 28.0, 20.0, 33.0, 29.0, 41.0, 49.0, 44.0, 50.0, 51.0, 56.0, 51.0, 55.0, 50.0, 38.0, 44.0, 30.0, 29.0, 34.0, 26.0, 18.0, 18.0, 15.0, 17.0, 17.0, 8.0, 12.0, 9.0, 7.0, 9.0, 7.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-76.0, -73.4814453125, -70.962890625, -68.4443359375, -65.92578125, -63.4072265625, -60.888671875, -58.3701171875, -55.8515625, -53.3330078125, -50.814453125, -48.2958984375, -45.77734375, -43.2587890625, -40.740234375, -38.2216796875, -35.703125, -33.1845703125, -30.666015625, -28.1474609375, -25.62890625, -23.1103515625, -20.591796875, -18.0732421875, -15.5546875, -13.0361328125, -10.517578125, -7.9990234375, -5.48046875, -2.9619140625, -0.443359375, 2.0751953125, 4.59375, 7.1123046875, 9.630859375, 12.1494140625, 14.66796875, 17.1865234375, 19.705078125, 22.2236328125, 24.7421875, 27.2607421875, 29.779296875, 32.2978515625, 34.81640625, 37.3349609375, 39.853515625, 42.3720703125, 44.890625, 47.4091796875, 49.927734375, 52.4462890625, 54.96484375, 57.4833984375, 60.001953125, 62.5205078125, 65.0390625, 67.5576171875, 70.076171875, 72.5947265625, 75.11328125, 77.6318359375, 80.150390625, 82.6689453125, 85.1875]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 9.0, 6.0, 3.0, 8.0, 14.0, 17.0, 27.0, 40.0, 58.0, 91.0, 149.0, 217.0, 354.0, 521.0, 878.0, 1416.0, 2378.0, 3933.0, 6984.0, 12526.0, 22547.0, 43374.0, 86977.0, 176099.0, 293109.0, 195071.0, 96162.0, 48461.0, 25005.0, 13551.0, 7573.0, 4424.0, 2537.0, 1547.0, 925.0, 533.0, 357.0, 215.0, 148.0, 102.0, 62.0, 47.0, 40.0, 19.0, 18.0, 6.0, 9.0, 2.0, 6.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-167.125, -161.83203125, -156.5390625, -151.24609375, -145.953125, -140.66015625, -135.3671875, -130.07421875, -124.78125, -119.48828125, -114.1953125, -108.90234375, -103.609375, -98.31640625, -93.0234375, -87.73046875, -82.4375, -77.14453125, -71.8515625, -66.55859375, -61.265625, -55.97265625, -50.6796875, -45.38671875, -40.09375, -34.80078125, -29.5078125, -24.21484375, -18.921875, -13.62890625, -8.3359375, -3.04296875, 2.25, 7.54296875, 12.8359375, 18.12890625, 23.421875, 28.71484375, 34.0078125, 39.30078125, 44.59375, 49.88671875, 55.1796875, 60.47265625, 65.765625, 71.05859375, 76.3515625, 81.64453125, 86.9375, 92.23046875, 97.5234375, 102.81640625, 108.109375, 113.40234375, 118.6953125, 123.98828125, 129.28125, 134.57421875, 139.8671875, 145.16015625, 150.453125, 155.74609375, 161.0390625, 166.33203125, 171.625]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 5.0, 8.0, 11.0, 11.0, 13.0, 16.0, 11.0, 17.0, 26.0, 28.0, 34.0, 29.0, 30.0, 34.0, 42.0, 50.0, 39.0, 53.0, 55.0, 47.0, 45.0, 46.0, 37.0, 31.0, 44.0, 40.0, 29.0, 17.0, 13.0, 20.0, 20.0, 16.0, 15.0, 14.0, 16.0, 4.0, 14.0, 6.0, 8.0, 4.0, 4.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-51.0, -49.294921875, -47.58984375, -45.884765625, -44.1796875, -42.474609375, -40.76953125, -39.064453125, -37.359375, -35.654296875, -33.94921875, -32.244140625, -30.5390625, -28.833984375, -27.12890625, -25.423828125, -23.71875, -22.013671875, -20.30859375, -18.603515625, -16.8984375, -15.193359375, -13.48828125, -11.783203125, -10.078125, -8.373046875, -6.66796875, -4.962890625, -3.2578125, -1.552734375, 0.15234375, 1.857421875, 3.5625, 5.267578125, 6.97265625, 8.677734375, 10.3828125, 12.087890625, 13.79296875, 15.498046875, 17.203125, 18.908203125, 20.61328125, 22.318359375, 24.0234375, 25.728515625, 27.43359375, 29.138671875, 30.84375, 32.548828125, 34.25390625, 35.958984375, 37.6640625, 39.369140625, 41.07421875, 42.779296875, 44.484375, 46.189453125, 47.89453125, 49.599609375, 51.3046875, 53.009765625, 54.71484375, 56.419921875, 58.125]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 4.0, 4.0, 5.0, 7.0, 7.0, 17.0, 19.0, 20.0, 45.0, 53.0, 57.0, 100.0, 137.0, 202.0, 312.0, 404.0, 590.0, 820.0, 1241.0, 2002.0, 3255.0, 5975.0, 11291.0, 23167.0, 55385.0, 187198.0, 545706.0, 126151.0, 42782.0, 19098.0, 9268.0, 4970.0, 2920.0, 1735.0, 1072.0, 742.0, 506.0, 376.0, 240.0, 214.0, 133.0, 109.0, 62.0, 39.0, 46.0, 19.0, 19.0, 10.0, 11.0, 10.0, 3.0, 1.0, 3.0, 3.0, 1.0], "bins": [-69.3125, -67.3525390625, -65.392578125, -63.4326171875, -61.47265625, -59.5126953125, -57.552734375, -55.5927734375, -53.6328125, -51.6728515625, -49.712890625, -47.7529296875, -45.79296875, -43.8330078125, -41.873046875, -39.9130859375, -37.953125, -35.9931640625, -34.033203125, -32.0732421875, -30.11328125, -28.1533203125, -26.193359375, -24.2333984375, -22.2734375, -20.3134765625, -18.353515625, -16.3935546875, -14.43359375, -12.4736328125, -10.513671875, -8.5537109375, -6.59375, -4.6337890625, -2.673828125, -0.7138671875, 1.24609375, 3.2060546875, 5.166015625, 7.1259765625, 9.0859375, 11.0458984375, 13.005859375, 14.9658203125, 16.92578125, 18.8857421875, 20.845703125, 22.8056640625, 24.765625, 26.7255859375, 28.685546875, 30.6455078125, 32.60546875, 34.5654296875, 36.525390625, 38.4853515625, 40.4453125, 42.4052734375, 44.365234375, 46.3251953125, 48.28515625, 50.2451171875, 52.205078125, 54.1650390625, 56.125]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 6.0, 2.0, 4.0, 9.0, 15.0, 11.0, 15.0, 29.0, 45.0, 84.0, 195.0, 240.0, 131.0, 59.0, 55.0, 26.0, 21.0, 13.0, 10.0, 9.0, 6.0, 5.0, 4.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00860595703125, -0.008380889892578125, -0.00815582275390625, -0.007930755615234375, -0.0077056884765625, -0.007480621337890625, -0.00725555419921875, -0.007030487060546875, -0.006805419921875, -0.006580352783203125, -0.00635528564453125, -0.006130218505859375, -0.0059051513671875, -0.005680084228515625, -0.00545501708984375, -0.005229949951171875, -0.0050048828125, -0.004779815673828125, -0.00455474853515625, -0.004329681396484375, -0.0041046142578125, -0.003879547119140625, -0.00365447998046875, -0.003429412841796875, -0.003204345703125, -0.002979278564453125, -0.00275421142578125, -0.002529144287109375, -0.0023040771484375, -0.002079010009765625, -0.00185394287109375, -0.001628875732421875, -0.00140380859375, -0.001178741455078125, -0.00095367431640625, -0.000728607177734375, -0.0005035400390625, -0.000278472900390625, -5.340576171875e-05, 0.000171661376953125, 0.000396728515625, 0.000621795654296875, 0.00084686279296875, 0.001071929931640625, 0.0012969970703125, 0.001522064208984375, 0.00174713134765625, 0.001972198486328125, 0.002197265625, 0.002422332763671875, 0.00264739990234375, 0.002872467041015625, 0.0030975341796875, 0.003322601318359375, 0.00354766845703125, 0.003772735595703125, 0.003997802734375, 0.004222869873046875, 0.00444793701171875, 0.004673004150390625, 0.0048980712890625, 0.005123138427734375, 0.00534820556640625, 0.005573272705078125, 0.00579833984375]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 5.0, 0.0, 4.0, 2.0, 1.0, 4.0, 10.0, 3.0, 16.0, 10.0, 12.0, 27.0, 23.0, 40.0, 56.0, 50.0, 83.0, 129.0, 176.0, 254.0, 419.0, 660.0, 1048.0, 1755.0, 3284.0, 6307.0, 13183.0, 36162.0, 165814.0, 655669.0, 111946.0, 27938.0, 10890.0, 5448.0, 2752.0, 1637.0, 918.0, 583.0, 396.0, 260.0, 158.0, 112.0, 71.0, 63.0, 47.0, 44.0, 20.0, 19.0, 19.0, 14.0, 8.0, 5.0, 2.0, 3.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-79.625, -77.0048828125, -74.384765625, -71.7646484375, -69.14453125, -66.5244140625, -63.904296875, -61.2841796875, -58.6640625, -56.0439453125, -53.423828125, -50.8037109375, -48.18359375, -45.5634765625, -42.943359375, -40.3232421875, -37.703125, -35.0830078125, -32.462890625, -29.8427734375, -27.22265625, -24.6025390625, -21.982421875, -19.3623046875, -16.7421875, -14.1220703125, -11.501953125, -8.8818359375, -6.26171875, -3.6416015625, -1.021484375, 1.5986328125, 4.21875, 6.8388671875, 9.458984375, 12.0791015625, 14.69921875, 17.3193359375, 19.939453125, 22.5595703125, 25.1796875, 27.7998046875, 30.419921875, 33.0400390625, 35.66015625, 38.2802734375, 40.900390625, 43.5205078125, 46.140625, 48.7607421875, 51.380859375, 54.0009765625, 56.62109375, 59.2412109375, 61.861328125, 64.4814453125, 67.1015625, 69.7216796875, 72.341796875, 74.9619140625, 77.58203125, 80.2021484375, 82.822265625, 85.4423828125, 88.0625]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 4.0, 7.0, 5.0, 14.0, 8.0, 13.0, 20.0, 33.0, 48.0, 59.0, 104.0, 169.0, 164.0, 126.0, 67.0, 49.0, 24.0, 17.0, 16.0, 13.0, 7.0, 13.0, 3.0, 5.0, 4.0, 3.0, 2.0, 2.0, 0.0, 4.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-27.734375, -27.02783203125, -26.3212890625, -25.61474609375, -24.908203125, -24.20166015625, -23.4951171875, -22.78857421875, -22.08203125, -21.37548828125, -20.6689453125, -19.96240234375, -19.255859375, -18.54931640625, -17.8427734375, -17.13623046875, -16.4296875, -15.72314453125, -15.0166015625, -14.31005859375, -13.603515625, -12.89697265625, -12.1904296875, -11.48388671875, -10.77734375, -10.07080078125, -9.3642578125, -8.65771484375, -7.951171875, -7.24462890625, -6.5380859375, -5.83154296875, -5.125, -4.41845703125, -3.7119140625, -3.00537109375, -2.298828125, -1.59228515625, -0.8857421875, -0.17919921875, 0.52734375, 1.23388671875, 1.9404296875, 2.64697265625, 3.353515625, 4.06005859375, 4.7666015625, 5.47314453125, 6.1796875, 6.88623046875, 7.5927734375, 8.29931640625, 9.005859375, 9.71240234375, 10.4189453125, 11.12548828125, 11.83203125, 12.53857421875, 13.2451171875, 13.95166015625, 14.658203125, 15.36474609375, 16.0712890625, 16.77783203125, 17.484375]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 9.0, 4.0, 4.0, 2.0, 16.0, 13.0, 18.0, 21.0, 33.0, 44.0, 58.0, 86.0, 88.0, 124.0, 107.0, 96.0, 73.0, 51.0, 55.0, 30.0, 17.0, 16.0, 9.0, 12.0, 3.0, 11.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-143.9215850830078, -139.4133758544922, -134.90516662597656, -130.39697265625, -125.88876342773438, -121.38055419921875, -116.87234497070312, -112.36414337158203, -107.85594177246094, -103.34773254394531, -98.83953094482422, -94.3313217163086, -89.8231201171875, -85.31491088867188, -80.80670166015625, -76.29850006103516, -71.79029083251953, -67.2820816040039, -62.77388000488281, -58.26567077636719, -53.757469177246094, -49.24925994873047, -44.74105453491211, -40.23284912109375, -35.72464370727539, -31.21643829345703, -26.708232879638672, -22.20002555847168, -17.69182014465332, -13.183614730834961, -8.675407409667969, -4.167201995849609, 0.34100341796875, 4.849209308624268, 9.357415199279785, 13.865621566772461, 18.37382698059082, 22.88203239440918, 27.390239715576172, 31.89844512939453, 36.40665054321289, 40.91485595703125, 45.42306137084961, 49.93126678466797, 54.439476013183594, 58.94767761230469, 63.45588684082031, 67.96409606933594, 72.47229766845703, 76.98050689697266, 81.48870849609375, 85.99691772460938, 90.50511932373047, 95.0133285522461, 99.52153015136719, 104.02973937988281, 108.53794860839844, 113.04615783691406, 117.55435943603516, 122.06256866455078, 126.57077026367188, 131.0789794921875, 135.58718872070312, 140.09539794921875, 144.6035919189453]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 7.0, 7.0, 4.0, 7.0, 6.0, 8.0, 19.0, 16.0, 12.0, 18.0, 13.0, 18.0, 39.0, 35.0, 39.0, 37.0, 58.0, 38.0, 45.0, 41.0, 45.0, 37.0, 52.0, 42.0, 39.0, 41.0, 39.0, 35.0, 31.0, 32.0, 24.0, 21.0, 18.0, 18.0, 13.0, 13.0, 9.0, 9.0, 9.0, 4.0, 4.0, 1.0, 4.0, 1.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-82.38619995117188, -79.71418762207031, -77.04216766357422, -74.37014770507812, -71.69813537597656, -69.026123046875, -66.3541030883789, -63.68208694458008, -61.01007080078125, -58.33805465698242, -55.666038513183594, -52.994022369384766, -50.32200622558594, -47.64999008178711, -44.97797393798828, -42.30595779418945, -39.633941650390625, -36.9619255065918, -34.28990936279297, -31.61789321899414, -28.945877075195312, -26.273860931396484, -23.601844787597656, -20.929828643798828, -18.2578125, -15.585796356201172, -12.913780212402344, -10.241764068603516, -7.5697479248046875, -4.897731781005859, -2.2257156372070312, 0.4463005065917969, 3.1183090209960938, 5.790325164794922, 8.46234130859375, 11.134357452392578, 13.806373596191406, 16.478389739990234, 19.150405883789062, 21.82242202758789, 24.49443817138672, 27.166454315185547, 29.838470458984375, 32.5104866027832, 35.18250274658203, 37.85451889038086, 40.52653503417969, 43.198551177978516, 45.870567321777344, 48.54258346557617, 51.214599609375, 53.88661575317383, 56.558631896972656, 59.230648040771484, 61.90266418457031, 64.57467651367188, 67.24669647216797, 69.91871643066406, 72.59072875976562, 75.26274108886719, 77.93476104736328, 80.60678100585938, 83.27879333496094, 85.9508056640625, 88.6228256225586]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 7.0, 5.0, 8.0, 13.0, 23.0, 24.0, 36.0, 59.0, 76.0, 117.0, 171.0, 235.0, 328.0, 456.0, 715.0, 1101.0, 1630.0, 2577.0, 4263.0, 7237.0, 14243.0, 32081.0, 103856.0, 642103.0, 2644515.0, 576792.0, 96305.0, 31504.0, 14129.0, 7367.0, 4394.0, 2699.0, 1740.0, 1144.0, 770.0, 510.0, 368.0, 216.0, 147.0, 109.0, 65.0, 45.0, 31.0, 25.0, 12.0, 14.0, 8.0, 6.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-181.0, -175.59375, -170.1875, -164.78125, -159.375, -153.96875, -148.5625, -143.15625, -137.75, -132.34375, -126.9375, -121.53125, -116.125, -110.71875, -105.3125, -99.90625, -94.5, -89.09375, -83.6875, -78.28125, -72.875, -67.46875, -62.0625, -56.65625, -51.25, -45.84375, -40.4375, -35.03125, -29.625, -24.21875, -18.8125, -13.40625, -8.0, -2.59375, 2.8125, 8.21875, 13.625, 19.03125, 24.4375, 29.84375, 35.25, 40.65625, 46.0625, 51.46875, 56.875, 62.28125, 67.6875, 73.09375, 78.5, 83.90625, 89.3125, 94.71875, 100.125, 105.53125, 110.9375, 116.34375, 121.75, 127.15625, 132.5625, 137.96875, 143.375, 148.78125, 154.1875, 159.59375, 165.0]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 4.0, 4.0, 3.0, 6.0, 14.0, 10.0, 14.0, 13.0, 13.0, 22.0, 19.0, 37.0, 37.0, 38.0, 46.0, 54.0, 47.0, 49.0, 43.0, 59.0, 50.0, 47.0, 38.0, 47.0, 44.0, 38.0, 38.0, 28.0, 17.0, 22.0, 14.0, 22.0, 11.0, 15.0, 10.0, 10.0, 6.0, 3.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-81.4375, -78.85546875, -76.2734375, -73.69140625, -71.109375, -68.52734375, -65.9453125, -63.36328125, -60.78125, -58.19921875, -55.6171875, -53.03515625, -50.453125, -47.87109375, -45.2890625, -42.70703125, -40.125, -37.54296875, -34.9609375, -32.37890625, -29.796875, -27.21484375, -24.6328125, -22.05078125, -19.46875, -16.88671875, -14.3046875, -11.72265625, -9.140625, -6.55859375, -3.9765625, -1.39453125, 1.1875, 3.76953125, 6.3515625, 8.93359375, 11.515625, 14.09765625, 16.6796875, 19.26171875, 21.84375, 24.42578125, 27.0078125, 29.58984375, 32.171875, 34.75390625, 37.3359375, 39.91796875, 42.5, 45.08203125, 47.6640625, 50.24609375, 52.828125, 55.41015625, 57.9921875, 60.57421875, 63.15625, 65.73828125, 68.3203125, 70.90234375, 73.484375, 76.06640625, 78.6484375, 81.23046875, 83.8125]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 9.0, 8.0, 15.0, 13.0, 19.0, 47.0, 49.0, 71.0, 82.0, 136.0, 206.0, 279.0, 389.0, 604.0, 880.0, 1234.0, 1931.0, 2954.0, 4645.0, 7504.0, 13340.0, 25530.0, 57206.0, 167293.0, 958999.0, 2459002.0, 323767.0, 88667.0, 35786.0, 17611.0, 9619.0, 5692.0, 3546.0, 2339.0, 1509.0, 1038.0, 655.0, 500.0, 333.0, 237.0, 166.0, 114.0, 72.0, 63.0, 42.0, 26.0, 17.0, 14.0, 14.0, 6.0, 9.0, 1.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-163.875, -158.453125, -153.03125, -147.609375, -142.1875, -136.765625, -131.34375, -125.921875, -120.5, -115.078125, -109.65625, -104.234375, -98.8125, -93.390625, -87.96875, -82.546875, -77.125, -71.703125, -66.28125, -60.859375, -55.4375, -50.015625, -44.59375, -39.171875, -33.75, -28.328125, -22.90625, -17.484375, -12.0625, -6.640625, -1.21875, 4.203125, 9.625, 15.046875, 20.46875, 25.890625, 31.3125, 36.734375, 42.15625, 47.578125, 53.0, 58.421875, 63.84375, 69.265625, 74.6875, 80.109375, 85.53125, 90.953125, 96.375, 101.796875, 107.21875, 112.640625, 118.0625, 123.484375, 128.90625, 134.328125, 139.75, 145.171875, 150.59375, 156.015625, 161.4375, 166.859375, 172.28125, 177.703125, 183.125]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 4.0, 6.0, 6.0, 7.0, 8.0, 9.0, 7.0, 23.0, 19.0, 25.0, 38.0, 54.0, 77.0, 113.0, 194.0, 265.0, 528.0, 889.0, 689.0, 407.0, 236.0, 145.0, 97.0, 54.0, 40.0, 25.0, 23.0, 18.0, 12.0, 14.0, 7.0, 2.0, 13.0, 4.0, 3.0, 5.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.5, -45.8486328125, -44.197265625, -42.5458984375, -40.89453125, -39.2431640625, -37.591796875, -35.9404296875, -34.2890625, -32.6376953125, -30.986328125, -29.3349609375, -27.68359375, -26.0322265625, -24.380859375, -22.7294921875, -21.078125, -19.4267578125, -17.775390625, -16.1240234375, -14.47265625, -12.8212890625, -11.169921875, -9.5185546875, -7.8671875, -6.2158203125, -4.564453125, -2.9130859375, -1.26171875, 0.3896484375, 2.041015625, 3.6923828125, 5.34375, 6.9951171875, 8.646484375, 10.2978515625, 11.94921875, 13.6005859375, 15.251953125, 16.9033203125, 18.5546875, 20.2060546875, 21.857421875, 23.5087890625, 25.16015625, 26.8115234375, 28.462890625, 30.1142578125, 31.765625, 33.4169921875, 35.068359375, 36.7197265625, 38.37109375, 40.0224609375, 41.673828125, 43.3251953125, 44.9765625, 46.6279296875, 48.279296875, 49.9306640625, 51.58203125, 53.2333984375, 54.884765625, 56.5361328125, 58.1875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 1.0, 6.0, 4.0, 3.0, 5.0, 6.0, 8.0, 11.0, 14.0, 15.0, 18.0, 26.0, 31.0, 34.0, 54.0, 46.0, 76.0, 105.0, 98.0, 117.0, 69.0, 54.0, 49.0, 38.0, 30.0, 23.0, 20.0, 8.0, 3.0, 8.0, 7.0, 4.0, 3.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-119.2146987915039, -115.4179916381836, -111.62127685546875, -107.82456970214844, -104.02786254882812, -100.23114776611328, -96.43444061279297, -92.63772583007812, -88.84101867675781, -85.0443115234375, -81.24759674072266, -77.45088958740234, -73.6541748046875, -69.85746765136719, -66.06076049804688, -62.2640495300293, -58.46733856201172, -54.67062759399414, -50.87391662597656, -47.07720947265625, -43.28049850463867, -39.483787536621094, -35.68708038330078, -31.890369415283203, -28.093658447265625, -24.296947479248047, -20.5002384185791, -16.703529357910156, -12.906818389892578, -9.110107421875, -5.313398361206055, -1.5166893005371094, 2.2800140380859375, 6.076724052429199, 9.873434066772461, 13.670144081115723, 17.466854095458984, 21.263565063476562, 25.060274124145508, 28.856983184814453, 32.65369415283203, 36.45040512084961, 40.24711608886719, 44.0438232421875, 47.84053421020508, 51.637245178222656, 55.43395233154297, 59.23066329956055, 63.027374267578125, 66.82408142089844, 70.62079620361328, 74.4175033569336, 78.21421813964844, 82.01092529296875, 85.80763244628906, 89.60433959960938, 93.40105438232422, 97.19776153564453, 100.99447631835938, 104.79118347167969, 108.587890625, 112.38460540771484, 116.18131256103516, 119.97802734375, 123.77473449707031]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 5.0, 4.0, 10.0, 11.0, 7.0, 9.0, 7.0, 16.0, 24.0, 21.0, 30.0, 34.0, 25.0, 25.0, 28.0, 35.0, 47.0, 44.0, 39.0, 38.0, 40.0, 46.0, 50.0, 35.0, 43.0, 34.0, 33.0, 33.0, 28.0, 39.0, 24.0, 21.0, 20.0, 20.0, 21.0, 12.0, 7.0, 4.0, 5.0, 4.0, 8.0, 5.0, 2.0, 5.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-81.59225463867188, -78.9365234375, -76.2807846069336, -73.62505340576172, -70.96931457519531, -68.31358337402344, -65.65784454345703, -63.002113342285156, -60.346378326416016, -57.690643310546875, -55.034908294677734, -52.379173278808594, -49.72344207763672, -47.06770324707031, -44.41197204589844, -41.7562370300293, -39.100502014160156, -36.444766998291016, -33.789031982421875, -31.133298873901367, -28.477563858032227, -25.821828842163086, -23.166095733642578, -20.510360717773438, -17.854625701904297, -15.198890686035156, -12.543156623840332, -9.887422561645508, -7.231687545776367, -4.575952529907227, -1.9202184677124023, 0.7355155944824219, 3.3912429809570312, 6.046977519989014, 8.702712059020996, 11.35844612121582, 14.014181137084961, 16.6699161529541, 19.32564926147461, 21.98138427734375, 24.63711929321289, 27.29285430908203, 29.948589324951172, 32.60432434082031, 35.26005554199219, 37.915794372558594, 40.57152557373047, 43.22726058959961, 45.88299560546875, 48.53873062133789, 51.19446563720703, 53.85020065307617, 56.50593566894531, 59.16166687011719, 61.81740188598633, 64.47313690185547, 67.12887573242188, 69.78460693359375, 72.44034576416016, 75.09607696533203, 77.75181579589844, 80.40754699707031, 83.06328582763672, 85.7190170288086, 88.37474822998047]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 4.0, 5.0, 9.0, 15.0, 20.0, 34.0, 49.0, 74.0, 92.0, 130.0, 206.0, 277.0, 380.0, 596.0, 814.0, 1203.0, 1755.0, 2631.0, 3865.0, 5701.0, 8843.0, 13345.0, 21413.0, 34253.0, 56061.0, 91811.0, 151941.0, 210332.0, 169125.0, 103901.0, 63122.0, 38450.0, 23787.0, 15039.0, 9606.0, 6315.0, 4204.0, 2931.0, 1892.0, 1385.0, 918.0, 636.0, 431.0, 278.0, 216.0, 153.0, 80.0, 78.0, 51.0, 36.0, 26.0, 19.0, 11.0, 4.0, 7.0, 5.0, 0.0, 1.0, 2.0, 2.0], "bins": [-46.75, -45.271484375, -43.79296875, -42.314453125, -40.8359375, -39.357421875, -37.87890625, -36.400390625, -34.921875, -33.443359375, -31.96484375, -30.486328125, -29.0078125, -27.529296875, -26.05078125, -24.572265625, -23.09375, -21.615234375, -20.13671875, -18.658203125, -17.1796875, -15.701171875, -14.22265625, -12.744140625, -11.265625, -9.787109375, -8.30859375, -6.830078125, -5.3515625, -3.873046875, -2.39453125, -0.916015625, 0.5625, 2.041015625, 3.51953125, 4.998046875, 6.4765625, 7.955078125, 9.43359375, 10.912109375, 12.390625, 13.869140625, 15.34765625, 16.826171875, 18.3046875, 19.783203125, 21.26171875, 22.740234375, 24.21875, 25.697265625, 27.17578125, 28.654296875, 30.1328125, 31.611328125, 33.08984375, 34.568359375, 36.046875, 37.525390625, 39.00390625, 40.482421875, 41.9609375, 43.439453125, 44.91796875, 46.396484375, 47.875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 3.0, 5.0, 7.0, 10.0, 9.0, 4.0, 6.0, 10.0, 23.0, 16.0, 22.0, 30.0, 31.0, 18.0, 31.0, 37.0, 38.0, 45.0, 51.0, 39.0, 49.0, 52.0, 49.0, 53.0, 43.0, 29.0, 39.0, 42.0, 31.0, 28.0, 32.0, 16.0, 17.0, 23.0, 16.0, 11.0, 8.0, 7.0, 4.0, 3.0, 2.0, 8.0, 3.0, 0.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-76.3125, -73.8701171875, -71.427734375, -68.9853515625, -66.54296875, -64.1005859375, -61.658203125, -59.2158203125, -56.7734375, -54.3310546875, -51.888671875, -49.4462890625, -47.00390625, -44.5615234375, -42.119140625, -39.6767578125, -37.234375, -34.7919921875, -32.349609375, -29.9072265625, -27.46484375, -25.0224609375, -22.580078125, -20.1376953125, -17.6953125, -15.2529296875, -12.810546875, -10.3681640625, -7.92578125, -5.4833984375, -3.041015625, -0.5986328125, 1.84375, 4.2861328125, 6.728515625, 9.1708984375, 11.61328125, 14.0556640625, 16.498046875, 18.9404296875, 21.3828125, 23.8251953125, 26.267578125, 28.7099609375, 31.15234375, 33.5947265625, 36.037109375, 38.4794921875, 40.921875, 43.3642578125, 45.806640625, 48.2490234375, 50.69140625, 53.1337890625, 55.576171875, 58.0185546875, 60.4609375, 62.9033203125, 65.345703125, 67.7880859375, 70.23046875, 72.6728515625, 75.115234375, 77.5576171875, 80.0]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 6.0, 3.0, 10.0, 6.0, 15.0, 23.0, 36.0, 46.0, 76.0, 102.0, 159.0, 237.0, 315.0, 526.0, 838.0, 1217.0, 2032.0, 3343.0, 5691.0, 10545.0, 24046.0, 159398.0, 761680.0, 44644.0, 14880.0, 7445.0, 4291.0, 2548.0, 1576.0, 982.0, 642.0, 400.0, 265.0, 183.0, 116.0, 73.0, 65.0, 31.0, 28.0, 11.0, 10.0, 7.0, 8.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-114.3125, -110.2646484375, -106.216796875, -102.1689453125, -98.12109375, -94.0732421875, -90.025390625, -85.9775390625, -81.9296875, -77.8818359375, -73.833984375, -69.7861328125, -65.73828125, -61.6904296875, -57.642578125, -53.5947265625, -49.546875, -45.4990234375, -41.451171875, -37.4033203125, -33.35546875, -29.3076171875, -25.259765625, -21.2119140625, -17.1640625, -13.1162109375, -9.068359375, -5.0205078125, -0.97265625, 3.0751953125, 7.123046875, 11.1708984375, 15.21875, 19.2666015625, 23.314453125, 27.3623046875, 31.41015625, 35.4580078125, 39.505859375, 43.5537109375, 47.6015625, 51.6494140625, 55.697265625, 59.7451171875, 63.79296875, 67.8408203125, 71.888671875, 75.9365234375, 79.984375, 84.0322265625, 88.080078125, 92.1279296875, 96.17578125, 100.2236328125, 104.271484375, 108.3193359375, 112.3671875, 116.4150390625, 120.462890625, 124.5107421875, 128.55859375, 132.6064453125, 136.654296875, 140.7021484375, 144.75]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 8.0, 9.0, 5.0, 5.0, 9.0, 25.0, 14.0, 18.0, 19.0, 25.0, 22.0, 37.0, 25.0, 40.0, 43.0, 46.0, 46.0, 46.0, 46.0, 58.0, 42.0, 54.0, 57.0, 49.0, 35.0, 34.0, 31.0, 23.0, 20.0, 17.0, 16.0, 19.0, 17.0, 8.0, 11.0, 8.0, 6.0, 4.0, 3.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-96.375, -93.3330078125, -90.291015625, -87.2490234375, -84.20703125, -81.1650390625, -78.123046875, -75.0810546875, -72.0390625, -68.9970703125, -65.955078125, -62.9130859375, -59.87109375, -56.8291015625, -53.787109375, -50.7451171875, -47.703125, -44.6611328125, -41.619140625, -38.5771484375, -35.53515625, -32.4931640625, -29.451171875, -26.4091796875, -23.3671875, -20.3251953125, -17.283203125, -14.2412109375, -11.19921875, -8.1572265625, -5.115234375, -2.0732421875, 0.96875, 4.0107421875, 7.052734375, 10.0947265625, 13.13671875, 16.1787109375, 19.220703125, 22.2626953125, 25.3046875, 28.3466796875, 31.388671875, 34.4306640625, 37.47265625, 40.5146484375, 43.556640625, 46.5986328125, 49.640625, 52.6826171875, 55.724609375, 58.7666015625, 61.80859375, 64.8505859375, 67.892578125, 70.9345703125, 73.9765625, 77.0185546875, 80.060546875, 83.1025390625, 86.14453125, 89.1865234375, 92.228515625, 95.2705078125, 98.3125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 8.0, 2.0, 5.0, 5.0, 12.0, 6.0, 15.0, 14.0, 24.0, 26.0, 35.0, 50.0, 75.0, 96.0, 138.0, 205.0, 310.0, 523.0, 1063.0, 3121.0, 23556.0, 985493.0, 27788.0, 3314.0, 1097.0, 566.0, 306.0, 197.0, 148.0, 97.0, 78.0, 47.0, 26.0, 23.0, 27.0, 14.0, 10.0, 11.0, 8.0, 7.0, 5.0, 3.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-50.84375, -49.3271484375, -47.810546875, -46.2939453125, -44.77734375, -43.2607421875, -41.744140625, -40.2275390625, -38.7109375, -37.1943359375, -35.677734375, -34.1611328125, -32.64453125, -31.1279296875, -29.611328125, -28.0947265625, -26.578125, -25.0615234375, -23.544921875, -22.0283203125, -20.51171875, -18.9951171875, -17.478515625, -15.9619140625, -14.4453125, -12.9287109375, -11.412109375, -9.8955078125, -8.37890625, -6.8623046875, -5.345703125, -3.8291015625, -2.3125, -0.7958984375, 0.720703125, 2.2373046875, 3.75390625, 5.2705078125, 6.787109375, 8.3037109375, 9.8203125, 11.3369140625, 12.853515625, 14.3701171875, 15.88671875, 17.4033203125, 18.919921875, 20.4365234375, 21.953125, 23.4697265625, 24.986328125, 26.5029296875, 28.01953125, 29.5361328125, 31.052734375, 32.5693359375, 34.0859375, 35.6025390625, 37.119140625, 38.6357421875, 40.15234375, 41.6689453125, 43.185546875, 44.7021484375, 46.21875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 6.0, 2.0, 3.0, 4.0, 9.0, 12.0, 23.0, 41.0, 47.0, 75.0, 124.0, 257.0, 150.0, 74.0, 51.0, 32.0, 23.0, 14.0, 13.0, 13.0, 7.0, 6.0, 3.0, 3.0, 1.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.008209228515625, -0.007932066917419434, -0.007654905319213867, -0.007377743721008301, -0.007100582122802734, -0.006823420524597168, -0.0065462589263916016, -0.006269097328186035, -0.005991935729980469, -0.005714774131774902, -0.005437612533569336, -0.0051604509353637695, -0.004883289337158203, -0.004606127738952637, -0.00432896614074707, -0.004051804542541504, -0.0037746429443359375, -0.003497481346130371, -0.0032203197479248047, -0.0029431581497192383, -0.002665996551513672, -0.0023888349533081055, -0.002111673355102539, -0.0018345117568969727, -0.0015573501586914062, -0.0012801885604858398, -0.0010030269622802734, -0.000725865364074707, -0.0004487037658691406, -0.00017154216766357422, 0.00010561943054199219, 0.0003827810287475586, 0.000659942626953125, 0.0009371042251586914, 0.0012142658233642578, 0.0014914274215698242, 0.0017685890197753906, 0.002045750617980957, 0.0023229122161865234, 0.00260007381439209, 0.0028772354125976562, 0.0031543970108032227, 0.003431558609008789, 0.0037087202072143555, 0.003985881805419922, 0.004263043403625488, 0.004540205001831055, 0.004817366600036621, 0.0050945281982421875, 0.005371689796447754, 0.00564885139465332, 0.005926012992858887, 0.006203174591064453, 0.0064803361892700195, 0.006757497787475586, 0.007034659385681152, 0.007311820983886719, 0.007588982582092285, 0.007866144180297852, 0.008143305778503418, 0.008420467376708984, 0.00869762897491455, 0.008974790573120117, 0.009251952171325684, 0.00952911376953125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 9.0, 7.0, 11.0, 11.0, 7.0, 14.0, 17.0, 34.0, 34.0, 69.0, 79.0, 106.0, 145.0, 207.0, 330.0, 403.0, 586.0, 855.0, 1199.0, 1746.0, 2423.0, 3593.0, 6543.0, 34229.0, 857977.0, 114131.0, 10087.0, 4229.0, 2767.0, 1996.0, 1345.0, 982.0, 706.0, 461.0, 323.0, 250.0, 170.0, 124.0, 89.0, 60.0, 54.0, 32.0, 33.0, 24.0, 17.0, 14.0, 10.0, 6.0, 6.0, 3.0, 1.0, 3.0, 4.0], "bins": [-41.28125, -40.12451171875, -38.9677734375, -37.81103515625, -36.654296875, -35.49755859375, -34.3408203125, -33.18408203125, -32.02734375, -30.87060546875, -29.7138671875, -28.55712890625, -27.400390625, -26.24365234375, -25.0869140625, -23.93017578125, -22.7734375, -21.61669921875, -20.4599609375, -19.30322265625, -18.146484375, -16.98974609375, -15.8330078125, -14.67626953125, -13.51953125, -12.36279296875, -11.2060546875, -10.04931640625, -8.892578125, -7.73583984375, -6.5791015625, -5.42236328125, -4.265625, -3.10888671875, -1.9521484375, -0.79541015625, 0.361328125, 1.51806640625, 2.6748046875, 3.83154296875, 4.98828125, 6.14501953125, 7.3017578125, 8.45849609375, 9.615234375, 10.77197265625, 11.9287109375, 13.08544921875, 14.2421875, 15.39892578125, 16.5556640625, 17.71240234375, 18.869140625, 20.02587890625, 21.1826171875, 22.33935546875, 23.49609375, 24.65283203125, 25.8095703125, 26.96630859375, 28.123046875, 29.27978515625, 30.4365234375, 31.59326171875, 32.75]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 0.0, 4.0, 1.0, 1.0, 4.0, 5.0, 18.0, 44.0, 167.0, 367.0, 242.0, 85.0, 29.0, 7.0, 6.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.78125, -11.45166015625, -11.1220703125, -10.79248046875, -10.462890625, -10.13330078125, -9.8037109375, -9.47412109375, -9.14453125, -8.81494140625, -8.4853515625, -8.15576171875, -7.826171875, -7.49658203125, -7.1669921875, -6.83740234375, -6.5078125, -6.17822265625, -5.8486328125, -5.51904296875, -5.189453125, -4.85986328125, -4.5302734375, -4.20068359375, -3.87109375, -3.54150390625, -3.2119140625, -2.88232421875, -2.552734375, -2.22314453125, -1.8935546875, -1.56396484375, -1.234375, -0.90478515625, -0.5751953125, -0.24560546875, 0.083984375, 0.41357421875, 0.7431640625, 1.07275390625, 1.40234375, 1.73193359375, 2.0615234375, 2.39111328125, 2.720703125, 3.05029296875, 3.3798828125, 3.70947265625, 4.0390625, 4.36865234375, 4.6982421875, 5.02783203125, 5.357421875, 5.68701171875, 6.0166015625, 6.34619140625, 6.67578125, 7.00537109375, 7.3349609375, 7.66455078125, 7.994140625, 8.32373046875, 8.6533203125, 8.98291015625, 9.3125]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 3.0, 4.0, 3.0, 5.0, 10.0, 5.0, 7.0, 15.0, 15.0, 20.0, 25.0, 22.0, 49.0, 37.0, 72.0, 83.0, 110.0, 112.0, 93.0, 65.0, 67.0, 37.0, 35.0, 27.0, 19.0, 14.0, 8.0, 11.0, 7.0, 4.0, 7.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-91.28695678710938, -88.04277801513672, -84.79859924316406, -81.5544204711914, -78.31024169921875, -75.06607055664062, -71.82189178466797, -68.57771301269531, -65.33353424072266, -62.08935546875, -58.845176696777344, -55.60100173950195, -52.3568229675293, -49.11264419555664, -45.86846923828125, -42.624290466308594, -39.38011169433594, -36.13593292236328, -32.891754150390625, -29.647579193115234, -26.403400421142578, -23.159221649169922, -19.9150447845459, -16.670867919921875, -13.426689147949219, -10.182511329650879, -6.938333511352539, -3.694155693054199, -0.4499778747558594, 2.794200897216797, 6.03837776184082, 9.282554626464844, 12.526741027832031, 15.770918846130371, 19.01509666442871, 22.259273529052734, 25.50345230102539, 28.747631072998047, 31.99180793762207, 35.235984802246094, 38.48016357421875, 41.724342346191406, 44.96852111816406, 48.21269607543945, 51.45687484741211, 54.701053619384766, 57.945228576660156, 61.18940734863281, 64.43358612060547, 67.67776489257812, 70.92194366455078, 74.16612243652344, 77.41029357910156, 80.65447998046875, 83.89865112304688, 87.14282989501953, 90.38700866699219, 93.63118743896484, 96.8753662109375, 100.11954498291016, 103.36372375488281, 106.60789489746094, 109.8520736694336, 113.09625244140625, 116.3404312133789]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 2.0, 4.0, 8.0, 5.0, 5.0, 8.0, 10.0, 13.0, 13.0, 13.0, 24.0, 27.0, 31.0, 29.0, 27.0, 31.0, 37.0, 37.0, 45.0, 49.0, 43.0, 44.0, 36.0, 43.0, 48.0, 30.0, 50.0, 39.0, 32.0, 22.0, 31.0, 30.0, 31.0, 19.0, 22.0, 15.0, 12.0, 6.0, 6.0, 5.0, 4.0, 5.0, 6.0, 2.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-72.8456039428711, -70.57373809814453, -68.30186462402344, -66.02999877929688, -63.75812530517578, -61.48625946044922, -59.21438980102539, -56.94252014160156, -54.670650482177734, -52.398780822753906, -50.12691116333008, -47.85504150390625, -45.58317565917969, -43.311302185058594, -41.03943634033203, -38.7675666809082, -36.495697021484375, -34.22382736206055, -31.95195770263672, -29.680089950561523, -27.408220291137695, -25.136350631713867, -22.864482879638672, -20.592613220214844, -18.320743560791016, -16.048873901367188, -13.777005195617676, -11.505136489868164, -9.233266830444336, -6.961397171020508, -4.689528465270996, -2.4176597595214844, -0.1457977294921875, 2.1260714530944824, 4.397940635681152, 6.669809818267822, 8.941679000854492, 11.21354866027832, 13.485417366027832, 15.757286071777344, 18.029155731201172, 20.301025390625, 22.572895050048828, 24.844762802124023, 27.11663246154785, 29.38850212097168, 31.660369873046875, 33.9322395324707, 36.20410919189453, 38.47597885131836, 40.74784851074219, 43.019718170166016, 45.291587829589844, 47.563453674316406, 49.835323333740234, 52.10719299316406, 54.37906265258789, 56.65093231201172, 58.92280197143555, 61.194671630859375, 63.46653747558594, 65.73841094970703, 68.0102767944336, 70.28215026855469, 72.55401611328125]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 12.0, 17.0, 12.0, 16.0, 45.0, 57.0, 60.0, 74.0, 107.0, 174.0, 220.0, 307.0, 387.0, 561.0, 720.0, 1052.0, 1650.0, 2321.0, 3428.0, 5235.0, 8205.0, 13795.0, 24568.0, 46528.0, 94904.0, 197038.0, 299615.0, 168472.0, 81753.0, 40703.0, 21725.0, 12154.0, 7455.0, 4795.0, 3154.0, 2101.0, 1442.0, 1046.0, 760.0, 520.0, 364.0, 255.0, 218.0, 144.0, 113.0, 81.0, 60.0, 39.0, 26.0, 27.0, 19.0, 5.0, 8.0, 4.0, 6.0, 4.0, 0.0, 2.0], "bins": [-102.5625, -99.396484375, -96.23046875, -93.064453125, -89.8984375, -86.732421875, -83.56640625, -80.400390625, -77.234375, -74.068359375, -70.90234375, -67.736328125, -64.5703125, -61.404296875, -58.23828125, -55.072265625, -51.90625, -48.740234375, -45.57421875, -42.408203125, -39.2421875, -36.076171875, -32.91015625, -29.744140625, -26.578125, -23.412109375, -20.24609375, -17.080078125, -13.9140625, -10.748046875, -7.58203125, -4.416015625, -1.25, 1.916015625, 5.08203125, 8.248046875, 11.4140625, 14.580078125, 17.74609375, 20.912109375, 24.078125, 27.244140625, 30.41015625, 33.576171875, 36.7421875, 39.908203125, 43.07421875, 46.240234375, 49.40625, 52.572265625, 55.73828125, 58.904296875, 62.0703125, 65.236328125, 68.40234375, 71.568359375, 74.734375, 77.900390625, 81.06640625, 84.232421875, 87.3984375, 90.564453125, 93.73046875, 96.896484375, 100.0625]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 5.0, 4.0, 1.0, 12.0, 9.0, 5.0, 14.0, 11.0, 20.0, 16.0, 25.0, 23.0, 32.0, 35.0, 27.0, 40.0, 47.0, 40.0, 65.0, 46.0, 45.0, 49.0, 40.0, 46.0, 46.0, 45.0, 41.0, 30.0, 20.0, 33.0, 31.0, 15.0, 19.0, 11.0, 12.0, 9.0, 6.0, 6.0, 5.0, 3.0, 3.0, 3.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-75.375, -73.0029296875, -70.630859375, -68.2587890625, -65.88671875, -63.5146484375, -61.142578125, -58.7705078125, -56.3984375, -54.0263671875, -51.654296875, -49.2822265625, -46.91015625, -44.5380859375, -42.166015625, -39.7939453125, -37.421875, -35.0498046875, -32.677734375, -30.3056640625, -27.93359375, -25.5615234375, -23.189453125, -20.8173828125, -18.4453125, -16.0732421875, -13.701171875, -11.3291015625, -8.95703125, -6.5849609375, -4.212890625, -1.8408203125, 0.53125, 2.9033203125, 5.275390625, 7.6474609375, 10.01953125, 12.3916015625, 14.763671875, 17.1357421875, 19.5078125, 21.8798828125, 24.251953125, 26.6240234375, 28.99609375, 31.3681640625, 33.740234375, 36.1123046875, 38.484375, 40.8564453125, 43.228515625, 45.6005859375, 47.97265625, 50.3447265625, 52.716796875, 55.0888671875, 57.4609375, 59.8330078125, 62.205078125, 64.5771484375, 66.94921875, 69.3212890625, 71.693359375, 74.0654296875, 76.4375]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 7.0, 3.0, 7.0, 16.0, 15.0, 23.0, 34.0, 41.0, 67.0, 101.0, 136.0, 199.0, 271.0, 390.0, 559.0, 877.0, 1241.0, 1888.0, 2949.0, 4544.0, 7184.0, 11756.0, 19451.0, 33787.0, 60047.0, 113745.0, 211251.0, 249728.0, 146605.0, 76940.0, 42174.0, 23823.0, 14193.0, 8636.0, 5484.0, 3411.0, 2258.0, 1544.0, 971.0, 670.0, 484.0, 323.0, 231.0, 154.0, 105.0, 68.0, 48.0, 49.0, 25.0, 25.0, 8.0, 8.0, 3.0, 5.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0], "bins": [-109.125, -105.626953125, -102.12890625, -98.630859375, -95.1328125, -91.634765625, -88.13671875, -84.638671875, -81.140625, -77.642578125, -74.14453125, -70.646484375, -67.1484375, -63.650390625, -60.15234375, -56.654296875, -53.15625, -49.658203125, -46.16015625, -42.662109375, -39.1640625, -35.666015625, -32.16796875, -28.669921875, -25.171875, -21.673828125, -18.17578125, -14.677734375, -11.1796875, -7.681640625, -4.18359375, -0.685546875, 2.8125, 6.310546875, 9.80859375, 13.306640625, 16.8046875, 20.302734375, 23.80078125, 27.298828125, 30.796875, 34.294921875, 37.79296875, 41.291015625, 44.7890625, 48.287109375, 51.78515625, 55.283203125, 58.78125, 62.279296875, 65.77734375, 69.275390625, 72.7734375, 76.271484375, 79.76953125, 83.267578125, 86.765625, 90.263671875, 93.76171875, 97.259765625, 100.7578125, 104.255859375, 107.75390625, 111.251953125, 114.75]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 4.0, 2.0, 2.0, 2.0, 5.0, 2.0, 5.0, 13.0, 6.0, 11.0, 11.0, 15.0, 11.0, 22.0, 27.0, 29.0, 29.0, 20.0, 36.0, 32.0, 39.0, 34.0, 51.0, 40.0, 44.0, 52.0, 31.0, 45.0, 49.0, 47.0, 42.0, 31.0, 27.0, 26.0, 23.0, 20.0, 21.0, 18.0, 13.0, 14.0, 7.0, 6.0, 11.0, 8.0, 7.0, 4.0, 6.0, 6.0, 1.0, 2.0, 0.0, 4.0, 2.0, 0.0, 1.0], "bins": [-47.875, -46.46728515625, -45.0595703125, -43.65185546875, -42.244140625, -40.83642578125, -39.4287109375, -38.02099609375, -36.61328125, -35.20556640625, -33.7978515625, -32.39013671875, -30.982421875, -29.57470703125, -28.1669921875, -26.75927734375, -25.3515625, -23.94384765625, -22.5361328125, -21.12841796875, -19.720703125, -18.31298828125, -16.9052734375, -15.49755859375, -14.08984375, -12.68212890625, -11.2744140625, -9.86669921875, -8.458984375, -7.05126953125, -5.6435546875, -4.23583984375, -2.828125, -1.42041015625, -0.0126953125, 1.39501953125, 2.802734375, 4.21044921875, 5.6181640625, 7.02587890625, 8.43359375, 9.84130859375, 11.2490234375, 12.65673828125, 14.064453125, 15.47216796875, 16.8798828125, 18.28759765625, 19.6953125, 21.10302734375, 22.5107421875, 23.91845703125, 25.326171875, 26.73388671875, 28.1416015625, 29.54931640625, 30.95703125, 32.36474609375, 33.7724609375, 35.18017578125, 36.587890625, 37.99560546875, 39.4033203125, 40.81103515625, 42.21875]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 4.0, 3.0, 9.0, 7.0, 10.0, 9.0, 20.0, 18.0, 40.0, 41.0, 77.0, 79.0, 129.0, 178.0, 243.0, 324.0, 547.0, 855.0, 1118.0, 1674.0, 2496.0, 3813.0, 5671.0, 8954.0, 14596.0, 25014.0, 46461.0, 99405.0, 271165.0, 324018.0, 116227.0, 52997.0, 27832.0, 15975.0, 9834.0, 6291.0, 3961.0, 2738.0, 1715.0, 1267.0, 843.0, 567.0, 391.0, 294.0, 178.0, 132.0, 100.0, 74.0, 51.0, 31.0, 24.0, 11.0, 14.0, 10.0, 9.0, 4.0, 5.0, 6.0, 3.0, 3.0, 3.0, 2.0], "bins": [-27.28125, -26.40380859375, -25.5263671875, -24.64892578125, -23.771484375, -22.89404296875, -22.0166015625, -21.13916015625, -20.26171875, -19.38427734375, -18.5068359375, -17.62939453125, -16.751953125, -15.87451171875, -14.9970703125, -14.11962890625, -13.2421875, -12.36474609375, -11.4873046875, -10.60986328125, -9.732421875, -8.85498046875, -7.9775390625, -7.10009765625, -6.22265625, -5.34521484375, -4.4677734375, -3.59033203125, -2.712890625, -1.83544921875, -0.9580078125, -0.08056640625, 0.796875, 1.67431640625, 2.5517578125, 3.42919921875, 4.306640625, 5.18408203125, 6.0615234375, 6.93896484375, 7.81640625, 8.69384765625, 9.5712890625, 10.44873046875, 11.326171875, 12.20361328125, 13.0810546875, 13.95849609375, 14.8359375, 15.71337890625, 16.5908203125, 17.46826171875, 18.345703125, 19.22314453125, 20.1005859375, 20.97802734375, 21.85546875, 22.73291015625, 23.6103515625, 24.48779296875, 25.365234375, 26.24267578125, 27.1201171875, 27.99755859375, 28.875]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 8.0, 5.0, 8.0, 8.0, 10.0, 15.0, 24.0, 23.0, 35.0, 38.0, 47.0, 98.0, 123.0, 143.0, 110.0, 82.0, 52.0, 29.0, 25.0, 21.0, 20.0, 21.0, 9.0, 8.0, 4.0, 10.0, 5.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003299713134765625, -0.0031915903091430664, -0.003083467483520508, -0.0029753446578979492, -0.0028672218322753906, -0.002759099006652832, -0.0026509761810302734, -0.002542853355407715, -0.0024347305297851562, -0.0023266077041625977, -0.002218484878540039, -0.0021103620529174805, -0.002002239227294922, -0.0018941164016723633, -0.0017859935760498047, -0.001677870750427246, -0.0015697479248046875, -0.001461625099182129, -0.0013535022735595703, -0.0012453794479370117, -0.0011372566223144531, -0.0010291337966918945, -0.0009210109710693359, -0.0008128881454467773, -0.0007047653198242188, -0.0005966424942016602, -0.0004885196685791016, -0.00038039684295654297, -0.0002722740173339844, -0.00016415119171142578, -5.602836608886719e-05, 5.2094459533691406e-05, 0.00016021728515625, 0.0002683401107788086, 0.0003764629364013672, 0.0004845857620239258, 0.0005927085876464844, 0.000700831413269043, 0.0008089542388916016, 0.0009170770645141602, 0.0010251998901367188, 0.0011333227157592773, 0.001241445541381836, 0.0013495683670043945, 0.0014576911926269531, 0.0015658140182495117, 0.0016739368438720703, 0.001782059669494629, 0.0018901824951171875, 0.001998305320739746, 0.0021064281463623047, 0.0022145509719848633, 0.002322673797607422, 0.0024307966232299805, 0.002538919448852539, 0.0026470422744750977, 0.0027551651000976562, 0.002863287925720215, 0.0029714107513427734, 0.003079533576965332, 0.0031876564025878906, 0.0032957792282104492, 0.003403902053833008, 0.0035120248794555664, 0.003620147705078125]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 0.0, 1.0, 5.0, 3.0, 9.0, 7.0, 14.0, 24.0, 36.0, 44.0, 70.0, 94.0, 131.0, 180.0, 272.0, 357.0, 562.0, 782.0, 1032.0, 1514.0, 2173.0, 3234.0, 4971.0, 7552.0, 12484.0, 21635.0, 41535.0, 90180.0, 236375.0, 350754.0, 139604.0, 58968.0, 29456.0, 16032.0, 9657.0, 5995.0, 4087.0, 2716.0, 1796.0, 1276.0, 872.0, 619.0, 424.0, 315.0, 206.0, 154.0, 107.0, 68.0, 62.0, 38.0, 28.0, 19.0, 9.0, 14.0, 7.0, 6.0, 1.0, 1.0, 1.0, 1.0], "bins": [-28.890625, -28.021484375, -27.15234375, -26.283203125, -25.4140625, -24.544921875, -23.67578125, -22.806640625, -21.9375, -21.068359375, -20.19921875, -19.330078125, -18.4609375, -17.591796875, -16.72265625, -15.853515625, -14.984375, -14.115234375, -13.24609375, -12.376953125, -11.5078125, -10.638671875, -9.76953125, -8.900390625, -8.03125, -7.162109375, -6.29296875, -5.423828125, -4.5546875, -3.685546875, -2.81640625, -1.947265625, -1.078125, -0.208984375, 0.66015625, 1.529296875, 2.3984375, 3.267578125, 4.13671875, 5.005859375, 5.875, 6.744140625, 7.61328125, 8.482421875, 9.3515625, 10.220703125, 11.08984375, 11.958984375, 12.828125, 13.697265625, 14.56640625, 15.435546875, 16.3046875, 17.173828125, 18.04296875, 18.912109375, 19.78125, 20.650390625, 21.51953125, 22.388671875, 23.2578125, 24.126953125, 24.99609375, 25.865234375, 26.734375]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 2.0, 3.0, 2.0, 6.0, 2.0, 3.0, 4.0, 5.0, 11.0, 11.0, 5.0, 12.0, 16.0, 18.0, 17.0, 27.0, 45.0, 38.0, 46.0, 69.0, 87.0, 90.0, 84.0, 74.0, 58.0, 52.0, 49.0, 45.0, 18.0, 18.0, 17.0, 14.0, 10.0, 11.0, 6.0, 3.0, 4.0, 2.0, 5.0, 6.0, 5.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-9.4375, -9.15966796875, -8.8818359375, -8.60400390625, -8.326171875, -8.04833984375, -7.7705078125, -7.49267578125, -7.21484375, -6.93701171875, -6.6591796875, -6.38134765625, -6.103515625, -5.82568359375, -5.5478515625, -5.27001953125, -4.9921875, -4.71435546875, -4.4365234375, -4.15869140625, -3.880859375, -3.60302734375, -3.3251953125, -3.04736328125, -2.76953125, -2.49169921875, -2.2138671875, -1.93603515625, -1.658203125, -1.38037109375, -1.1025390625, -0.82470703125, -0.546875, -0.26904296875, 0.0087890625, 0.28662109375, 0.564453125, 0.84228515625, 1.1201171875, 1.39794921875, 1.67578125, 1.95361328125, 2.2314453125, 2.50927734375, 2.787109375, 3.06494140625, 3.3427734375, 3.62060546875, 3.8984375, 4.17626953125, 4.4541015625, 4.73193359375, 5.009765625, 5.28759765625, 5.5654296875, 5.84326171875, 6.12109375, 6.39892578125, 6.6767578125, 6.95458984375, 7.232421875, 7.51025390625, 7.7880859375, 8.06591796875, 8.34375]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 2.0, 3.0, 3.0, 3.0, 6.0, 10.0, 7.0, 13.0, 11.0, 14.0, 21.0, 27.0, 35.0, 54.0, 72.0, 92.0, 104.0, 114.0, 97.0, 70.0, 63.0, 40.0, 33.0, 32.0, 20.0, 9.0, 14.0, 10.0, 8.0, 4.0, 7.0, 4.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-94.12782287597656, -90.66825103759766, -87.20867919921875, -83.74910736083984, -80.28953552246094, -76.82996368408203, -73.37039184570312, -69.91082000732422, -66.45124816894531, -62.991676330566406, -59.5321044921875, -56.072532653808594, -52.61296081542969, -49.15338897705078, -45.693817138671875, -42.23424530029297, -38.7746696472168, -35.31509780883789, -31.855525970458984, -28.395954132080078, -24.936382293701172, -21.476808547973633, -18.017236709594727, -14.55766487121582, -11.098093032836914, -7.638521194458008, -4.178948879241943, -0.7193765640258789, 2.7401952743530273, 6.19976806640625, 9.659339904785156, 13.118911743164062, 16.57848358154297, 20.038055419921875, 23.49762725830078, 26.957199096679688, 30.416770935058594, 33.8763427734375, 37.335914611816406, 40.79548645019531, 44.25505828857422, 47.714630126953125, 51.17420196533203, 54.63377380371094, 58.093345642089844, 61.55291748046875, 65.01248931884766, 68.47206115722656, 71.931640625, 75.3912124633789, 78.85078430175781, 82.31035614013672, 85.76992797851562, 89.22949981689453, 92.68907165527344, 96.14864349365234, 99.60821533203125, 103.06778717041016, 106.52735900878906, 109.98693084716797, 113.44650268554688, 116.90607452392578, 120.36564636230469, 123.8252182006836, 127.2847900390625]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 5.0, 7.0, 11.0, 8.0, 9.0, 11.0, 6.0, 12.0, 9.0, 11.0, 19.0, 24.0, 21.0, 27.0, 36.0, 39.0, 40.0, 26.0, 37.0, 45.0, 42.0, 35.0, 38.0, 39.0, 48.0, 33.0, 40.0, 29.0, 34.0, 29.0, 34.0, 27.0, 23.0, 19.0, 24.0, 15.0, 19.0, 14.0, 11.0, 5.0, 13.0, 6.0, 8.0, 6.0, 2.0, 2.0, 3.0, 0.0, 3.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-65.30443572998047, -63.186561584472656, -61.068687438964844, -58.9508171081543, -56.832942962646484, -54.71506881713867, -52.597198486328125, -50.47932434082031, -48.3614501953125, -46.24357604980469, -44.125701904296875, -42.00783157348633, -39.889957427978516, -37.7720832824707, -35.654212951660156, -33.536338806152344, -31.41846466064453, -29.30059051513672, -27.18271827697754, -25.06484603881836, -22.946971893310547, -20.829097747802734, -18.711225509643555, -16.593353271484375, -14.475479125976562, -12.357605934143066, -10.23973274230957, -8.121859550476074, -6.003986358642578, -3.886113166809082, -1.768239974975586, 0.34963321685791016, 2.4675140380859375, 4.585387229919434, 6.70326042175293, 8.821133613586426, 10.939006805419922, 13.056879997253418, 15.174753189086914, 17.292625427246094, 19.410499572753906, 21.52837371826172, 23.6462459564209, 25.764118194580078, 27.88199234008789, 29.999866485595703, 32.11773681640625, 34.23561096191406, 36.353485107421875, 38.47135925292969, 40.5892333984375, 42.70710372924805, 44.82497787475586, 46.94285202026367, 49.06072235107422, 51.17859649658203, 53.296470642089844, 55.414344787597656, 57.53221893310547, 59.650089263916016, 61.76796340942383, 63.88583755493164, 66.00370788574219, 68.12158203125, 70.23945617675781]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 4.0, 7.0, 3.0, 17.0, 21.0, 12.0, 36.0, 43.0, 63.0, 73.0, 113.0, 164.0, 233.0, 357.0, 489.0, 767.0, 1070.0, 1631.0, 2544.0, 3880.0, 6081.0, 10112.0, 18614.0, 45417.0, 161411.0, 749467.0, 2216903.0, 734247.0, 153075.0, 41293.0, 18124.0, 10063.0, 6150.0, 3793.0, 2489.0, 1710.0, 1181.0, 771.0, 549.0, 351.0, 295.0, 201.0, 142.0, 88.0, 71.0, 49.0, 37.0, 23.0, 18.0, 12.0, 11.0, 5.0, 5.0, 2.0, 2.0, 1.0, 1.0], "bins": [-120.0625, -116.4775390625, -112.892578125, -109.3076171875, -105.72265625, -102.1376953125, -98.552734375, -94.9677734375, -91.3828125, -87.7978515625, -84.212890625, -80.6279296875, -77.04296875, -73.4580078125, -69.873046875, -66.2880859375, -62.703125, -59.1181640625, -55.533203125, -51.9482421875, -48.36328125, -44.7783203125, -41.193359375, -37.6083984375, -34.0234375, -30.4384765625, -26.853515625, -23.2685546875, -19.68359375, -16.0986328125, -12.513671875, -8.9287109375, -5.34375, -1.7587890625, 1.826171875, 5.4111328125, 8.99609375, 12.5810546875, 16.166015625, 19.7509765625, 23.3359375, 26.9208984375, 30.505859375, 34.0908203125, 37.67578125, 41.2607421875, 44.845703125, 48.4306640625, 52.015625, 55.6005859375, 59.185546875, 62.7705078125, 66.35546875, 69.9404296875, 73.525390625, 77.1103515625, 80.6953125, 84.2802734375, 87.865234375, 91.4501953125, 95.03515625, 98.6201171875, 102.205078125, 105.7900390625, 109.375]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 7.0, 12.0, 9.0, 9.0, 9.0, 9.0, 11.0, 15.0, 20.0, 27.0, 21.0, 40.0, 36.0, 28.0, 41.0, 37.0, 55.0, 46.0, 57.0, 43.0, 54.0, 42.0, 32.0, 35.0, 39.0, 24.0, 35.0, 35.0, 31.0, 20.0, 17.0, 18.0, 11.0, 14.0, 13.0, 10.0, 6.0, 9.0, 5.0, 2.0, 4.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.4375, -59.421875, -57.40625, -55.390625, -53.375, -51.359375, -49.34375, -47.328125, -45.3125, -43.296875, -41.28125, -39.265625, -37.25, -35.234375, -33.21875, -31.203125, -29.1875, -27.171875, -25.15625, -23.140625, -21.125, -19.109375, -17.09375, -15.078125, -13.0625, -11.046875, -9.03125, -7.015625, -5.0, -2.984375, -0.96875, 1.046875, 3.0625, 5.078125, 7.09375, 9.109375, 11.125, 13.140625, 15.15625, 17.171875, 19.1875, 21.203125, 23.21875, 25.234375, 27.25, 29.265625, 31.28125, 33.296875, 35.3125, 37.328125, 39.34375, 41.359375, 43.375, 45.390625, 47.40625, 49.421875, 51.4375, 53.453125, 55.46875, 57.484375, 59.5, 61.515625, 63.53125, 65.546875, 67.5625]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [2.0, 6.0, 6.0, 11.0, 12.0, 15.0, 26.0, 35.0, 53.0, 86.0, 84.0, 153.0, 167.0, 296.0, 392.0, 575.0, 796.0, 1136.0, 1634.0, 2451.0, 3782.0, 5765.0, 9065.0, 15447.0, 27695.0, 55778.0, 144545.0, 592342.0, 2443917.0, 613597.0, 147094.0, 56999.0, 27776.0, 15623.0, 9236.0, 5954.0, 3765.0, 2586.0, 1632.0, 1130.0, 787.0, 527.0, 390.0, 258.0, 172.0, 139.0, 106.0, 60.0, 56.0, 37.0, 36.0, 11.0, 21.0, 14.0, 6.0, 3.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-118.6875, -114.5244140625, -110.361328125, -106.1982421875, -102.03515625, -97.8720703125, -93.708984375, -89.5458984375, -85.3828125, -81.2197265625, -77.056640625, -72.8935546875, -68.73046875, -64.5673828125, -60.404296875, -56.2412109375, -52.078125, -47.9150390625, -43.751953125, -39.5888671875, -35.42578125, -31.2626953125, -27.099609375, -22.9365234375, -18.7734375, -14.6103515625, -10.447265625, -6.2841796875, -2.12109375, 2.0419921875, 6.205078125, 10.3681640625, 14.53125, 18.6943359375, 22.857421875, 27.0205078125, 31.18359375, 35.3466796875, 39.509765625, 43.6728515625, 47.8359375, 51.9990234375, 56.162109375, 60.3251953125, 64.48828125, 68.6513671875, 72.814453125, 76.9775390625, 81.140625, 85.3037109375, 89.466796875, 93.6298828125, 97.79296875, 101.9560546875, 106.119140625, 110.2822265625, 114.4453125, 118.6083984375, 122.771484375, 126.9345703125, 131.09765625, 135.2607421875, 139.423828125, 143.5869140625, 147.75]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 2.0, 3.0, 2.0, 8.0, 5.0, 9.0, 8.0, 13.0, 11.0, 21.0, 27.0, 23.0, 27.0, 38.0, 56.0, 74.0, 92.0, 154.0, 241.0, 329.0, 524.0, 692.0, 564.0, 355.0, 253.0, 145.0, 96.0, 64.0, 49.0, 35.0, 39.0, 28.0, 13.0, 7.0, 12.0, 11.0, 14.0, 6.0, 6.0, 8.0, 5.0, 1.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-36.40625, -35.17578125, -33.9453125, -32.71484375, -31.484375, -30.25390625, -29.0234375, -27.79296875, -26.5625, -25.33203125, -24.1015625, -22.87109375, -21.640625, -20.41015625, -19.1796875, -17.94921875, -16.71875, -15.48828125, -14.2578125, -13.02734375, -11.796875, -10.56640625, -9.3359375, -8.10546875, -6.875, -5.64453125, -4.4140625, -3.18359375, -1.953125, -0.72265625, 0.5078125, 1.73828125, 2.96875, 4.19921875, 5.4296875, 6.66015625, 7.890625, 9.12109375, 10.3515625, 11.58203125, 12.8125, 14.04296875, 15.2734375, 16.50390625, 17.734375, 18.96484375, 20.1953125, 21.42578125, 22.65625, 23.88671875, 25.1171875, 26.34765625, 27.578125, 28.80859375, 30.0390625, 31.26953125, 32.5, 33.73046875, 34.9609375, 36.19140625, 37.421875, 38.65234375, 39.8828125, 41.11328125, 42.34375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 3.0, 3.0, 3.0, 6.0, 7.0, 7.0, 10.0, 8.0, 8.0, 12.0, 22.0, 19.0, 29.0, 29.0, 36.0, 61.0, 70.0, 82.0, 103.0, 102.0, 77.0, 63.0, 53.0, 35.0, 27.0, 36.0, 20.0, 10.0, 10.0, 12.0, 12.0, 7.0, 3.0, 3.0, 3.0, 4.0, 2.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-92.34141540527344, -89.34625244140625, -86.35108947753906, -83.35592651367188, -80.36076354980469, -77.36560821533203, -74.37044525146484, -71.37528228759766, -68.38011932373047, -65.38495635986328, -62.389793395996094, -59.39463424682617, -56.399471282958984, -53.4043083190918, -50.409149169921875, -47.41398620605469, -44.4188232421875, -41.42366027832031, -38.428497314453125, -35.4333381652832, -32.438175201416016, -29.443012237548828, -26.447851181030273, -23.45269012451172, -20.45752716064453, -17.462364196777344, -14.467203140258789, -11.472041130065918, -8.476879119873047, -5.481717109680176, -2.4865550994873047, 0.50860595703125, 3.5037689208984375, 6.498930931091309, 9.49409294128418, 12.48925495147705, 15.484416961669922, 18.47957992553711, 21.474740982055664, 24.46990203857422, 27.465065002441406, 30.460227966308594, 33.45539093017578, 36.4505500793457, 39.44571304321289, 42.44087600708008, 45.43603515625, 48.43119812011719, 51.426361083984375, 54.42152404785156, 57.41668701171875, 60.41184616088867, 63.40700912475586, 66.40216827392578, 69.39733123779297, 72.39249420166016, 75.38765716552734, 78.38282012939453, 81.37798309326172, 84.3731460571289, 87.36830139160156, 90.36346435546875, 93.35862731933594, 96.35379028320312, 99.34895324707031]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 5.0, 2.0, 7.0, 3.0, 7.0, 14.0, 13.0, 7.0, 11.0, 11.0, 13.0, 10.0, 25.0, 23.0, 35.0, 29.0, 22.0, 41.0, 45.0, 42.0, 39.0, 55.0, 40.0, 37.0, 40.0, 35.0, 44.0, 34.0, 38.0, 30.0, 38.0, 33.0, 28.0, 19.0, 19.0, 19.0, 18.0, 13.0, 11.0, 8.0, 12.0, 7.0, 7.0, 10.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-76.96728515625, -74.66474914550781, -72.36222076416016, -70.05968475341797, -67.75715637207031, -65.45462036132812, -63.15208435058594, -60.849552154541016, -58.547019958496094, -56.24448776245117, -53.94195556640625, -51.63941955566406, -49.33688735961914, -47.03435516357422, -44.73181915283203, -42.42928695678711, -40.12675476074219, -37.824222564697266, -35.521690368652344, -33.219154357910156, -30.916622161865234, -28.614089965820312, -26.311555862426758, -24.009021759033203, -21.70648956298828, -19.40395736694336, -17.101423263549805, -14.798890113830566, -12.496356964111328, -10.19382381439209, -7.891290664672852, -5.588756561279297, -3.2862319946289062, -0.983698844909668, 1.3188343048095703, 3.6213674545288086, 5.923900604248047, 8.226433753967285, 10.528966903686523, 12.831501007080078, 15.134033203125, 17.436565399169922, 19.739099502563477, 22.04163360595703, 24.344165802001953, 26.646697998046875, 28.94923210144043, 31.251766204833984, 33.554298400878906, 35.85683059692383, 38.15936279296875, 40.46189880371094, 42.76443099975586, 45.06696319580078, 47.36949920654297, 49.67203140258789, 51.97456359863281, 54.277095794677734, 56.579627990722656, 58.882164001464844, 61.184696197509766, 63.48722839355469, 65.78976440429688, 68.09230041503906, 70.39482879638672]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 6.0, 3.0, 8.0, 11.0, 13.0, 24.0, 21.0, 43.0, 40.0, 83.0, 136.0, 185.0, 232.0, 332.0, 467.0, 690.0, 1081.0, 1592.0, 2219.0, 3195.0, 4603.0, 6663.0, 9962.0, 15354.0, 24012.0, 38506.0, 67407.0, 121743.0, 207951.0, 219141.0, 132586.0, 73632.0, 41731.0, 24984.0, 16176.0, 10742.0, 7151.0, 4883.0, 3388.0, 2266.0, 1664.0, 1102.0, 753.0, 535.0, 387.0, 275.0, 197.0, 110.0, 96.0, 54.0, 53.0, 31.0, 20.0, 12.0, 9.0, 3.0, 3.0, 4.0, 0.0, 0.0, 0.0, 3.0], "bins": [-42.9375, -41.5556640625, -40.173828125, -38.7919921875, -37.41015625, -36.0283203125, -34.646484375, -33.2646484375, -31.8828125, -30.5009765625, -29.119140625, -27.7373046875, -26.35546875, -24.9736328125, -23.591796875, -22.2099609375, -20.828125, -19.4462890625, -18.064453125, -16.6826171875, -15.30078125, -13.9189453125, -12.537109375, -11.1552734375, -9.7734375, -8.3916015625, -7.009765625, -5.6279296875, -4.24609375, -2.8642578125, -1.482421875, -0.1005859375, 1.28125, 2.6630859375, 4.044921875, 5.4267578125, 6.80859375, 8.1904296875, 9.572265625, 10.9541015625, 12.3359375, 13.7177734375, 15.099609375, 16.4814453125, 17.86328125, 19.2451171875, 20.626953125, 22.0087890625, 23.390625, 24.7724609375, 26.154296875, 27.5361328125, 28.91796875, 30.2998046875, 31.681640625, 33.0634765625, 34.4453125, 35.8271484375, 37.208984375, 38.5908203125, 39.97265625, 41.3544921875, 42.736328125, 44.1181640625, 45.5]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 1.0, 3.0, 2.0, 5.0, 5.0, 13.0, 8.0, 8.0, 6.0, 9.0, 11.0, 15.0, 6.0, 17.0, 26.0, 25.0, 24.0, 30.0, 31.0, 34.0, 39.0, 43.0, 46.0, 40.0, 48.0, 44.0, 44.0, 47.0, 38.0, 34.0, 39.0, 25.0, 33.0, 28.0, 24.0, 22.0, 14.0, 17.0, 14.0, 17.0, 11.0, 9.0, 7.0, 13.0, 8.0, 4.0, 5.0, 4.0, 4.0, 2.0, 5.0, 2.0, 0.0, 2.0, 0.0, 3.0], "bins": [-62.96875, -61.078125, -59.1875, -57.296875, -55.40625, -53.515625, -51.625, -49.734375, -47.84375, -45.953125, -44.0625, -42.171875, -40.28125, -38.390625, -36.5, -34.609375, -32.71875, -30.828125, -28.9375, -27.046875, -25.15625, -23.265625, -21.375, -19.484375, -17.59375, -15.703125, -13.8125, -11.921875, -10.03125, -8.140625, -6.25, -4.359375, -2.46875, -0.578125, 1.3125, 3.203125, 5.09375, 6.984375, 8.875, 10.765625, 12.65625, 14.546875, 16.4375, 18.328125, 20.21875, 22.109375, 24.0, 25.890625, 27.78125, 29.671875, 31.5625, 33.453125, 35.34375, 37.234375, 39.125, 41.015625, 42.90625, 44.796875, 46.6875, 48.578125, 50.46875, 52.359375, 54.25, 56.140625, 58.03125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 2.0, 4.0, 10.0, 6.0, 9.0, 20.0, 17.0, 35.0, 33.0, 49.0, 90.0, 97.0, 157.0, 225.0, 334.0, 458.0, 646.0, 959.0, 1376.0, 2119.0, 3473.0, 5545.0, 9245.0, 18258.0, 62497.0, 778120.0, 113903.0, 22633.0, 10939.0, 6113.0, 3891.0, 2457.0, 1563.0, 1044.0, 679.0, 439.0, 336.0, 228.0, 156.0, 94.0, 84.0, 60.0, 44.0, 27.0, 22.0, 20.0, 10.0, 9.0, 6.0, 8.0, 4.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0], "bins": [-120.375, -116.169921875, -111.96484375, -107.759765625, -103.5546875, -99.349609375, -95.14453125, -90.939453125, -86.734375, -82.529296875, -78.32421875, -74.119140625, -69.9140625, -65.708984375, -61.50390625, -57.298828125, -53.09375, -48.888671875, -44.68359375, -40.478515625, -36.2734375, -32.068359375, -27.86328125, -23.658203125, -19.453125, -15.248046875, -11.04296875, -6.837890625, -2.6328125, 1.572265625, 5.77734375, 9.982421875, 14.1875, 18.392578125, 22.59765625, 26.802734375, 31.0078125, 35.212890625, 39.41796875, 43.623046875, 47.828125, 52.033203125, 56.23828125, 60.443359375, 64.6484375, 68.853515625, 73.05859375, 77.263671875, 81.46875, 85.673828125, 89.87890625, 94.083984375, 98.2890625, 102.494140625, 106.69921875, 110.904296875, 115.109375, 119.314453125, 123.51953125, 127.724609375, 131.9296875, 136.134765625, 140.33984375, 144.544921875, 148.75]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 0.0, 3.0, 3.0, 7.0, 7.0, 16.0, 10.0, 13.0, 22.0, 22.0, 15.0, 35.0, 31.0, 29.0, 38.0, 35.0, 41.0, 36.0, 36.0, 51.0, 45.0, 42.0, 41.0, 43.0, 35.0, 45.0, 28.0, 38.0, 43.0, 36.0, 23.0, 21.0, 19.0, 22.0, 18.0, 10.0, 13.0, 8.0, 8.0, 9.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-121.375, -118.064453125, -114.75390625, -111.443359375, -108.1328125, -104.822265625, -101.51171875, -98.201171875, -94.890625, -91.580078125, -88.26953125, -84.958984375, -81.6484375, -78.337890625, -75.02734375, -71.716796875, -68.40625, -65.095703125, -61.78515625, -58.474609375, -55.1640625, -51.853515625, -48.54296875, -45.232421875, -41.921875, -38.611328125, -35.30078125, -31.990234375, -28.6796875, -25.369140625, -22.05859375, -18.748046875, -15.4375, -12.126953125, -8.81640625, -5.505859375, -2.1953125, 1.115234375, 4.42578125, 7.736328125, 11.046875, 14.357421875, 17.66796875, 20.978515625, 24.2890625, 27.599609375, 30.91015625, 34.220703125, 37.53125, 40.841796875, 44.15234375, 47.462890625, 50.7734375, 54.083984375, 57.39453125, 60.705078125, 64.015625, 67.326171875, 70.63671875, 73.947265625, 77.2578125, 80.568359375, 83.87890625, 87.189453125, 90.5]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 4.0, 4.0, 5.0, 6.0, 14.0, 15.0, 14.0, 23.0, 32.0, 52.0, 75.0, 106.0, 145.0, 194.0, 344.0, 521.0, 829.0, 1396.0, 2421.0, 4610.0, 9688.0, 29265.0, 394399.0, 550328.0, 32458.0, 10268.0, 4793.0, 2495.0, 1491.0, 909.0, 555.0, 313.0, 228.0, 182.0, 114.0, 89.0, 50.0, 37.0, 25.0, 12.0, 10.0, 15.0, 5.0, 8.0, 2.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.375, -16.776611328125, -16.17822265625, -15.579833984375, -14.9814453125, -14.383056640625, -13.78466796875, -13.186279296875, -12.587890625, -11.989501953125, -11.39111328125, -10.792724609375, -10.1943359375, -9.595947265625, -8.99755859375, -8.399169921875, -7.80078125, -7.202392578125, -6.60400390625, -6.005615234375, -5.4072265625, -4.808837890625, -4.21044921875, -3.612060546875, -3.013671875, -2.415283203125, -1.81689453125, -1.218505859375, -0.6201171875, -0.021728515625, 0.57666015625, 1.175048828125, 1.7734375, 2.371826171875, 2.97021484375, 3.568603515625, 4.1669921875, 4.765380859375, 5.36376953125, 5.962158203125, 6.560546875, 7.158935546875, 7.75732421875, 8.355712890625, 8.9541015625, 9.552490234375, 10.15087890625, 10.749267578125, 11.34765625, 11.946044921875, 12.54443359375, 13.142822265625, 13.7412109375, 14.339599609375, 14.93798828125, 15.536376953125, 16.134765625, 16.733154296875, 17.33154296875, 17.929931640625, 18.5283203125, 19.126708984375, 19.72509765625, 20.323486328125, 20.921875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 5.0, 6.0, 10.0, 11.0, 19.0, 21.0, 43.0, 51.0, 106.0, 167.0, 193.0, 138.0, 80.0, 49.0, 25.0, 20.0, 22.0, 9.0, 11.0, 5.0, 2.0, 6.0, 1.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0109100341796875, -0.010509371757507324, -0.010108709335327148, -0.009708046913146973, -0.009307384490966797, -0.008906722068786621, -0.008506059646606445, -0.00810539722442627, -0.007704734802246094, -0.007304072380065918, -0.006903409957885742, -0.006502747535705566, -0.006102085113525391, -0.005701422691345215, -0.005300760269165039, -0.004900097846984863, -0.0044994354248046875, -0.004098773002624512, -0.003698110580444336, -0.00329744815826416, -0.0028967857360839844, -0.0024961233139038086, -0.002095460891723633, -0.001694798469543457, -0.0012941360473632812, -0.0008934736251831055, -0.0004928112030029297, -9.21487808227539e-05, 0.0003085136413574219, 0.0007091760635375977, 0.0011098384857177734, 0.0015105009078979492, 0.001911163330078125, 0.0023118257522583008, 0.0027124881744384766, 0.0031131505966186523, 0.003513813018798828, 0.003914475440979004, 0.00431513786315918, 0.0047158002853393555, 0.005116462707519531, 0.005517125129699707, 0.005917787551879883, 0.006318449974060059, 0.006719112396240234, 0.00711977481842041, 0.007520437240600586, 0.007921099662780762, 0.008321762084960938, 0.008722424507141113, 0.009123086929321289, 0.009523749351501465, 0.00992441177368164, 0.010325074195861816, 0.010725736618041992, 0.011126399040222168, 0.011527061462402344, 0.01192772388458252, 0.012328386306762695, 0.012729048728942871, 0.013129711151123047, 0.013530373573303223, 0.013931035995483398, 0.014331698417663574, 0.01473236083984375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 7.0, 2.0, 8.0, 6.0, 14.0, 23.0, 32.0, 47.0, 57.0, 99.0, 126.0, 139.0, 214.0, 294.0, 447.0, 635.0, 961.0, 1454.0, 2228.0, 3488.0, 5456.0, 8998.0, 15452.0, 28021.0, 53898.0, 122910.0, 323168.0, 270496.0, 101860.0, 47224.0, 24509.0, 13869.0, 8089.0, 4999.0, 3096.0, 2011.0, 1334.0, 862.0, 609.0, 445.0, 300.0, 192.0, 129.0, 98.0, 69.0, 61.0, 29.0, 26.0, 26.0, 11.0, 7.0, 14.0, 5.0, 7.0, 3.0, 3.0, 2.0], "bins": [-7.60546875, -7.381103515625, -7.15673828125, -6.932373046875, -6.7080078125, -6.483642578125, -6.25927734375, -6.034912109375, -5.810546875, -5.586181640625, -5.36181640625, -5.137451171875, -4.9130859375, -4.688720703125, -4.46435546875, -4.239990234375, -4.015625, -3.791259765625, -3.56689453125, -3.342529296875, -3.1181640625, -2.893798828125, -2.66943359375, -2.445068359375, -2.220703125, -1.996337890625, -1.77197265625, -1.547607421875, -1.3232421875, -1.098876953125, -0.87451171875, -0.650146484375, -0.42578125, -0.201416015625, 0.02294921875, 0.247314453125, 0.4716796875, 0.696044921875, 0.92041015625, 1.144775390625, 1.369140625, 1.593505859375, 1.81787109375, 2.042236328125, 2.2666015625, 2.490966796875, 2.71533203125, 2.939697265625, 3.1640625, 3.388427734375, 3.61279296875, 3.837158203125, 4.0615234375, 4.285888671875, 4.51025390625, 4.734619140625, 4.958984375, 5.183349609375, 5.40771484375, 5.632080078125, 5.8564453125, 6.080810546875, 6.30517578125, 6.529541015625, 6.75390625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 7.0, 4.0, 5.0, 7.0, 5.0, 12.0, 13.0, 12.0, 22.0, 20.0, 24.0, 34.0, 47.0, 46.0, 48.0, 57.0, 60.0, 82.0, 62.0, 60.0, 62.0, 64.0, 42.0, 29.0, 27.0, 39.0, 15.0, 19.0, 17.0, 15.0, 11.0, 10.0, 8.0, 2.0, 4.0, 4.0, 4.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-2.33984375, -2.274261474609375, -2.20867919921875, -2.143096923828125, -2.0775146484375, -2.011932373046875, -1.94635009765625, -1.880767822265625, -1.815185546875, -1.749603271484375, -1.68402099609375, -1.618438720703125, -1.5528564453125, -1.487274169921875, -1.42169189453125, -1.356109619140625, -1.29052734375, -1.224945068359375, -1.15936279296875, -1.093780517578125, -1.0281982421875, -0.962615966796875, -0.89703369140625, -0.831451416015625, -0.765869140625, -0.700286865234375, -0.63470458984375, -0.569122314453125, -0.5035400390625, -0.437957763671875, -0.37237548828125, -0.306793212890625, -0.2412109375, -0.175628662109375, -0.11004638671875, -0.044464111328125, 0.0211181640625, 0.086700439453125, 0.15228271484375, 0.217864990234375, 0.283447265625, 0.349029541015625, 0.41461181640625, 0.480194091796875, 0.5457763671875, 0.611358642578125, 0.67694091796875, 0.742523193359375, 0.80810546875, 0.873687744140625, 0.93927001953125, 1.004852294921875, 1.0704345703125, 1.136016845703125, 1.20159912109375, 1.267181396484375, 1.332763671875, 1.398345947265625, 1.46392822265625, 1.529510498046875, 1.5950927734375, 1.660675048828125, 1.72625732421875, 1.791839599609375, 1.857421875]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 5.0, 6.0, 10.0, 8.0, 11.0, 12.0, 11.0, 18.0, 22.0, 24.0, 36.0, 52.0, 74.0, 85.0, 104.0, 107.0, 110.0, 76.0, 63.0, 42.0, 39.0, 28.0, 11.0, 8.0, 15.0, 11.0, 5.0, 4.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-90.31333923339844, -87.32707214355469, -84.3407974243164, -81.35453033447266, -78.36825561523438, -75.38198852539062, -72.39572143554688, -69.40945434570312, -66.42317962646484, -63.43690872192383, -60.45063781738281, -57.46437072753906, -54.47809982299805, -51.49182891845703, -48.50556182861328, -45.519290924072266, -42.53302001953125, -39.546749114990234, -36.56047821044922, -33.57421112060547, -30.587940216064453, -27.601669311523438, -24.615400314331055, -21.629131317138672, -18.642860412597656, -15.656590461730957, -12.670320510864258, -9.684050559997559, -6.697780609130859, -3.71151065826416, -0.7252407073974609, 2.261028289794922, 5.247291564941406, 8.233561515808105, 11.219831466674805, 14.206101417541504, 17.192371368408203, 20.17864227294922, 23.1649112701416, 26.151180267333984, 29.137451171875, 32.123722076416016, 35.10999298095703, 38.09626007080078, 41.0825309753418, 44.06880187988281, 47.05506896972656, 50.04133987426758, 53.027610778808594, 56.01388168334961, 59.000152587890625, 61.986419677734375, 64.97268676757812, 67.9589614868164, 70.94522857666016, 73.93150329589844, 76.91777038574219, 79.90403747558594, 82.89031219482422, 85.87657928466797, 88.86285400390625, 91.84912109375, 94.83538818359375, 97.8216552734375, 100.80792999267578]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 2.0, 6.0, 8.0, 14.0, 9.0, 3.0, 11.0, 13.0, 14.0, 13.0, 21.0, 22.0, 23.0, 34.0, 35.0, 34.0, 30.0, 44.0, 42.0, 43.0, 43.0, 39.0, 39.0, 41.0, 42.0, 46.0, 30.0, 28.0, 42.0, 24.0, 34.0, 22.0, 21.0, 19.0, 17.0, 16.0, 18.0, 11.0, 8.0, 8.0, 8.0, 10.0, 3.0, 6.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-61.97907257080078, -60.09901809692383, -58.21896743774414, -56.33891296386719, -54.4588623046875, -52.57880783081055, -50.698753356933594, -48.818702697753906, -46.93865203857422, -45.058597564697266, -43.17854690551758, -41.298492431640625, -39.41844177246094, -37.538387298583984, -35.65833282470703, -33.778282165527344, -31.89822769165039, -30.01817512512207, -28.13812255859375, -26.258068084716797, -24.37801742553711, -22.497962951660156, -20.617910385131836, -18.737857818603516, -16.857805252075195, -14.977752685546875, -13.097700119018555, -11.217646598815918, -9.337594032287598, -7.457541465759277, -5.577487945556641, -3.6974353790283203, -1.8173866271972656, 0.06266617774963379, 1.9427189826965332, 3.8227720260620117, 5.702824592590332, 7.582877159118652, 9.462930679321289, 11.34298324584961, 13.22303581237793, 15.10308837890625, 16.98314094543457, 18.86319351196289, 20.743247985839844, 22.62329864501953, 24.503353118896484, 26.383405685424805, 28.263458251953125, 30.143510818481445, 32.023563385009766, 33.90361785888672, 35.783668518066406, 37.66372299194336, 39.54377746582031, 41.423828125, 43.30387878417969, 45.18393325805664, 47.06398391723633, 48.94403839111328, 50.82408905029297, 52.70414352416992, 54.584197998046875, 56.46424865722656, 58.344303131103516]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 11.0, 7.0, 8.0, 13.0, 17.0, 23.0, 29.0, 35.0, 67.0, 88.0, 115.0, 171.0, 192.0, 332.0, 449.0, 619.0, 839.0, 1197.0, 1637.0, 2352.0, 3245.0, 4653.0, 6610.0, 9804.0, 14832.0, 23296.0, 36802.0, 62077.0, 107403.0, 189793.0, 230199.0, 140221.0, 79113.0, 46716.0, 28566.0, 18159.0, 11967.0, 8089.0, 5464.0, 3868.0, 2590.0, 1944.0, 1401.0, 1018.0, 728.0, 521.0, 373.0, 258.0, 184.0, 134.0, 104.0, 74.0, 51.0, 35.0, 37.0, 18.0, 8.0, 4.0, 7.0, 1.0, 2.0, 2.0], "bins": [-56.125, -54.3837890625, -52.642578125, -50.9013671875, -49.16015625, -47.4189453125, -45.677734375, -43.9365234375, -42.1953125, -40.4541015625, -38.712890625, -36.9716796875, -35.23046875, -33.4892578125, -31.748046875, -30.0068359375, -28.265625, -26.5244140625, -24.783203125, -23.0419921875, -21.30078125, -19.5595703125, -17.818359375, -16.0771484375, -14.3359375, -12.5947265625, -10.853515625, -9.1123046875, -7.37109375, -5.6298828125, -3.888671875, -2.1474609375, -0.40625, 1.3349609375, 3.076171875, 4.8173828125, 6.55859375, 8.2998046875, 10.041015625, 11.7822265625, 13.5234375, 15.2646484375, 17.005859375, 18.7470703125, 20.48828125, 22.2294921875, 23.970703125, 25.7119140625, 27.453125, 29.1943359375, 30.935546875, 32.6767578125, 34.41796875, 36.1591796875, 37.900390625, 39.6416015625, 41.3828125, 43.1240234375, 44.865234375, 46.6064453125, 48.34765625, 50.0888671875, 51.830078125, 53.5712890625, 55.3125]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 4.0, 2.0, 0.0, 9.0, 14.0, 10.0, 4.0, 8.0, 11.0, 13.0, 17.0, 11.0, 23.0, 22.0, 29.0, 28.0, 30.0, 33.0, 45.0, 45.0, 44.0, 52.0, 39.0, 60.0, 46.0, 46.0, 47.0, 37.0, 31.0, 36.0, 28.0, 20.0, 24.0, 22.0, 18.0, 14.0, 20.0, 13.0, 11.0, 6.0, 10.0, 7.0, 6.0, 4.0, 3.0, 4.0, 0.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-64.625, -62.67578125, -60.7265625, -58.77734375, -56.828125, -54.87890625, -52.9296875, -50.98046875, -49.03125, -47.08203125, -45.1328125, -43.18359375, -41.234375, -39.28515625, -37.3359375, -35.38671875, -33.4375, -31.48828125, -29.5390625, -27.58984375, -25.640625, -23.69140625, -21.7421875, -19.79296875, -17.84375, -15.89453125, -13.9453125, -11.99609375, -10.046875, -8.09765625, -6.1484375, -4.19921875, -2.25, -0.30078125, 1.6484375, 3.59765625, 5.546875, 7.49609375, 9.4453125, 11.39453125, 13.34375, 15.29296875, 17.2421875, 19.19140625, 21.140625, 23.08984375, 25.0390625, 26.98828125, 28.9375, 30.88671875, 32.8359375, 34.78515625, 36.734375, 38.68359375, 40.6328125, 42.58203125, 44.53125, 46.48046875, 48.4296875, 50.37890625, 52.328125, 54.27734375, 56.2265625, 58.17578125, 60.125]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 1.0, 3.0, 5.0, 10.0, 8.0, 21.0, 36.0, 30.0, 70.0, 95.0, 129.0, 188.0, 293.0, 378.0, 613.0, 964.0, 1368.0, 2149.0, 3299.0, 4962.0, 7663.0, 12243.0, 19353.0, 31074.0, 52935.0, 93617.0, 176373.0, 259329.0, 164268.0, 87096.0, 49309.0, 29634.0, 18439.0, 11450.0, 7314.0, 4662.0, 3155.0, 1983.0, 1338.0, 866.0, 581.0, 422.0, 269.0, 184.0, 128.0, 83.0, 51.0, 47.0, 33.0, 12.0, 13.0, 4.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-73.875, -71.525390625, -69.17578125, -66.826171875, -64.4765625, -62.126953125, -59.77734375, -57.427734375, -55.078125, -52.728515625, -50.37890625, -48.029296875, -45.6796875, -43.330078125, -40.98046875, -38.630859375, -36.28125, -33.931640625, -31.58203125, -29.232421875, -26.8828125, -24.533203125, -22.18359375, -19.833984375, -17.484375, -15.134765625, -12.78515625, -10.435546875, -8.0859375, -5.736328125, -3.38671875, -1.037109375, 1.3125, 3.662109375, 6.01171875, 8.361328125, 10.7109375, 13.060546875, 15.41015625, 17.759765625, 20.109375, 22.458984375, 24.80859375, 27.158203125, 29.5078125, 31.857421875, 34.20703125, 36.556640625, 38.90625, 41.255859375, 43.60546875, 45.955078125, 48.3046875, 50.654296875, 53.00390625, 55.353515625, 57.703125, 60.052734375, 62.40234375, 64.751953125, 67.1015625, 69.451171875, 71.80078125, 74.150390625, 76.5]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 4.0, 7.0, 7.0, 10.0, 16.0, 20.0, 11.0, 17.0, 20.0, 17.0, 29.0, 16.0, 28.0, 49.0, 36.0, 41.0, 40.0, 39.0, 41.0, 32.0, 33.0, 53.0, 43.0, 42.0, 49.0, 44.0, 28.0, 25.0, 27.0, 36.0, 20.0, 18.0, 18.0, 16.0, 13.0, 17.0, 9.0, 9.0, 4.0, 3.0, 3.0, 6.0, 5.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-40.6875, -39.47216796875, -38.2568359375, -37.04150390625, -35.826171875, -34.61083984375, -33.3955078125, -32.18017578125, -30.96484375, -29.74951171875, -28.5341796875, -27.31884765625, -26.103515625, -24.88818359375, -23.6728515625, -22.45751953125, -21.2421875, -20.02685546875, -18.8115234375, -17.59619140625, -16.380859375, -15.16552734375, -13.9501953125, -12.73486328125, -11.51953125, -10.30419921875, -9.0888671875, -7.87353515625, -6.658203125, -5.44287109375, -4.2275390625, -3.01220703125, -1.796875, -0.58154296875, 0.6337890625, 1.84912109375, 3.064453125, 4.27978515625, 5.4951171875, 6.71044921875, 7.92578125, 9.14111328125, 10.3564453125, 11.57177734375, 12.787109375, 14.00244140625, 15.2177734375, 16.43310546875, 17.6484375, 18.86376953125, 20.0791015625, 21.29443359375, 22.509765625, 23.72509765625, 24.9404296875, 26.15576171875, 27.37109375, 28.58642578125, 29.8017578125, 31.01708984375, 32.232421875, 33.44775390625, 34.6630859375, 35.87841796875, 37.09375]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 4.0, 2.0, 3.0, 4.0, 7.0, 11.0, 13.0, 28.0, 31.0, 50.0, 62.0, 115.0, 169.0, 230.0, 337.0, 494.0, 853.0, 1206.0, 1815.0, 2819.0, 4538.0, 7407.0, 12567.0, 22327.0, 41592.0, 85897.0, 204944.0, 349283.0, 159600.0, 69540.0, 35007.0, 18955.0, 10650.0, 6570.0, 3948.0, 2575.0, 1621.0, 1074.0, 723.0, 486.0, 350.0, 212.0, 142.0, 102.0, 68.0, 42.0, 34.0, 22.0, 10.0, 12.0, 7.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-25.109375, -24.308837890625, -23.50830078125, -22.707763671875, -21.9072265625, -21.106689453125, -20.30615234375, -19.505615234375, -18.705078125, -17.904541015625, -17.10400390625, -16.303466796875, -15.5029296875, -14.702392578125, -13.90185546875, -13.101318359375, -12.30078125, -11.500244140625, -10.69970703125, -9.899169921875, -9.0986328125, -8.298095703125, -7.49755859375, -6.697021484375, -5.896484375, -5.095947265625, -4.29541015625, -3.494873046875, -2.6943359375, -1.893798828125, -1.09326171875, -0.292724609375, 0.5078125, 1.308349609375, 2.10888671875, 2.909423828125, 3.7099609375, 4.510498046875, 5.31103515625, 6.111572265625, 6.912109375, 7.712646484375, 8.51318359375, 9.313720703125, 10.1142578125, 10.914794921875, 11.71533203125, 12.515869140625, 13.31640625, 14.116943359375, 14.91748046875, 15.718017578125, 16.5185546875, 17.319091796875, 18.11962890625, 18.920166015625, 19.720703125, 20.521240234375, 21.32177734375, 22.122314453125, 22.9228515625, 23.723388671875, 24.52392578125, 25.324462890625, 26.125]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 8.0, 7.0, 4.0, 6.0, 9.0, 10.0, 14.0, 20.0, 18.0, 19.0, 27.0, 47.0, 56.0, 84.0, 121.0, 127.0, 107.0, 68.0, 60.0, 46.0, 30.0, 18.0, 20.0, 14.0, 11.0, 9.0, 13.0, 4.0, 4.0, 9.0, 4.0, 0.0, 4.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00307464599609375, -0.0029824376106262207, -0.0028902292251586914, -0.002798020839691162, -0.002705812454223633, -0.0026136040687561035, -0.0025213956832885742, -0.002429187297821045, -0.0023369789123535156, -0.0022447705268859863, -0.002152562141418457, -0.0020603537559509277, -0.0019681453704833984, -0.0018759369850158691, -0.0017837285995483398, -0.0016915202140808105, -0.0015993118286132812, -0.001507103443145752, -0.0014148950576782227, -0.0013226866722106934, -0.001230478286743164, -0.0011382699012756348, -0.0010460615158081055, -0.0009538531303405762, -0.0008616447448730469, -0.0007694363594055176, -0.0006772279739379883, -0.000585019588470459, -0.0004928112030029297, -0.0004006028175354004, -0.0003083944320678711, -0.0002161860466003418, -0.0001239776611328125, -3.17692756652832e-05, 6.0439109802246094e-05, 0.0001526474952697754, 0.0002448558807373047, 0.000337064266204834, 0.0004292726516723633, 0.0005214810371398926, 0.0006136894226074219, 0.0007058978080749512, 0.0007981061935424805, 0.0008903145790100098, 0.000982522964477539, 0.0010747313499450684, 0.0011669397354125977, 0.001259148120880127, 0.0013513565063476562, 0.0014435648918151855, 0.0015357732772827148, 0.0016279816627502441, 0.0017201900482177734, 0.0018123984336853027, 0.001904606819152832, 0.0019968152046203613, 0.0020890235900878906, 0.00218123197555542, 0.0022734403610229492, 0.0023656487464904785, 0.002457857131958008, 0.002550065517425537, 0.0026422739028930664, 0.0027344822883605957, 0.002826690673828125]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 6.0, 4.0, 1.0, 2.0, 4.0, 14.0, 14.0, 24.0, 35.0, 29.0, 55.0, 75.0, 110.0, 156.0, 261.0, 346.0, 460.0, 736.0, 1108.0, 1740.0, 2711.0, 4487.0, 7552.0, 13167.0, 23971.0, 47476.0, 102829.0, 249473.0, 321777.0, 138656.0, 61541.0, 30030.0, 15892.0, 9004.0, 5419.0, 3294.0, 2072.0, 1373.0, 824.0, 566.0, 361.0, 276.0, 158.0, 149.0, 85.0, 75.0, 36.0, 40.0, 35.0, 25.0, 12.0, 5.0, 2.0, 5.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-24.421875, -23.662841796875, -22.90380859375, -22.144775390625, -21.3857421875, -20.626708984375, -19.86767578125, -19.108642578125, -18.349609375, -17.590576171875, -16.83154296875, -16.072509765625, -15.3134765625, -14.554443359375, -13.79541015625, -13.036376953125, -12.27734375, -11.518310546875, -10.75927734375, -10.000244140625, -9.2412109375, -8.482177734375, -7.72314453125, -6.964111328125, -6.205078125, -5.446044921875, -4.68701171875, -3.927978515625, -3.1689453125, -2.409912109375, -1.65087890625, -0.891845703125, -0.1328125, 0.626220703125, 1.38525390625, 2.144287109375, 2.9033203125, 3.662353515625, 4.42138671875, 5.180419921875, 5.939453125, 6.698486328125, 7.45751953125, 8.216552734375, 8.9755859375, 9.734619140625, 10.49365234375, 11.252685546875, 12.01171875, 12.770751953125, 13.52978515625, 14.288818359375, 15.0478515625, 15.806884765625, 16.56591796875, 17.324951171875, 18.083984375, 18.843017578125, 19.60205078125, 20.361083984375, 21.1201171875, 21.879150390625, 22.63818359375, 23.397216796875, 24.15625]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 6.0, 10.0, 10.0, 9.0, 10.0, 8.0, 20.0, 20.0, 15.0, 28.0, 40.0, 41.0, 40.0, 46.0, 61.0, 62.0, 58.0, 64.0, 71.0, 59.0, 48.0, 46.0, 42.0, 33.0, 24.0, 37.0, 25.0, 18.0, 11.0, 9.0, 10.0, 6.0, 2.0, 4.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.1484375, -7.9169921875, -7.685546875, -7.4541015625, -7.22265625, -6.9912109375, -6.759765625, -6.5283203125, -6.296875, -6.0654296875, -5.833984375, -5.6025390625, -5.37109375, -5.1396484375, -4.908203125, -4.6767578125, -4.4453125, -4.2138671875, -3.982421875, -3.7509765625, -3.51953125, -3.2880859375, -3.056640625, -2.8251953125, -2.59375, -2.3623046875, -2.130859375, -1.8994140625, -1.66796875, -1.4365234375, -1.205078125, -0.9736328125, -0.7421875, -0.5107421875, -0.279296875, -0.0478515625, 0.18359375, 0.4150390625, 0.646484375, 0.8779296875, 1.109375, 1.3408203125, 1.572265625, 1.8037109375, 2.03515625, 2.2666015625, 2.498046875, 2.7294921875, 2.9609375, 3.1923828125, 3.423828125, 3.6552734375, 3.88671875, 4.1181640625, 4.349609375, 4.5810546875, 4.8125, 5.0439453125, 5.275390625, 5.5068359375, 5.73828125, 5.9697265625, 6.201171875, 6.4326171875, 6.6640625]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 7.0, 6.0, 7.0, 11.0, 14.0, 13.0, 14.0, 21.0, 38.0, 39.0, 48.0, 62.0, 94.0, 112.0, 109.0, 101.0, 77.0, 56.0, 47.0, 29.0, 23.0, 17.0, 17.0, 11.0, 8.0, 5.0, 11.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.94277954101562, -82.0176773071289, -79.09258270263672, -76.16748046875, -73.24238586425781, -70.3172836303711, -67.39218139648438, -64.46708679199219, -61.541988372802734, -58.61688995361328, -55.69179153442383, -52.766693115234375, -49.841590881347656, -46.91649627685547, -43.99139404296875, -41.0662956237793, -38.141197204589844, -35.21609878540039, -32.29100036621094, -29.36590003967285, -26.4408016204834, -23.515703201293945, -20.59060287475586, -17.665504455566406, -14.740406036376953, -11.8153076171875, -8.89020824432373, -5.965108871459961, -3.040010452270508, -0.11491203308105469, 2.8101882934570312, 5.735286712646484, 8.660385131835938, 11.58548355102539, 14.51058292388916, 17.43568229675293, 20.360780715942383, 23.285879135131836, 26.210979461669922, 29.136077880859375, 32.06117630004883, 34.98627471923828, 37.911373138427734, 40.83647155761719, 43.761573791503906, 46.686668395996094, 49.61177062988281, 52.536869049072266, 55.46196746826172, 58.38706588745117, 61.312164306640625, 64.23726654052734, 67.16236114501953, 70.08746337890625, 73.01255798339844, 75.93766021728516, 78.86276245117188, 81.7878646850586, 84.71295928955078, 87.6380615234375, 90.56315612792969, 93.4882583618164, 96.41336059570312, 99.33845520019531, 102.2635498046875]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 9.0, 6.0, 9.0, 4.0, 9.0, 4.0, 9.0, 11.0, 18.0, 22.0, 13.0, 21.0, 20.0, 30.0, 41.0, 40.0, 36.0, 43.0, 34.0, 39.0, 46.0, 35.0, 26.0, 42.0, 31.0, 41.0, 37.0, 32.0, 29.0, 39.0, 27.0, 23.0, 24.0, 22.0, 23.0, 13.0, 24.0, 12.0, 13.0, 11.0, 11.0, 9.0, 3.0, 3.0, 1.0, 6.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-62.063899993896484, -60.25804138183594, -58.452186584472656, -56.646331787109375, -54.84047317504883, -53.03461456298828, -51.228759765625, -49.42290496826172, -47.61704635620117, -45.811187744140625, -44.005332946777344, -42.19947814941406, -40.393619537353516, -38.58776092529297, -36.78190612792969, -34.976051330566406, -33.17019271850586, -31.364336013793945, -29.55847930908203, -27.752622604370117, -25.946765899658203, -24.14090919494629, -22.335052490234375, -20.52919578552246, -18.723339080810547, -16.917482376098633, -15.111625671386719, -13.305768966674805, -11.49991226196289, -9.694055557250977, -7.8881988525390625, -6.082342147827148, -4.276485443115234, -2.4706287384033203, -0.6647720336914062, 1.1410846710205078, 2.946941375732422, 4.752798080444336, 6.55865478515625, 8.364511489868164, 10.170368194580078, 11.976224899291992, 13.782081604003906, 15.58793830871582, 17.393795013427734, 19.19965171813965, 21.005508422851562, 22.811365127563477, 24.61722183227539, 26.423078536987305, 28.22893524169922, 30.034791946411133, 31.840648651123047, 33.646507263183594, 35.452362060546875, 37.258216857910156, 39.0640754699707, 40.86993408203125, 42.67578887939453, 44.48164367675781, 46.28750228881836, 48.093360900878906, 49.89921569824219, 51.70507049560547, 53.510929107666016]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 6.0, 6.0, 7.0, 21.0, 12.0, 18.0, 21.0, 40.0, 50.0, 84.0, 84.0, 136.0, 185.0, 268.0, 399.0, 595.0, 862.0, 1369.0, 2142.0, 3378.0, 5803.0, 10013.0, 20067.0, 56019.0, 285590.0, 1523091.0, 1841127.0, 328792.0, 66079.0, 21586.0, 10408.0, 5894.0, 3518.0, 2325.0, 1398.0, 951.0, 618.0, 392.0, 290.0, 206.0, 119.0, 73.0, 68.0, 45.0, 40.0, 34.0, 15.0, 5.0, 8.0, 9.0, 6.0, 4.0, 6.0, 5.0, 1.0], "bins": [-120.875, -117.4267578125, -113.978515625, -110.5302734375, -107.08203125, -103.6337890625, -100.185546875, -96.7373046875, -93.2890625, -89.8408203125, -86.392578125, -82.9443359375, -79.49609375, -76.0478515625, -72.599609375, -69.1513671875, -65.703125, -62.2548828125, -58.806640625, -55.3583984375, -51.91015625, -48.4619140625, -45.013671875, -41.5654296875, -38.1171875, -34.6689453125, -31.220703125, -27.7724609375, -24.32421875, -20.8759765625, -17.427734375, -13.9794921875, -10.53125, -7.0830078125, -3.634765625, -0.1865234375, 3.26171875, 6.7099609375, 10.158203125, 13.6064453125, 17.0546875, 20.5029296875, 23.951171875, 27.3994140625, 30.84765625, 34.2958984375, 37.744140625, 41.1923828125, 44.640625, 48.0888671875, 51.537109375, 54.9853515625, 58.43359375, 61.8818359375, 65.330078125, 68.7783203125, 72.2265625, 75.6748046875, 79.123046875, 82.5712890625, 86.01953125, 89.4677734375, 92.916015625, 96.3642578125, 99.8125]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 0.0, 5.0, 6.0, 7.0, 5.0, 7.0, 14.0, 15.0, 10.0, 23.0, 16.0, 18.0, 19.0, 30.0, 39.0, 29.0, 42.0, 56.0, 40.0, 46.0, 47.0, 32.0, 40.0, 36.0, 42.0, 44.0, 31.0, 35.0, 38.0, 28.0, 31.0, 28.0, 13.0, 17.0, 17.0, 20.0, 9.0, 17.0, 5.0, 12.0, 13.0, 6.0, 4.0, 1.0, 1.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-57.3125, -55.6328125, -53.953125, -52.2734375, -50.59375, -48.9140625, -47.234375, -45.5546875, -43.875, -42.1953125, -40.515625, -38.8359375, -37.15625, -35.4765625, -33.796875, -32.1171875, -30.4375, -28.7578125, -27.078125, -25.3984375, -23.71875, -22.0390625, -20.359375, -18.6796875, -17.0, -15.3203125, -13.640625, -11.9609375, -10.28125, -8.6015625, -6.921875, -5.2421875, -3.5625, -1.8828125, -0.203125, 1.4765625, 3.15625, 4.8359375, 6.515625, 8.1953125, 9.875, 11.5546875, 13.234375, 14.9140625, 16.59375, 18.2734375, 19.953125, 21.6328125, 23.3125, 24.9921875, 26.671875, 28.3515625, 30.03125, 31.7109375, 33.390625, 35.0703125, 36.75, 38.4296875, 40.109375, 41.7890625, 43.46875, 45.1484375, 46.828125, 48.5078125, 50.1875]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 11.0, 9.0, 17.0, 34.0, 36.0, 48.0, 51.0, 93.0, 108.0, 205.0, 275.0, 430.0, 596.0, 1048.0, 1497.0, 2428.0, 3990.0, 6548.0, 11268.0, 20502.0, 40339.0, 93729.0, 315349.0, 2183670.0, 1163809.0, 203724.0, 70404.0, 32446.0, 17036.0, 9339.0, 5665.0, 3438.0, 2184.0, 1436.0, 849.0, 542.0, 358.0, 235.0, 159.0, 114.0, 82.0, 49.0, 42.0, 16.0, 25.0, 16.0, 14.0, 8.0, 3.0, 2.0, 4.0, 4.0, 1.0, 3.0, 1.0], "bins": [-123.8125, -120.04296875, -116.2734375, -112.50390625, -108.734375, -104.96484375, -101.1953125, -97.42578125, -93.65625, -89.88671875, -86.1171875, -82.34765625, -78.578125, -74.80859375, -71.0390625, -67.26953125, -63.5, -59.73046875, -55.9609375, -52.19140625, -48.421875, -44.65234375, -40.8828125, -37.11328125, -33.34375, -29.57421875, -25.8046875, -22.03515625, -18.265625, -14.49609375, -10.7265625, -6.95703125, -3.1875, 0.58203125, 4.3515625, 8.12109375, 11.890625, 15.66015625, 19.4296875, 23.19921875, 26.96875, 30.73828125, 34.5078125, 38.27734375, 42.046875, 45.81640625, 49.5859375, 53.35546875, 57.125, 60.89453125, 64.6640625, 68.43359375, 72.203125, 75.97265625, 79.7421875, 83.51171875, 87.28125, 91.05078125, 94.8203125, 98.58984375, 102.359375, 106.12890625, 109.8984375, 113.66796875, 117.4375]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 3.0, 6.0, 10.0, 14.0, 13.0, 12.0, 18.0, 24.0, 17.0, 28.0, 45.0, 69.0, 87.0, 96.0, 163.0, 294.0, 423.0, 656.0, 717.0, 471.0, 298.0, 187.0, 100.0, 73.0, 58.0, 54.0, 26.0, 37.0, 16.0, 11.0, 17.0, 10.0, 6.0, 9.0, 7.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-39.125, -37.97802734375, -36.8310546875, -35.68408203125, -34.537109375, -33.39013671875, -32.2431640625, -31.09619140625, -29.94921875, -28.80224609375, -27.6552734375, -26.50830078125, -25.361328125, -24.21435546875, -23.0673828125, -21.92041015625, -20.7734375, -19.62646484375, -18.4794921875, -17.33251953125, -16.185546875, -15.03857421875, -13.8916015625, -12.74462890625, -11.59765625, -10.45068359375, -9.3037109375, -8.15673828125, -7.009765625, -5.86279296875, -4.7158203125, -3.56884765625, -2.421875, -1.27490234375, -0.1279296875, 1.01904296875, 2.166015625, 3.31298828125, 4.4599609375, 5.60693359375, 6.75390625, 7.90087890625, 9.0478515625, 10.19482421875, 11.341796875, 12.48876953125, 13.6357421875, 14.78271484375, 15.9296875, 17.07666015625, 18.2236328125, 19.37060546875, 20.517578125, 21.66455078125, 22.8115234375, 23.95849609375, 25.10546875, 26.25244140625, 27.3994140625, 28.54638671875, 29.693359375, 30.84033203125, 31.9873046875, 33.13427734375, 34.28125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 2.0, 2.0, 3.0, 1.0, 7.0, 7.0, 6.0, 4.0, 8.0, 14.0, 23.0, 22.0, 32.0, 31.0, 51.0, 70.0, 82.0, 112.0, 96.0, 100.0, 74.0, 61.0, 37.0, 41.0, 28.0, 21.0, 12.0, 14.0, 13.0, 9.0, 8.0, 4.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.39539337158203, -62.81571960449219, -60.236045837402344, -57.656368255615234, -55.07669448852539, -52.49702072143555, -49.91734313964844, -47.337669372558594, -44.75799560546875, -42.178321838378906, -39.59864807128906, -37.01897048950195, -34.43929672241211, -31.859622955322266, -29.27994728088379, -26.700271606445312, -24.12059783935547, -21.540924072265625, -18.96124839782715, -16.381572723388672, -13.801898956298828, -11.222224235534668, -8.642549514770508, -6.062873840332031, -3.4832000732421875, -0.9035253524780273, 1.6761493682861328, 4.255824089050293, 6.835498809814453, 9.415173530578613, 11.994848251342773, 14.57452392578125, 17.154205322265625, 19.73387908935547, 22.313554763793945, 24.893230438232422, 27.472904205322266, 30.05257797241211, 32.63225555419922, 35.21192932128906, 37.791603088378906, 40.37127685546875, 42.950950622558594, 45.5306282043457, 48.11030197143555, 50.68997573852539, 53.2696533203125, 55.849327087402344, 58.42900085449219, 61.00867462158203, 63.588348388671875, 66.16802215576172, 68.74769592285156, 71.32737731933594, 73.90705108642578, 76.48672485351562, 79.06639862060547, 81.64607238769531, 84.22574615478516, 86.805419921875, 89.38510131835938, 91.96477508544922, 94.54444885253906, 97.1241226196289, 99.70379638671875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 4.0, 4.0, 2.0, 3.0, 2.0, 5.0, 5.0, 5.0, 6.0, 7.0, 11.0, 14.0, 17.0, 14.0, 16.0, 14.0, 21.0, 30.0, 41.0, 37.0, 40.0, 44.0, 43.0, 37.0, 52.0, 37.0, 41.0, 36.0, 42.0, 52.0, 36.0, 37.0, 27.0, 26.0, 29.0, 20.0, 23.0, 17.0, 20.0, 17.0, 21.0, 15.0, 8.0, 8.0, 9.0, 7.0, 5.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-55.66313934326172, -53.819252014160156, -51.97536087036133, -50.131473541259766, -48.28758239746094, -46.443695068359375, -44.59980773925781, -42.755916595458984, -40.91202926635742, -39.06814193725586, -37.22425079345703, -35.38036346435547, -33.53647232055664, -31.692584991455078, -29.848695755004883, -28.004806518554688, -26.160917282104492, -24.317028045654297, -22.4731388092041, -20.629249572753906, -18.785362243652344, -16.94147300720215, -15.097583770751953, -13.253695487976074, -11.409806251525879, -9.565917015075684, -7.722028732299805, -5.878139495849609, -4.034250736236572, -2.190361976623535, -0.34647274017333984, 1.497415542602539, 3.3413047790527344, 5.1851935386657715, 7.029082298278809, 8.872971534729004, 10.716859817504883, 12.560749053955078, 14.404638290405273, 16.24852752685547, 18.09241485595703, 19.936304092407227, 21.780193328857422, 23.624080657958984, 25.46796989440918, 27.311859130859375, 29.15574836730957, 30.999637603759766, 32.843528747558594, 34.687416076660156, 36.531307220458984, 38.37519454956055, 40.219085693359375, 42.06297302246094, 43.9068603515625, 45.75075149536133, 47.59463882446289, 49.43852615356445, 51.28241729736328, 53.126304626464844, 54.97019577026367, 56.814083099365234, 58.65797424316406, 60.501861572265625, 62.34574890136719]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 2.0, 6.0, 10.0, 15.0, 18.0, 28.0, 29.0, 50.0, 69.0, 93.0, 149.0, 191.0, 268.0, 387.0, 624.0, 931.0, 1403.0, 2199.0, 3430.0, 5581.0, 9211.0, 15981.0, 27662.0, 51669.0, 105641.0, 226523.0, 287755.0, 150110.0, 70745.0, 36370.0, 20332.0, 11906.0, 7000.0, 4414.0, 2655.0, 1765.0, 1104.0, 722.0, 481.0, 320.0, 204.0, 159.0, 97.0, 74.0, 54.0, 41.0, 27.0, 13.0, 18.0, 7.0, 12.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-40.5, -39.16015625, -37.8203125, -36.48046875, -35.140625, -33.80078125, -32.4609375, -31.12109375, -29.78125, -28.44140625, -27.1015625, -25.76171875, -24.421875, -23.08203125, -21.7421875, -20.40234375, -19.0625, -17.72265625, -16.3828125, -15.04296875, -13.703125, -12.36328125, -11.0234375, -9.68359375, -8.34375, -7.00390625, -5.6640625, -4.32421875, -2.984375, -1.64453125, -0.3046875, 1.03515625, 2.375, 3.71484375, 5.0546875, 6.39453125, 7.734375, 9.07421875, 10.4140625, 11.75390625, 13.09375, 14.43359375, 15.7734375, 17.11328125, 18.453125, 19.79296875, 21.1328125, 22.47265625, 23.8125, 25.15234375, 26.4921875, 27.83203125, 29.171875, 30.51171875, 31.8515625, 33.19140625, 34.53125, 35.87109375, 37.2109375, 38.55078125, 39.890625, 41.23046875, 42.5703125, 43.91015625, 45.25]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 5.0, 2.0, 0.0, 4.0, 4.0, 6.0, 3.0, 3.0, 5.0, 13.0, 15.0, 10.0, 10.0, 11.0, 17.0, 24.0, 27.0, 39.0, 37.0, 37.0, 42.0, 38.0, 58.0, 35.0, 43.0, 45.0, 50.0, 56.0, 52.0, 42.0, 37.0, 34.0, 23.0, 21.0, 20.0, 18.0, 21.0, 17.0, 17.0, 15.0, 11.0, 12.0, 3.0, 6.0, 9.0, 5.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.21875, -55.3896484375, -53.560546875, -51.7314453125, -49.90234375, -48.0732421875, -46.244140625, -44.4150390625, -42.5859375, -40.7568359375, -38.927734375, -37.0986328125, -35.26953125, -33.4404296875, -31.611328125, -29.7822265625, -27.953125, -26.1240234375, -24.294921875, -22.4658203125, -20.63671875, -18.8076171875, -16.978515625, -15.1494140625, -13.3203125, -11.4912109375, -9.662109375, -7.8330078125, -6.00390625, -4.1748046875, -2.345703125, -0.5166015625, 1.3125, 3.1416015625, 4.970703125, 6.7998046875, 8.62890625, 10.4580078125, 12.287109375, 14.1162109375, 15.9453125, 17.7744140625, 19.603515625, 21.4326171875, 23.26171875, 25.0908203125, 26.919921875, 28.7490234375, 30.578125, 32.4072265625, 34.236328125, 36.0654296875, 37.89453125, 39.7236328125, 41.552734375, 43.3818359375, 45.2109375, 47.0400390625, 48.869140625, 50.6982421875, 52.52734375, 54.3564453125, 56.185546875, 58.0146484375, 59.84375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 5.0, 9.0, 8.0, 20.0, 26.0, 20.0, 37.0, 52.0, 62.0, 90.0, 121.0, 194.0, 287.0, 409.0, 585.0, 888.0, 1365.0, 2045.0, 3108.0, 5291.0, 9013.0, 17725.0, 57607.0, 772324.0, 125551.0, 23524.0, 10947.0, 6253.0, 3898.0, 2355.0, 1559.0, 962.0, 674.0, 442.0, 317.0, 216.0, 159.0, 122.0, 81.0, 57.0, 39.0, 27.0, 18.0, 16.0, 17.0, 9.0, 9.0, 5.0, 1.0, 4.0, 1.0, 0.0, 3.0], "bins": [-80.9375, -78.6025390625, -76.267578125, -73.9326171875, -71.59765625, -69.2626953125, -66.927734375, -64.5927734375, -62.2578125, -59.9228515625, -57.587890625, -55.2529296875, -52.91796875, -50.5830078125, -48.248046875, -45.9130859375, -43.578125, -41.2431640625, -38.908203125, -36.5732421875, -34.23828125, -31.9033203125, -29.568359375, -27.2333984375, -24.8984375, -22.5634765625, -20.228515625, -17.8935546875, -15.55859375, -13.2236328125, -10.888671875, -8.5537109375, -6.21875, -3.8837890625, -1.548828125, 0.7861328125, 3.12109375, 5.4560546875, 7.791015625, 10.1259765625, 12.4609375, 14.7958984375, 17.130859375, 19.4658203125, 21.80078125, 24.1357421875, 26.470703125, 28.8056640625, 31.140625, 33.4755859375, 35.810546875, 38.1455078125, 40.48046875, 42.8154296875, 45.150390625, 47.4853515625, 49.8203125, 52.1552734375, 54.490234375, 56.8251953125, 59.16015625, 61.4951171875, 63.830078125, 66.1650390625, 68.5]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 3.0, 2.0, 9.0, 3.0, 11.0, 7.0, 7.0, 11.0, 14.0, 14.0, 25.0, 18.0, 21.0, 34.0, 37.0, 49.0, 32.0, 39.0, 51.0, 35.0, 42.0, 45.0, 58.0, 35.0, 23.0, 39.0, 39.0, 39.0, 31.0, 39.0, 25.0, 26.0, 27.0, 18.0, 23.0, 11.0, 16.0, 16.0, 6.0, 5.0, 6.0, 2.0, 4.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-51.46875, -49.71044921875, -47.9521484375, -46.19384765625, -44.435546875, -42.67724609375, -40.9189453125, -39.16064453125, -37.40234375, -35.64404296875, -33.8857421875, -32.12744140625, -30.369140625, -28.61083984375, -26.8525390625, -25.09423828125, -23.3359375, -21.57763671875, -19.8193359375, -18.06103515625, -16.302734375, -14.54443359375, -12.7861328125, -11.02783203125, -9.26953125, -7.51123046875, -5.7529296875, -3.99462890625, -2.236328125, -0.47802734375, 1.2802734375, 3.03857421875, 4.796875, 6.55517578125, 8.3134765625, 10.07177734375, 11.830078125, 13.58837890625, 15.3466796875, 17.10498046875, 18.86328125, 20.62158203125, 22.3798828125, 24.13818359375, 25.896484375, 27.65478515625, 29.4130859375, 31.17138671875, 32.9296875, 34.68798828125, 36.4462890625, 38.20458984375, 39.962890625, 41.72119140625, 43.4794921875, 45.23779296875, 46.99609375, 48.75439453125, 50.5126953125, 52.27099609375, 54.029296875, 55.78759765625, 57.5458984375, 59.30419921875, 61.0625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 4.0, 10.0, 7.0, 8.0, 13.0, 14.0, 22.0, 35.0, 40.0, 65.0, 83.0, 122.0, 161.0, 224.0, 358.0, 544.0, 891.0, 1513.0, 2936.0, 6597.0, 18550.0, 106298.0, 834851.0, 51279.0, 12980.0, 5021.0, 2317.0, 1290.0, 790.0, 489.0, 314.0, 203.0, 147.0, 106.0, 68.0, 44.0, 47.0, 28.0, 22.0, 15.0, 15.0, 10.0, 10.0, 8.0, 4.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.20703125, -5.988037109375, -5.76904296875, -5.550048828125, -5.3310546875, -5.112060546875, -4.89306640625, -4.674072265625, -4.455078125, -4.236083984375, -4.01708984375, -3.798095703125, -3.5791015625, -3.360107421875, -3.14111328125, -2.922119140625, -2.703125, -2.484130859375, -2.26513671875, -2.046142578125, -1.8271484375, -1.608154296875, -1.38916015625, -1.170166015625, -0.951171875, -0.732177734375, -0.51318359375, -0.294189453125, -0.0751953125, 0.143798828125, 0.36279296875, 0.581787109375, 0.80078125, 1.019775390625, 1.23876953125, 1.457763671875, 1.6767578125, 1.895751953125, 2.11474609375, 2.333740234375, 2.552734375, 2.771728515625, 2.99072265625, 3.209716796875, 3.4287109375, 3.647705078125, 3.86669921875, 4.085693359375, 4.3046875, 4.523681640625, 4.74267578125, 4.961669921875, 5.1806640625, 5.399658203125, 5.61865234375, 5.837646484375, 6.056640625, 6.275634765625, 6.49462890625, 6.713623046875, 6.9326171875, 7.151611328125, 7.37060546875, 7.589599609375, 7.80859375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 2.0, 5.0, 3.0, 1.0, 5.0, 8.0, 4.0, 8.0, 12.0, 12.0, 14.0, 29.0, 35.0, 48.0, 68.0, 82.0, 99.0, 135.0, 112.0, 79.0, 52.0, 45.0, 30.0, 28.0, 12.0, 22.0, 14.0, 8.0, 8.0, 6.0, 8.0, 4.0, 1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0030670166015625, -0.0029805004596710205, -0.002893984317779541, -0.0028074681758880615, -0.002720952033996582, -0.0026344358921051025, -0.002547919750213623, -0.0024614036083221436, -0.002374887466430664, -0.0022883713245391846, -0.002201855182647705, -0.0021153390407562256, -0.002028822898864746, -0.0019423067569732666, -0.0018557906150817871, -0.0017692744731903076, -0.0016827583312988281, -0.0015962421894073486, -0.0015097260475158691, -0.0014232099056243896, -0.0013366937637329102, -0.0012501776218414307, -0.0011636614799499512, -0.0010771453380584717, -0.0009906291961669922, -0.0009041130542755127, -0.0008175969123840332, -0.0007310807704925537, -0.0006445646286010742, -0.0005580484867095947, -0.00047153234481811523, -0.00038501620292663574, -0.00029850006103515625, -0.00021198391914367676, -0.00012546777725219727, -3.8951635360717773e-05, 4.756450653076172e-05, 0.0001340806484222412, 0.0002205967903137207, 0.0003071129322052002, 0.0003936290740966797, 0.0004801452159881592, 0.0005666613578796387, 0.0006531774997711182, 0.0007396936416625977, 0.0008262097835540771, 0.0009127259254455566, 0.0009992420673370361, 0.0010857582092285156, 0.0011722743511199951, 0.0012587904930114746, 0.001345306634902954, 0.0014318227767944336, 0.001518338918685913, 0.0016048550605773926, 0.001691371202468872, 0.0017778873443603516, 0.001864403486251831, 0.0019509196281433105, 0.00203743577003479, 0.0021239519119262695, 0.002210468053817749, 0.0022969841957092285, 0.002383500337600708, 0.0024700164794921875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 4.0, 3.0, 6.0, 5.0, 8.0, 13.0, 22.0, 32.0, 38.0, 56.0, 85.0, 120.0, 175.0, 231.0, 337.0, 538.0, 709.0, 1204.0, 1912.0, 3128.0, 5291.0, 9407.0, 18284.0, 37906.0, 92937.0, 284961.0, 368469.0, 125288.0, 47848.0, 22115.0, 11466.0, 6249.0, 3480.0, 2174.0, 1318.0, 882.0, 548.0, 377.0, 296.0, 196.0, 123.0, 96.0, 60.0, 47.0, 34.0, 28.0, 19.0, 14.0, 6.0, 10.0, 3.0, 5.0, 1.0, 1.0, 1.0], "bins": [-3.146484375, -3.05694580078125, -2.9674072265625, -2.87786865234375, -2.788330078125, -2.69879150390625, -2.6092529296875, -2.51971435546875, -2.43017578125, -2.34063720703125, -2.2510986328125, -2.16156005859375, -2.072021484375, -1.98248291015625, -1.8929443359375, -1.80340576171875, -1.7138671875, -1.62432861328125, -1.5347900390625, -1.44525146484375, -1.355712890625, -1.26617431640625, -1.1766357421875, -1.08709716796875, -0.99755859375, -0.90802001953125, -0.8184814453125, -0.72894287109375, -0.639404296875, -0.54986572265625, -0.4603271484375, -0.37078857421875, -0.28125, -0.19171142578125, -0.1021728515625, -0.01263427734375, 0.076904296875, 0.16644287109375, 0.2559814453125, 0.34552001953125, 0.43505859375, 0.52459716796875, 0.6141357421875, 0.70367431640625, 0.793212890625, 0.88275146484375, 0.9722900390625, 1.06182861328125, 1.1513671875, 1.24090576171875, 1.3304443359375, 1.41998291015625, 1.509521484375, 1.59906005859375, 1.6885986328125, 1.77813720703125, 1.86767578125, 1.95721435546875, 2.0467529296875, 2.13629150390625, 2.225830078125, 2.31536865234375, 2.4049072265625, 2.49444580078125, 2.583984375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 1.0, 4.0, 4.0, 3.0, 4.0, 9.0, 15.0, 17.0, 18.0, 12.0, 28.0, 33.0, 30.0, 60.0, 69.0, 101.0, 90.0, 85.0, 79.0, 81.0, 49.0, 40.0, 35.0, 22.0, 14.0, 13.0, 18.0, 22.0, 11.0, 8.0, 5.0, 4.0, 2.0, 4.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9072265625, -0.8797149658203125, -0.852203369140625, -0.8246917724609375, -0.79718017578125, -0.7696685791015625, -0.742156982421875, -0.7146453857421875, -0.6871337890625, -0.6596221923828125, -0.632110595703125, -0.6045989990234375, -0.57708740234375, -0.5495758056640625, -0.522064208984375, -0.4945526123046875, -0.467041015625, -0.4395294189453125, -0.412017822265625, -0.3845062255859375, -0.35699462890625, -0.3294830322265625, -0.301971435546875, -0.2744598388671875, -0.2469482421875, -0.2194366455078125, -0.191925048828125, -0.1644134521484375, -0.13690185546875, -0.1093902587890625, -0.081878662109375, -0.0543670654296875, -0.02685546875, 0.0006561279296875, 0.028167724609375, 0.0556793212890625, 0.08319091796875, 0.1107025146484375, 0.138214111328125, 0.1657257080078125, 0.1932373046875, 0.2207489013671875, 0.248260498046875, 0.2757720947265625, 0.30328369140625, 0.3307952880859375, 0.358306884765625, 0.3858184814453125, 0.413330078125, 0.4408416748046875, 0.468353271484375, 0.4958648681640625, 0.52337646484375, 0.5508880615234375, 0.578399658203125, 0.6059112548828125, 0.6334228515625, 0.6609344482421875, 0.688446044921875, 0.7159576416015625, 0.74346923828125, 0.7709808349609375, 0.798492431640625, 0.8260040283203125, 0.853515625]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 5.0, 8.0, 3.0, 4.0, 14.0, 14.0, 24.0, 20.0, 36.0, 34.0, 55.0, 78.0, 97.0, 98.0, 113.0, 105.0, 68.0, 55.0, 37.0, 37.0, 19.0, 19.0, 15.0, 14.0, 6.0, 7.0, 5.0, 8.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-74.0177001953125, -71.4654769897461, -68.91324615478516, -66.36102294921875, -63.80879592895508, -61.256568908691406, -58.704341888427734, -56.15211486816406, -53.599891662597656, -51.047664642333984, -48.49543762207031, -45.943214416503906, -43.390987396240234, -40.83876037597656, -38.28653335571289, -35.73430633544922, -33.18207931518555, -30.629852294921875, -28.077627182006836, -25.525400161743164, -22.973175048828125, -20.420948028564453, -17.86872100830078, -15.316495895385742, -12.76426887512207, -10.212042808532715, -7.659816265106201, -5.1075897216796875, -2.555363655090332, -0.0031375885009765625, 2.5490894317626953, 5.101314544677734, 7.653541564941406, 10.205767631530762, 12.757993698120117, 15.310220718383789, 17.862445831298828, 20.4146728515625, 22.966899871826172, 25.51912498474121, 28.071352005004883, 30.623579025268555, 33.175804138183594, 35.728031158447266, 38.28025817871094, 40.832481384277344, 43.38471221923828, 45.93693542480469, 48.48916244506836, 51.04138946533203, 53.5936164855957, 56.145843505859375, 58.69806671142578, 61.25029373168945, 63.802520751953125, 66.35474395751953, 68.90697479248047, 71.45919799804688, 74.01142883300781, 76.56365203857422, 79.11588287353516, 81.66810607910156, 84.2203369140625, 86.7725601196289, 89.32478332519531]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 0.0, 6.0, 2.0, 6.0, 5.0, 5.0, 7.0, 11.0, 14.0, 19.0, 15.0, 17.0, 14.0, 18.0, 33.0, 42.0, 37.0, 45.0, 33.0, 51.0, 39.0, 46.0, 42.0, 36.0, 39.0, 52.0, 43.0, 37.0, 33.0, 28.0, 27.0, 24.0, 22.0, 23.0, 22.0, 17.0, 16.0, 21.0, 15.0, 6.0, 8.0, 5.0, 11.0, 4.0, 5.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-51.7095947265625, -49.992801666259766, -48.27600860595703, -46.5592155456543, -44.84242248535156, -43.12562942504883, -41.408836364746094, -39.69204330444336, -37.975250244140625, -36.25845718383789, -34.541664123535156, -32.82487106323242, -31.108078002929688, -29.391284942626953, -27.67449188232422, -25.957698822021484, -24.24090576171875, -22.524112701416016, -20.80731964111328, -19.090526580810547, -17.373733520507812, -15.656940460205078, -13.940147399902344, -12.22335433959961, -10.506561279296875, -8.78976821899414, -7.072975158691406, -5.356182098388672, -3.6393890380859375, -1.9225959777832031, -0.20580291748046875, 1.5109901428222656, 3.2277870178222656, 4.944580078125, 6.661373138427734, 8.378166198730469, 10.094959259033203, 11.811752319335938, 13.528545379638672, 15.245338439941406, 16.96213150024414, 18.678924560546875, 20.39571762084961, 22.112510681152344, 23.829303741455078, 25.546096801757812, 27.262889862060547, 28.97968292236328, 30.696475982666016, 32.41326904296875, 34.130062103271484, 35.84685516357422, 37.56364822387695, 39.28044128417969, 40.99723434448242, 42.714027404785156, 44.43082046508789, 46.147613525390625, 47.86440658569336, 49.581199645996094, 51.29799270629883, 53.01478576660156, 54.7315788269043, 56.44837188720703, 58.165164947509766]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 10.0, 9.0, 7.0, 14.0, 24.0, 41.0, 40.0, 72.0, 110.0, 146.0, 197.0, 302.0, 519.0, 841.0, 1245.0, 2151.0, 3449.0, 6096.0, 10942.0, 20134.0, 40966.0, 90703.0, 230498.0, 350087.0, 156873.0, 65342.0, 30976.0, 15804.0, 8525.0, 4897.0, 2757.0, 1731.0, 1065.0, 630.0, 435.0, 307.0, 190.0, 122.0, 86.0, 69.0, 39.0, 30.0, 27.0, 12.0, 18.0, 7.0, 2.0, 6.0, 4.0, 0.0, 2.0, 1.0, 2.0], "bins": [-89.875, -87.2548828125, -84.634765625, -82.0146484375, -79.39453125, -76.7744140625, -74.154296875, -71.5341796875, -68.9140625, -66.2939453125, -63.673828125, -61.0537109375, -58.43359375, -55.8134765625, -53.193359375, -50.5732421875, -47.953125, -45.3330078125, -42.712890625, -40.0927734375, -37.47265625, -34.8525390625, -32.232421875, -29.6123046875, -26.9921875, -24.3720703125, -21.751953125, -19.1318359375, -16.51171875, -13.8916015625, -11.271484375, -8.6513671875, -6.03125, -3.4111328125, -0.791015625, 1.8291015625, 4.44921875, 7.0693359375, 9.689453125, 12.3095703125, 14.9296875, 17.5498046875, 20.169921875, 22.7900390625, 25.41015625, 28.0302734375, 30.650390625, 33.2705078125, 35.890625, 38.5107421875, 41.130859375, 43.7509765625, 46.37109375, 48.9912109375, 51.611328125, 54.2314453125, 56.8515625, 59.4716796875, 62.091796875, 64.7119140625, 67.33203125, 69.9521484375, 72.572265625, 75.1923828125, 77.8125]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 0.0, 5.0, 5.0, 3.0, 3.0, 7.0, 7.0, 10.0, 10.0, 12.0, 15.0, 17.0, 15.0, 22.0, 24.0, 40.0, 33.0, 28.0, 43.0, 46.0, 45.0, 51.0, 44.0, 42.0, 40.0, 50.0, 47.0, 42.0, 33.0, 40.0, 24.0, 24.0, 17.0, 24.0, 14.0, 26.0, 16.0, 18.0, 16.0, 7.0, 7.0, 10.0, 5.0, 6.0, 4.0, 4.0, 4.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-54.90625, -53.15966796875, -51.4130859375, -49.66650390625, -47.919921875, -46.17333984375, -44.4267578125, -42.68017578125, -40.93359375, -39.18701171875, -37.4404296875, -35.69384765625, -33.947265625, -32.20068359375, -30.4541015625, -28.70751953125, -26.9609375, -25.21435546875, -23.4677734375, -21.72119140625, -19.974609375, -18.22802734375, -16.4814453125, -14.73486328125, -12.98828125, -11.24169921875, -9.4951171875, -7.74853515625, -6.001953125, -4.25537109375, -2.5087890625, -0.76220703125, 0.984375, 2.73095703125, 4.4775390625, 6.22412109375, 7.970703125, 9.71728515625, 11.4638671875, 13.21044921875, 14.95703125, 16.70361328125, 18.4501953125, 20.19677734375, 21.943359375, 23.68994140625, 25.4365234375, 27.18310546875, 28.9296875, 30.67626953125, 32.4228515625, 34.16943359375, 35.916015625, 37.66259765625, 39.4091796875, 41.15576171875, 42.90234375, 44.64892578125, 46.3955078125, 48.14208984375, 49.888671875, 51.63525390625, 53.3818359375, 55.12841796875, 56.875]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 7.0, 16.0, 18.0, 24.0, 43.0, 54.0, 67.0, 101.0, 153.0, 213.0, 313.0, 429.0, 582.0, 797.0, 1205.0, 1765.0, 2599.0, 3822.0, 6030.0, 9499.0, 14855.0, 24829.0, 42357.0, 75776.0, 148133.0, 270766.0, 204209.0, 101660.0, 54464.0, 31501.0, 18802.0, 11559.0, 7316.0, 4664.0, 3089.0, 2060.0, 1444.0, 992.0, 687.0, 482.0, 335.0, 259.0, 171.0, 121.0, 95.0, 62.0, 41.0, 40.0, 22.0, 13.0, 7.0, 7.0, 4.0, 3.0, 1.0, 4.0, 2.0], "bins": [-69.0, -66.8916015625, -64.783203125, -62.6748046875, -60.56640625, -58.4580078125, -56.349609375, -54.2412109375, -52.1328125, -50.0244140625, -47.916015625, -45.8076171875, -43.69921875, -41.5908203125, -39.482421875, -37.3740234375, -35.265625, -33.1572265625, -31.048828125, -28.9404296875, -26.83203125, -24.7236328125, -22.615234375, -20.5068359375, -18.3984375, -16.2900390625, -14.181640625, -12.0732421875, -9.96484375, -7.8564453125, -5.748046875, -3.6396484375, -1.53125, 0.5771484375, 2.685546875, 4.7939453125, 6.90234375, 9.0107421875, 11.119140625, 13.2275390625, 15.3359375, 17.4443359375, 19.552734375, 21.6611328125, 23.76953125, 25.8779296875, 27.986328125, 30.0947265625, 32.203125, 34.3115234375, 36.419921875, 38.5283203125, 40.63671875, 42.7451171875, 44.853515625, 46.9619140625, 49.0703125, 51.1787109375, 53.287109375, 55.3955078125, 57.50390625, 59.6123046875, 61.720703125, 63.8291015625, 65.9375]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 4.0, 1.0, 2.0, 3.0, 3.0, 5.0, 4.0, 5.0, 1.0, 9.0, 3.0, 11.0, 17.0, 13.0, 15.0, 30.0, 21.0, 24.0, 20.0, 37.0, 34.0, 43.0, 38.0, 46.0, 32.0, 43.0, 51.0, 45.0, 42.0, 43.0, 39.0, 39.0, 35.0, 31.0, 27.0, 24.0, 26.0, 29.0, 23.0, 19.0, 13.0, 14.0, 7.0, 8.0, 8.0, 4.0, 5.0, 3.0, 6.0, 4.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-31.296875, -30.258056640625, -29.21923828125, -28.180419921875, -27.1416015625, -26.102783203125, -25.06396484375, -24.025146484375, -22.986328125, -21.947509765625, -20.90869140625, -19.869873046875, -18.8310546875, -17.792236328125, -16.75341796875, -15.714599609375, -14.67578125, -13.636962890625, -12.59814453125, -11.559326171875, -10.5205078125, -9.481689453125, -8.44287109375, -7.404052734375, -6.365234375, -5.326416015625, -4.28759765625, -3.248779296875, -2.2099609375, -1.171142578125, -0.13232421875, 0.906494140625, 1.9453125, 2.984130859375, 4.02294921875, 5.061767578125, 6.1005859375, 7.139404296875, 8.17822265625, 9.217041015625, 10.255859375, 11.294677734375, 12.33349609375, 13.372314453125, 14.4111328125, 15.449951171875, 16.48876953125, 17.527587890625, 18.56640625, 19.605224609375, 20.64404296875, 21.682861328125, 22.7216796875, 23.760498046875, 24.79931640625, 25.838134765625, 26.876953125, 27.915771484375, 28.95458984375, 29.993408203125, 31.0322265625, 32.071044921875, 33.10986328125, 34.148681640625, 35.1875]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 0.0, 6.0, 8.0, 13.0, 18.0, 27.0, 39.0, 75.0, 110.0, 142.0, 186.0, 289.0, 472.0, 644.0, 1091.0, 1557.0, 2546.0, 4299.0, 7424.0, 13200.0, 24625.0, 48574.0, 103069.0, 231129.0, 311932.0, 151716.0, 69418.0, 33698.0, 17848.0, 9842.0, 5394.0, 3314.0, 2096.0, 1295.0, 818.0, 551.0, 346.0, 242.0, 166.0, 111.0, 71.0, 49.0, 34.0, 24.0, 16.0, 12.0, 6.0, 7.0, 2.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-22.953125, -22.2412109375, -21.529296875, -20.8173828125, -20.10546875, -19.3935546875, -18.681640625, -17.9697265625, -17.2578125, -16.5458984375, -15.833984375, -15.1220703125, -14.41015625, -13.6982421875, -12.986328125, -12.2744140625, -11.5625, -10.8505859375, -10.138671875, -9.4267578125, -8.71484375, -8.0029296875, -7.291015625, -6.5791015625, -5.8671875, -5.1552734375, -4.443359375, -3.7314453125, -3.01953125, -2.3076171875, -1.595703125, -0.8837890625, -0.171875, 0.5400390625, 1.251953125, 1.9638671875, 2.67578125, 3.3876953125, 4.099609375, 4.8115234375, 5.5234375, 6.2353515625, 6.947265625, 7.6591796875, 8.37109375, 9.0830078125, 9.794921875, 10.5068359375, 11.21875, 11.9306640625, 12.642578125, 13.3544921875, 14.06640625, 14.7783203125, 15.490234375, 16.2021484375, 16.9140625, 17.6259765625, 18.337890625, 19.0498046875, 19.76171875, 20.4736328125, 21.185546875, 21.8974609375, 22.609375]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 4.0, 4.0, 2.0, 6.0, 2.0, 5.0, 7.0, 8.0, 13.0, 13.0, 17.0, 19.0, 23.0, 36.0, 66.0, 58.0, 92.0, 90.0, 126.0, 76.0, 61.0, 66.0, 52.0, 31.0, 19.0, 27.0, 19.0, 15.0, 11.0, 6.0, 9.0, 3.0, 4.0, 5.0, 1.0, 3.0, 5.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.002597808837890625, -0.0025197267532348633, -0.0024416446685791016, -0.00236356258392334, -0.002285480499267578, -0.0022073984146118164, -0.0021293163299560547, -0.002051234245300293, -0.0019731521606445312, -0.0018950700759887695, -0.0018169879913330078, -0.001738905906677246, -0.0016608238220214844, -0.0015827417373657227, -0.001504659652709961, -0.0014265775680541992, -0.0013484954833984375, -0.0012704133987426758, -0.001192331314086914, -0.0011142492294311523, -0.0010361671447753906, -0.0009580850601196289, -0.0008800029754638672, -0.0008019208908081055, -0.0007238388061523438, -0.000645756721496582, -0.0005676746368408203, -0.0004895925521850586, -0.0004115104675292969, -0.00033342838287353516, -0.00025534629821777344, -0.00017726421356201172, -9.918212890625e-05, -2.110004425048828e-05, 5.698204040527344e-05, 0.00013506412506103516, 0.00021314620971679688, 0.0002912282943725586, 0.0003693103790283203, 0.00044739246368408203, 0.0005254745483398438, 0.0006035566329956055, 0.0006816387176513672, 0.0007597208023071289, 0.0008378028869628906, 0.0009158849716186523, 0.000993967056274414, 0.0010720491409301758, 0.0011501312255859375, 0.0012282133102416992, 0.001306295394897461, 0.0013843774795532227, 0.0014624595642089844, 0.001540541648864746, 0.0016186237335205078, 0.0016967058181762695, 0.0017747879028320312, 0.001852869987487793, 0.0019309520721435547, 0.0020090341567993164, 0.002087116241455078, 0.00216519832611084, 0.0022432804107666016, 0.0023213624954223633, 0.002399444580078125]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 5.0, 1.0, 5.0, 6.0, 6.0, 4.0, 14.0, 15.0, 32.0, 32.0, 40.0, 48.0, 95.0, 90.0, 152.0, 222.0, 295.0, 413.0, 589.0, 933.0, 1524.0, 2370.0, 3967.0, 6747.0, 12311.0, 22781.0, 44619.0, 91834.0, 197118.0, 307393.0, 180473.0, 84442.0, 40751.0, 21095.0, 11157.0, 6588.0, 3805.0, 2301.0, 1464.0, 859.0, 584.0, 404.0, 272.0, 180.0, 153.0, 100.0, 67.0, 59.0, 48.0, 29.0, 25.0, 14.0, 10.0, 10.0, 5.0, 9.0, 2.0, 2.0, 2.0, 0.0, 2.0], "bins": [-19.53125, -18.92919921875, -18.3271484375, -17.72509765625, -17.123046875, -16.52099609375, -15.9189453125, -15.31689453125, -14.71484375, -14.11279296875, -13.5107421875, -12.90869140625, -12.306640625, -11.70458984375, -11.1025390625, -10.50048828125, -9.8984375, -9.29638671875, -8.6943359375, -8.09228515625, -7.490234375, -6.88818359375, -6.2861328125, -5.68408203125, -5.08203125, -4.47998046875, -3.8779296875, -3.27587890625, -2.673828125, -2.07177734375, -1.4697265625, -0.86767578125, -0.265625, 0.33642578125, 0.9384765625, 1.54052734375, 2.142578125, 2.74462890625, 3.3466796875, 3.94873046875, 4.55078125, 5.15283203125, 5.7548828125, 6.35693359375, 6.958984375, 7.56103515625, 8.1630859375, 8.76513671875, 9.3671875, 9.96923828125, 10.5712890625, 11.17333984375, 11.775390625, 12.37744140625, 12.9794921875, 13.58154296875, 14.18359375, 14.78564453125, 15.3876953125, 15.98974609375, 16.591796875, 17.19384765625, 17.7958984375, 18.39794921875, 19.0]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 4.0, 7.0, 11.0, 9.0, 11.0, 16.0, 20.0, 30.0, 29.0, 34.0, 43.0, 47.0, 70.0, 76.0, 84.0, 70.0, 73.0, 82.0, 59.0, 58.0, 37.0, 27.0, 23.0, 16.0, 14.0, 19.0, 12.0, 8.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.6640625, -6.45135498046875, -6.2386474609375, -6.02593994140625, -5.813232421875, -5.60052490234375, -5.3878173828125, -5.17510986328125, -4.96240234375, -4.74969482421875, -4.5369873046875, -4.32427978515625, -4.111572265625, -3.89886474609375, -3.6861572265625, -3.47344970703125, -3.2607421875, -3.04803466796875, -2.8353271484375, -2.62261962890625, -2.409912109375, -2.19720458984375, -1.9844970703125, -1.77178955078125, -1.55908203125, -1.34637451171875, -1.1336669921875, -0.92095947265625, -0.708251953125, -0.49554443359375, -0.2828369140625, -0.07012939453125, 0.142578125, 0.35528564453125, 0.5679931640625, 0.78070068359375, 0.993408203125, 1.20611572265625, 1.4188232421875, 1.63153076171875, 1.84423828125, 2.05694580078125, 2.2696533203125, 2.48236083984375, 2.695068359375, 2.90777587890625, 3.1204833984375, 3.33319091796875, 3.5458984375, 3.75860595703125, 3.9713134765625, 4.18402099609375, 4.396728515625, 4.60943603515625, 4.8221435546875, 5.03485107421875, 5.24755859375, 5.46026611328125, 5.6729736328125, 5.88568115234375, 6.098388671875, 6.31109619140625, 6.5238037109375, 6.73651123046875, 6.94921875]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 5.0, 0.0, 2.0, 5.0, 8.0, 9.0, 13.0, 13.0, 18.0, 24.0, 50.0, 40.0, 78.0, 103.0, 115.0, 109.0, 104.0, 85.0, 58.0, 40.0, 26.0, 31.0, 24.0, 14.0, 12.0, 11.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-77.49870300292969, -74.7408676147461, -71.9830322265625, -69.2251968383789, -66.46736145019531, -63.70952224731445, -60.951683044433594, -58.19384765625, -55.436012268066406, -52.67817687988281, -49.92034149169922, -47.16250228881836, -44.404666900634766, -41.64683151245117, -38.88899230957031, -36.13115692138672, -33.373321533203125, -30.61548614501953, -27.857648849487305, -25.099811553955078, -22.341976165771484, -19.58414077758789, -16.826303482055664, -14.068466186523438, -11.310630798339844, -8.552794456481934, -5.794958114624023, -3.0371217727661133, -0.2792854309082031, 2.478550910949707, 5.236387252807617, 7.994224548339844, 10.752067565917969, 13.509903907775879, 16.26774024963379, 19.025577545166016, 21.78341293334961, 24.541248321533203, 27.29908561706543, 30.056922912597656, 32.81475830078125, 35.572593688964844, 38.33042907714844, 41.0882682800293, 43.84610366821289, 46.603939056396484, 49.361778259277344, 52.11961364746094, 54.87744903564453, 57.635284423828125, 60.39311981201172, 63.15095901489258, 65.90879821777344, 68.66663360595703, 71.42446899414062, 74.18230438232422, 76.94013977050781, 79.6979751586914, 82.455810546875, 85.2136459350586, 87.97148132324219, 90.72932434082031, 93.4871597290039, 96.2449951171875, 99.0028305053711]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 6.0, 5.0, 8.0, 6.0, 6.0, 6.0, 11.0, 10.0, 18.0, 14.0, 13.0, 15.0, 16.0, 25.0, 23.0, 34.0, 44.0, 42.0, 30.0, 42.0, 45.0, 42.0, 45.0, 45.0, 36.0, 43.0, 39.0, 35.0, 34.0, 28.0, 32.0, 24.0, 27.0, 17.0, 22.0, 21.0, 20.0, 15.0, 11.0, 11.0, 6.0, 3.0, 9.0, 7.0, 3.0, 2.0, 7.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0], "bins": [-53.536766052246094, -51.87102127075195, -50.20528030395508, -48.53953552246094, -46.87379455566406, -45.20804977416992, -43.54230499267578, -41.876564025878906, -40.21082305908203, -38.54507827758789, -36.879337310791016, -35.213592529296875, -33.5478515625, -31.88210678100586, -30.21636390686035, -28.550621032714844, -26.884876251220703, -25.219133377075195, -23.553390502929688, -21.887645721435547, -20.221904754638672, -18.55615997314453, -16.890417098999023, -15.224674224853516, -13.558931350708008, -11.8931884765625, -10.227445602416992, -8.561701774597168, -6.89595890045166, -5.230216026306152, -3.564472198486328, -1.8987293243408203, -0.23298263549804688, 1.43276047706604, 3.098503589630127, 4.764246940612793, 6.429989814758301, 8.095732688903809, 9.761476516723633, 11.42721939086914, 13.092962265014648, 14.758705139160156, 16.424448013305664, 18.090190887451172, 19.755935668945312, 21.421676635742188, 23.087421417236328, 24.753164291381836, 26.418907165527344, 28.08465003967285, 29.75039291381836, 31.4161376953125, 33.081878662109375, 34.747623443603516, 36.413368225097656, 38.07910919189453, 39.744850158691406, 41.41059494018555, 43.07633590698242, 44.74208068847656, 46.40782165527344, 48.07356643676758, 49.73931121826172, 51.405052185058594, 53.070796966552734]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 4.0, 2.0, 6.0, 5.0, 11.0, 5.0, 15.0, 29.0, 23.0, 35.0, 70.0, 87.0, 119.0, 151.0, 236.0, 289.0, 440.0, 629.0, 904.0, 1241.0, 1882.0, 2686.0, 3940.0, 6084.0, 9984.0, 17171.0, 38349.0, 119400.0, 459895.0, 1670667.0, 1357458.0, 343094.0, 85731.0, 30357.0, 15307.0, 8928.0, 5921.0, 3915.0, 2643.0, 1902.0, 1328.0, 987.0, 663.0, 474.0, 342.0, 251.0, 183.0, 127.0, 98.0, 65.0, 47.0, 41.0, 24.0, 16.0, 12.0, 7.0, 6.0, 4.0, 6.0, 4.0], "bins": [-79.9375, -77.5791015625, -75.220703125, -72.8623046875, -70.50390625, -68.1455078125, -65.787109375, -63.4287109375, -61.0703125, -58.7119140625, -56.353515625, -53.9951171875, -51.63671875, -49.2783203125, -46.919921875, -44.5615234375, -42.203125, -39.8447265625, -37.486328125, -35.1279296875, -32.76953125, -30.4111328125, -28.052734375, -25.6943359375, -23.3359375, -20.9775390625, -18.619140625, -16.2607421875, -13.90234375, -11.5439453125, -9.185546875, -6.8271484375, -4.46875, -2.1103515625, 0.248046875, 2.6064453125, 4.96484375, 7.3232421875, 9.681640625, 12.0400390625, 14.3984375, 16.7568359375, 19.115234375, 21.4736328125, 23.83203125, 26.1904296875, 28.548828125, 30.9072265625, 33.265625, 35.6240234375, 37.982421875, 40.3408203125, 42.69921875, 45.0576171875, 47.416015625, 49.7744140625, 52.1328125, 54.4912109375, 56.849609375, 59.2080078125, 61.56640625, 63.9248046875, 66.283203125, 68.6416015625, 71.0]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 9.0, 8.0, 8.0, 5.0, 8.0, 7.0, 15.0, 13.0, 12.0, 17.0, 15.0, 27.0, 22.0, 23.0, 51.0, 34.0, 46.0, 33.0, 47.0, 38.0, 49.0, 52.0, 44.0, 39.0, 48.0, 41.0, 30.0, 33.0, 39.0, 25.0, 21.0, 17.0, 19.0, 18.0, 16.0, 15.0, 12.0, 10.0, 7.0, 6.0, 5.0, 6.0, 4.0, 3.0, 4.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-48.25, -46.75732421875, -45.2646484375, -43.77197265625, -42.279296875, -40.78662109375, -39.2939453125, -37.80126953125, -36.30859375, -34.81591796875, -33.3232421875, -31.83056640625, -30.337890625, -28.84521484375, -27.3525390625, -25.85986328125, -24.3671875, -22.87451171875, -21.3818359375, -19.88916015625, -18.396484375, -16.90380859375, -15.4111328125, -13.91845703125, -12.42578125, -10.93310546875, -9.4404296875, -7.94775390625, -6.455078125, -4.96240234375, -3.4697265625, -1.97705078125, -0.484375, 1.00830078125, 2.5009765625, 3.99365234375, 5.486328125, 6.97900390625, 8.4716796875, 9.96435546875, 11.45703125, 12.94970703125, 14.4423828125, 15.93505859375, 17.427734375, 18.92041015625, 20.4130859375, 21.90576171875, 23.3984375, 24.89111328125, 26.3837890625, 27.87646484375, 29.369140625, 30.86181640625, 32.3544921875, 33.84716796875, 35.33984375, 36.83251953125, 38.3251953125, 39.81787109375, 41.310546875, 42.80322265625, 44.2958984375, 45.78857421875, 47.28125]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 3.0, 8.0, 17.0, 22.0, 31.0, 26.0, 35.0, 81.0, 99.0, 158.0, 254.0, 341.0, 547.0, 834.0, 1227.0, 2133.0, 3408.0, 5598.0, 9726.0, 18011.0, 36415.0, 86317.0, 293724.0, 2051764.0, 1328752.0, 215736.0, 70236.0, 30996.0, 15668.0, 8924.0, 4976.0, 2950.0, 1865.0, 1169.0, 737.0, 471.0, 341.0, 208.0, 144.0, 114.0, 92.0, 38.0, 36.0, 21.0, 10.0, 8.0, 7.0, 4.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-103.4375, -100.1943359375, -96.951171875, -93.7080078125, -90.46484375, -87.2216796875, -83.978515625, -80.7353515625, -77.4921875, -74.2490234375, -71.005859375, -67.7626953125, -64.51953125, -61.2763671875, -58.033203125, -54.7900390625, -51.546875, -48.3037109375, -45.060546875, -41.8173828125, -38.57421875, -35.3310546875, -32.087890625, -28.8447265625, -25.6015625, -22.3583984375, -19.115234375, -15.8720703125, -12.62890625, -9.3857421875, -6.142578125, -2.8994140625, 0.34375, 3.5869140625, 6.830078125, 10.0732421875, 13.31640625, 16.5595703125, 19.802734375, 23.0458984375, 26.2890625, 29.5322265625, 32.775390625, 36.0185546875, 39.26171875, 42.5048828125, 45.748046875, 48.9912109375, 52.234375, 55.4775390625, 58.720703125, 61.9638671875, 65.20703125, 68.4501953125, 71.693359375, 74.9365234375, 78.1796875, 81.4228515625, 84.666015625, 87.9091796875, 91.15234375, 94.3955078125, 97.638671875, 100.8818359375, 104.125]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 5.0, 9.0, 5.0, 14.0, 10.0, 15.0, 23.0, 19.0, 29.0, 45.0, 48.0, 65.0, 97.0, 118.0, 200.0, 311.0, 477.0, 681.0, 593.0, 437.0, 251.0, 176.0, 83.0, 84.0, 56.0, 56.0, 32.0, 36.0, 27.0, 12.0, 10.0, 8.0, 12.0, 7.0, 8.0, 2.0, 7.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.9375, -25.037353515625, -24.13720703125, -23.237060546875, -22.3369140625, -21.436767578125, -20.53662109375, -19.636474609375, -18.736328125, -17.836181640625, -16.93603515625, -16.035888671875, -15.1357421875, -14.235595703125, -13.33544921875, -12.435302734375, -11.53515625, -10.635009765625, -9.73486328125, -8.834716796875, -7.9345703125, -7.034423828125, -6.13427734375, -5.234130859375, -4.333984375, -3.433837890625, -2.53369140625, -1.633544921875, -0.7333984375, 0.166748046875, 1.06689453125, 1.967041015625, 2.8671875, 3.767333984375, 4.66748046875, 5.567626953125, 6.4677734375, 7.367919921875, 8.26806640625, 9.168212890625, 10.068359375, 10.968505859375, 11.86865234375, 12.768798828125, 13.6689453125, 14.569091796875, 15.46923828125, 16.369384765625, 17.26953125, 18.169677734375, 19.06982421875, 19.969970703125, 20.8701171875, 21.770263671875, 22.67041015625, 23.570556640625, 24.470703125, 25.370849609375, 26.27099609375, 27.171142578125, 28.0712890625, 28.971435546875, 29.87158203125, 30.771728515625, 31.671875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 2.0, 3.0, 6.0, 7.0, 6.0, 7.0, 11.0, 16.0, 21.0, 29.0, 38.0, 58.0, 47.0, 78.0, 72.0, 105.0, 88.0, 106.0, 63.0, 47.0, 46.0, 36.0, 22.0, 18.0, 15.0, 7.0, 9.0, 7.0, 6.0, 11.0, 4.0, 1.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-51.113773345947266, -49.06436538696289, -47.014957427978516, -44.96554946899414, -42.9161376953125, -40.866729736328125, -38.81732177734375, -36.767913818359375, -34.718505859375, -32.669097900390625, -30.61968994140625, -28.570280075073242, -26.520872116088867, -24.471464157104492, -22.422054290771484, -20.37264633178711, -18.323238372802734, -16.27383041381836, -14.224421501159668, -12.175012588500977, -10.125604629516602, -8.076196670532227, -6.026787757873535, -3.9773788452148438, -1.9279708862304688, 0.12143754959106445, 2.1708459854125977, 4.220254421234131, 6.269662857055664, 8.319070816040039, 10.36847972869873, 12.417888641357422, 14.467292785644531, 16.516700744628906, 18.56610870361328, 20.61551856994629, 22.664926528930664, 24.71433448791504, 26.763744354248047, 28.813152313232422, 30.862560272216797, 32.91196823120117, 34.96137619018555, 37.01078414916992, 39.06019592285156, 41.10960388183594, 43.15901184082031, 45.20841979980469, 47.25782775878906, 49.30723571777344, 51.35664367675781, 53.40605163574219, 55.45545959472656, 57.50486755371094, 59.55427932739258, 61.60368728637695, 63.65309524536133, 65.70250701904297, 67.75191497802734, 69.80132293701172, 71.8507308959961, 73.90013885498047, 75.94954681396484, 77.99895477294922, 80.0483627319336]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 5.0, 2.0, 2.0, 2.0, 3.0, 0.0, 5.0, 4.0, 7.0, 7.0, 10.0, 12.0, 11.0, 14.0, 13.0, 15.0, 18.0, 25.0, 32.0, 22.0, 25.0, 30.0, 41.0, 39.0, 48.0, 28.0, 41.0, 37.0, 38.0, 35.0, 41.0, 48.0, 46.0, 36.0, 23.0, 28.0, 22.0, 28.0, 25.0, 25.0, 15.0, 21.0, 9.0, 13.0, 12.0, 11.0, 4.0, 4.0, 8.0, 5.0, 5.0, 3.0, 7.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0], "bins": [-46.545711517333984, -45.09880447387695, -43.65189743041992, -42.204986572265625, -40.758079528808594, -39.31117248535156, -37.86426544189453, -36.4173583984375, -34.97045135498047, -33.52354431152344, -32.076637268066406, -30.629728317260742, -29.18282127380371, -27.735912322998047, -26.289005279541016, -24.842098236083984, -23.39518928527832, -21.94828224182129, -20.501373291015625, -19.054466247558594, -17.607559204101562, -16.16065216064453, -14.713743209838867, -13.266836166381836, -11.819928169250488, -10.37302017211914, -8.92611312866211, -7.479205131530762, -6.032297611236572, -4.585390090942383, -3.138482093811035, -1.691575050354004, -0.24466705322265625, 1.2022405862808228, 2.6491482257843018, 4.09605598449707, 5.54296350479126, 6.989871025085449, 8.436779022216797, 9.883686065673828, 11.330594062805176, 12.777502059936523, 14.224409103393555, 15.671317100524902, 17.11822509765625, 18.56513214111328, 20.012039184570312, 21.458946228027344, 22.905855178833008, 24.35276222229004, 25.799671173095703, 27.246578216552734, 28.693485260009766, 30.140392303466797, 31.58730125427246, 33.034210205078125, 34.481117248535156, 35.92802429199219, 37.37493133544922, 38.82183837890625, 40.26874923706055, 41.71565628051758, 43.16256332397461, 44.60947036743164, 46.05637741088867]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 5.0, 8.0, 21.0, 25.0, 38.0, 64.0, 103.0, 146.0, 224.0, 267.0, 438.0, 598.0, 873.0, 1366.0, 1955.0, 3010.0, 4458.0, 6704.0, 10614.0, 16668.0, 27408.0, 48098.0, 89532.0, 181472.0, 286326.0, 167579.0, 83517.0, 45485.0, 26361.0, 15884.0, 9951.0, 6469.0, 4164.0, 2863.0, 1889.0, 1273.0, 882.0, 566.0, 427.0, 258.0, 159.0, 137.0, 95.0, 63.0, 42.0, 22.0, 21.0, 10.0, 12.0, 4.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.34375, -29.34716796875, -28.3505859375, -27.35400390625, -26.357421875, -25.36083984375, -24.3642578125, -23.36767578125, -22.37109375, -21.37451171875, -20.3779296875, -19.38134765625, -18.384765625, -17.38818359375, -16.3916015625, -15.39501953125, -14.3984375, -13.40185546875, -12.4052734375, -11.40869140625, -10.412109375, -9.41552734375, -8.4189453125, -7.42236328125, -6.42578125, -5.42919921875, -4.4326171875, -3.43603515625, -2.439453125, -1.44287109375, -0.4462890625, 0.55029296875, 1.546875, 2.54345703125, 3.5400390625, 4.53662109375, 5.533203125, 6.52978515625, 7.5263671875, 8.52294921875, 9.51953125, 10.51611328125, 11.5126953125, 12.50927734375, 13.505859375, 14.50244140625, 15.4990234375, 16.49560546875, 17.4921875, 18.48876953125, 19.4853515625, 20.48193359375, 21.478515625, 22.47509765625, 23.4716796875, 24.46826171875, 25.46484375, 26.46142578125, 27.4580078125, 28.45458984375, 29.451171875, 30.44775390625, 31.4443359375, 32.44091796875, 33.4375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 3.0, 2.0, 0.0, 3.0, 4.0, 7.0, 3.0, 7.0, 8.0, 10.0, 14.0, 14.0, 16.0, 14.0, 26.0, 20.0, 22.0, 31.0, 22.0, 34.0, 33.0, 41.0, 48.0, 39.0, 42.0, 41.0, 51.0, 51.0, 52.0, 45.0, 28.0, 38.0, 20.0, 32.0, 19.0, 24.0, 23.0, 15.0, 21.0, 19.0, 4.0, 9.0, 11.0, 12.0, 0.0, 7.0, 5.0, 7.0, 2.0, 2.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0], "bins": [-50.15625, -48.62353515625, -47.0908203125, -45.55810546875, -44.025390625, -42.49267578125, -40.9599609375, -39.42724609375, -37.89453125, -36.36181640625, -34.8291015625, -33.29638671875, -31.763671875, -30.23095703125, -28.6982421875, -27.16552734375, -25.6328125, -24.10009765625, -22.5673828125, -21.03466796875, -19.501953125, -17.96923828125, -16.4365234375, -14.90380859375, -13.37109375, -11.83837890625, -10.3056640625, -8.77294921875, -7.240234375, -5.70751953125, -4.1748046875, -2.64208984375, -1.109375, 0.42333984375, 1.9560546875, 3.48876953125, 5.021484375, 6.55419921875, 8.0869140625, 9.61962890625, 11.15234375, 12.68505859375, 14.2177734375, 15.75048828125, 17.283203125, 18.81591796875, 20.3486328125, 21.88134765625, 23.4140625, 24.94677734375, 26.4794921875, 28.01220703125, 29.544921875, 31.07763671875, 32.6103515625, 34.14306640625, 35.67578125, 37.20849609375, 38.7412109375, 40.27392578125, 41.806640625, 43.33935546875, 44.8720703125, 46.40478515625, 47.9375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 7.0, 12.0, 6.0, 8.0, 12.0, 26.0, 36.0, 47.0, 47.0, 75.0, 92.0, 156.0, 224.0, 310.0, 439.0, 660.0, 979.0, 1412.0, 2182.0, 3259.0, 5399.0, 8749.0, 15760.0, 40602.0, 598207.0, 302423.0, 31726.0, 13823.0, 7839.0, 4822.0, 3073.0, 2022.0, 1310.0, 914.0, 596.0, 385.0, 276.0, 188.0, 152.0, 93.0, 60.0, 53.0, 32.0, 17.0, 9.0, 20.0, 11.0, 7.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-48.8125, -47.23291015625, -45.6533203125, -44.07373046875, -42.494140625, -40.91455078125, -39.3349609375, -37.75537109375, -36.17578125, -34.59619140625, -33.0166015625, -31.43701171875, -29.857421875, -28.27783203125, -26.6982421875, -25.11865234375, -23.5390625, -21.95947265625, -20.3798828125, -18.80029296875, -17.220703125, -15.64111328125, -14.0615234375, -12.48193359375, -10.90234375, -9.32275390625, -7.7431640625, -6.16357421875, -4.583984375, -3.00439453125, -1.4248046875, 0.15478515625, 1.734375, 3.31396484375, 4.8935546875, 6.47314453125, 8.052734375, 9.63232421875, 11.2119140625, 12.79150390625, 14.37109375, 15.95068359375, 17.5302734375, 19.10986328125, 20.689453125, 22.26904296875, 23.8486328125, 25.42822265625, 27.0078125, 28.58740234375, 30.1669921875, 31.74658203125, 33.326171875, 34.90576171875, 36.4853515625, 38.06494140625, 39.64453125, 41.22412109375, 42.8037109375, 44.38330078125, 45.962890625, 47.54248046875, 49.1220703125, 50.70166015625, 52.28125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 2.0, 1.0, 4.0, 5.0, 0.0, 6.0, 8.0, 9.0, 14.0, 7.0, 24.0, 17.0, 17.0, 13.0, 20.0, 24.0, 29.0, 29.0, 27.0, 37.0, 36.0, 24.0, 36.0, 39.0, 43.0, 41.0, 46.0, 43.0, 39.0, 37.0, 33.0, 29.0, 37.0, 30.0, 18.0, 24.0, 19.0, 18.0, 18.0, 11.0, 21.0, 14.0, 8.0, 11.0, 5.0, 7.0, 7.0, 6.0, 2.0, 5.0, 3.0, 6.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-36.34375, -35.21142578125, -34.0791015625, -32.94677734375, -31.814453125, -30.68212890625, -29.5498046875, -28.41748046875, -27.28515625, -26.15283203125, -25.0205078125, -23.88818359375, -22.755859375, -21.62353515625, -20.4912109375, -19.35888671875, -18.2265625, -17.09423828125, -15.9619140625, -14.82958984375, -13.697265625, -12.56494140625, -11.4326171875, -10.30029296875, -9.16796875, -8.03564453125, -6.9033203125, -5.77099609375, -4.638671875, -3.50634765625, -2.3740234375, -1.24169921875, -0.109375, 1.02294921875, 2.1552734375, 3.28759765625, 4.419921875, 5.55224609375, 6.6845703125, 7.81689453125, 8.94921875, 10.08154296875, 11.2138671875, 12.34619140625, 13.478515625, 14.61083984375, 15.7431640625, 16.87548828125, 18.0078125, 19.14013671875, 20.2724609375, 21.40478515625, 22.537109375, 23.66943359375, 24.8017578125, 25.93408203125, 27.06640625, 28.19873046875, 29.3310546875, 30.46337890625, 31.595703125, 32.72802734375, 33.8603515625, 34.99267578125, 36.125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 5.0, 2.0, 5.0, 10.0, 10.0, 13.0, 19.0, 45.0, 59.0, 76.0, 139.0, 207.0, 344.0, 510.0, 883.0, 1723.0, 3089.0, 6628.0, 17092.0, 90258.0, 847303.0, 54581.0, 13704.0, 5571.0, 2687.0, 1476.0, 801.0, 480.0, 291.0, 170.0, 114.0, 91.0, 52.0, 41.0, 24.0, 15.0, 15.0, 8.0, 5.0, 3.0, 9.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.9453125, -3.830596923828125, -3.71588134765625, -3.601165771484375, -3.4864501953125, -3.371734619140625, -3.25701904296875, -3.142303466796875, -3.027587890625, -2.912872314453125, -2.79815673828125, -2.683441162109375, -2.5687255859375, -2.454010009765625, -2.33929443359375, -2.224578857421875, -2.10986328125, -1.995147705078125, -1.88043212890625, -1.765716552734375, -1.6510009765625, -1.536285400390625, -1.42156982421875, -1.306854248046875, -1.192138671875, -1.077423095703125, -0.96270751953125, -0.847991943359375, -0.7332763671875, -0.618560791015625, -0.50384521484375, -0.389129638671875, -0.2744140625, -0.159698486328125, -0.04498291015625, 0.069732666015625, 0.1844482421875, 0.299163818359375, 0.41387939453125, 0.528594970703125, 0.643310546875, 0.758026123046875, 0.87274169921875, 0.987457275390625, 1.1021728515625, 1.216888427734375, 1.33160400390625, 1.446319580078125, 1.56103515625, 1.675750732421875, 1.79046630859375, 1.905181884765625, 2.0198974609375, 2.134613037109375, 2.24932861328125, 2.364044189453125, 2.478759765625, 2.593475341796875, 2.70819091796875, 2.822906494140625, 2.9376220703125, 3.052337646484375, 3.16705322265625, 3.281768798828125, 3.396484375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 3.0, 6.0, 4.0, 7.0, 6.0, 12.0, 4.0, 15.0, 22.0, 23.0, 44.0, 47.0, 83.0, 135.0, 184.0, 119.0, 72.0, 52.0, 32.0, 41.0, 26.0, 3.0, 11.0, 10.0, 15.0, 4.0, 1.0, 5.0, 4.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.001567840576171875, -0.001516297459602356, -0.001464754343032837, -0.0014132112264633179, -0.0013616681098937988, -0.0013101249933242798, -0.0012585818767547607, -0.0012070387601852417, -0.0011554956436157227, -0.0011039525270462036, -0.0010524094104766846, -0.0010008662939071655, -0.0009493231773376465, -0.0008977800607681274, -0.0008462369441986084, -0.0007946938276290894, -0.0007431507110595703, -0.0006916075944900513, -0.0006400644779205322, -0.0005885213613510132, -0.0005369782447814941, -0.0004854351282119751, -0.00043389201164245605, -0.000382348895072937, -0.00033080577850341797, -0.0002792626619338989, -0.00022771954536437988, -0.00017617642879486084, -0.0001246333122253418, -7.309019565582275e-05, -2.154707908630371e-05, 2.9996037483215332e-05, 8.153915405273438e-05, 0.00013308227062225342, 0.00018462538719177246, 0.0002361685037612915, 0.00028771162033081055, 0.0003392547369003296, 0.00039079785346984863, 0.0004423409700393677, 0.0004938840866088867, 0.0005454272031784058, 0.0005969703197479248, 0.0006485134363174438, 0.0007000565528869629, 0.0007515996694564819, 0.000803142786026001, 0.00085468590259552, 0.0009062290191650391, 0.0009577721357345581, 0.0010093152523040771, 0.0010608583688735962, 0.0011124014854431152, 0.0011639446020126343, 0.0012154877185821533, 0.0012670308351516724, 0.0013185739517211914, 0.0013701170682907104, 0.0014216601848602295, 0.0014732033014297485, 0.0015247464179992676, 0.0015762895345687866, 0.0016278326511383057, 0.0016793757677078247, 0.0017309188842773438]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 9.0, 11.0, 13.0, 24.0, 33.0, 62.0, 90.0, 147.0, 217.0, 324.0, 485.0, 737.0, 1085.0, 1663.0, 2684.0, 4147.0, 7056.0, 12425.0, 22024.0, 43134.0, 94126.0, 241105.0, 342000.0, 143488.0, 61374.0, 30199.0, 16103.0, 9192.0, 5347.0, 3325.0, 2090.0, 1294.0, 844.0, 553.0, 393.0, 268.0, 178.0, 122.0, 79.0, 46.0, 23.0, 11.0, 18.0, 10.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.951171875, -1.8957977294921875, -1.840423583984375, -1.7850494384765625, -1.72967529296875, -1.6743011474609375, -1.618927001953125, -1.5635528564453125, -1.5081787109375, -1.4528045654296875, -1.397430419921875, -1.3420562744140625, -1.28668212890625, -1.2313079833984375, -1.175933837890625, -1.1205596923828125, -1.065185546875, -1.0098114013671875, -0.954437255859375, -0.8990631103515625, -0.84368896484375, -0.7883148193359375, -0.732940673828125, -0.6775665283203125, -0.6221923828125, -0.5668182373046875, -0.511444091796875, -0.4560699462890625, -0.40069580078125, -0.3453216552734375, -0.289947509765625, -0.2345733642578125, -0.17919921875, -0.1238250732421875, -0.068450927734375, -0.0130767822265625, 0.04229736328125, 0.0976715087890625, 0.153045654296875, 0.2084197998046875, 0.2637939453125, 0.3191680908203125, 0.374542236328125, 0.4299163818359375, 0.48529052734375, 0.5406646728515625, 0.596038818359375, 0.6514129638671875, 0.706787109375, 0.7621612548828125, 0.817535400390625, 0.8729095458984375, 0.92828369140625, 0.9836578369140625, 1.039031982421875, 1.0944061279296875, 1.1497802734375, 1.2051544189453125, 1.260528564453125, 1.3159027099609375, 1.37127685546875, 1.4266510009765625, 1.482025146484375, 1.5373992919921875, 1.5927734375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 4.0, 3.0, 2.0, 5.0, 1.0, 1.0, 9.0, 9.0, 11.0, 14.0, 17.0, 25.0, 29.0, 21.0, 32.0, 26.0, 55.0, 69.0, 64.0, 77.0, 67.0, 76.0, 62.0, 60.0, 41.0, 55.0, 28.0, 28.0, 17.0, 14.0, 11.0, 11.0, 7.0, 8.0, 7.0, 5.0, 2.0, 7.0, 3.0, 3.0, 3.0, 6.0, 4.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.470703125, -0.4547576904296875, -0.438812255859375, -0.4228668212890625, -0.40692138671875, -0.3909759521484375, -0.375030517578125, -0.3590850830078125, -0.3431396484375, -0.3271942138671875, -0.311248779296875, -0.2953033447265625, -0.27935791015625, -0.2634124755859375, -0.247467041015625, -0.2315216064453125, -0.215576171875, -0.1996307373046875, -0.183685302734375, -0.1677398681640625, -0.15179443359375, -0.1358489990234375, -0.119903564453125, -0.1039581298828125, -0.0880126953125, -0.0720672607421875, -0.056121826171875, -0.0401763916015625, -0.02423095703125, -0.0082855224609375, 0.007659912109375, 0.0236053466796875, 0.03955078125, 0.0554962158203125, 0.071441650390625, 0.0873870849609375, 0.10333251953125, 0.1192779541015625, 0.135223388671875, 0.1511688232421875, 0.1671142578125, 0.1830596923828125, 0.199005126953125, 0.2149505615234375, 0.23089599609375, 0.2468414306640625, 0.262786865234375, 0.2787322998046875, 0.294677734375, 0.3106231689453125, 0.326568603515625, 0.3425140380859375, 0.35845947265625, 0.3744049072265625, 0.390350341796875, 0.4062957763671875, 0.4222412109375, 0.4381866455078125, 0.454132080078125, 0.4700775146484375, 0.48602294921875, 0.5019683837890625, 0.517913818359375, 0.5338592529296875, 0.5498046875]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 3.0, 3.0, 6.0, 4.0, 4.0, 6.0, 16.0, 13.0, 17.0, 25.0, 41.0, 43.0, 53.0, 49.0, 71.0, 85.0, 101.0, 85.0, 85.0, 77.0, 47.0, 41.0, 19.0, 20.0, 21.0, 12.0, 11.0, 7.0, 7.0, 8.0, 6.0, 4.0, 4.0, 3.0, 2.0, 0.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.05890655517578, -47.134620666503906, -45.21033477783203, -43.286048889160156, -41.361759185791016, -39.43747329711914, -37.513187408447266, -35.58890151977539, -33.66461181640625, -31.740325927734375, -29.816038131713867, -27.891752243041992, -25.967464447021484, -24.04317855834961, -22.118892669677734, -20.19460678100586, -18.270320892333984, -16.34603500366211, -14.421747207641602, -12.497461318969727, -10.573174476623535, -8.648887634277344, -6.724601745605469, -4.800314903259277, -2.876028060913086, -0.9517414569854736, 0.9725451469421387, 2.896831512451172, 4.821118354797363, 6.745405197143555, 8.66969108581543, 10.593977928161621, 12.518264770507812, 14.442551612854004, 16.366838455200195, 18.29112434387207, 20.215412139892578, 22.139698028564453, 24.063983917236328, 25.988269805908203, 27.91255760192871, 29.836843490600586, 31.761131286621094, 33.68541717529297, 35.609703063964844, 37.53398895263672, 39.458274841308594, 41.382564544677734, 43.30685043334961, 45.231136322021484, 47.15542221069336, 49.0797119140625, 51.003997802734375, 52.92828369140625, 54.852569580078125, 56.77685546875, 58.701141357421875, 60.62542724609375, 62.549713134765625, 64.4739990234375, 66.39828491210938, 68.32257080078125, 70.24685668945312, 72.17115020751953, 74.0954360961914]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 5.0, 2.0, 2.0, 2.0, 3.0, 0.0, 5.0, 4.0, 6.0, 9.0, 9.0, 11.0, 14.0, 15.0, 9.0, 16.0, 19.0, 25.0, 32.0, 24.0, 22.0, 32.0, 45.0, 35.0, 50.0, 27.0, 38.0, 35.0, 49.0, 33.0, 39.0, 50.0, 42.0, 32.0, 25.0, 31.0, 21.0, 31.0, 23.0, 22.0, 17.0, 18.0, 10.0, 14.0, 10.0, 13.0, 2.0, 7.0, 5.0, 6.0, 4.0, 4.0, 6.0, 3.0, 0.0, 3.0, 0.0, 1.0, 3.0, 1.0], "bins": [-45.38300323486328, -43.97460174560547, -42.56620407104492, -41.15780258178711, -39.74940490722656, -38.34100341796875, -36.93260192871094, -35.52420425415039, -34.115806579589844, -32.70740509033203, -31.299007415771484, -29.890605926513672, -28.482208251953125, -27.073806762695312, -25.665407180786133, -24.257007598876953, -22.84860610961914, -21.44020652770996, -20.03180694580078, -18.62340545654297, -17.215007781982422, -15.806607246398926, -14.39820671081543, -12.98980712890625, -11.58140754699707, -10.17300796508789, -8.764608383178711, -7.356207847595215, -5.947808265686035, -4.5394086837768555, -3.1310081481933594, -1.7226085662841797, -0.314208984375, 1.0941908359527588, 2.5025906562805176, 3.9109907150268555, 5.319390296936035, 6.727789878845215, 8.136190414428711, 9.54458999633789, 10.95298957824707, 12.36138916015625, 13.76978874206543, 15.178189277648926, 16.586589813232422, 17.99498748779297, 19.40338897705078, 20.81178855895996, 22.22018814086914, 23.62858772277832, 25.0369873046875, 26.445388793945312, 27.85378646850586, 29.262187957763672, 30.67058753967285, 32.07898712158203, 33.487388610839844, 34.895790100097656, 36.3041877746582, 37.712589263916016, 39.12098693847656, 40.529388427734375, 41.93778991699219, 43.346187591552734, 44.75458526611328]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 4.0, 13.0, 14.0, 22.0, 23.0, 29.0, 49.0, 73.0, 121.0, 161.0, 257.0, 369.0, 520.0, 763.0, 1171.0, 1785.0, 2876.0, 4437.0, 7131.0, 11923.0, 20813.0, 38368.0, 76848.0, 169996.0, 314269.0, 202439.0, 90743.0, 44412.0, 23646.0, 13419.0, 7987.0, 4952.0, 3019.0, 1987.0, 1273.0, 868.0, 551.0, 408.0, 240.0, 172.0, 128.0, 87.0, 61.0, 43.0, 30.0, 18.0, 20.0, 9.0, 4.0, 5.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.6875, -63.609375, -61.53125, -59.453125, -57.375, -55.296875, -53.21875, -51.140625, -49.0625, -46.984375, -44.90625, -42.828125, -40.75, -38.671875, -36.59375, -34.515625, -32.4375, -30.359375, -28.28125, -26.203125, -24.125, -22.046875, -19.96875, -17.890625, -15.8125, -13.734375, -11.65625, -9.578125, -7.5, -5.421875, -3.34375, -1.265625, 0.8125, 2.890625, 4.96875, 7.046875, 9.125, 11.203125, 13.28125, 15.359375, 17.4375, 19.515625, 21.59375, 23.671875, 25.75, 27.828125, 29.90625, 31.984375, 34.0625, 36.140625, 38.21875, 40.296875, 42.375, 44.453125, 46.53125, 48.609375, 50.6875, 52.765625, 54.84375, 56.921875, 59.0, 61.078125, 63.15625, 65.234375, 67.3125]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 6.0, 5.0, 4.0, 5.0, 6.0, 8.0, 9.0, 14.0, 14.0, 12.0, 15.0, 13.0, 30.0, 29.0, 19.0, 25.0, 40.0, 40.0, 41.0, 48.0, 38.0, 34.0, 50.0, 43.0, 45.0, 39.0, 60.0, 37.0, 40.0, 22.0, 27.0, 26.0, 21.0, 20.0, 19.0, 16.0, 17.0, 15.0, 7.0, 7.0, 7.0, 3.0, 5.0, 4.0, 7.0, 3.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-47.90625, -46.44677734375, -44.9873046875, -43.52783203125, -42.068359375, -40.60888671875, -39.1494140625, -37.68994140625, -36.23046875, -34.77099609375, -33.3115234375, -31.85205078125, -30.392578125, -28.93310546875, -27.4736328125, -26.01416015625, -24.5546875, -23.09521484375, -21.6357421875, -20.17626953125, -18.716796875, -17.25732421875, -15.7978515625, -14.33837890625, -12.87890625, -11.41943359375, -9.9599609375, -8.50048828125, -7.041015625, -5.58154296875, -4.1220703125, -2.66259765625, -1.203125, 0.25634765625, 1.7158203125, 3.17529296875, 4.634765625, 6.09423828125, 7.5537109375, 9.01318359375, 10.47265625, 11.93212890625, 13.3916015625, 14.85107421875, 16.310546875, 17.77001953125, 19.2294921875, 20.68896484375, 22.1484375, 23.60791015625, 25.0673828125, 26.52685546875, 27.986328125, 29.44580078125, 30.9052734375, 32.36474609375, 33.82421875, 35.28369140625, 36.7431640625, 38.20263671875, 39.662109375, 41.12158203125, 42.5810546875, 44.04052734375, 45.5]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 2.0, 4.0, 8.0, 5.0, 19.0, 31.0, 38.0, 60.0, 82.0, 144.0, 215.0, 302.0, 436.0, 628.0, 1019.0, 1491.0, 2362.0, 3954.0, 6219.0, 10073.0, 17239.0, 29389.0, 53034.0, 98802.0, 194391.0, 270292.0, 163985.0, 84473.0, 45533.0, 25556.0, 14862.0, 8885.0, 5315.0, 3459.0, 2128.0, 1378.0, 931.0, 629.0, 405.0, 264.0, 190.0, 101.0, 83.0, 44.0, 25.0, 29.0, 19.0, 12.0, 7.0, 5.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-64.0625, -62.0205078125, -59.978515625, -57.9365234375, -55.89453125, -53.8525390625, -51.810546875, -49.7685546875, -47.7265625, -45.6845703125, -43.642578125, -41.6005859375, -39.55859375, -37.5166015625, -35.474609375, -33.4326171875, -31.390625, -29.3486328125, -27.306640625, -25.2646484375, -23.22265625, -21.1806640625, -19.138671875, -17.0966796875, -15.0546875, -13.0126953125, -10.970703125, -8.9287109375, -6.88671875, -4.8447265625, -2.802734375, -0.7607421875, 1.28125, 3.3232421875, 5.365234375, 7.4072265625, 9.44921875, 11.4912109375, 13.533203125, 15.5751953125, 17.6171875, 19.6591796875, 21.701171875, 23.7431640625, 25.78515625, 27.8271484375, 29.869140625, 31.9111328125, 33.953125, 35.9951171875, 38.037109375, 40.0791015625, 42.12109375, 44.1630859375, 46.205078125, 48.2470703125, 50.2890625, 52.3310546875, 54.373046875, 56.4150390625, 58.45703125, 60.4990234375, 62.541015625, 64.5830078125, 66.625]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 3.0, 5.0, 4.0, 4.0, 9.0, 9.0, 10.0, 10.0, 19.0, 16.0, 25.0, 21.0, 38.0, 32.0, 36.0, 34.0, 28.0, 47.0, 41.0, 47.0, 34.0, 44.0, 52.0, 45.0, 29.0, 40.0, 40.0, 33.0, 37.0, 35.0, 24.0, 26.0, 27.0, 16.0, 17.0, 12.0, 9.0, 8.0, 7.0, 6.0, 5.0, 2.0, 3.0, 4.0, 6.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-30.90625, -29.94970703125, -28.9931640625, -28.03662109375, -27.080078125, -26.12353515625, -25.1669921875, -24.21044921875, -23.25390625, -22.29736328125, -21.3408203125, -20.38427734375, -19.427734375, -18.47119140625, -17.5146484375, -16.55810546875, -15.6015625, -14.64501953125, -13.6884765625, -12.73193359375, -11.775390625, -10.81884765625, -9.8623046875, -8.90576171875, -7.94921875, -6.99267578125, -6.0361328125, -5.07958984375, -4.123046875, -3.16650390625, -2.2099609375, -1.25341796875, -0.296875, 0.65966796875, 1.6162109375, 2.57275390625, 3.529296875, 4.48583984375, 5.4423828125, 6.39892578125, 7.35546875, 8.31201171875, 9.2685546875, 10.22509765625, 11.181640625, 12.13818359375, 13.0947265625, 14.05126953125, 15.0078125, 15.96435546875, 16.9208984375, 17.87744140625, 18.833984375, 19.79052734375, 20.7470703125, 21.70361328125, 22.66015625, 23.61669921875, 24.5732421875, 25.52978515625, 26.486328125, 27.44287109375, 28.3994140625, 29.35595703125, 30.3125]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 7.0, 6.0, 5.0, 6.0, 18.0, 26.0, 25.0, 57.0, 94.0, 122.0, 183.0, 276.0, 541.0, 851.0, 1485.0, 2746.0, 5031.0, 9630.0, 19718.0, 45165.0, 116411.0, 338007.0, 318268.0, 108346.0, 42627.0, 18830.0, 9125.0, 4763.0, 2507.0, 1455.0, 843.0, 542.0, 311.0, 207.0, 106.0, 81.0, 50.0, 36.0, 24.0, 15.0, 7.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-29.546875, -28.62255859375, -27.6982421875, -26.77392578125, -25.849609375, -24.92529296875, -24.0009765625, -23.07666015625, -22.15234375, -21.22802734375, -20.3037109375, -19.37939453125, -18.455078125, -17.53076171875, -16.6064453125, -15.68212890625, -14.7578125, -13.83349609375, -12.9091796875, -11.98486328125, -11.060546875, -10.13623046875, -9.2119140625, -8.28759765625, -7.36328125, -6.43896484375, -5.5146484375, -4.59033203125, -3.666015625, -2.74169921875, -1.8173828125, -0.89306640625, 0.03125, 0.95556640625, 1.8798828125, 2.80419921875, 3.728515625, 4.65283203125, 5.5771484375, 6.50146484375, 7.42578125, 8.35009765625, 9.2744140625, 10.19873046875, 11.123046875, 12.04736328125, 12.9716796875, 13.89599609375, 14.8203125, 15.74462890625, 16.6689453125, 17.59326171875, 18.517578125, 19.44189453125, 20.3662109375, 21.29052734375, 22.21484375, 23.13916015625, 24.0634765625, 24.98779296875, 25.912109375, 26.83642578125, 27.7607421875, 28.68505859375, 29.609375]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 4.0, 3.0, 9.0, 1.0, 10.0, 12.0, 7.0, 12.0, 15.0, 19.0, 22.0, 33.0, 53.0, 60.0, 106.0, 125.0, 114.0, 105.0, 81.0, 52.0, 52.0, 37.0, 16.0, 14.0, 5.0, 10.0, 8.0, 3.0, 3.0, 3.0, 2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0028018951416015625, -0.0027174949645996094, -0.0026330947875976562, -0.002548694610595703, -0.00246429443359375, -0.002379894256591797, -0.0022954940795898438, -0.0022110939025878906, -0.0021266937255859375, -0.0020422935485839844, -0.0019578933715820312, -0.0018734931945800781, -0.001789093017578125, -0.0017046928405761719, -0.0016202926635742188, -0.0015358924865722656, -0.0014514923095703125, -0.0013670921325683594, -0.0012826919555664062, -0.0011982917785644531, -0.0011138916015625, -0.0010294914245605469, -0.0009450912475585938, -0.0008606910705566406, -0.0007762908935546875, -0.0006918907165527344, -0.0006074905395507812, -0.0005230903625488281, -0.000438690185546875, -0.0003542900085449219, -0.00026988983154296875, -0.00018548965454101562, -0.0001010894775390625, -1.6689300537109375e-05, 6.771087646484375e-05, 0.00015211105346679688, 0.00023651123046875, 0.0003209114074707031, 0.00040531158447265625, 0.0004897117614746094, 0.0005741119384765625, 0.0006585121154785156, 0.0007429122924804688, 0.0008273124694824219, 0.000911712646484375, 0.0009961128234863281, 0.0010805130004882812, 0.0011649131774902344, 0.0012493133544921875, 0.0013337135314941406, 0.0014181137084960938, 0.0015025138854980469, 0.0015869140625, 0.0016713142395019531, 0.0017557144165039062, 0.0018401145935058594, 0.0019245147705078125, 0.0020089149475097656, 0.0020933151245117188, 0.002177715301513672, 0.002262115478515625, 0.002346515655517578, 0.0024309158325195312, 0.0025153160095214844, 0.0025997161865234375]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 5.0, 10.0, 20.0, 25.0, 22.0, 32.0, 54.0, 73.0, 110.0, 180.0, 255.0, 391.0, 585.0, 909.0, 1467.0, 2336.0, 3798.0, 6491.0, 11101.0, 19807.0, 37407.0, 74294.0, 157066.0, 287984.0, 223804.0, 105806.0, 51425.0, 26989.0, 14645.0, 8559.0, 4814.0, 2953.0, 1865.0, 1163.0, 701.0, 463.0, 285.0, 219.0, 145.0, 101.0, 65.0, 41.0, 36.0, 18.0, 13.0, 7.0, 7.0, 6.0, 5.0, 3.0, 1.0, 1.0, 3.0], "bins": [-21.28125, -20.668701171875, -20.05615234375, -19.443603515625, -18.8310546875, -18.218505859375, -17.60595703125, -16.993408203125, -16.380859375, -15.768310546875, -15.15576171875, -14.543212890625, -13.9306640625, -13.318115234375, -12.70556640625, -12.093017578125, -11.48046875, -10.867919921875, -10.25537109375, -9.642822265625, -9.0302734375, -8.417724609375, -7.80517578125, -7.192626953125, -6.580078125, -5.967529296875, -5.35498046875, -4.742431640625, -4.1298828125, -3.517333984375, -2.90478515625, -2.292236328125, -1.6796875, -1.067138671875, -0.45458984375, 0.157958984375, 0.7705078125, 1.383056640625, 1.99560546875, 2.608154296875, 3.220703125, 3.833251953125, 4.44580078125, 5.058349609375, 5.6708984375, 6.283447265625, 6.89599609375, 7.508544921875, 8.12109375, 8.733642578125, 9.34619140625, 9.958740234375, 10.5712890625, 11.183837890625, 11.79638671875, 12.408935546875, 13.021484375, 13.634033203125, 14.24658203125, 14.859130859375, 15.4716796875, 16.084228515625, 16.69677734375, 17.309326171875, 17.921875]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 5.0, 6.0, 7.0, 9.0, 12.0, 19.0, 19.0, 41.0, 23.0, 37.0, 49.0, 39.0, 50.0, 56.0, 69.0, 74.0, 62.0, 60.0, 58.0, 47.0, 51.0, 35.0, 26.0, 35.0, 23.0, 21.0, 18.0, 9.0, 14.0, 10.0, 5.0, 4.0, 5.0, 0.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.22265625, -6.0164794921875, -5.810302734375, -5.6041259765625, -5.39794921875, -5.1917724609375, -4.985595703125, -4.7794189453125, -4.5732421875, -4.3670654296875, -4.160888671875, -3.9547119140625, -3.74853515625, -3.5423583984375, -3.336181640625, -3.1300048828125, -2.923828125, -2.7176513671875, -2.511474609375, -2.3052978515625, -2.09912109375, -1.8929443359375, -1.686767578125, -1.4805908203125, -1.2744140625, -1.0682373046875, -0.862060546875, -0.6558837890625, -0.44970703125, -0.2435302734375, -0.037353515625, 0.1688232421875, 0.375, 0.5811767578125, 0.787353515625, 0.9935302734375, 1.19970703125, 1.4058837890625, 1.612060546875, 1.8182373046875, 2.0244140625, 2.2305908203125, 2.436767578125, 2.6429443359375, 2.84912109375, 3.0552978515625, 3.261474609375, 3.4676513671875, 3.673828125, 3.8800048828125, 4.086181640625, 4.2923583984375, 4.49853515625, 4.7047119140625, 4.910888671875, 5.1170654296875, 5.3232421875, 5.5294189453125, 5.735595703125, 5.9417724609375, 6.14794921875, 6.3541259765625, 6.560302734375, 6.7664794921875, 6.97265625]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 4.0, 1.0, 3.0, 3.0, 1.0, 4.0, 5.0, 7.0, 13.0, 14.0, 19.0, 23.0, 31.0, 30.0, 43.0, 47.0, 70.0, 61.0, 76.0, 80.0, 80.0, 78.0, 66.0, 48.0, 46.0, 34.0, 20.0, 18.0, 22.0, 12.0, 10.0, 9.0, 2.0, 5.0, 6.0, 7.0, 6.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-46.28619384765625, -44.47490310668945, -42.663612365722656, -40.85232162475586, -39.04103088378906, -37.229740142822266, -35.41844940185547, -33.60715866088867, -31.795867919921875, -29.984577178955078, -28.17328643798828, -26.361995697021484, -24.550704956054688, -22.73941421508789, -20.928123474121094, -19.116832733154297, -17.305543899536133, -15.494253158569336, -13.682962417602539, -11.871671676635742, -10.060380935668945, -8.249091148376465, -6.437800407409668, -4.626509666442871, -2.815218925476074, -1.003928303718567, 0.8073623180389404, 2.618652820587158, 4.429943561553955, 6.241233825683594, 8.05252456665039, 9.863815307617188, 11.675106048583984, 13.486396789550781, 15.297687530517578, 17.108978271484375, 18.920269012451172, 20.73155975341797, 22.542850494384766, 24.354141235351562, 26.16543197631836, 27.976722717285156, 29.788013458251953, 31.59930419921875, 33.41059494018555, 35.221885681152344, 37.03317642211914, 38.84446716308594, 40.65575408935547, 42.467044830322266, 44.27833557128906, 46.08962631225586, 47.900917053222656, 49.71220779418945, 51.52349853515625, 53.33478927612305, 55.146080017089844, 56.95737075805664, 58.76866149902344, 60.579952239990234, 62.39124298095703, 64.20252990722656, 66.01382446289062, 67.82511138916016, 69.63640594482422]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 3.0, 6.0, 6.0, 4.0, 10.0, 11.0, 12.0, 14.0, 22.0, 16.0, 21.0, 24.0, 23.0, 22.0, 26.0, 31.0, 38.0, 41.0, 37.0, 31.0, 33.0, 47.0, 30.0, 50.0, 28.0, 41.0, 50.0, 36.0, 38.0, 32.0, 31.0, 21.0, 20.0, 25.0, 17.0, 19.0, 11.0, 7.0, 18.0, 9.0, 6.0, 11.0, 6.0, 9.0, 4.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-45.57964324951172, -44.09043502807617, -42.601226806640625, -41.11201858520508, -39.62281036376953, -38.133602142333984, -36.64439392089844, -35.15518569946289, -33.665977478027344, -32.1767692565918, -30.68756103515625, -29.198352813720703, -27.709144592285156, -26.21993637084961, -24.730728149414062, -23.241519927978516, -21.75231170654297, -20.263103485107422, -18.773895263671875, -17.284687042236328, -15.795478820800781, -14.306270599365234, -12.817062377929688, -11.32785415649414, -9.838645935058594, -8.349437713623047, -6.8602294921875, -5.371021270751953, -3.8818130493164062, -2.3926048278808594, -0.9033966064453125, 0.5858116149902344, 2.0750198364257812, 3.564228057861328, 5.053436279296875, 6.542644500732422, 8.031852722167969, 9.521060943603516, 11.010269165039062, 12.49947738647461, 13.988685607910156, 15.477893829345703, 16.96710205078125, 18.456310272216797, 19.945518493652344, 21.43472671508789, 22.923934936523438, 24.413143157958984, 25.90235137939453, 27.391559600830078, 28.880767822265625, 30.369976043701172, 31.85918426513672, 33.348392486572266, 34.83760070800781, 36.32680892944336, 37.816017150878906, 39.30522537231445, 40.79443359375, 42.28364181518555, 43.772850036621094, 45.26205825805664, 46.75126647949219, 48.240474700927734, 49.72968292236328]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 5.0, 5.0, 3.0, 9.0, 16.0, 22.0, 29.0, 45.0, 53.0, 84.0, 96.0, 172.0, 284.0, 414.0, 585.0, 897.0, 1299.0, 2154.0, 3219.0, 5348.0, 9672.0, 19459.0, 54626.0, 259882.0, 1364810.0, 1924529.0, 418698.0, 76868.0, 23226.0, 10986.0, 6048.0, 3631.0, 2318.0, 1558.0, 1061.0, 670.0, 467.0, 300.0, 232.0, 172.0, 103.0, 70.0, 46.0, 34.0, 27.0, 24.0, 11.0, 4.0, 13.0, 7.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-82.875, -80.3740234375, -77.873046875, -75.3720703125, -72.87109375, -70.3701171875, -67.869140625, -65.3681640625, -62.8671875, -60.3662109375, -57.865234375, -55.3642578125, -52.86328125, -50.3623046875, -47.861328125, -45.3603515625, -42.859375, -40.3583984375, -37.857421875, -35.3564453125, -32.85546875, -30.3544921875, -27.853515625, -25.3525390625, -22.8515625, -20.3505859375, -17.849609375, -15.3486328125, -12.84765625, -10.3466796875, -7.845703125, -5.3447265625, -2.84375, -0.3427734375, 2.158203125, 4.6591796875, 7.16015625, 9.6611328125, 12.162109375, 14.6630859375, 17.1640625, 19.6650390625, 22.166015625, 24.6669921875, 27.16796875, 29.6689453125, 32.169921875, 34.6708984375, 37.171875, 39.6728515625, 42.173828125, 44.6748046875, 47.17578125, 49.6767578125, 52.177734375, 54.6787109375, 57.1796875, 59.6806640625, 62.181640625, 64.6826171875, 67.18359375, 69.6845703125, 72.185546875, 74.6865234375, 77.1875]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 4.0, 2.0, 1.0, 3.0, 5.0, 7.0, 5.0, 10.0, 13.0, 20.0, 14.0, 9.0, 23.0, 23.0, 18.0, 19.0, 18.0, 28.0, 46.0, 29.0, 32.0, 43.0, 31.0, 50.0, 46.0, 28.0, 41.0, 51.0, 40.0, 49.0, 32.0, 37.0, 29.0, 35.0, 26.0, 19.0, 20.0, 14.0, 14.0, 12.0, 7.0, 14.0, 7.0, 9.0, 7.0, 6.0, 3.0, 6.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.71875, -36.4296875, -35.140625, -33.8515625, -32.5625, -31.2734375, -29.984375, -28.6953125, -27.40625, -26.1171875, -24.828125, -23.5390625, -22.25, -20.9609375, -19.671875, -18.3828125, -17.09375, -15.8046875, -14.515625, -13.2265625, -11.9375, -10.6484375, -9.359375, -8.0703125, -6.78125, -5.4921875, -4.203125, -2.9140625, -1.625, -0.3359375, 0.953125, 2.2421875, 3.53125, 4.8203125, 6.109375, 7.3984375, 8.6875, 9.9765625, 11.265625, 12.5546875, 13.84375, 15.1328125, 16.421875, 17.7109375, 19.0, 20.2890625, 21.578125, 22.8671875, 24.15625, 25.4453125, 26.734375, 28.0234375, 29.3125, 30.6015625, 31.890625, 33.1796875, 34.46875, 35.7578125, 37.046875, 38.3359375, 39.625, 40.9140625, 42.203125, 43.4921875, 44.78125]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 8.0, 10.0, 13.0, 13.0, 20.0, 32.0, 29.0, 53.0, 80.0, 109.0, 139.0, 247.0, 319.0, 528.0, 723.0, 1200.0, 1995.0, 3363.0, 5920.0, 11272.0, 23008.0, 53835.0, 158527.0, 787917.0, 2525035.0, 431163.0, 108627.0, 40480.0, 18090.0, 9063.0, 4876.0, 2872.0, 1669.0, 1021.0, 655.0, 425.0, 303.0, 197.0, 123.0, 104.0, 76.0, 31.0, 39.0, 21.0, 16.0, 9.0, 13.0, 6.0, 5.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-92.0, -88.9677734375, -85.935546875, -82.9033203125, -79.87109375, -76.8388671875, -73.806640625, -70.7744140625, -67.7421875, -64.7099609375, -61.677734375, -58.6455078125, -55.61328125, -52.5810546875, -49.548828125, -46.5166015625, -43.484375, -40.4521484375, -37.419921875, -34.3876953125, -31.35546875, -28.3232421875, -25.291015625, -22.2587890625, -19.2265625, -16.1943359375, -13.162109375, -10.1298828125, -7.09765625, -4.0654296875, -1.033203125, 1.9990234375, 5.03125, 8.0634765625, 11.095703125, 14.1279296875, 17.16015625, 20.1923828125, 23.224609375, 26.2568359375, 29.2890625, 32.3212890625, 35.353515625, 38.3857421875, 41.41796875, 44.4501953125, 47.482421875, 50.5146484375, 53.546875, 56.5791015625, 59.611328125, 62.6435546875, 65.67578125, 68.7080078125, 71.740234375, 74.7724609375, 77.8046875, 80.8369140625, 83.869140625, 86.9013671875, 89.93359375, 92.9658203125, 95.998046875, 99.0302734375, 102.0625]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 7.0, 6.0, 6.0, 8.0, 13.0, 11.0, 13.0, 21.0, 32.0, 58.0, 50.0, 89.0, 111.0, 185.0, 293.0, 470.0, 688.0, 672.0, 457.0, 269.0, 161.0, 139.0, 81.0, 66.0, 48.0, 34.0, 19.0, 20.0, 10.0, 14.0, 7.0, 9.0, 6.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.28125, -20.3935546875, -19.505859375, -18.6181640625, -17.73046875, -16.8427734375, -15.955078125, -15.0673828125, -14.1796875, -13.2919921875, -12.404296875, -11.5166015625, -10.62890625, -9.7412109375, -8.853515625, -7.9658203125, -7.078125, -6.1904296875, -5.302734375, -4.4150390625, -3.52734375, -2.6396484375, -1.751953125, -0.8642578125, 0.0234375, 0.9111328125, 1.798828125, 2.6865234375, 3.57421875, 4.4619140625, 5.349609375, 6.2373046875, 7.125, 8.0126953125, 8.900390625, 9.7880859375, 10.67578125, 11.5634765625, 12.451171875, 13.3388671875, 14.2265625, 15.1142578125, 16.001953125, 16.8896484375, 17.77734375, 18.6650390625, 19.552734375, 20.4404296875, 21.328125, 22.2158203125, 23.103515625, 23.9912109375, 24.87890625, 25.7666015625, 26.654296875, 27.5419921875, 28.4296875, 29.3173828125, 30.205078125, 31.0927734375, 31.98046875, 32.8681640625, 33.755859375, 34.6435546875, 35.53125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 3.0, 1.0, 6.0, 6.0, 4.0, 7.0, 4.0, 14.0, 12.0, 16.0, 24.0, 25.0, 35.0, 41.0, 49.0, 69.0, 82.0, 94.0, 82.0, 80.0, 70.0, 70.0, 34.0, 34.0, 44.0, 16.0, 11.0, 21.0, 12.0, 8.0, 9.0, 6.0, 8.0, 1.0, 2.0, 3.0, 1.0, 0.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-54.37342071533203, -52.585872650146484, -50.7983283996582, -49.010780334472656, -47.223236083984375, -45.43568801879883, -43.64813995361328, -41.860595703125, -40.07304763793945, -38.285499572753906, -36.497955322265625, -34.71040725708008, -32.9228630065918, -31.13531494140625, -29.347768783569336, -27.560222625732422, -25.772676467895508, -23.985130310058594, -22.19758415222168, -20.410037994384766, -18.62248992919922, -16.834943771362305, -15.04739761352539, -13.25985050201416, -11.472304344177246, -9.684758186340332, -7.897211074829102, -6.1096649169921875, -4.322118282318115, -2.534571647644043, -0.7470254898071289, 1.0405216217041016, 2.8280677795410156, 4.615614414215088, 6.40316104888916, 8.190707206726074, 9.978254318237305, 11.765800476074219, 13.553346633911133, 15.340893745422363, 17.128440856933594, 18.915987014770508, 20.703533172607422, 22.49108123779297, 24.278627395629883, 26.066173553466797, 27.85371971130371, 29.641265869140625, 31.42881202697754, 33.21635818481445, 35.00390625, 36.79145050048828, 38.57899856567383, 40.366546630859375, 42.154090881347656, 43.9416389465332, 45.729183197021484, 47.51673126220703, 49.30427551269531, 51.09182357788086, 52.87936782836914, 54.66691589355469, 56.45446014404297, 58.242008209228516, 60.02955627441406]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 8.0, 3.0, 2.0, 5.0, 12.0, 16.0, 8.0, 12.0, 18.0, 14.0, 37.0, 30.0, 26.0, 28.0, 29.0, 38.0, 40.0, 39.0, 43.0, 44.0, 48.0, 53.0, 37.0, 50.0, 50.0, 32.0, 34.0, 29.0, 32.0, 23.0, 29.0, 26.0, 16.0, 20.0, 15.0, 11.0, 10.0, 13.0, 8.0, 6.0, 6.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.65070724487305, -41.14067459106445, -39.630645751953125, -38.12061309814453, -36.6105842590332, -35.10055160522461, -33.59052276611328, -32.08049011230469, -30.570457458496094, -29.060426712036133, -27.550395965576172, -26.040363311767578, -24.530332565307617, -23.020301818847656, -21.510271072387695, -20.000240325927734, -18.490209579467773, -16.980178833007812, -15.470147132873535, -13.960116386413574, -12.450084686279297, -10.940053939819336, -9.430023193359375, -7.919991493225098, -6.409960746765137, -4.899929523468018, -3.3898985385894775, -1.8798675537109375, -0.36983633041381836, 1.1401948928833008, 2.6502256393432617, 4.160257339477539, 5.6702880859375, 7.180319309234619, 8.690350532531738, 10.2003812789917, 11.710412979125977, 13.220443725585938, 14.730474472045898, 16.24050521850586, 17.750537872314453, 19.260568618774414, 20.770599365234375, 22.28063201904297, 23.79066276550293, 25.30069351196289, 26.81072425842285, 28.320755004882812, 29.830785751342773, 31.340816497802734, 32.85084915161133, 34.360877990722656, 35.87091064453125, 37.380943298339844, 38.89097213745117, 40.401004791259766, 41.911033630371094, 43.42106628417969, 44.931095123291016, 46.44112777709961, 47.95115661621094, 49.46118927001953, 50.971221923828125, 52.48125076293945, 53.99128341674805]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 7.0, 9.0, 7.0, 27.0, 28.0, 54.0, 66.0, 72.0, 134.0, 194.0, 286.0, 390.0, 541.0, 725.0, 1064.0, 1450.0, 2105.0, 3069.0, 4193.0, 5958.0, 8662.0, 12837.0, 19312.0, 29646.0, 46993.0, 77466.0, 132686.0, 215853.0, 187610.0, 111730.0, 65657.0, 40066.0, 25483.0, 16950.0, 11420.0, 7660.0, 5381.0, 3735.0, 2707.0, 1896.0, 1288.0, 893.0, 708.0, 459.0, 340.0, 217.0, 163.0, 124.0, 83.0, 54.0, 41.0, 28.0, 11.0, 11.0, 7.0, 5.0, 3.0, 3.0, 0.0, 2.0], "bins": [-18.25, -17.6767578125, -17.103515625, -16.5302734375, -15.95703125, -15.3837890625, -14.810546875, -14.2373046875, -13.6640625, -13.0908203125, -12.517578125, -11.9443359375, -11.37109375, -10.7978515625, -10.224609375, -9.6513671875, -9.078125, -8.5048828125, -7.931640625, -7.3583984375, -6.78515625, -6.2119140625, -5.638671875, -5.0654296875, -4.4921875, -3.9189453125, -3.345703125, -2.7724609375, -2.19921875, -1.6259765625, -1.052734375, -0.4794921875, 0.09375, 0.6669921875, 1.240234375, 1.8134765625, 2.38671875, 2.9599609375, 3.533203125, 4.1064453125, 4.6796875, 5.2529296875, 5.826171875, 6.3994140625, 6.97265625, 7.5458984375, 8.119140625, 8.6923828125, 9.265625, 9.8388671875, 10.412109375, 10.9853515625, 11.55859375, 12.1318359375, 12.705078125, 13.2783203125, 13.8515625, 14.4248046875, 14.998046875, 15.5712890625, 16.14453125, 16.7177734375, 17.291015625, 17.8642578125, 18.4375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 6.0, 3.0, 4.0, 4.0, 4.0, 9.0, 4.0, 14.0, 18.0, 13.0, 10.0, 21.0, 25.0, 29.0, 26.0, 23.0, 28.0, 43.0, 36.0, 46.0, 52.0, 39.0, 46.0, 44.0, 42.0, 48.0, 45.0, 34.0, 30.0, 31.0, 29.0, 23.0, 29.0, 28.0, 21.0, 19.0, 9.0, 22.0, 7.0, 10.0, 7.0, 10.0, 2.0, 7.0, 3.0, 5.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-41.8125, -40.3369140625, -38.861328125, -37.3857421875, -35.91015625, -34.4345703125, -32.958984375, -31.4833984375, -30.0078125, -28.5322265625, -27.056640625, -25.5810546875, -24.10546875, -22.6298828125, -21.154296875, -19.6787109375, -18.203125, -16.7275390625, -15.251953125, -13.7763671875, -12.30078125, -10.8251953125, -9.349609375, -7.8740234375, -6.3984375, -4.9228515625, -3.447265625, -1.9716796875, -0.49609375, 0.9794921875, 2.455078125, 3.9306640625, 5.40625, 6.8818359375, 8.357421875, 9.8330078125, 11.30859375, 12.7841796875, 14.259765625, 15.7353515625, 17.2109375, 18.6865234375, 20.162109375, 21.6376953125, 23.11328125, 24.5888671875, 26.064453125, 27.5400390625, 29.015625, 30.4912109375, 31.966796875, 33.4423828125, 34.91796875, 36.3935546875, 37.869140625, 39.3447265625, 40.8203125, 42.2958984375, 43.771484375, 45.2470703125, 46.72265625, 48.1982421875, 49.673828125, 51.1494140625, 52.625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 5.0, 7.0, 8.0, 13.0, 18.0, 34.0, 25.0, 44.0, 60.0, 82.0, 112.0, 154.0, 222.0, 313.0, 436.0, 663.0, 952.0, 1460.0, 2140.0, 3464.0, 5492.0, 9665.0, 19171.0, 60702.0, 760320.0, 127792.0, 25056.0, 11909.0, 6716.0, 4035.0, 2507.0, 1568.0, 1069.0, 688.0, 492.0, 343.0, 234.0, 161.0, 121.0, 101.0, 51.0, 52.0, 30.0, 22.0, 15.0, 11.0, 5.0, 14.0, 3.0, 3.0, 0.0, 2.0, 2.0], "bins": [-42.5, -41.30810546875, -40.1162109375, -38.92431640625, -37.732421875, -36.54052734375, -35.3486328125, -34.15673828125, -32.96484375, -31.77294921875, -30.5810546875, -29.38916015625, -28.197265625, -27.00537109375, -25.8134765625, -24.62158203125, -23.4296875, -22.23779296875, -21.0458984375, -19.85400390625, -18.662109375, -17.47021484375, -16.2783203125, -15.08642578125, -13.89453125, -12.70263671875, -11.5107421875, -10.31884765625, -9.126953125, -7.93505859375, -6.7431640625, -5.55126953125, -4.359375, -3.16748046875, -1.9755859375, -0.78369140625, 0.408203125, 1.60009765625, 2.7919921875, 3.98388671875, 5.17578125, 6.36767578125, 7.5595703125, 8.75146484375, 9.943359375, 11.13525390625, 12.3271484375, 13.51904296875, 14.7109375, 15.90283203125, 17.0947265625, 18.28662109375, 19.478515625, 20.67041015625, 21.8623046875, 23.05419921875, 24.24609375, 25.43798828125, 26.6298828125, 27.82177734375, 29.013671875, 30.20556640625, 31.3974609375, 32.58935546875, 33.78125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 5.0, 2.0, 6.0, 11.0, 11.0, 10.0, 10.0, 13.0, 13.0, 20.0, 23.0, 23.0, 23.0, 24.0, 25.0, 33.0, 27.0, 47.0, 38.0, 45.0, 42.0, 34.0, 38.0, 46.0, 39.0, 36.0, 41.0, 46.0, 27.0, 46.0, 26.0, 35.0, 20.0, 15.0, 18.0, 15.0, 10.0, 13.0, 3.0, 5.0, 9.0, 10.0, 8.0, 2.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-30.484375, -29.447021484375, -28.40966796875, -27.372314453125, -26.3349609375, -25.297607421875, -24.26025390625, -23.222900390625, -22.185546875, -21.148193359375, -20.11083984375, -19.073486328125, -18.0361328125, -16.998779296875, -15.96142578125, -14.924072265625, -13.88671875, -12.849365234375, -11.81201171875, -10.774658203125, -9.7373046875, -8.699951171875, -7.66259765625, -6.625244140625, -5.587890625, -4.550537109375, -3.51318359375, -2.475830078125, -1.4384765625, -0.401123046875, 0.63623046875, 1.673583984375, 2.7109375, 3.748291015625, 4.78564453125, 5.822998046875, 6.8603515625, 7.897705078125, 8.93505859375, 9.972412109375, 11.009765625, 12.047119140625, 13.08447265625, 14.121826171875, 15.1591796875, 16.196533203125, 17.23388671875, 18.271240234375, 19.30859375, 20.345947265625, 21.38330078125, 22.420654296875, 23.4580078125, 24.495361328125, 25.53271484375, 26.570068359375, 27.607421875, 28.644775390625, 29.68212890625, 30.719482421875, 31.7568359375, 32.794189453125, 33.83154296875, 34.868896484375, 35.90625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 5.0, 6.0, 8.0, 9.0, 21.0, 34.0, 45.0, 88.0, 178.0, 330.0, 596.0, 1518.0, 4573.0, 21986.0, 929529.0, 76471.0, 8848.0, 2417.0, 1007.0, 403.0, 204.0, 98.0, 59.0, 48.0, 27.0, 13.0, 8.0, 8.0, 7.0, 1.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.1796875, -6.9208984375, -6.662109375, -6.4033203125, -6.14453125, -5.8857421875, -5.626953125, -5.3681640625, -5.109375, -4.8505859375, -4.591796875, -4.3330078125, -4.07421875, -3.8154296875, -3.556640625, -3.2978515625, -3.0390625, -2.7802734375, -2.521484375, -2.2626953125, -2.00390625, -1.7451171875, -1.486328125, -1.2275390625, -0.96875, -0.7099609375, -0.451171875, -0.1923828125, 0.06640625, 0.3251953125, 0.583984375, 0.8427734375, 1.1015625, 1.3603515625, 1.619140625, 1.8779296875, 2.13671875, 2.3955078125, 2.654296875, 2.9130859375, 3.171875, 3.4306640625, 3.689453125, 3.9482421875, 4.20703125, 4.4658203125, 4.724609375, 4.9833984375, 5.2421875, 5.5009765625, 5.759765625, 6.0185546875, 6.27734375, 6.5361328125, 6.794921875, 7.0537109375, 7.3125, 7.5712890625, 7.830078125, 8.0888671875, 8.34765625, 8.6064453125, 8.865234375, 9.1240234375, 9.3828125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 6.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 7.0, 10.0, 11.0, 25.0, 27.0, 36.0, 59.0, 77.0, 140.0, 147.0, 148.0, 89.0, 62.0, 44.0, 34.0, 17.0, 13.0, 11.0, 7.0, 6.0, 6.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000743865966796875, -0.0007168799638748169, -0.0006898939609527588, -0.0006629079580307007, -0.0006359219551086426, -0.0006089359521865845, -0.0005819499492645264, -0.0005549639463424683, -0.0005279779434204102, -0.000500991940498352, -0.00047400593757629395, -0.00044701993465423584, -0.00042003393173217773, -0.00039304792881011963, -0.0003660619258880615, -0.0003390759229660034, -0.0003120899200439453, -0.0002851039171218872, -0.0002581179141998291, -0.000231131911277771, -0.0002041459083557129, -0.00017715990543365479, -0.00015017390251159668, -0.00012318789958953857, -9.620189666748047e-05, -6.921589374542236e-05, -4.222989082336426e-05, -1.5243887901306152e-05, 1.1742115020751953e-05, 3.872811794281006e-05, 6.571412086486816e-05, 9.270012378692627e-05, 0.00011968612670898438, 0.00014667212963104248, 0.00017365813255310059, 0.0002006441354751587, 0.0002276301383972168, 0.0002546161413192749, 0.000281602144241333, 0.0003085881471633911, 0.0003355741500854492, 0.0003625601530075073, 0.00038954615592956543, 0.00041653215885162354, 0.00044351816177368164, 0.00047050416469573975, 0.0004974901676177979, 0.000524476170539856, 0.0005514621734619141, 0.0005784481763839722, 0.0006054341793060303, 0.0006324201822280884, 0.0006594061851501465, 0.0006863921880722046, 0.0007133781909942627, 0.0007403641939163208, 0.0007673501968383789, 0.000794336199760437, 0.0008213222026824951, 0.0008483082056045532, 0.0008752942085266113, 0.0009022802114486694, 0.0009292662143707275, 0.0009562522172927856, 0.0009832382202148438]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 9.0, 8.0, 11.0, 8.0, 22.0, 18.0, 36.0, 50.0, 55.0, 99.0, 144.0, 166.0, 258.0, 386.0, 587.0, 912.0, 1456.0, 2508.0, 4546.0, 9346.0, 22490.0, 69919.0, 330441.0, 457919.0, 95073.0, 28121.0, 11159.0, 5315.0, 2871.0, 1615.0, 1047.0, 636.0, 410.0, 275.0, 167.0, 136.0, 97.0, 69.0, 51.0, 27.0, 24.0, 18.0, 11.0, 15.0, 12.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-6.15625, -5.9583740234375, -5.760498046875, -5.5626220703125, -5.36474609375, -5.1668701171875, -4.968994140625, -4.7711181640625, -4.5732421875, -4.3753662109375, -4.177490234375, -3.9796142578125, -3.78173828125, -3.5838623046875, -3.385986328125, -3.1881103515625, -2.990234375, -2.7923583984375, -2.594482421875, -2.3966064453125, -2.19873046875, -2.0008544921875, -1.802978515625, -1.6051025390625, -1.4072265625, -1.2093505859375, -1.011474609375, -0.8135986328125, -0.61572265625, -0.4178466796875, -0.219970703125, -0.0220947265625, 0.17578125, 0.3736572265625, 0.571533203125, 0.7694091796875, 0.96728515625, 1.1651611328125, 1.363037109375, 1.5609130859375, 1.7587890625, 1.9566650390625, 2.154541015625, 2.3524169921875, 2.55029296875, 2.7481689453125, 2.946044921875, 3.1439208984375, 3.341796875, 3.5396728515625, 3.737548828125, 3.9354248046875, 4.13330078125, 4.3311767578125, 4.529052734375, 4.7269287109375, 4.9248046875, 5.1226806640625, 5.320556640625, 5.5184326171875, 5.71630859375, 5.9141845703125, 6.112060546875, 6.3099365234375, 6.5078125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 2.0, 5.0, 2.0, 9.0, 5.0, 11.0, 17.0, 25.0, 36.0, 53.0, 95.0, 116.0, 174.0, 144.0, 114.0, 52.0, 38.0, 20.0, 20.0, 19.0, 7.0, 9.0, 6.0, 6.0, 2.0, 4.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.6865234375, -1.629425048828125, -1.57232666015625, -1.515228271484375, -1.4581298828125, -1.401031494140625, -1.34393310546875, -1.286834716796875, -1.229736328125, -1.172637939453125, -1.11553955078125, -1.058441162109375, -1.0013427734375, -0.944244384765625, -0.88714599609375, -0.830047607421875, -0.77294921875, -0.715850830078125, -0.65875244140625, -0.601654052734375, -0.5445556640625, -0.487457275390625, -0.43035888671875, -0.373260498046875, -0.316162109375, -0.259063720703125, -0.20196533203125, -0.144866943359375, -0.0877685546875, -0.030670166015625, 0.02642822265625, 0.083526611328125, 0.140625, 0.197723388671875, 0.25482177734375, 0.311920166015625, 0.3690185546875, 0.426116943359375, 0.48321533203125, 0.540313720703125, 0.597412109375, 0.654510498046875, 0.71160888671875, 0.768707275390625, 0.8258056640625, 0.882904052734375, 0.94000244140625, 0.997100830078125, 1.05419921875, 1.111297607421875, 1.16839599609375, 1.225494384765625, 1.2825927734375, 1.339691162109375, 1.39678955078125, 1.453887939453125, 1.510986328125, 1.568084716796875, 1.62518310546875, 1.682281494140625, 1.7393798828125, 1.796478271484375, 1.85357666015625, 1.910675048828125, 1.9677734375]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 1.0, 7.0, 3.0, 8.0, 11.0, 10.0, 7.0, 21.0, 19.0, 23.0, 43.0, 41.0, 61.0, 58.0, 84.0, 90.0, 85.0, 77.0, 77.0, 58.0, 40.0, 41.0, 33.0, 21.0, 17.0, 10.0, 11.0, 10.0, 10.0, 8.0, 6.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.22563552856445, -45.49348449707031, -43.76133346557617, -42.02918243408203, -40.297035217285156, -38.564884185791016, -36.832733154296875, -35.100582122802734, -33.368431091308594, -31.636280059814453, -29.904130935668945, -28.171979904174805, -26.439828872680664, -24.707679748535156, -22.975528717041016, -21.243377685546875, -19.511228561401367, -17.779077529907227, -16.04692840576172, -14.314777374267578, -12.582626342773438, -10.850476264953613, -9.118326187133789, -7.386175155639648, -5.654025077819824, -3.921874523162842, -2.1897242069244385, -0.45757389068603516, 1.2745766639709473, 3.0067272186279297, 4.738877296447754, 6.4710283279418945, 8.203178405761719, 9.935328483581543, 11.667479515075684, 13.399629592895508, 15.131780624389648, 16.863929748535156, 18.596080780029297, 20.328231811523438, 22.060382843017578, 23.79253387451172, 25.524682998657227, 27.256834030151367, 28.988985061645508, 30.721134185791016, 32.453285217285156, 34.1854362487793, 35.91758728027344, 37.64973831176758, 39.38188934326172, 41.114036560058594, 42.846187591552734, 44.578338623046875, 46.310489654541016, 48.042640686035156, 49.77478790283203, 51.50693893432617, 53.23908996582031, 54.97123718261719, 56.70338821411133, 58.43553924560547, 60.16769027709961, 61.89984130859375, 63.63199234008789]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 7.0, 5.0, 2.0, 4.0, 10.0, 17.0, 8.0, 12.0, 16.0, 13.0, 39.0, 28.0, 32.0, 25.0, 28.0, 36.0, 41.0, 42.0, 42.0, 46.0, 47.0, 50.0, 39.0, 51.0, 47.0, 33.0, 36.0, 29.0, 33.0, 24.0, 26.0, 26.0, 21.0, 19.0, 14.0, 9.0, 12.0, 11.0, 8.0, 6.0, 7.0, 3.0, 1.0, 2.0, 3.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.657379150390625, -40.182823181152344, -38.70826721191406, -37.23371505737305, -35.759159088134766, -34.284603118896484, -32.81005096435547, -31.335494995117188, -29.860939025878906, -28.386383056640625, -26.911828994750977, -25.437274932861328, -23.962718963623047, -22.488162994384766, -21.013608932495117, -19.53905487060547, -18.064498901367188, -16.589942932128906, -15.115388870239258, -13.640833854675293, -12.166278839111328, -10.691723823547363, -9.217168807983398, -7.742613792419434, -6.268058776855469, -4.793503761291504, -3.318948745727539, -1.8443937301635742, -0.3698387145996094, 1.1047163009643555, 2.5792713165283203, 4.053826332092285, 5.528385162353516, 7.0029401779174805, 8.477495193481445, 9.95205020904541, 11.426605224609375, 12.90116024017334, 14.375715255737305, 15.85027027130127, 17.324825286865234, 18.799381256103516, 20.273935317993164, 21.748489379882812, 23.223045349121094, 24.697601318359375, 26.172155380249023, 27.646709442138672, 29.121265411376953, 30.595821380615234, 32.07037353515625, 33.54492950439453, 35.01948547363281, 36.494041442871094, 37.968597412109375, 39.44314956665039, 40.91770553588867, 42.39226150512695, 43.86681365966797, 45.34136962890625, 46.81592559814453, 48.29048156738281, 49.765037536621094, 51.23958969116211, 52.71414566040039]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 12.0, 16.0, 34.0, 19.0, 38.0, 64.0, 96.0, 150.0, 211.0, 330.0, 438.0, 719.0, 1004.0, 1617.0, 2487.0, 3842.0, 5950.0, 9954.0, 16658.0, 28735.0, 53169.0, 105241.0, 218391.0, 282525.0, 149215.0, 73524.0, 38526.0, 21692.0, 12624.0, 7650.0, 4796.0, 3107.0, 1872.0, 1276.0, 822.0, 568.0, 368.0, 263.0, 175.0, 113.0, 88.0, 54.0, 35.0, 28.0, 21.0, 16.0, 3.0, 6.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-56.0, -54.20751953125, -52.4150390625, -50.62255859375, -48.830078125, -47.03759765625, -45.2451171875, -43.45263671875, -41.66015625, -39.86767578125, -38.0751953125, -36.28271484375, -34.490234375, -32.69775390625, -30.9052734375, -29.11279296875, -27.3203125, -25.52783203125, -23.7353515625, -21.94287109375, -20.150390625, -18.35791015625, -16.5654296875, -14.77294921875, -12.98046875, -11.18798828125, -9.3955078125, -7.60302734375, -5.810546875, -4.01806640625, -2.2255859375, -0.43310546875, 1.359375, 3.15185546875, 4.9443359375, 6.73681640625, 8.529296875, 10.32177734375, 12.1142578125, 13.90673828125, 15.69921875, 17.49169921875, 19.2841796875, 21.07666015625, 22.869140625, 24.66162109375, 26.4541015625, 28.24658203125, 30.0390625, 31.83154296875, 33.6240234375, 35.41650390625, 37.208984375, 39.00146484375, 40.7939453125, 42.58642578125, 44.37890625, 46.17138671875, 47.9638671875, 49.75634765625, 51.548828125, 53.34130859375, 55.1337890625, 56.92626953125, 58.71875]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 3.0, 3.0, 7.0, 13.0, 7.0, 10.0, 14.0, 18.0, 27.0, 30.0, 24.0, 24.0, 32.0, 36.0, 40.0, 49.0, 45.0, 54.0, 53.0, 48.0, 55.0, 61.0, 50.0, 38.0, 31.0, 33.0, 26.0, 29.0, 25.0, 23.0, 19.0, 16.0, 11.0, 8.0, 10.0, 8.0, 7.0, 4.0, 6.0, 2.0, 1.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.03125, -42.470703125, -40.91015625, -39.349609375, -37.7890625, -36.228515625, -34.66796875, -33.107421875, -31.546875, -29.986328125, -28.42578125, -26.865234375, -25.3046875, -23.744140625, -22.18359375, -20.623046875, -19.0625, -17.501953125, -15.94140625, -14.380859375, -12.8203125, -11.259765625, -9.69921875, -8.138671875, -6.578125, -5.017578125, -3.45703125, -1.896484375, -0.3359375, 1.224609375, 2.78515625, 4.345703125, 5.90625, 7.466796875, 9.02734375, 10.587890625, 12.1484375, 13.708984375, 15.26953125, 16.830078125, 18.390625, 19.951171875, 21.51171875, 23.072265625, 24.6328125, 26.193359375, 27.75390625, 29.314453125, 30.875, 32.435546875, 33.99609375, 35.556640625, 37.1171875, 38.677734375, 40.23828125, 41.798828125, 43.359375, 44.919921875, 46.48046875, 48.041015625, 49.6015625, 51.162109375, 52.72265625, 54.283203125, 55.84375]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 5.0, 5.0, 5.0, 9.0, 15.0, 20.0, 23.0, 36.0, 70.0, 87.0, 149.0, 235.0, 352.0, 532.0, 740.0, 1168.0, 1754.0, 2792.0, 4189.0, 6369.0, 10309.0, 16229.0, 26510.0, 44146.0, 77424.0, 140489.0, 235193.0, 204504.0, 114224.0, 63065.0, 37174.0, 22100.0, 13894.0, 8586.0, 5684.0, 3523.0, 2368.0, 1614.0, 966.0, 673.0, 476.0, 291.0, 207.0, 115.0, 94.0, 59.0, 34.0, 23.0, 23.0, 5.0, 8.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-58.90625, -57.21484375, -55.5234375, -53.83203125, -52.140625, -50.44921875, -48.7578125, -47.06640625, -45.375, -43.68359375, -41.9921875, -40.30078125, -38.609375, -36.91796875, -35.2265625, -33.53515625, -31.84375, -30.15234375, -28.4609375, -26.76953125, -25.078125, -23.38671875, -21.6953125, -20.00390625, -18.3125, -16.62109375, -14.9296875, -13.23828125, -11.546875, -9.85546875, -8.1640625, -6.47265625, -4.78125, -3.08984375, -1.3984375, 0.29296875, 1.984375, 3.67578125, 5.3671875, 7.05859375, 8.75, 10.44140625, 12.1328125, 13.82421875, 15.515625, 17.20703125, 18.8984375, 20.58984375, 22.28125, 23.97265625, 25.6640625, 27.35546875, 29.046875, 30.73828125, 32.4296875, 34.12109375, 35.8125, 37.50390625, 39.1953125, 40.88671875, 42.578125, 44.26953125, 45.9609375, 47.65234375, 49.34375]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 3.0, 5.0, 6.0, 8.0, 13.0, 11.0, 12.0, 10.0, 13.0, 18.0, 19.0, 29.0, 25.0, 22.0, 27.0, 30.0, 40.0, 30.0, 39.0, 23.0, 36.0, 45.0, 39.0, 53.0, 41.0, 38.0, 43.0, 37.0, 35.0, 32.0, 28.0, 26.0, 16.0, 24.0, 19.0, 20.0, 16.0, 10.0, 13.0, 4.0, 11.0, 8.0, 8.0, 7.0, 5.0, 3.0, 0.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0], "bins": [-28.484375, -27.630126953125, -26.77587890625, -25.921630859375, -25.0673828125, -24.213134765625, -23.35888671875, -22.504638671875, -21.650390625, -20.796142578125, -19.94189453125, -19.087646484375, -18.2333984375, -17.379150390625, -16.52490234375, -15.670654296875, -14.81640625, -13.962158203125, -13.10791015625, -12.253662109375, -11.3994140625, -10.545166015625, -9.69091796875, -8.836669921875, -7.982421875, -7.128173828125, -6.27392578125, -5.419677734375, -4.5654296875, -3.711181640625, -2.85693359375, -2.002685546875, -1.1484375, -0.294189453125, 0.56005859375, 1.414306640625, 2.2685546875, 3.122802734375, 3.97705078125, 4.831298828125, 5.685546875, 6.539794921875, 7.39404296875, 8.248291015625, 9.1025390625, 9.956787109375, 10.81103515625, 11.665283203125, 12.51953125, 13.373779296875, 14.22802734375, 15.082275390625, 15.9365234375, 16.790771484375, 17.64501953125, 18.499267578125, 19.353515625, 20.207763671875, 21.06201171875, 21.916259765625, 22.7705078125, 23.624755859375, 24.47900390625, 25.333251953125, 26.1875]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 3.0, 1.0, 6.0, 12.0, 20.0, 23.0, 28.0, 48.0, 70.0, 100.0, 165.0, 248.0, 440.0, 731.0, 1199.0, 2183.0, 4312.0, 9951.0, 25476.0, 80189.0, 315661.0, 434965.0, 113867.0, 34590.0, 12793.0, 5330.0, 2576.0, 1432.0, 817.0, 493.0, 287.0, 185.0, 124.0, 59.0, 49.0, 51.0, 17.0, 18.0, 14.0, 12.0, 6.0, 5.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.0625, -38.77587890625, -37.4892578125, -36.20263671875, -34.916015625, -33.62939453125, -32.3427734375, -31.05615234375, -29.76953125, -28.48291015625, -27.1962890625, -25.90966796875, -24.623046875, -23.33642578125, -22.0498046875, -20.76318359375, -19.4765625, -18.18994140625, -16.9033203125, -15.61669921875, -14.330078125, -13.04345703125, -11.7568359375, -10.47021484375, -9.18359375, -7.89697265625, -6.6103515625, -5.32373046875, -4.037109375, -2.75048828125, -1.4638671875, -0.17724609375, 1.109375, 2.39599609375, 3.6826171875, 4.96923828125, 6.255859375, 7.54248046875, 8.8291015625, 10.11572265625, 11.40234375, 12.68896484375, 13.9755859375, 15.26220703125, 16.548828125, 17.83544921875, 19.1220703125, 20.40869140625, 21.6953125, 22.98193359375, 24.2685546875, 25.55517578125, 26.841796875, 28.12841796875, 29.4150390625, 30.70166015625, 31.98828125, 33.27490234375, 34.5615234375, 35.84814453125, 37.134765625, 38.42138671875, 39.7080078125, 40.99462890625, 42.28125]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 3.0, 3.0, 2.0, 9.0, 7.0, 17.0, 18.0, 29.0, 37.0, 79.0, 141.0, 179.0, 169.0, 107.0, 76.0, 43.0, 27.0, 24.0, 16.0, 6.0, 5.0, 2.0, 4.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0028438568115234375, -0.0027130544185638428, -0.002582252025604248, -0.0024514496326446533, -0.0023206472396850586, -0.002189844846725464, -0.002059042453765869, -0.0019282400608062744, -0.0017974376678466797, -0.001666635274887085, -0.0015358328819274902, -0.0014050304889678955, -0.0012742280960083008, -0.001143425703048706, -0.0010126233100891113, -0.0008818209171295166, -0.0007510185241699219, -0.0006202161312103271, -0.0004894137382507324, -0.0003586113452911377, -0.00022780895233154297, -9.700655937194824e-05, 3.3795833587646484e-05, 0.0001645982265472412, 0.00029540061950683594, 0.00042620301246643066, 0.0005570054054260254, 0.0006878077983856201, 0.0008186101913452148, 0.0009494125843048096, 0.0010802149772644043, 0.001211017370223999, 0.0013418197631835938, 0.0014726221561431885, 0.0016034245491027832, 0.001734226942062378, 0.0018650293350219727, 0.0019958317279815674, 0.002126634120941162, 0.002257436513900757, 0.0023882389068603516, 0.0025190412998199463, 0.002649843692779541, 0.0027806460857391357, 0.0029114484786987305, 0.003042250871658325, 0.00317305326461792, 0.0033038556575775146, 0.0034346580505371094, 0.003565460443496704, 0.003696262836456299, 0.0038270652294158936, 0.003957867622375488, 0.004088670015335083, 0.004219472408294678, 0.0043502748012542725, 0.004481077194213867, 0.004611879587173462, 0.004742681980133057, 0.004873484373092651, 0.005004286766052246, 0.005135089159011841, 0.0052658915519714355, 0.00539669394493103, 0.005527496337890625]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 4.0, 2.0, 4.0, 2.0, 6.0, 4.0, 16.0, 11.0, 25.0, 21.0, 26.0, 45.0, 77.0, 93.0, 142.0, 217.0, 308.0, 467.0, 776.0, 1194.0, 2061.0, 3830.0, 7562.0, 16503.0, 40236.0, 112003.0, 328009.0, 341590.0, 116624.0, 42287.0, 17161.0, 7786.0, 3994.0, 2010.0, 1251.0, 735.0, 502.0, 285.0, 188.0, 151.0, 95.0, 81.0, 41.0, 43.0, 25.0, 23.0, 13.0, 15.0, 9.0, 8.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-28.328125, -27.384521484375, -26.44091796875, -25.497314453125, -24.5537109375, -23.610107421875, -22.66650390625, -21.722900390625, -20.779296875, -19.835693359375, -18.89208984375, -17.948486328125, -17.0048828125, -16.061279296875, -15.11767578125, -14.174072265625, -13.23046875, -12.286865234375, -11.34326171875, -10.399658203125, -9.4560546875, -8.512451171875, -7.56884765625, -6.625244140625, -5.681640625, -4.738037109375, -3.79443359375, -2.850830078125, -1.9072265625, -0.963623046875, -0.02001953125, 0.923583984375, 1.8671875, 2.810791015625, 3.75439453125, 4.697998046875, 5.6416015625, 6.585205078125, 7.52880859375, 8.472412109375, 9.416015625, 10.359619140625, 11.30322265625, 12.246826171875, 13.1904296875, 14.134033203125, 15.07763671875, 16.021240234375, 16.96484375, 17.908447265625, 18.85205078125, 19.795654296875, 20.7392578125, 21.682861328125, 22.62646484375, 23.570068359375, 24.513671875, 25.457275390625, 26.40087890625, 27.344482421875, 28.2880859375, 29.231689453125, 30.17529296875, 31.118896484375, 32.0625]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 6.0, 4.0, 8.0, 13.0, 9.0, 11.0, 22.0, 23.0, 30.0, 50.0, 50.0, 69.0, 62.0, 74.0, 83.0, 85.0, 73.0, 62.0, 51.0, 40.0, 38.0, 33.0, 25.0, 15.0, 19.0, 12.0, 4.0, 14.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.890625, -7.650634765625, -7.41064453125, -7.170654296875, -6.9306640625, -6.690673828125, -6.45068359375, -6.210693359375, -5.970703125, -5.730712890625, -5.49072265625, -5.250732421875, -5.0107421875, -4.770751953125, -4.53076171875, -4.290771484375, -4.05078125, -3.810791015625, -3.57080078125, -3.330810546875, -3.0908203125, -2.850830078125, -2.61083984375, -2.370849609375, -2.130859375, -1.890869140625, -1.65087890625, -1.410888671875, -1.1708984375, -0.930908203125, -0.69091796875, -0.450927734375, -0.2109375, 0.029052734375, 0.26904296875, 0.509033203125, 0.7490234375, 0.989013671875, 1.22900390625, 1.468994140625, 1.708984375, 1.948974609375, 2.18896484375, 2.428955078125, 2.6689453125, 2.908935546875, 3.14892578125, 3.388916015625, 3.62890625, 3.868896484375, 4.10888671875, 4.348876953125, 4.5888671875, 4.828857421875, 5.06884765625, 5.308837890625, 5.548828125, 5.788818359375, 6.02880859375, 6.268798828125, 6.5087890625, 6.748779296875, 6.98876953125, 7.228759765625, 7.46875]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 3.0, 5.0, 7.0, 3.0, 7.0, 14.0, 15.0, 23.0, 23.0, 21.0, 36.0, 52.0, 49.0, 77.0, 66.0, 86.0, 96.0, 74.0, 77.0, 45.0, 48.0, 37.0, 38.0, 27.0, 21.0, 8.0, 11.0, 7.0, 8.0, 2.0, 3.0, 2.0, 3.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-48.10462951660156, -46.39650344848633, -44.688377380371094, -42.98025131225586, -41.272125244140625, -39.56399917602539, -37.855873107910156, -36.14774703979492, -34.43962097167969, -32.73149490356445, -31.02336883544922, -29.315242767333984, -27.60711669921875, -25.898990631103516, -24.19086456298828, -22.482738494873047, -20.774612426757812, -19.066486358642578, -17.358360290527344, -15.65023422241211, -13.942108154296875, -12.23398208618164, -10.525856018066406, -8.817729949951172, -7.1096038818359375, -5.401477813720703, -3.6933517456054688, -1.9852256774902344, -0.277099609375, 1.4310264587402344, 3.1391525268554688, 4.847278594970703, 6.555408477783203, 8.263534545898438, 9.971660614013672, 11.679786682128906, 13.38791275024414, 15.096038818359375, 16.80416488647461, 18.512290954589844, 20.220417022705078, 21.928543090820312, 23.636669158935547, 25.34479522705078, 27.052921295166016, 28.76104736328125, 30.469173431396484, 32.17729949951172, 33.88542556762695, 35.59355163574219, 37.30167770385742, 39.009803771972656, 40.71792984008789, 42.426055908203125, 44.13418197631836, 45.842308044433594, 47.55043411254883, 49.25856018066406, 50.9666862487793, 52.67481231689453, 54.382938385009766, 56.091064453125, 57.799190521240234, 59.50731658935547, 61.2154426574707]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 4.0, 2.0, 8.0, 7.0, 11.0, 11.0, 12.0, 10.0, 22.0, 21.0, 23.0, 39.0, 38.0, 41.0, 42.0, 42.0, 56.0, 44.0, 47.0, 48.0, 36.0, 52.0, 41.0, 43.0, 40.0, 40.0, 39.0, 24.0, 34.0, 19.0, 20.0, 24.0, 14.0, 11.0, 13.0, 11.0, 4.0, 4.0, 2.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.30747604370117, -44.63785934448242, -42.968238830566406, -41.298622131347656, -39.629005432128906, -37.959388732910156, -36.289772033691406, -34.62015151977539, -32.95053482055664, -31.28091812133789, -29.611299514770508, -27.941680908203125, -26.272064208984375, -24.602447509765625, -22.932828903198242, -21.26321029663086, -19.59359359741211, -17.92397689819336, -16.254358291625977, -14.58474063873291, -12.915122985839844, -11.245505332946777, -9.575887680053711, -7.9062700271606445, -6.236652374267578, -4.567034721374512, -2.8974170684814453, -1.227799415588379, 0.4418182373046875, 2.111435890197754, 3.7810535430908203, 5.450671195983887, 7.120288848876953, 8.78990650177002, 10.459524154663086, 12.129141807556152, 13.798759460449219, 15.468377113342285, 17.13799476623535, 18.807613372802734, 20.477230072021484, 22.146846771240234, 23.816465377807617, 25.486083984375, 27.15570068359375, 28.8253173828125, 30.494935989379883, 32.164554595947266, 33.834171295166016, 35.503787994384766, 37.17340850830078, 38.84302520751953, 40.51264190673828, 42.18225860595703, 43.85187530517578, 45.5214958190918, 47.19111251831055, 48.8607292175293, 50.53034973144531, 52.19996643066406, 53.86958312988281, 55.53919982910156, 57.20881652832031, 58.87843704223633, 60.54805374145508]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [3.0, 4.0, 8.0, 9.0, 16.0, 18.0, 22.0, 42.0, 49.0, 78.0, 105.0, 190.0, 232.0, 303.0, 488.0, 733.0, 1007.0, 1568.0, 2430.0, 3651.0, 6001.0, 10176.0, 19867.0, 46041.0, 143957.0, 517808.0, 1595474.0, 1303254.0, 365226.0, 97405.0, 35240.0, 16718.0, 9416.0, 5473.0, 3545.0, 2304.0, 1531.0, 1090.0, 828.0, 526.0, 422.0, 278.0, 220.0, 142.0, 117.0, 91.0, 48.0, 37.0, 33.0, 27.0, 14.0, 19.0, 9.0, 7.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.71875, -47.86865234375, -46.0185546875, -44.16845703125, -42.318359375, -40.46826171875, -38.6181640625, -36.76806640625, -34.91796875, -33.06787109375, -31.2177734375, -29.36767578125, -27.517578125, -25.66748046875, -23.8173828125, -21.96728515625, -20.1171875, -18.26708984375, -16.4169921875, -14.56689453125, -12.716796875, -10.86669921875, -9.0166015625, -7.16650390625, -5.31640625, -3.46630859375, -1.6162109375, 0.23388671875, 2.083984375, 3.93408203125, 5.7841796875, 7.63427734375, 9.484375, 11.33447265625, 13.1845703125, 15.03466796875, 16.884765625, 18.73486328125, 20.5849609375, 22.43505859375, 24.28515625, 26.13525390625, 27.9853515625, 29.83544921875, 31.685546875, 33.53564453125, 35.3857421875, 37.23583984375, 39.0859375, 40.93603515625, 42.7861328125, 44.63623046875, 46.486328125, 48.33642578125, 50.1865234375, 52.03662109375, 53.88671875, 55.73681640625, 57.5869140625, 59.43701171875, 61.287109375, 63.13720703125, 64.9873046875, 66.83740234375, 68.6875]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 10.0, 8.0, 10.0, 8.0, 7.0, 19.0, 17.0, 25.0, 24.0, 32.0, 31.0, 49.0, 45.0, 47.0, 57.0, 53.0, 60.0, 40.0, 51.0, 48.0, 53.0, 46.0, 36.0, 41.0, 28.0, 31.0, 29.0, 23.0, 21.0, 11.0, 9.0, 10.0, 11.0, 8.0, 1.0, 3.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.40625, -39.896484375, -38.38671875, -36.876953125, -35.3671875, -33.857421875, -32.34765625, -30.837890625, -29.328125, -27.818359375, -26.30859375, -24.798828125, -23.2890625, -21.779296875, -20.26953125, -18.759765625, -17.25, -15.740234375, -14.23046875, -12.720703125, -11.2109375, -9.701171875, -8.19140625, -6.681640625, -5.171875, -3.662109375, -2.15234375, -0.642578125, 0.8671875, 2.376953125, 3.88671875, 5.396484375, 6.90625, 8.416015625, 9.92578125, 11.435546875, 12.9453125, 14.455078125, 15.96484375, 17.474609375, 18.984375, 20.494140625, 22.00390625, 23.513671875, 25.0234375, 26.533203125, 28.04296875, 29.552734375, 31.0625, 32.572265625, 34.08203125, 35.591796875, 37.1015625, 38.611328125, 40.12109375, 41.630859375, 43.140625, 44.650390625, 46.16015625, 47.669921875, 49.1796875, 50.689453125, 52.19921875, 53.708984375, 55.21875]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 14.0, 13.0, 13.0, 21.0, 26.0, 52.0, 90.0, 121.0, 193.0, 240.0, 385.0, 586.0, 928.0, 1359.0, 2169.0, 3688.0, 6189.0, 11245.0, 22359.0, 50400.0, 137311.0, 507643.0, 2188399.0, 912934.0, 213288.0, 71314.0, 29546.0, 14459.0, 7693.0, 4341.0, 2609.0, 1607.0, 1031.0, 648.0, 438.0, 298.0, 205.0, 143.0, 109.0, 62.0, 34.0, 30.0, 16.0, 11.0, 13.0, 2.0, 7.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-75.0, -72.5556640625, -70.111328125, -67.6669921875, -65.22265625, -62.7783203125, -60.333984375, -57.8896484375, -55.4453125, -53.0009765625, -50.556640625, -48.1123046875, -45.66796875, -43.2236328125, -40.779296875, -38.3349609375, -35.890625, -33.4462890625, -31.001953125, -28.5576171875, -26.11328125, -23.6689453125, -21.224609375, -18.7802734375, -16.3359375, -13.8916015625, -11.447265625, -9.0029296875, -6.55859375, -4.1142578125, -1.669921875, 0.7744140625, 3.21875, 5.6630859375, 8.107421875, 10.5517578125, 12.99609375, 15.4404296875, 17.884765625, 20.3291015625, 22.7734375, 25.2177734375, 27.662109375, 30.1064453125, 32.55078125, 34.9951171875, 37.439453125, 39.8837890625, 42.328125, 44.7724609375, 47.216796875, 49.6611328125, 52.10546875, 54.5498046875, 56.994140625, 59.4384765625, 61.8828125, 64.3271484375, 66.771484375, 69.2158203125, 71.66015625, 74.1044921875, 76.548828125, 78.9931640625, 81.4375]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 5.0, 7.0, 2.0, 9.0, 5.0, 10.0, 16.0, 18.0, 20.0, 27.0, 35.0, 60.0, 87.0, 108.0, 150.0, 202.0, 274.0, 373.0, 516.0, 603.0, 421.0, 286.0, 246.0, 164.0, 116.0, 74.0, 64.0, 34.0, 34.0, 25.0, 23.0, 9.0, 8.0, 7.0, 10.0, 15.0, 6.0, 2.0, 0.0, 2.0, 3.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.921875, -22.20849609375, -21.4951171875, -20.78173828125, -20.068359375, -19.35498046875, -18.6416015625, -17.92822265625, -17.21484375, -16.50146484375, -15.7880859375, -15.07470703125, -14.361328125, -13.64794921875, -12.9345703125, -12.22119140625, -11.5078125, -10.79443359375, -10.0810546875, -9.36767578125, -8.654296875, -7.94091796875, -7.2275390625, -6.51416015625, -5.80078125, -5.08740234375, -4.3740234375, -3.66064453125, -2.947265625, -2.23388671875, -1.5205078125, -0.80712890625, -0.09375, 0.61962890625, 1.3330078125, 2.04638671875, 2.759765625, 3.47314453125, 4.1865234375, 4.89990234375, 5.61328125, 6.32666015625, 7.0400390625, 7.75341796875, 8.466796875, 9.18017578125, 9.8935546875, 10.60693359375, 11.3203125, 12.03369140625, 12.7470703125, 13.46044921875, 14.173828125, 14.88720703125, 15.6005859375, 16.31396484375, 17.02734375, 17.74072265625, 18.4541015625, 19.16748046875, 19.880859375, 20.59423828125, 21.3076171875, 22.02099609375, 22.734375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 0.0, 6.0, 5.0, 8.0, 11.0, 6.0, 9.0, 16.0, 16.0, 16.0, 15.0, 23.0, 40.0, 54.0, 59.0, 55.0, 74.0, 89.0, 69.0, 72.0, 62.0, 49.0, 50.0, 40.0, 39.0, 23.0, 17.0, 22.0, 15.0, 14.0, 3.0, 7.0, 4.0, 2.0, 1.0, 5.0, 0.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-44.840267181396484, -43.35997772216797, -41.87968826293945, -40.39939880371094, -38.91911315917969, -37.43882369995117, -35.958534240722656, -34.47824478149414, -32.997955322265625, -31.51766586303711, -30.037378311157227, -28.55708885192871, -27.076801300048828, -25.596511840820312, -24.116222381591797, -22.63593292236328, -21.15564727783203, -19.675357818603516, -18.195070266723633, -16.714780807495117, -15.234492301940918, -13.754203796386719, -12.273914337158203, -10.793625831604004, -9.313337326049805, -7.8330488204956055, -6.352759838104248, -4.872470855712891, -3.3921823501586914, -1.9118938446044922, -0.43160438537597656, 1.0486841201782227, 2.5289764404296875, 4.009264945983887, 5.489553928375244, 6.969842910766602, 8.4501314163208, 9.930419921875, 11.410709381103516, 12.890997886657715, 14.371286392211914, 15.851574897766113, 17.331863403320312, 18.812152862548828, 20.292442321777344, 21.772729873657227, 23.253019332885742, 24.733306884765625, 26.21359634399414, 27.693885803222656, 29.17417335510254, 30.654462814331055, 32.13475036621094, 33.61503982543945, 35.09532928466797, 36.575618743896484, 38.055908203125, 39.536197662353516, 41.01648712158203, 42.49677276611328, 43.9770622253418, 45.45735168457031, 46.93764114379883, 48.417930603027344, 49.898216247558594]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 2.0, 2.0, 3.0, 10.0, 12.0, 10.0, 15.0, 15.0, 18.0, 12.0, 26.0, 27.0, 26.0, 39.0, 34.0, 36.0, 49.0, 41.0, 41.0, 44.0, 37.0, 47.0, 45.0, 41.0, 41.0, 38.0, 32.0, 43.0, 24.0, 33.0, 25.0, 28.0, 14.0, 20.0, 12.0, 11.0, 17.0, 8.0, 5.0, 2.0, 3.0, 6.0, 3.0, 2.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-41.163185119628906, -39.7889404296875, -38.41469192504883, -37.04044723510742, -35.66619873046875, -34.291954040527344, -32.91770935058594, -31.543460845947266, -30.16921615600586, -28.79496955871582, -27.42072296142578, -26.046478271484375, -24.672231674194336, -23.297985076904297, -21.923738479614258, -20.54949188232422, -19.17524528503418, -17.80099868774414, -16.4267520904541, -15.052506446838379, -13.678260803222656, -12.304014205932617, -10.929767608642578, -9.555521965026855, -8.181275367736816, -6.8070292472839355, -5.432783126831055, -4.058536529541016, -2.6842904090881348, -1.310044288635254, 0.06420230865478516, 1.4384479522705078, 2.812694549560547, 4.186940670013428, 5.561186790466309, 6.935433387756348, 8.30967903137207, 9.68392562866211, 11.058172225952148, 12.432417869567871, 13.80666446685791, 15.18091106414795, 16.555156707763672, 17.92940330505371, 19.30364990234375, 20.677894592285156, 22.052143096923828, 23.426387786865234, 24.800634384155273, 26.174880981445312, 27.54912757873535, 28.92337417602539, 30.297618865966797, 31.671865463256836, 33.046112060546875, 34.42035675048828, 35.79460525512695, 37.16884994506836, 38.54309844970703, 39.91734313964844, 41.29159164428711, 42.665836334228516, 44.04008483886719, 45.414329528808594, 46.78857421875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 3.0, 13.0, 11.0, 21.0, 22.0, 42.0, 56.0, 60.0, 126.0, 150.0, 209.0, 306.0, 470.0, 677.0, 931.0, 1393.0, 2202.0, 3149.0, 4741.0, 6992.0, 11121.0, 17308.0, 27710.0, 47300.0, 82841.0, 151644.0, 249589.0, 188215.0, 102670.0, 56757.0, 33219.0, 20518.0, 13123.0, 8265.0, 5372.0, 3574.0, 2459.0, 1690.0, 1132.0, 787.0, 523.0, 324.0, 267.0, 172.0, 139.0, 81.0, 59.0, 48.0, 30.0, 22.0, 15.0, 2.0, 4.0, 5.0, 3.0, 2.0, 0.0, 2.0], "bins": [-18.46875, -17.903564453125, -17.33837890625, -16.773193359375, -16.2080078125, -15.642822265625, -15.07763671875, -14.512451171875, -13.947265625, -13.382080078125, -12.81689453125, -12.251708984375, -11.6865234375, -11.121337890625, -10.55615234375, -9.990966796875, -9.42578125, -8.860595703125, -8.29541015625, -7.730224609375, -7.1650390625, -6.599853515625, -6.03466796875, -5.469482421875, -4.904296875, -4.339111328125, -3.77392578125, -3.208740234375, -2.6435546875, -2.078369140625, -1.51318359375, -0.947998046875, -0.3828125, 0.182373046875, 0.74755859375, 1.312744140625, 1.8779296875, 2.443115234375, 3.00830078125, 3.573486328125, 4.138671875, 4.703857421875, 5.26904296875, 5.834228515625, 6.3994140625, 6.964599609375, 7.52978515625, 8.094970703125, 8.66015625, 9.225341796875, 9.79052734375, 10.355712890625, 10.9208984375, 11.486083984375, 12.05126953125, 12.616455078125, 13.181640625, 13.746826171875, 14.31201171875, 14.877197265625, 15.4423828125, 16.007568359375, 16.57275390625, 17.137939453125, 17.703125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 1.0, 4.0, 5.0, 8.0, 7.0, 11.0, 14.0, 13.0, 10.0, 10.0, 25.0, 23.0, 24.0, 31.0, 35.0, 29.0, 38.0, 50.0, 43.0, 45.0, 39.0, 36.0, 37.0, 41.0, 47.0, 58.0, 33.0, 36.0, 37.0, 32.0, 25.0, 28.0, 21.0, 15.0, 14.0, 17.0, 10.0, 6.0, 13.0, 9.0, 5.0, 2.0, 3.0, 3.0, 5.0, 0.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-40.84375, -39.48291015625, -38.1220703125, -36.76123046875, -35.400390625, -34.03955078125, -32.6787109375, -31.31787109375, -29.95703125, -28.59619140625, -27.2353515625, -25.87451171875, -24.513671875, -23.15283203125, -21.7919921875, -20.43115234375, -19.0703125, -17.70947265625, -16.3486328125, -14.98779296875, -13.626953125, -12.26611328125, -10.9052734375, -9.54443359375, -8.18359375, -6.82275390625, -5.4619140625, -4.10107421875, -2.740234375, -1.37939453125, -0.0185546875, 1.34228515625, 2.703125, 4.06396484375, 5.4248046875, 6.78564453125, 8.146484375, 9.50732421875, 10.8681640625, 12.22900390625, 13.58984375, 14.95068359375, 16.3115234375, 17.67236328125, 19.033203125, 20.39404296875, 21.7548828125, 23.11572265625, 24.4765625, 25.83740234375, 27.1982421875, 28.55908203125, 29.919921875, 31.28076171875, 32.6416015625, 34.00244140625, 35.36328125, 36.72412109375, 38.0849609375, 39.44580078125, 40.806640625, 42.16748046875, 43.5283203125, 44.88916015625, 46.25]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 6.0, 5.0, 3.0, 14.0, 13.0, 21.0, 33.0, 46.0, 59.0, 85.0, 148.0, 214.0, 341.0, 571.0, 899.0, 1348.0, 2400.0, 3880.0, 6731.0, 12190.0, 26185.0, 158199.0, 742604.0, 52341.0, 17785.0, 9336.0, 5135.0, 2995.0, 1806.0, 1166.0, 733.0, 442.0, 303.0, 167.0, 132.0, 59.0, 50.0, 46.0, 26.0, 13.0, 10.0, 5.0, 8.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.28125, -35.22265625, -34.1640625, -33.10546875, -32.046875, -30.98828125, -29.9296875, -28.87109375, -27.8125, -26.75390625, -25.6953125, -24.63671875, -23.578125, -22.51953125, -21.4609375, -20.40234375, -19.34375, -18.28515625, -17.2265625, -16.16796875, -15.109375, -14.05078125, -12.9921875, -11.93359375, -10.875, -9.81640625, -8.7578125, -7.69921875, -6.640625, -5.58203125, -4.5234375, -3.46484375, -2.40625, -1.34765625, -0.2890625, 0.76953125, 1.828125, 2.88671875, 3.9453125, 5.00390625, 6.0625, 7.12109375, 8.1796875, 9.23828125, 10.296875, 11.35546875, 12.4140625, 13.47265625, 14.53125, 15.58984375, 16.6484375, 17.70703125, 18.765625, 19.82421875, 20.8828125, 21.94140625, 23.0, 24.05859375, 25.1171875, 26.17578125, 27.234375, 28.29296875, 29.3515625, 30.41015625, 31.46875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 5.0, 1.0, 6.0, 4.0, 10.0, 17.0, 10.0, 15.0, 21.0, 15.0, 22.0, 20.0, 34.0, 37.0, 26.0, 40.0, 47.0, 37.0, 36.0, 45.0, 50.0, 46.0, 38.0, 43.0, 46.0, 35.0, 28.0, 40.0, 27.0, 34.0, 31.0, 14.0, 19.0, 18.0, 19.0, 17.0, 15.0, 13.0, 6.0, 4.0, 6.0, 3.0, 6.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.84375, -28.8251953125, -27.806640625, -26.7880859375, -25.76953125, -24.7509765625, -23.732421875, -22.7138671875, -21.6953125, -20.6767578125, -19.658203125, -18.6396484375, -17.62109375, -16.6025390625, -15.583984375, -14.5654296875, -13.546875, -12.5283203125, -11.509765625, -10.4912109375, -9.47265625, -8.4541015625, -7.435546875, -6.4169921875, -5.3984375, -4.3798828125, -3.361328125, -2.3427734375, -1.32421875, -0.3056640625, 0.712890625, 1.7314453125, 2.75, 3.7685546875, 4.787109375, 5.8056640625, 6.82421875, 7.8427734375, 8.861328125, 9.8798828125, 10.8984375, 11.9169921875, 12.935546875, 13.9541015625, 14.97265625, 15.9912109375, 17.009765625, 18.0283203125, 19.046875, 20.0654296875, 21.083984375, 22.1025390625, 23.12109375, 24.1396484375, 25.158203125, 26.1767578125, 27.1953125, 28.2138671875, 29.232421875, 30.2509765625, 31.26953125, 32.2880859375, 33.306640625, 34.3251953125, 35.34375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 6.0, 2.0, 1.0, 3.0, 4.0, 8.0, 6.0, 18.0, 20.0, 37.0, 52.0, 60.0, 86.0, 125.0, 174.0, 282.0, 431.0, 728.0, 1230.0, 2253.0, 4399.0, 9206.0, 22871.0, 128126.0, 804883.0, 44743.0, 14834.0, 6411.0, 3205.0, 1740.0, 971.0, 562.0, 377.0, 198.0, 151.0, 106.0, 65.0, 63.0, 35.0, 30.0, 15.0, 15.0, 9.0, 10.0, 3.0, 2.0, 2.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.3359375, -3.232574462890625, -3.12921142578125, -3.025848388671875, -2.9224853515625, -2.819122314453125, -2.71575927734375, -2.612396240234375, -2.509033203125, -2.405670166015625, -2.30230712890625, -2.198944091796875, -2.0955810546875, -1.992218017578125, -1.88885498046875, -1.785491943359375, -1.68212890625, -1.578765869140625, -1.47540283203125, -1.372039794921875, -1.2686767578125, -1.165313720703125, -1.06195068359375, -0.958587646484375, -0.855224609375, -0.751861572265625, -0.64849853515625, -0.545135498046875, -0.4417724609375, -0.338409423828125, -0.23504638671875, -0.131683349609375, -0.0283203125, 0.075042724609375, 0.17840576171875, 0.281768798828125, 0.3851318359375, 0.488494873046875, 0.59185791015625, 0.695220947265625, 0.798583984375, 0.901947021484375, 1.00531005859375, 1.108673095703125, 1.2120361328125, 1.315399169921875, 1.41876220703125, 1.522125244140625, 1.62548828125, 1.728851318359375, 1.83221435546875, 1.935577392578125, 2.0389404296875, 2.142303466796875, 2.24566650390625, 2.349029541015625, 2.452392578125, 2.555755615234375, 2.65911865234375, 2.762481689453125, 2.8658447265625, 2.969207763671875, 3.07257080078125, 3.175933837890625, 3.279296875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 5.0, 9.0, 16.0, 23.0, 52.0, 70.0, 108.0, 145.0, 176.0, 124.0, 106.0, 75.0, 40.0, 18.0, 13.0, 9.0, 8.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006508827209472656, -0.0006280690431594849, -0.0006052553653717041, -0.0005824416875839233, -0.0005596280097961426, -0.0005368143320083618, -0.0005140006542205811, -0.0004911869764328003, -0.00046837329864501953, -0.00044555962085723877, -0.000422745943069458, -0.00039993226528167725, -0.0003771185874938965, -0.0003543049097061157, -0.00033149123191833496, -0.0003086775541305542, -0.00028586387634277344, -0.0002630501985549927, -0.00024023652076721191, -0.00021742284297943115, -0.0001946091651916504, -0.00017179548740386963, -0.00014898180961608887, -0.0001261681318283081, -0.00010335445404052734, -8.054077625274658e-05, -5.772709846496582e-05, -3.491342067718506e-05, -1.2099742889404297e-05, 1.0713934898376465e-05, 3.3527612686157227e-05, 5.634129047393799e-05, 7.915496826171875e-05, 0.00010196864604949951, 0.00012478232383728027, 0.00014759600162506104, 0.0001704096794128418, 0.00019322335720062256, 0.00021603703498840332, 0.00023885071277618408, 0.00026166439056396484, 0.0002844780683517456, 0.00030729174613952637, 0.00033010542392730713, 0.0003529191017150879, 0.00037573277950286865, 0.0003985464572906494, 0.0004213601350784302, 0.00044417381286621094, 0.0004669874906539917, 0.0004898011684417725, 0.0005126148462295532, 0.000535428524017334, 0.0005582422018051147, 0.0005810558795928955, 0.0006038695573806763, 0.000626683235168457, 0.0006494969129562378, 0.0006723105907440186, 0.0006951242685317993, 0.0007179379463195801, 0.0007407516241073608, 0.0007635653018951416, 0.0007863789796829224, 0.0008091926574707031]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 9.0, 9.0, 9.0, 12.0, 15.0, 25.0, 40.0, 52.0, 77.0, 138.0, 151.0, 240.0, 351.0, 468.0, 696.0, 982.0, 1435.0, 2188.0, 3121.0, 4755.0, 7134.0, 10908.0, 16831.0, 27006.0, 44433.0, 75589.0, 133211.0, 211581.0, 202320.0, 121976.0, 70137.0, 40940.0, 24780.0, 15852.0, 10240.0, 6722.0, 4461.0, 3083.0, 2052.0, 1392.0, 1013.0, 659.0, 424.0, 318.0, 245.0, 121.0, 101.0, 82.0, 60.0, 37.0, 30.0, 22.0, 10.0, 9.0, 7.0, 6.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.13671875, -2.067626953125, -1.99853515625, -1.929443359375, -1.8603515625, -1.791259765625, -1.72216796875, -1.653076171875, -1.583984375, -1.514892578125, -1.44580078125, -1.376708984375, -1.3076171875, -1.238525390625, -1.16943359375, -1.100341796875, -1.03125, -0.962158203125, -0.89306640625, -0.823974609375, -0.7548828125, -0.685791015625, -0.61669921875, -0.547607421875, -0.478515625, -0.409423828125, -0.34033203125, -0.271240234375, -0.2021484375, -0.133056640625, -0.06396484375, 0.005126953125, 0.07421875, 0.143310546875, 0.21240234375, 0.281494140625, 0.3505859375, 0.419677734375, 0.48876953125, 0.557861328125, 0.626953125, 0.696044921875, 0.76513671875, 0.834228515625, 0.9033203125, 0.972412109375, 1.04150390625, 1.110595703125, 1.1796875, 1.248779296875, 1.31787109375, 1.386962890625, 1.4560546875, 1.525146484375, 1.59423828125, 1.663330078125, 1.732421875, 1.801513671875, 1.87060546875, 1.939697265625, 2.0087890625, 2.077880859375, 2.14697265625, 2.216064453125, 2.28515625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 5.0, 4.0, 2.0, 6.0, 8.0, 5.0, 10.0, 10.0, 11.0, 12.0, 12.0, 21.0, 18.0, 23.0, 28.0, 25.0, 38.0, 37.0, 44.0, 42.0, 70.0, 72.0, 72.0, 68.0, 57.0, 44.0, 41.0, 32.0, 25.0, 23.0, 24.0, 31.0, 10.0, 13.0, 12.0, 11.0, 14.0, 4.0, 2.0, 5.0, 2.0, 2.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.74658203125, -0.72076416015625, -0.6949462890625, -0.66912841796875, -0.643310546875, -0.61749267578125, -0.5916748046875, -0.56585693359375, -0.5400390625, -0.51422119140625, -0.4884033203125, -0.46258544921875, -0.436767578125, -0.41094970703125, -0.3851318359375, -0.35931396484375, -0.33349609375, -0.30767822265625, -0.2818603515625, -0.25604248046875, -0.230224609375, -0.20440673828125, -0.1785888671875, -0.15277099609375, -0.126953125, -0.10113525390625, -0.0753173828125, -0.04949951171875, -0.023681640625, 0.00213623046875, 0.0279541015625, 0.05377197265625, 0.07958984375, 0.10540771484375, 0.1312255859375, 0.15704345703125, 0.182861328125, 0.20867919921875, 0.2344970703125, 0.26031494140625, 0.2861328125, 0.31195068359375, 0.3377685546875, 0.36358642578125, 0.389404296875, 0.41522216796875, 0.4410400390625, 0.46685791015625, 0.49267578125, 0.51849365234375, 0.5443115234375, 0.57012939453125, 0.595947265625, 0.62176513671875, 0.6475830078125, 0.67340087890625, 0.69921875, 0.72503662109375, 0.7508544921875, 0.77667236328125, 0.802490234375, 0.82830810546875, 0.8541259765625, 0.87994384765625, 0.90576171875]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 7.0, 0.0, 3.0, 7.0, 5.0, 8.0, 9.0, 15.0, 10.0, 11.0, 22.0, 23.0, 37.0, 52.0, 62.0, 61.0, 85.0, 95.0, 92.0, 65.0, 70.0, 54.0, 45.0, 40.0, 39.0, 14.0, 23.0, 15.0, 11.0, 5.0, 3.0, 5.0, 6.0, 1.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.892513275146484, -47.27054977416992, -45.648590087890625, -44.02662658691406, -42.4046630859375, -40.7827033996582, -39.16073989868164, -37.538780212402344, -35.91681671142578, -34.29485321044922, -32.67289352416992, -31.05093002319336, -29.42896842956543, -27.8070068359375, -26.185043334960938, -24.563081741333008, -22.941118240356445, -21.319156646728516, -19.697193145751953, -18.075231552124023, -16.453269958496094, -14.831307411193848, -13.209344863891602, -11.587383270263672, -9.965420722961426, -8.34345817565918, -6.72149658203125, -5.099534034729004, -3.477571964263916, -1.8556098937988281, -0.23364734649658203, 1.3883142471313477, 3.0102767944335938, 4.632238864898682, 6.2542009353637695, 7.876163482666016, 9.498125076293945, 11.120087623596191, 12.742050170898438, 14.364011764526367, 15.985974311828613, 17.60793685913086, 19.22989845275879, 20.85186004638672, 22.47382354736328, 24.09578514099121, 25.71774673461914, 27.339710235595703, 28.961671829223633, 30.583633422851562, 32.205596923828125, 33.82756042480469, 35.449520111083984, 37.07148361206055, 38.693443298339844, 40.315406799316406, 41.93737030029297, 43.55933380126953, 45.18129348754883, 46.80325698852539, 48.42522048950195, 50.04718017578125, 51.66914367675781, 53.291107177734375, 54.91306686401367]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 4.0, 1.0, 1.0, 3.0, 10.0, 8.0, 12.0, 11.0, 19.0, 16.0, 16.0, 23.0, 25.0, 29.0, 32.0, 34.0, 37.0, 44.0, 52.0, 45.0, 42.0, 32.0, 44.0, 47.0, 47.0, 42.0, 38.0, 37.0, 38.0, 31.0, 29.0, 27.0, 27.0, 13.0, 18.0, 13.0, 11.0, 18.0, 9.0, 3.0, 2.0, 4.0, 3.0, 5.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-41.21173858642578, -39.8424186706543, -38.47309494018555, -37.10377502441406, -35.73445510864258, -34.365135192871094, -32.995811462402344, -31.62649154663086, -30.257169723510742, -28.887847900390625, -27.51852798461914, -26.149206161499023, -24.779884338378906, -23.410564422607422, -22.041242599487305, -20.671920776367188, -19.302600860595703, -17.933279037475586, -16.5639591217041, -15.194637298583984, -13.825316429138184, -12.455995559692383, -11.086673736572266, -9.717352867126465, -8.348031997680664, -6.978711128234863, -5.609389781951904, -4.240068435668945, -2.8707475662231445, -1.5014266967773438, -0.13210487365722656, 1.2372159957885742, 2.6065330505371094, 3.9758541584014893, 5.345175266265869, 6.714496612548828, 8.083817481994629, 9.45313835144043, 10.822460174560547, 12.191781044006348, 13.561101913452148, 14.93042278289795, 16.29974365234375, 17.669065475463867, 19.038387298583984, 20.40770721435547, 21.777029037475586, 23.146350860595703, 24.515670776367188, 25.884992599487305, 27.25431251525879, 28.623634338378906, 29.99295425415039, 31.362276077270508, 32.731597900390625, 34.10091781616211, 35.470237731933594, 36.83955764770508, 38.20888137817383, 39.57820129394531, 40.9475212097168, 42.31684112548828, 43.68616485595703, 45.055484771728516, 46.424808502197266]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 7.0, 13.0, 11.0, 18.0, 34.0, 47.0, 70.0, 87.0, 172.0, 252.0, 365.0, 554.0, 787.0, 1213.0, 1881.0, 2633.0, 4179.0, 6529.0, 10543.0, 16626.0, 26977.0, 44716.0, 77811.0, 143249.0, 238386.0, 202275.0, 111432.0, 61406.0, 36234.0, 22017.0, 13596.0, 8568.0, 5426.0, 3545.0, 2252.0, 1589.0, 1012.0, 726.0, 430.0, 315.0, 208.0, 124.0, 94.0, 50.0, 32.0, 32.0, 15.0, 8.0, 5.0, 7.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.875, -44.38525390625, -42.8955078125, -41.40576171875, -39.916015625, -38.42626953125, -36.9365234375, -35.44677734375, -33.95703125, -32.46728515625, -30.9775390625, -29.48779296875, -27.998046875, -26.50830078125, -25.0185546875, -23.52880859375, -22.0390625, -20.54931640625, -19.0595703125, -17.56982421875, -16.080078125, -14.59033203125, -13.1005859375, -11.61083984375, -10.12109375, -8.63134765625, -7.1416015625, -5.65185546875, -4.162109375, -2.67236328125, -1.1826171875, 0.30712890625, 1.796875, 3.28662109375, 4.7763671875, 6.26611328125, 7.755859375, 9.24560546875, 10.7353515625, 12.22509765625, 13.71484375, 15.20458984375, 16.6943359375, 18.18408203125, 19.673828125, 21.16357421875, 22.6533203125, 24.14306640625, 25.6328125, 27.12255859375, 28.6123046875, 30.10205078125, 31.591796875, 33.08154296875, 34.5712890625, 36.06103515625, 37.55078125, 39.04052734375, 40.5302734375, 42.02001953125, 43.509765625, 44.99951171875, 46.4892578125, 47.97900390625, 49.46875]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 5.0, 7.0, 13.0, 8.0, 12.0, 17.0, 17.0, 12.0, 21.0, 21.0, 28.0, 22.0, 32.0, 39.0, 48.0, 47.0, 50.0, 39.0, 41.0, 40.0, 40.0, 43.0, 60.0, 29.0, 36.0, 26.0, 42.0, 30.0, 26.0, 20.0, 24.0, 20.0, 20.0, 13.0, 9.0, 6.0, 9.0, 8.0, 3.0, 3.0, 5.0, 5.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.5, -38.203125, -36.90625, -35.609375, -34.3125, -33.015625, -31.71875, -30.421875, -29.125, -27.828125, -26.53125, -25.234375, -23.9375, -22.640625, -21.34375, -20.046875, -18.75, -17.453125, -16.15625, -14.859375, -13.5625, -12.265625, -10.96875, -9.671875, -8.375, -7.078125, -5.78125, -4.484375, -3.1875, -1.890625, -0.59375, 0.703125, 2.0, 3.296875, 4.59375, 5.890625, 7.1875, 8.484375, 9.78125, 11.078125, 12.375, 13.671875, 14.96875, 16.265625, 17.5625, 18.859375, 20.15625, 21.453125, 22.75, 24.046875, 25.34375, 26.640625, 27.9375, 29.234375, 30.53125, 31.828125, 33.125, 34.421875, 35.71875, 37.015625, 38.3125, 39.609375, 40.90625, 42.203125, 43.5]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 9.0, 15.0, 20.0, 22.0, 33.0, 51.0, 89.0, 106.0, 152.0, 213.0, 355.0, 446.0, 745.0, 1098.0, 1681.0, 2496.0, 3876.0, 6036.0, 9300.0, 14857.0, 23634.0, 39460.0, 66401.0, 113235.0, 188531.0, 216807.0, 144651.0, 84477.0, 49242.0, 29672.0, 18212.0, 11595.0, 7309.0, 4582.0, 3015.0, 2002.0, 1304.0, 933.0, 577.0, 415.0, 284.0, 181.0, 148.0, 96.0, 68.0, 38.0, 36.0, 22.0, 12.0, 9.0, 5.0, 3.0, 0.0, 1.0, 3.0], "bins": [-53.375, -51.8154296875, -50.255859375, -48.6962890625, -47.13671875, -45.5771484375, -44.017578125, -42.4580078125, -40.8984375, -39.3388671875, -37.779296875, -36.2197265625, -34.66015625, -33.1005859375, -31.541015625, -29.9814453125, -28.421875, -26.8623046875, -25.302734375, -23.7431640625, -22.18359375, -20.6240234375, -19.064453125, -17.5048828125, -15.9453125, -14.3857421875, -12.826171875, -11.2666015625, -9.70703125, -8.1474609375, -6.587890625, -5.0283203125, -3.46875, -1.9091796875, -0.349609375, 1.2099609375, 2.76953125, 4.3291015625, 5.888671875, 7.4482421875, 9.0078125, 10.5673828125, 12.126953125, 13.6865234375, 15.24609375, 16.8056640625, 18.365234375, 19.9248046875, 21.484375, 23.0439453125, 24.603515625, 26.1630859375, 27.72265625, 29.2822265625, 30.841796875, 32.4013671875, 33.9609375, 35.5205078125, 37.080078125, 38.6396484375, 40.19921875, 41.7587890625, 43.318359375, 44.8779296875, 46.4375]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 5.0, 2.0, 2.0, 9.0, 5.0, 10.0, 11.0, 10.0, 10.0, 7.0, 13.0, 13.0, 8.0, 22.0, 16.0, 32.0, 40.0, 30.0, 27.0, 32.0, 46.0, 41.0, 48.0, 47.0, 34.0, 31.0, 40.0, 38.0, 27.0, 43.0, 39.0, 28.0, 28.0, 30.0, 16.0, 21.0, 23.0, 18.0, 16.0, 13.0, 19.0, 16.0, 8.0, 10.0, 6.0, 4.0, 4.0, 3.0, 1.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-25.875, -25.0791015625, -24.283203125, -23.4873046875, -22.69140625, -21.8955078125, -21.099609375, -20.3037109375, -19.5078125, -18.7119140625, -17.916015625, -17.1201171875, -16.32421875, -15.5283203125, -14.732421875, -13.9365234375, -13.140625, -12.3447265625, -11.548828125, -10.7529296875, -9.95703125, -9.1611328125, -8.365234375, -7.5693359375, -6.7734375, -5.9775390625, -5.181640625, -4.3857421875, -3.58984375, -2.7939453125, -1.998046875, -1.2021484375, -0.40625, 0.3896484375, 1.185546875, 1.9814453125, 2.77734375, 3.5732421875, 4.369140625, 5.1650390625, 5.9609375, 6.7568359375, 7.552734375, 8.3486328125, 9.14453125, 9.9404296875, 10.736328125, 11.5322265625, 12.328125, 13.1240234375, 13.919921875, 14.7158203125, 15.51171875, 16.3076171875, 17.103515625, 17.8994140625, 18.6953125, 19.4912109375, 20.287109375, 21.0830078125, 21.87890625, 22.6748046875, 23.470703125, 24.2666015625, 25.0625]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 8.0, 9.0, 15.0, 21.0, 26.0, 47.0, 76.0, 61.0, 98.0, 153.0, 227.0, 346.0, 472.0, 773.0, 1094.0, 1693.0, 2703.0, 4318.0, 6887.0, 11244.0, 18874.0, 33375.0, 61340.0, 117326.0, 227908.0, 256274.0, 138319.0, 70837.0, 38361.0, 21979.0, 12616.0, 7686.0, 4654.0, 2930.0, 1881.0, 1235.0, 897.0, 581.0, 414.0, 264.0, 187.0, 104.0, 75.0, 50.0, 33.0, 32.0, 17.0, 13.0, 11.0, 5.0, 9.0, 4.0, 1.0, 1.0, 1.0, 2.0], "bins": [-23.828125, -23.108642578125, -22.38916015625, -21.669677734375, -20.9501953125, -20.230712890625, -19.51123046875, -18.791748046875, -18.072265625, -17.352783203125, -16.63330078125, -15.913818359375, -15.1943359375, -14.474853515625, -13.75537109375, -13.035888671875, -12.31640625, -11.596923828125, -10.87744140625, -10.157958984375, -9.4384765625, -8.718994140625, -7.99951171875, -7.280029296875, -6.560546875, -5.841064453125, -5.12158203125, -4.402099609375, -3.6826171875, -2.963134765625, -2.24365234375, -1.524169921875, -0.8046875, -0.085205078125, 0.63427734375, 1.353759765625, 2.0732421875, 2.792724609375, 3.51220703125, 4.231689453125, 4.951171875, 5.670654296875, 6.39013671875, 7.109619140625, 7.8291015625, 8.548583984375, 9.26806640625, 9.987548828125, 10.70703125, 11.426513671875, 12.14599609375, 12.865478515625, 13.5849609375, 14.304443359375, 15.02392578125, 15.743408203125, 16.462890625, 17.182373046875, 17.90185546875, 18.621337890625, 19.3408203125, 20.060302734375, 20.77978515625, 21.499267578125, 22.21875]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 5.0, 5.0, 4.0, 8.0, 8.0, 20.0, 18.0, 29.0, 35.0, 32.0, 54.0, 67.0, 85.0, 97.0, 98.0, 89.0, 80.0, 49.0, 54.0, 40.0, 32.0, 22.0, 19.0, 15.0, 6.0, 5.0, 7.0, 6.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0025501251220703125, -0.002465665340423584, -0.0023812055587768555, -0.002296745777130127, -0.0022122859954833984, -0.00212782621383667, -0.0020433664321899414, -0.001958906650543213, -0.0018744468688964844, -0.0017899870872497559, -0.0017055273056030273, -0.0016210675239562988, -0.0015366077423095703, -0.0014521479606628418, -0.0013676881790161133, -0.0012832283973693848, -0.0011987686157226562, -0.0011143088340759277, -0.0010298490524291992, -0.0009453892707824707, -0.0008609294891357422, -0.0007764697074890137, -0.0006920099258422852, -0.0006075501441955566, -0.0005230903625488281, -0.0004386305809020996, -0.0003541707992553711, -0.0002697110176086426, -0.00018525123596191406, -0.00010079145431518555, -1.633167266845703e-05, 6.812810897827148e-05, 0.000152587890625, 0.00023704767227172852, 0.00032150745391845703, 0.00040596723556518555, 0.0004904270172119141, 0.0005748867988586426, 0.0006593465805053711, 0.0007438063621520996, 0.0008282661437988281, 0.0009127259254455566, 0.0009971857070922852, 0.0010816454887390137, 0.0011661052703857422, 0.0012505650520324707, 0.0013350248336791992, 0.0014194846153259277, 0.0015039443969726562, 0.0015884041786193848, 0.0016728639602661133, 0.0017573237419128418, 0.0018417835235595703, 0.0019262433052062988, 0.0020107030868530273, 0.002095162868499756, 0.0021796226501464844, 0.002264082431793213, 0.0023485422134399414, 0.00243300199508667, 0.0025174617767333984, 0.002601921558380127, 0.0026863813400268555, 0.002770841121673584, 0.0028553009033203125]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 2.0, 4.0, 14.0, 8.0, 13.0, 24.0, 34.0, 43.0, 77.0, 133.0, 191.0, 261.0, 430.0, 687.0, 1087.0, 1795.0, 2998.0, 5204.0, 9346.0, 17753.0, 36381.0, 79783.0, 183510.0, 326727.0, 206603.0, 90118.0, 40961.0, 20126.0, 10304.0, 5719.0, 3336.0, 1841.0, 1133.0, 670.0, 428.0, 272.0, 168.0, 113.0, 78.0, 46.0, 32.0, 31.0, 18.0, 13.0, 8.0, 10.0, 8.0, 5.0, 3.0, 3.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0], "bins": [-24.3125, -23.517333984375, -22.72216796875, -21.927001953125, -21.1318359375, -20.336669921875, -19.54150390625, -18.746337890625, -17.951171875, -17.156005859375, -16.36083984375, -15.565673828125, -14.7705078125, -13.975341796875, -13.18017578125, -12.385009765625, -11.58984375, -10.794677734375, -9.99951171875, -9.204345703125, -8.4091796875, -7.614013671875, -6.81884765625, -6.023681640625, -5.228515625, -4.433349609375, -3.63818359375, -2.843017578125, -2.0478515625, -1.252685546875, -0.45751953125, 0.337646484375, 1.1328125, 1.927978515625, 2.72314453125, 3.518310546875, 4.3134765625, 5.108642578125, 5.90380859375, 6.698974609375, 7.494140625, 8.289306640625, 9.08447265625, 9.879638671875, 10.6748046875, 11.469970703125, 12.26513671875, 13.060302734375, 13.85546875, 14.650634765625, 15.44580078125, 16.240966796875, 17.0361328125, 17.831298828125, 18.62646484375, 19.421630859375, 20.216796875, 21.011962890625, 21.80712890625, 22.602294921875, 23.3974609375, 24.192626953125, 24.98779296875, 25.782958984375, 26.578125]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 5.0, 6.0, 7.0, 10.0, 12.0, 12.0, 21.0, 22.0, 25.0, 37.0, 36.0, 49.0, 43.0, 41.0, 52.0, 60.0, 72.0, 62.0, 63.0, 61.0, 53.0, 30.0, 45.0, 33.0, 29.0, 24.0, 19.0, 18.0, 11.0, 13.0, 6.0, 4.0, 5.0, 2.0, 1.0, 4.0, 3.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.5703125, -5.372802734375, -5.17529296875, -4.977783203125, -4.7802734375, -4.582763671875, -4.38525390625, -4.187744140625, -3.990234375, -3.792724609375, -3.59521484375, -3.397705078125, -3.2001953125, -3.002685546875, -2.80517578125, -2.607666015625, -2.41015625, -2.212646484375, -2.01513671875, -1.817626953125, -1.6201171875, -1.422607421875, -1.22509765625, -1.027587890625, -0.830078125, -0.632568359375, -0.43505859375, -0.237548828125, -0.0400390625, 0.157470703125, 0.35498046875, 0.552490234375, 0.75, 0.947509765625, 1.14501953125, 1.342529296875, 1.5400390625, 1.737548828125, 1.93505859375, 2.132568359375, 2.330078125, 2.527587890625, 2.72509765625, 2.922607421875, 3.1201171875, 3.317626953125, 3.51513671875, 3.712646484375, 3.91015625, 4.107666015625, 4.30517578125, 4.502685546875, 4.7001953125, 4.897705078125, 5.09521484375, 5.292724609375, 5.490234375, 5.687744140625, 5.88525390625, 6.082763671875, 6.2802734375, 6.477783203125, 6.67529296875, 6.872802734375, 7.0703125]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 5.0, 3.0, 5.0, 3.0, 8.0, 13.0, 9.0, 16.0, 17.0, 16.0, 16.0, 29.0, 40.0, 60.0, 55.0, 63.0, 71.0, 80.0, 77.0, 59.0, 65.0, 58.0, 40.0, 34.0, 27.0, 20.0, 30.0, 22.0, 9.0, 16.0, 6.0, 7.0, 5.0, 6.0, 5.0, 3.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-40.81684875488281, -39.41847229003906, -38.02009582519531, -36.62171936035156, -35.22334289550781, -33.82497024536133, -32.42659378051758, -31.028217315673828, -29.629840850830078, -28.231464385986328, -26.833087921142578, -25.43471336364746, -24.03633689880371, -22.63796043395996, -21.239585876464844, -19.841209411621094, -18.442832946777344, -17.044456481933594, -15.64608097076416, -14.247705459594727, -12.849328994750977, -11.450952529907227, -10.052577018737793, -8.65420150756836, -7.255825042724609, -5.857449054718018, -4.459073066711426, -3.060697078704834, -1.6623210906982422, -0.2639451026916504, 1.1344308853149414, 2.532806396484375, 3.931182861328125, 5.329558849334717, 6.727934837341309, 8.126310348510742, 9.524686813354492, 10.923063278198242, 12.321438789367676, 13.71981430053711, 15.11819076538086, 16.51656723022461, 17.91494369506836, 19.313318252563477, 20.711694717407227, 22.110071182250977, 23.508445739746094, 24.906822204589844, 26.305198669433594, 27.703575134277344, 29.101951599121094, 30.50032615661621, 31.89870262145996, 33.29707717895508, 34.69545364379883, 36.09383010864258, 37.49220657348633, 38.89058303833008, 40.28895950317383, 41.68733596801758, 43.08570861816406, 44.48408508300781, 45.88246154785156, 47.28083801269531, 48.67921447753906]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 6.0, 2.0, 2.0, 5.0, 4.0, 3.0, 7.0, 13.0, 15.0, 14.0, 14.0, 20.0, 22.0, 29.0, 15.0, 31.0, 44.0, 28.0, 34.0, 38.0, 52.0, 53.0, 43.0, 37.0, 56.0, 38.0, 46.0, 42.0, 32.0, 33.0, 26.0, 25.0, 31.0, 27.0, 19.0, 16.0, 12.0, 17.0, 13.0, 13.0, 6.0, 6.0, 4.0, 7.0, 6.0, 2.0, 3.0, 6.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.6596565246582, -39.28377151489258, -37.90788650512695, -36.53200149536133, -35.1561164855957, -33.78023147583008, -32.40434646606445, -31.028461456298828, -29.652576446533203, -28.276691436767578, -26.900806427001953, -25.524921417236328, -24.149036407470703, -22.773151397705078, -21.397266387939453, -20.021381378173828, -18.64549446105957, -17.269609451293945, -15.89372444152832, -14.517839431762695, -13.14195442199707, -11.766069412231445, -10.390183448791504, -9.014298439025879, -7.638413429260254, -6.262528419494629, -4.886643409729004, -3.5107579231262207, -2.1348729133605957, -0.7589879035949707, 0.6168975830078125, 1.9927825927734375, 3.3686676025390625, 4.7445526123046875, 6.1204376220703125, 7.496323108673096, 8.872207641601562, 10.248092651367188, 11.623978614807129, 12.999863624572754, 14.375748634338379, 15.751633644104004, 17.127519607543945, 18.50340461730957, 19.879289627075195, 21.25517463684082, 22.631059646606445, 24.00694465637207, 25.382829666137695, 26.75871467590332, 28.134599685668945, 29.51048469543457, 30.886369705200195, 32.26225662231445, 33.63814163208008, 35.0140266418457, 36.38991165161133, 37.76579666137695, 39.14168167114258, 40.5175666809082, 41.89345169067383, 43.26933670043945, 44.64522171020508, 46.0211067199707, 47.39699172973633]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 0.0, 3.0, 2.0, 6.0, 12.0, 15.0, 13.0, 29.0, 42.0, 61.0, 67.0, 110.0, 150.0, 204.0, 344.0, 438.0, 617.0, 947.0, 1337.0, 2026.0, 3041.0, 4918.0, 7871.0, 13667.0, 25896.0, 58326.0, 183117.0, 746151.0, 1911021.0, 885868.0, 214148.0, 65864.0, 28619.0, 15027.0, 8524.0, 5234.0, 3274.0, 2254.0, 1468.0, 1078.0, 696.0, 502.0, 378.0, 255.0, 197.0, 134.0, 93.0, 79.0, 59.0, 31.0, 24.0, 19.0, 8.0, 14.0, 8.0, 5.0, 0.0, 1.0, 3.0, 2.0, 1.0], "bins": [-58.65625, -56.7978515625, -54.939453125, -53.0810546875, -51.22265625, -49.3642578125, -47.505859375, -45.6474609375, -43.7890625, -41.9306640625, -40.072265625, -38.2138671875, -36.35546875, -34.4970703125, -32.638671875, -30.7802734375, -28.921875, -27.0634765625, -25.205078125, -23.3466796875, -21.48828125, -19.6298828125, -17.771484375, -15.9130859375, -14.0546875, -12.1962890625, -10.337890625, -8.4794921875, -6.62109375, -4.7626953125, -2.904296875, -1.0458984375, 0.8125, 2.6708984375, 4.529296875, 6.3876953125, 8.24609375, 10.1044921875, 11.962890625, 13.8212890625, 15.6796875, 17.5380859375, 19.396484375, 21.2548828125, 23.11328125, 24.9716796875, 26.830078125, 28.6884765625, 30.546875, 32.4052734375, 34.263671875, 36.1220703125, 37.98046875, 39.8388671875, 41.697265625, 43.5556640625, 45.4140625, 47.2724609375, 49.130859375, 50.9892578125, 52.84765625, 54.7060546875, 56.564453125, 58.4228515625, 60.28125]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 4.0, 4.0, 1.0, 0.0, 8.0, 12.0, 4.0, 12.0, 14.0, 14.0, 20.0, 24.0, 21.0, 18.0, 20.0, 31.0, 36.0, 25.0, 37.0, 34.0, 43.0, 47.0, 40.0, 45.0, 46.0, 46.0, 46.0, 36.0, 32.0, 25.0, 35.0, 32.0, 24.0, 25.0, 29.0, 15.0, 20.0, 8.0, 14.0, 12.0, 13.0, 11.0, 8.0, 3.0, 3.0, 1.0, 7.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-33.625, -32.53173828125, -31.4384765625, -30.34521484375, -29.251953125, -28.15869140625, -27.0654296875, -25.97216796875, -24.87890625, -23.78564453125, -22.6923828125, -21.59912109375, -20.505859375, -19.41259765625, -18.3193359375, -17.22607421875, -16.1328125, -15.03955078125, -13.9462890625, -12.85302734375, -11.759765625, -10.66650390625, -9.5732421875, -8.47998046875, -7.38671875, -6.29345703125, -5.2001953125, -4.10693359375, -3.013671875, -1.92041015625, -0.8271484375, 0.26611328125, 1.359375, 2.45263671875, 3.5458984375, 4.63916015625, 5.732421875, 6.82568359375, 7.9189453125, 9.01220703125, 10.10546875, 11.19873046875, 12.2919921875, 13.38525390625, 14.478515625, 15.57177734375, 16.6650390625, 17.75830078125, 18.8515625, 19.94482421875, 21.0380859375, 22.13134765625, 23.224609375, 24.31787109375, 25.4111328125, 26.50439453125, 27.59765625, 28.69091796875, 29.7841796875, 30.87744140625, 31.970703125, 33.06396484375, 34.1572265625, 35.25048828125, 36.34375]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 5.0, 3.0, 4.0, 6.0, 14.0, 20.0, 13.0, 35.0, 53.0, 69.0, 105.0, 141.0, 203.0, 337.0, 442.0, 672.0, 1058.0, 1753.0, 2682.0, 4142.0, 7292.0, 13045.0, 24272.0, 49422.0, 111165.0, 291219.0, 1005586.0, 1829166.0, 523866.0, 177593.0, 72967.0, 34410.0, 17682.0, 9750.0, 5711.0, 3335.0, 2086.0, 1331.0, 886.0, 590.0, 372.0, 269.0, 172.0, 96.0, 77.0, 64.0, 38.0, 31.0, 13.0, 12.0, 9.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-60.40625, -58.40966796875, -56.4130859375, -54.41650390625, -52.419921875, -50.42333984375, -48.4267578125, -46.43017578125, -44.43359375, -42.43701171875, -40.4404296875, -38.44384765625, -36.447265625, -34.45068359375, -32.4541015625, -30.45751953125, -28.4609375, -26.46435546875, -24.4677734375, -22.47119140625, -20.474609375, -18.47802734375, -16.4814453125, -14.48486328125, -12.48828125, -10.49169921875, -8.4951171875, -6.49853515625, -4.501953125, -2.50537109375, -0.5087890625, 1.48779296875, 3.484375, 5.48095703125, 7.4775390625, 9.47412109375, 11.470703125, 13.46728515625, 15.4638671875, 17.46044921875, 19.45703125, 21.45361328125, 23.4501953125, 25.44677734375, 27.443359375, 29.43994140625, 31.4365234375, 33.43310546875, 35.4296875, 37.42626953125, 39.4228515625, 41.41943359375, 43.416015625, 45.41259765625, 47.4091796875, 49.40576171875, 51.40234375, 53.39892578125, 55.3955078125, 57.39208984375, 59.388671875, 61.38525390625, 63.3818359375, 65.37841796875, 67.375]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 4.0, 0.0, 2.0, 7.0, 6.0, 3.0, 7.0, 7.0, 10.0, 10.0, 18.0, 15.0, 10.0, 26.0, 33.0, 30.0, 50.0, 54.0, 65.0, 79.0, 108.0, 125.0, 154.0, 196.0, 241.0, 326.0, 361.0, 373.0, 346.0, 274.0, 238.0, 164.0, 142.0, 129.0, 88.0, 72.0, 69.0, 46.0, 37.0, 32.0, 16.0, 19.0, 14.0, 15.0, 7.0, 9.0, 4.0, 14.0, 8.0, 4.0, 9.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-15.3203125, -14.8148193359375, -14.309326171875, -13.8038330078125, -13.29833984375, -12.7928466796875, -12.287353515625, -11.7818603515625, -11.2763671875, -10.7708740234375, -10.265380859375, -9.7598876953125, -9.25439453125, -8.7489013671875, -8.243408203125, -7.7379150390625, -7.232421875, -6.7269287109375, -6.221435546875, -5.7159423828125, -5.21044921875, -4.7049560546875, -4.199462890625, -3.6939697265625, -3.1884765625, -2.6829833984375, -2.177490234375, -1.6719970703125, -1.16650390625, -0.6610107421875, -0.155517578125, 0.3499755859375, 0.85546875, 1.3609619140625, 1.866455078125, 2.3719482421875, 2.87744140625, 3.3829345703125, 3.888427734375, 4.3939208984375, 4.8994140625, 5.4049072265625, 5.910400390625, 6.4158935546875, 6.92138671875, 7.4268798828125, 7.932373046875, 8.4378662109375, 8.943359375, 9.4488525390625, 9.954345703125, 10.4598388671875, 10.96533203125, 11.4708251953125, 11.976318359375, 12.4818115234375, 12.9873046875, 13.4927978515625, 13.998291015625, 14.5037841796875, 15.00927734375, 15.5147705078125, 16.020263671875, 16.5257568359375, 17.03125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 6.0, 4.0, 3.0, 3.0, 7.0, 7.0, 12.0, 20.0, 19.0, 33.0, 29.0, 57.0, 59.0, 46.0, 84.0, 95.0, 81.0, 69.0, 74.0, 66.0, 43.0, 44.0, 33.0, 25.0, 17.0, 12.0, 17.0, 10.0, 5.0, 4.0, 5.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.31568908691406, -45.760162353515625, -44.20463562011719, -42.64910888671875, -41.09358596801758, -39.53805923461914, -37.9825325012207, -36.427005767822266, -34.87147903442383, -33.31595230102539, -31.760427474975586, -30.20490074157715, -28.64937400817871, -27.093849182128906, -25.53832244873047, -23.98279571533203, -22.427270889282227, -20.87174415588379, -19.316219329833984, -17.760692596435547, -16.20516586303711, -14.649640083312988, -13.094114303588867, -11.53858757019043, -9.983061790466309, -8.427536010742188, -6.87200927734375, -5.316483497619629, -3.7609572410583496, -2.2054309844970703, -0.6499052047729492, 0.9056215286254883, 2.4611473083496094, 4.016673564910889, 5.572199821472168, 7.127725601196289, 8.683252334594727, 10.238778114318848, 11.794303894042969, 13.349830627441406, 14.905356407165527, 16.46088218688965, 18.016408920288086, 19.57193374633789, 21.127460479736328, 22.682987213134766, 24.238513946533203, 25.79404067993164, 27.349565505981445, 28.905092239379883, 30.460617065429688, 32.016143798828125, 33.57167053222656, 35.127197265625, 36.68272399902344, 38.238250732421875, 39.79377365112305, 41.349300384521484, 42.90482711791992, 44.460350036621094, 46.01587677001953, 47.57140350341797, 49.126930236816406, 50.682456970214844, 52.23798370361328]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 7.0, 2.0, 2.0, 6.0, 6.0, 6.0, 13.0, 9.0, 18.0, 22.0, 23.0, 22.0, 35.0, 25.0, 22.0, 31.0, 30.0, 35.0, 39.0, 59.0, 30.0, 48.0, 46.0, 49.0, 43.0, 47.0, 45.0, 36.0, 35.0, 21.0, 24.0, 25.0, 16.0, 23.0, 18.0, 21.0, 16.0, 8.0, 12.0, 7.0, 4.0, 5.0, 7.0, 1.0, 3.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.902496337890625, -31.659561157226562, -30.416627883911133, -29.173694610595703, -27.93075942993164, -26.687824249267578, -25.44489097595215, -24.20195770263672, -22.959022521972656, -21.716087341308594, -20.473154067993164, -19.230220794677734, -17.987285614013672, -16.74435043334961, -15.50141716003418, -14.258482933044434, -13.015548706054688, -11.772614479064941, -10.529680252075195, -9.28674602508545, -8.043811798095703, -6.800877571105957, -5.557943344116211, -4.315009117126465, -3.0720748901367188, -1.8291406631469727, -0.5862064361572266, 0.6567277908325195, 1.8996620178222656, 3.1425962448120117, 4.385530471801758, 5.628464698791504, 6.871402740478516, 8.114336967468262, 9.357271194458008, 10.600205421447754, 11.8431396484375, 13.086073875427246, 14.329008102416992, 15.571942329406738, 16.814876556396484, 18.057811737060547, 19.300745010375977, 20.543678283691406, 21.78661346435547, 23.02954864501953, 24.27248191833496, 25.51541519165039, 26.758350372314453, 28.001285552978516, 29.244218826293945, 30.487152099609375, 31.730087280273438, 32.9730224609375, 34.21595764160156, 35.45888900756836, 36.70182418823242, 37.944759368896484, 39.18769073486328, 40.430625915527344, 41.673561096191406, 42.91649627685547, 44.15943145751953, 45.40236282348633, 46.64529800415039]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 7.0, 5.0, 6.0, 5.0, 13.0, 16.0, 24.0, 27.0, 42.0, 60.0, 89.0, 130.0, 229.0, 317.0, 518.0, 811.0, 1314.0, 2123.0, 3712.0, 6487.0, 11176.0, 20446.0, 38820.0, 78824.0, 173637.0, 315775.0, 204345.0, 92062.0, 44404.0, 23110.0, 12541.0, 6948.0, 4132.0, 2362.0, 1452.0, 898.0, 595.0, 381.0, 249.0, 139.0, 105.0, 65.0, 42.0, 27.0, 25.0, 13.0, 14.0, 14.0, 6.0, 10.0, 3.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0], "bins": [-18.25, -17.690185546875, -17.13037109375, -16.570556640625, -16.0107421875, -15.450927734375, -14.89111328125, -14.331298828125, -13.771484375, -13.211669921875, -12.65185546875, -12.092041015625, -11.5322265625, -10.972412109375, -10.41259765625, -9.852783203125, -9.29296875, -8.733154296875, -8.17333984375, -7.613525390625, -7.0537109375, -6.493896484375, -5.93408203125, -5.374267578125, -4.814453125, -4.254638671875, -3.69482421875, -3.135009765625, -2.5751953125, -2.015380859375, -1.45556640625, -0.895751953125, -0.3359375, 0.223876953125, 0.78369140625, 1.343505859375, 1.9033203125, 2.463134765625, 3.02294921875, 3.582763671875, 4.142578125, 4.702392578125, 5.26220703125, 5.822021484375, 6.3818359375, 6.941650390625, 7.50146484375, 8.061279296875, 8.62109375, 9.180908203125, 9.74072265625, 10.300537109375, 10.8603515625, 11.420166015625, 11.97998046875, 12.539794921875, 13.099609375, 13.659423828125, 14.21923828125, 14.779052734375, 15.3388671875, 15.898681640625, 16.45849609375, 17.018310546875, 17.578125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 2.0, 5.0, 5.0, 4.0, 2.0, 6.0, 9.0, 11.0, 20.0, 13.0, 19.0, 18.0, 15.0, 34.0, 20.0, 18.0, 34.0, 28.0, 31.0, 36.0, 42.0, 39.0, 44.0, 38.0, 41.0, 48.0, 40.0, 38.0, 45.0, 32.0, 34.0, 31.0, 19.0, 23.0, 24.0, 24.0, 16.0, 13.0, 17.0, 19.0, 6.0, 8.0, 5.0, 5.0, 5.0, 1.0, 9.0, 3.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-35.875, -34.69775390625, -33.5205078125, -32.34326171875, -31.166015625, -29.98876953125, -28.8115234375, -27.63427734375, -26.45703125, -25.27978515625, -24.1025390625, -22.92529296875, -21.748046875, -20.57080078125, -19.3935546875, -18.21630859375, -17.0390625, -15.86181640625, -14.6845703125, -13.50732421875, -12.330078125, -11.15283203125, -9.9755859375, -8.79833984375, -7.62109375, -6.44384765625, -5.2666015625, -4.08935546875, -2.912109375, -1.73486328125, -0.5576171875, 0.61962890625, 1.796875, 2.97412109375, 4.1513671875, 5.32861328125, 6.505859375, 7.68310546875, 8.8603515625, 10.03759765625, 11.21484375, 12.39208984375, 13.5693359375, 14.74658203125, 15.923828125, 17.10107421875, 18.2783203125, 19.45556640625, 20.6328125, 21.81005859375, 22.9873046875, 24.16455078125, 25.341796875, 26.51904296875, 27.6962890625, 28.87353515625, 30.05078125, 31.22802734375, 32.4052734375, 33.58251953125, 34.759765625, 35.93701171875, 37.1142578125, 38.29150390625, 39.46875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 0.0, 7.0, 3.0, 6.0, 7.0, 17.0, 14.0, 21.0, 27.0, 52.0, 74.0, 122.0, 236.0, 431.0, 826.0, 1669.0, 3635.0, 8360.0, 21701.0, 168678.0, 788722.0, 33316.0, 11337.0, 4845.0, 2171.0, 1033.0, 536.0, 279.0, 162.0, 86.0, 53.0, 43.0, 16.0, 16.0, 14.0, 10.0, 5.0, 5.0, 6.0, 7.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0], "bins": [-44.15625, -42.8642578125, -41.572265625, -40.2802734375, -38.98828125, -37.6962890625, -36.404296875, -35.1123046875, -33.8203125, -32.5283203125, -31.236328125, -29.9443359375, -28.65234375, -27.3603515625, -26.068359375, -24.7763671875, -23.484375, -22.1923828125, -20.900390625, -19.6083984375, -18.31640625, -17.0244140625, -15.732421875, -14.4404296875, -13.1484375, -11.8564453125, -10.564453125, -9.2724609375, -7.98046875, -6.6884765625, -5.396484375, -4.1044921875, -2.8125, -1.5205078125, -0.228515625, 1.0634765625, 2.35546875, 3.6474609375, 4.939453125, 6.2314453125, 7.5234375, 8.8154296875, 10.107421875, 11.3994140625, 12.69140625, 13.9833984375, 15.275390625, 16.5673828125, 17.859375, 19.1513671875, 20.443359375, 21.7353515625, 23.02734375, 24.3193359375, 25.611328125, 26.9033203125, 28.1953125, 29.4873046875, 30.779296875, 32.0712890625, 33.36328125, 34.6552734375, 35.947265625, 37.2392578125, 38.53125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 2.0, 3.0, 1.0, 8.0, 4.0, 3.0, 9.0, 9.0, 7.0, 14.0, 9.0, 14.0, 11.0, 17.0, 17.0, 19.0, 11.0, 28.0, 23.0, 31.0, 26.0, 41.0, 40.0, 37.0, 36.0, 44.0, 40.0, 42.0, 38.0, 39.0, 35.0, 33.0, 34.0, 37.0, 37.0, 25.0, 23.0, 23.0, 21.0, 20.0, 11.0, 15.0, 9.0, 11.0, 13.0, 4.0, 13.0, 5.0, 6.0, 7.0, 2.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.140625, -23.35986328125, -22.5791015625, -21.79833984375, -21.017578125, -20.23681640625, -19.4560546875, -18.67529296875, -17.89453125, -17.11376953125, -16.3330078125, -15.55224609375, -14.771484375, -13.99072265625, -13.2099609375, -12.42919921875, -11.6484375, -10.86767578125, -10.0869140625, -9.30615234375, -8.525390625, -7.74462890625, -6.9638671875, -6.18310546875, -5.40234375, -4.62158203125, -3.8408203125, -3.06005859375, -2.279296875, -1.49853515625, -0.7177734375, 0.06298828125, 0.84375, 1.62451171875, 2.4052734375, 3.18603515625, 3.966796875, 4.74755859375, 5.5283203125, 6.30908203125, 7.08984375, 7.87060546875, 8.6513671875, 9.43212890625, 10.212890625, 10.99365234375, 11.7744140625, 12.55517578125, 13.3359375, 14.11669921875, 14.8974609375, 15.67822265625, 16.458984375, 17.23974609375, 18.0205078125, 18.80126953125, 19.58203125, 20.36279296875, 21.1435546875, 21.92431640625, 22.705078125, 23.48583984375, 24.2666015625, 25.04736328125, 25.828125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 5.0, 5.0, 10.0, 6.0, 14.0, 23.0, 30.0, 43.0, 67.0, 89.0, 115.0, 204.0, 318.0, 532.0, 928.0, 1708.0, 3678.0, 8761.0, 26070.0, 678643.0, 290017.0, 22149.0, 7871.0, 3288.0, 1620.0, 926.0, 490.0, 312.0, 193.0, 138.0, 89.0, 64.0, 34.0, 25.0, 27.0, 23.0, 14.0, 6.0, 9.0, 5.0, 4.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-3.751953125, -3.626617431640625, -3.50128173828125, -3.375946044921875, -3.2506103515625, -3.125274658203125, -2.99993896484375, -2.874603271484375, -2.749267578125, -2.623931884765625, -2.49859619140625, -2.373260498046875, -2.2479248046875, -2.122589111328125, -1.99725341796875, -1.871917724609375, -1.74658203125, -1.621246337890625, -1.49591064453125, -1.370574951171875, -1.2452392578125, -1.119903564453125, -0.99456787109375, -0.869232177734375, -0.743896484375, -0.618560791015625, -0.49322509765625, -0.367889404296875, -0.2425537109375, -0.117218017578125, 0.00811767578125, 0.133453369140625, 0.2587890625, 0.384124755859375, 0.50946044921875, 0.634796142578125, 0.7601318359375, 0.885467529296875, 1.01080322265625, 1.136138916015625, 1.261474609375, 1.386810302734375, 1.51214599609375, 1.637481689453125, 1.7628173828125, 1.888153076171875, 2.01348876953125, 2.138824462890625, 2.26416015625, 2.389495849609375, 2.51483154296875, 2.640167236328125, 2.7655029296875, 2.890838623046875, 3.01617431640625, 3.141510009765625, 3.266845703125, 3.392181396484375, 3.51751708984375, 3.642852783203125, 3.7681884765625, 3.893524169921875, 4.01885986328125, 4.144195556640625, 4.26953125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 7.0, 11.0, 13.0, 19.0, 24.0, 37.0, 41.0, 54.0, 115.0, 129.0, 139.0, 122.0, 77.0, 53.0, 51.0, 34.0, 33.0, 9.0, 13.0, 7.0, 4.0, 1.0, 4.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005731582641601562, -0.0005593076348304749, -0.0005454570055007935, -0.0005316063761711121, -0.0005177557468414307, -0.0005039051175117493, -0.0004900544881820679, -0.0004762038588523865, -0.0004623532295227051, -0.0004485026001930237, -0.0004346519708633423, -0.0004208013415336609, -0.0004069507122039795, -0.0003931000828742981, -0.0003792494535446167, -0.0003653988242149353, -0.0003515481948852539, -0.0003376975655555725, -0.0003238469362258911, -0.0003099963068962097, -0.0002961456775665283, -0.0002822950482368469, -0.00026844441890716553, -0.00025459378957748413, -0.00024074316024780273, -0.00022689253091812134, -0.00021304190158843994, -0.00019919127225875854, -0.00018534064292907715, -0.00017149001359939575, -0.00015763938426971436, -0.00014378875494003296, -0.00012993812561035156, -0.00011608749628067017, -0.00010223686695098877, -8.838623762130737e-05, -7.453560829162598e-05, -6.068497896194458e-05, -4.6834349632263184e-05, -3.298372030258179e-05, -1.913309097290039e-05, -5.282461643218994e-06, 8.568167686462402e-06, 2.24187970161438e-05, 3.6269426345825195e-05, 5.012005567550659e-05, 6.397068500518799e-05, 7.782131433486938e-05, 9.167194366455078e-05, 0.00010552257299423218, 0.00011937320232391357, 0.00013322383165359497, 0.00014707446098327637, 0.00016092509031295776, 0.00017477571964263916, 0.00018862634897232056, 0.00020247697830200195, 0.00021632760763168335, 0.00023017823696136475, 0.00024402886629104614, 0.00025787949562072754, 0.00027173012495040894, 0.00028558075428009033, 0.00029943138360977173, 0.0003132820129394531]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 5.0, 8.0, 12.0, 17.0, 29.0, 33.0, 44.0, 92.0, 99.0, 153.0, 217.0, 327.0, 475.0, 720.0, 1118.0, 1706.0, 2522.0, 3947.0, 6447.0, 10731.0, 18287.0, 33631.0, 67960.0, 158767.0, 338785.0, 215670.0, 88827.0, 41959.0, 22062.0, 12638.0, 7738.0, 4825.0, 2991.0, 1935.0, 1262.0, 810.0, 570.0, 347.0, 246.0, 165.0, 112.0, 80.0, 53.0, 44.0, 24.0, 20.0, 11.0, 12.0, 8.0, 6.0, 8.0, 2.0, 1.0, 2.0, 4.0], "bins": [-3.626953125, -3.51922607421875, -3.4114990234375, -3.30377197265625, -3.196044921875, -3.08831787109375, -2.9805908203125, -2.87286376953125, -2.76513671875, -2.65740966796875, -2.5496826171875, -2.44195556640625, -2.334228515625, -2.22650146484375, -2.1187744140625, -2.01104736328125, -1.9033203125, -1.79559326171875, -1.6878662109375, -1.58013916015625, -1.472412109375, -1.36468505859375, -1.2569580078125, -1.14923095703125, -1.04150390625, -0.93377685546875, -0.8260498046875, -0.71832275390625, -0.610595703125, -0.50286865234375, -0.3951416015625, -0.28741455078125, -0.1796875, -0.07196044921875, 0.0357666015625, 0.14349365234375, 0.251220703125, 0.35894775390625, 0.4666748046875, 0.57440185546875, 0.68212890625, 0.78985595703125, 0.8975830078125, 1.00531005859375, 1.113037109375, 1.22076416015625, 1.3284912109375, 1.43621826171875, 1.5439453125, 1.65167236328125, 1.7593994140625, 1.86712646484375, 1.974853515625, 2.08258056640625, 2.1903076171875, 2.29803466796875, 2.40576171875, 2.51348876953125, 2.6212158203125, 2.72894287109375, 2.836669921875, 2.94439697265625, 3.0521240234375, 3.15985107421875, 3.267578125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 11.0, 11.0, 12.0, 17.0, 10.0, 25.0, 35.0, 28.0, 28.0, 43.0, 55.0, 70.0, 59.0, 67.0, 82.0, 57.0, 59.0, 64.0, 42.0, 31.0, 42.0, 28.0, 21.0, 14.0, 13.0, 19.0, 10.0, 6.0, 9.0, 5.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.1142578125, -1.0807647705078125, -1.047271728515625, -1.0137786865234375, -0.98028564453125, -0.9467926025390625, -0.913299560546875, -0.8798065185546875, -0.8463134765625, -0.8128204345703125, -0.779327392578125, -0.7458343505859375, -0.71234130859375, -0.6788482666015625, -0.645355224609375, -0.6118621826171875, -0.578369140625, -0.5448760986328125, -0.511383056640625, -0.4778900146484375, -0.44439697265625, -0.4109039306640625, -0.377410888671875, -0.3439178466796875, -0.3104248046875, -0.2769317626953125, -0.243438720703125, -0.2099456787109375, -0.17645263671875, -0.1429595947265625, -0.109466552734375, -0.0759735107421875, -0.04248046875, -0.0089874267578125, 0.024505615234375, 0.0579986572265625, 0.09149169921875, 0.1249847412109375, 0.158477783203125, 0.1919708251953125, 0.2254638671875, 0.2589569091796875, 0.292449951171875, 0.3259429931640625, 0.35943603515625, 0.3929290771484375, 0.426422119140625, 0.4599151611328125, 0.493408203125, 0.5269012451171875, 0.560394287109375, 0.5938873291015625, 0.62738037109375, 0.6608734130859375, 0.694366455078125, 0.7278594970703125, 0.7613525390625, 0.7948455810546875, 0.828338623046875, 0.8618316650390625, 0.89532470703125, 0.9288177490234375, 0.962310791015625, 0.9958038330078125, 1.029296875]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 4.0, 7.0, 7.0, 9.0, 14.0, 22.0, 22.0, 30.0, 45.0, 43.0, 64.0, 57.0, 79.0, 86.0, 78.0, 74.0, 69.0, 61.0, 51.0, 29.0, 36.0, 19.0, 17.0, 25.0, 11.0, 7.0, 4.0, 5.0, 4.0, 2.0, 1.0, 5.0, 2.0, 0.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.452972412109375, -41.96217727661133, -40.47138214111328, -38.9805908203125, -37.48979568481445, -35.999000549316406, -34.508209228515625, -33.01741409301758, -31.52661895751953, -30.035823822021484, -28.54503059387207, -27.054237365722656, -25.56344223022461, -24.072647094726562, -22.58185386657715, -21.091060638427734, -19.600265502929688, -18.10947036743164, -16.618677139282227, -15.127882957458496, -13.637088775634766, -12.146294593811035, -10.655500411987305, -9.164706230163574, -7.673912048339844, -6.183117866516113, -4.692323684692383, -3.2015295028686523, -1.7107353210449219, -0.2199411392211914, 1.270853042602539, 2.7616472244262695, 4.25244140625, 5.7432355880737305, 7.234029769897461, 8.724823951721191, 10.215618133544922, 11.706412315368652, 13.197206497192383, 14.688000679016113, 16.178794860839844, 17.66958999633789, 19.160383224487305, 20.65117645263672, 22.141971588134766, 23.632766723632812, 25.123559951782227, 26.61435317993164, 28.105148315429688, 29.595943450927734, 31.08673667907715, 32.57752990722656, 34.06832504272461, 35.559120178222656, 37.04991149902344, 38.540706634521484, 40.03150177001953, 41.52229690551758, 43.013092041015625, 44.503883361816406, 45.99467849731445, 47.4854736328125, 48.97626495361328, 50.46706008911133, 51.957855224609375]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 7.0, 3.0, 1.0, 7.0, 6.0, 2.0, 13.0, 13.0, 16.0, 20.0, 23.0, 23.0, 31.0, 25.0, 28.0, 25.0, 29.0, 38.0, 40.0, 52.0, 39.0, 47.0, 42.0, 45.0, 49.0, 47.0, 45.0, 38.0, 33.0, 24.0, 21.0, 21.0, 23.0, 22.0, 16.0, 21.0, 21.0, 8.0, 9.0, 11.0, 2.0, 6.0, 6.0, 2.0, 3.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.65187072753906, -31.42336082458496, -30.19485092163086, -28.966341018676758, -27.737831115722656, -26.509321212768555, -25.280811309814453, -24.05230140686035, -22.82379150390625, -21.59528160095215, -20.366771697998047, -19.138261795043945, -17.909751892089844, -16.681241989135742, -15.45273208618164, -14.224222183227539, -12.995712280273438, -11.767202377319336, -10.538692474365234, -9.310182571411133, -8.081672668457031, -6.85316276550293, -5.624652862548828, -4.396142959594727, -3.167633056640625, -1.9391231536865234, -0.7106132507324219, 0.5178966522216797, 1.7464065551757812, 2.974916458129883, 4.203426361083984, 5.431936264038086, 6.660442352294922, 7.888952255249023, 9.117462158203125, 10.345972061157227, 11.574481964111328, 12.80299186706543, 14.031501770019531, 15.260011672973633, 16.488521575927734, 17.717031478881836, 18.945541381835938, 20.17405128479004, 21.40256118774414, 22.631071090698242, 23.859580993652344, 25.088090896606445, 26.316600799560547, 27.54511070251465, 28.77362060546875, 30.00213050842285, 31.230640411376953, 32.45915222167969, 33.687660217285156, 34.916168212890625, 36.14468002319336, 37.373191833496094, 38.60169982910156, 39.83020782470703, 41.058719635009766, 42.2872314453125, 43.51573944091797, 44.74424743652344, 45.97275924682617]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 5.0, 5.0, 9.0, 10.0, 7.0, 33.0, 35.0, 64.0, 99.0, 167.0, 277.0, 435.0, 746.0, 1303.0, 2126.0, 4117.0, 7508.0, 14851.0, 30506.0, 66884.0, 154875.0, 322904.0, 243889.0, 105181.0, 46821.0, 22004.0, 10803.0, 5647.0, 3085.0, 1687.0, 1007.0, 575.0, 368.0, 197.0, 119.0, 81.0, 36.0, 26.0, 18.0, 14.0, 10.0, 6.0, 5.0, 6.0, 4.0, 1.0, 1.0, 0.0, 2.0], "bins": [-75.25, -73.20361328125, -71.1572265625, -69.11083984375, -67.064453125, -65.01806640625, -62.9716796875, -60.92529296875, -58.87890625, -56.83251953125, -54.7861328125, -52.73974609375, -50.693359375, -48.64697265625, -46.6005859375, -44.55419921875, -42.5078125, -40.46142578125, -38.4150390625, -36.36865234375, -34.322265625, -32.27587890625, -30.2294921875, -28.18310546875, -26.13671875, -24.09033203125, -22.0439453125, -19.99755859375, -17.951171875, -15.90478515625, -13.8583984375, -11.81201171875, -9.765625, -7.71923828125, -5.6728515625, -3.62646484375, -1.580078125, 0.46630859375, 2.5126953125, 4.55908203125, 6.60546875, 8.65185546875, 10.6982421875, 12.74462890625, 14.791015625, 16.83740234375, 18.8837890625, 20.93017578125, 22.9765625, 25.02294921875, 27.0693359375, 29.11572265625, 31.162109375, 33.20849609375, 35.2548828125, 37.30126953125, 39.34765625, 41.39404296875, 43.4404296875, 45.48681640625, 47.533203125, 49.57958984375, 51.6259765625, 53.67236328125, 55.71875]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 6.0, 6.0, 5.0, 6.0, 6.0, 10.0, 15.0, 12.0, 25.0, 22.0, 36.0, 18.0, 26.0, 22.0, 34.0, 44.0, 35.0, 42.0, 47.0, 43.0, 48.0, 51.0, 55.0, 51.0, 55.0, 32.0, 27.0, 26.0, 29.0, 21.0, 21.0, 14.0, 19.0, 20.0, 16.0, 9.0, 15.0, 4.0, 7.0, 7.0, 3.0, 4.0, 3.0, 2.0, 1.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.8125, -33.560546875, -32.30859375, -31.056640625, -29.8046875, -28.552734375, -27.30078125, -26.048828125, -24.796875, -23.544921875, -22.29296875, -21.041015625, -19.7890625, -18.537109375, -17.28515625, -16.033203125, -14.78125, -13.529296875, -12.27734375, -11.025390625, -9.7734375, -8.521484375, -7.26953125, -6.017578125, -4.765625, -3.513671875, -2.26171875, -1.009765625, 0.2421875, 1.494140625, 2.74609375, 3.998046875, 5.25, 6.501953125, 7.75390625, 9.005859375, 10.2578125, 11.509765625, 12.76171875, 14.013671875, 15.265625, 16.517578125, 17.76953125, 19.021484375, 20.2734375, 21.525390625, 22.77734375, 24.029296875, 25.28125, 26.533203125, 27.78515625, 29.037109375, 30.2890625, 31.541015625, 32.79296875, 34.044921875, 35.296875, 36.548828125, 37.80078125, 39.052734375, 40.3046875, 41.556640625, 42.80859375, 44.060546875, 45.3125]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 2.0, 10.0, 2.0, 13.0, 7.0, 34.0, 30.0, 47.0, 74.0, 98.0, 166.0, 239.0, 387.0, 567.0, 890.0, 1241.0, 1929.0, 3060.0, 4689.0, 7419.0, 11180.0, 17479.0, 28533.0, 46317.0, 76366.0, 125803.0, 189591.0, 192491.0, 130976.0, 79728.0, 48235.0, 29572.0, 18356.0, 11687.0, 7439.0, 4729.0, 3115.0, 2044.0, 1422.0, 878.0, 593.0, 384.0, 266.0, 153.0, 116.0, 59.0, 51.0, 30.0, 17.0, 17.0, 15.0, 10.0, 6.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-43.40625, -42.0078125, -40.609375, -39.2109375, -37.8125, -36.4140625, -35.015625, -33.6171875, -32.21875, -30.8203125, -29.421875, -28.0234375, -26.625, -25.2265625, -23.828125, -22.4296875, -21.03125, -19.6328125, -18.234375, -16.8359375, -15.4375, -14.0390625, -12.640625, -11.2421875, -9.84375, -8.4453125, -7.046875, -5.6484375, -4.25, -2.8515625, -1.453125, -0.0546875, 1.34375, 2.7421875, 4.140625, 5.5390625, 6.9375, 8.3359375, 9.734375, 11.1328125, 12.53125, 13.9296875, 15.328125, 16.7265625, 18.125, 19.5234375, 20.921875, 22.3203125, 23.71875, 25.1171875, 26.515625, 27.9140625, 29.3125, 30.7109375, 32.109375, 33.5078125, 34.90625, 36.3046875, 37.703125, 39.1015625, 40.5, 41.8984375, 43.296875, 44.6953125, 46.09375]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 0.0, 11.0, 8.0, 12.0, 14.0, 12.0, 19.0, 17.0, 20.0, 10.0, 25.0, 24.0, 28.0, 23.0, 33.0, 45.0, 49.0, 38.0, 32.0, 47.0, 36.0, 32.0, 46.0, 43.0, 49.0, 55.0, 35.0, 46.0, 24.0, 22.0, 27.0, 15.0, 20.0, 13.0, 15.0, 15.0, 10.0, 8.0, 10.0, 7.0, 2.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.90625, -22.07373046875, -21.2412109375, -20.40869140625, -19.576171875, -18.74365234375, -17.9111328125, -17.07861328125, -16.24609375, -15.41357421875, -14.5810546875, -13.74853515625, -12.916015625, -12.08349609375, -11.2509765625, -10.41845703125, -9.5859375, -8.75341796875, -7.9208984375, -7.08837890625, -6.255859375, -5.42333984375, -4.5908203125, -3.75830078125, -2.92578125, -2.09326171875, -1.2607421875, -0.42822265625, 0.404296875, 1.23681640625, 2.0693359375, 2.90185546875, 3.734375, 4.56689453125, 5.3994140625, 6.23193359375, 7.064453125, 7.89697265625, 8.7294921875, 9.56201171875, 10.39453125, 11.22705078125, 12.0595703125, 12.89208984375, 13.724609375, 14.55712890625, 15.3896484375, 16.22216796875, 17.0546875, 17.88720703125, 18.7197265625, 19.55224609375, 20.384765625, 21.21728515625, 22.0498046875, 22.88232421875, 23.71484375, 24.54736328125, 25.3798828125, 26.21240234375, 27.044921875, 27.87744140625, 28.7099609375, 29.54248046875, 30.375]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 6.0, 4.0, 4.0, 11.0, 12.0, 37.0, 30.0, 46.0, 78.0, 106.0, 149.0, 185.0, 279.0, 386.0, 575.0, 857.0, 1222.0, 1706.0, 2488.0, 3879.0, 5850.0, 9197.0, 14498.0, 23772.0, 40249.0, 69437.0, 124735.0, 219383.0, 222902.0, 127704.0, 70843.0, 41071.0, 24380.0, 14971.0, 9238.0, 5989.0, 3979.0, 2632.0, 1760.0, 1234.0, 846.0, 564.0, 374.0, 273.0, 186.0, 143.0, 104.0, 75.0, 34.0, 36.0, 17.0, 12.0, 8.0, 5.0, 5.0, 4.0, 2.0, 0.0, 1.0], "bins": [-17.71875, -17.18212890625, -16.6455078125, -16.10888671875, -15.572265625, -15.03564453125, -14.4990234375, -13.96240234375, -13.42578125, -12.88916015625, -12.3525390625, -11.81591796875, -11.279296875, -10.74267578125, -10.2060546875, -9.66943359375, -9.1328125, -8.59619140625, -8.0595703125, -7.52294921875, -6.986328125, -6.44970703125, -5.9130859375, -5.37646484375, -4.83984375, -4.30322265625, -3.7666015625, -3.22998046875, -2.693359375, -2.15673828125, -1.6201171875, -1.08349609375, -0.546875, -0.01025390625, 0.5263671875, 1.06298828125, 1.599609375, 2.13623046875, 2.6728515625, 3.20947265625, 3.74609375, 4.28271484375, 4.8193359375, 5.35595703125, 5.892578125, 6.42919921875, 6.9658203125, 7.50244140625, 8.0390625, 8.57568359375, 9.1123046875, 9.64892578125, 10.185546875, 10.72216796875, 11.2587890625, 11.79541015625, 12.33203125, 12.86865234375, 13.4052734375, 13.94189453125, 14.478515625, 15.01513671875, 15.5517578125, 16.08837890625, 16.625]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 3.0, 6.0, 8.0, 10.0, 13.0, 17.0, 19.0, 13.0, 34.0, 44.0, 60.0, 66.0, 70.0, 87.0, 92.0, 91.0, 77.0, 58.0, 48.0, 29.0, 23.0, 18.0, 26.0, 19.0, 13.0, 8.0, 17.0, 6.0, 4.0, 3.0, 2.0, 5.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.001983642578125, -0.0019261986017227173, -0.0018687546253204346, -0.0018113106489181519, -0.0017538666725158691, -0.0016964226961135864, -0.0016389787197113037, -0.001581534743309021, -0.0015240907669067383, -0.0014666467905044556, -0.0014092028141021729, -0.0013517588376998901, -0.0012943148612976074, -0.0012368708848953247, -0.001179426908493042, -0.0011219829320907593, -0.0010645389556884766, -0.0010070949792861938, -0.0009496510028839111, -0.0008922070264816284, -0.0008347630500793457, -0.000777319073677063, -0.0007198750972747803, -0.0006624311208724976, -0.0006049871444702148, -0.0005475431680679321, -0.0004900991916656494, -0.0004326552152633667, -0.000375211238861084, -0.00031776726245880127, -0.00026032328605651855, -0.00020287930965423584, -0.00014543533325195312, -8.799135684967041e-05, -3.0547380447387695e-05, 2.689659595489502e-05, 8.434057235717773e-05, 0.00014178454875946045, 0.00019922852516174316, 0.0002566725015640259, 0.0003141164779663086, 0.0003715604543685913, 0.000429004430770874, 0.00048644840717315674, 0.0005438923835754395, 0.0006013363599777222, 0.0006587803363800049, 0.0007162243127822876, 0.0007736682891845703, 0.000831112265586853, 0.0008885562419891357, 0.0009460002183914185, 0.0010034441947937012, 0.0010608881711959839, 0.0011183321475982666, 0.0011757761240005493, 0.001233220100402832, 0.0012906640768051147, 0.0013481080532073975, 0.0014055520296096802, 0.0014629960060119629, 0.0015204399824142456, 0.0015778839588165283, 0.001635327935218811, 0.0016927719116210938]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 4.0, 3.0, 6.0, 11.0, 9.0, 11.0, 18.0, 33.0, 40.0, 54.0, 83.0, 130.0, 198.0, 257.0, 390.0, 530.0, 745.0, 1139.0, 1624.0, 2386.0, 3608.0, 5544.0, 8858.0, 14470.0, 22705.0, 37390.0, 65170.0, 114721.0, 207505.0, 234563.0, 135806.0, 75393.0, 43949.0, 25900.0, 16053.0, 10165.0, 6343.0, 4095.0, 2758.0, 1825.0, 1352.0, 848.0, 553.0, 426.0, 269.0, 207.0, 121.0, 88.0, 72.0, 39.0, 28.0, 21.0, 18.0, 15.0, 5.0, 7.0, 2.0, 4.0, 0.0, 3.0, 2.0], "bins": [-16.328125, -15.820068359375, -15.31201171875, -14.803955078125, -14.2958984375, -13.787841796875, -13.27978515625, -12.771728515625, -12.263671875, -11.755615234375, -11.24755859375, -10.739501953125, -10.2314453125, -9.723388671875, -9.21533203125, -8.707275390625, -8.19921875, -7.691162109375, -7.18310546875, -6.675048828125, -6.1669921875, -5.658935546875, -5.15087890625, -4.642822265625, -4.134765625, -3.626708984375, -3.11865234375, -2.610595703125, -2.1025390625, -1.594482421875, -1.08642578125, -0.578369140625, -0.0703125, 0.437744140625, 0.94580078125, 1.453857421875, 1.9619140625, 2.469970703125, 2.97802734375, 3.486083984375, 3.994140625, 4.502197265625, 5.01025390625, 5.518310546875, 6.0263671875, 6.534423828125, 7.04248046875, 7.550537109375, 8.05859375, 8.566650390625, 9.07470703125, 9.582763671875, 10.0908203125, 10.598876953125, 11.10693359375, 11.614990234375, 12.123046875, 12.631103515625, 13.13916015625, 13.647216796875, 14.1552734375, 14.663330078125, 15.17138671875, 15.679443359375, 16.1875]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 3.0, 5.0, 12.0, 13.0, 7.0, 15.0, 15.0, 19.0, 17.0, 30.0, 33.0, 45.0, 30.0, 44.0, 38.0, 61.0, 65.0, 54.0, 63.0, 51.0, 55.0, 56.0, 39.0, 41.0, 37.0, 25.0, 21.0, 18.0, 21.0, 13.0, 12.0, 11.0, 0.0, 5.0, 2.0, 6.0, 4.0, 4.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.90625, -6.70880126953125, -6.5113525390625, -6.31390380859375, -6.116455078125, -5.91900634765625, -5.7215576171875, -5.52410888671875, -5.32666015625, -5.12921142578125, -4.9317626953125, -4.73431396484375, -4.536865234375, -4.33941650390625, -4.1419677734375, -3.94451904296875, -3.7470703125, -3.54962158203125, -3.3521728515625, -3.15472412109375, -2.957275390625, -2.75982666015625, -2.5623779296875, -2.36492919921875, -2.16748046875, -1.97003173828125, -1.7725830078125, -1.57513427734375, -1.377685546875, -1.18023681640625, -0.9827880859375, -0.78533935546875, -0.587890625, -0.39044189453125, -0.1929931640625, 0.00445556640625, 0.201904296875, 0.39935302734375, 0.5968017578125, 0.79425048828125, 0.99169921875, 1.18914794921875, 1.3865966796875, 1.58404541015625, 1.781494140625, 1.97894287109375, 2.1763916015625, 2.37384033203125, 2.5712890625, 2.76873779296875, 2.9661865234375, 3.16363525390625, 3.361083984375, 3.55853271484375, 3.7559814453125, 3.95343017578125, 4.15087890625, 4.34832763671875, 4.5457763671875, 4.74322509765625, 4.940673828125, 5.13812255859375, 5.3355712890625, 5.53302001953125, 5.73046875]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 5.0, 2.0, 6.0, 7.0, 12.0, 16.0, 16.0, 11.0, 27.0, 26.0, 41.0, 48.0, 54.0, 58.0, 63.0, 57.0, 72.0, 67.0, 67.0, 52.0, 61.0, 56.0, 28.0, 33.0, 29.0, 13.0, 14.0, 15.0, 10.0, 7.0, 4.0, 5.0, 5.0, 2.0, 4.0, 3.0, 2.0, 4.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.03135299682617, -37.67646408081055, -36.32157516479492, -34.9666862487793, -33.61180114746094, -32.25691223144531, -30.902023315429688, -29.547134399414062, -28.192245483398438, -26.837356567382812, -25.482467651367188, -24.127580642700195, -22.77269172668457, -21.417802810668945, -20.062915802001953, -18.708026885986328, -17.353137969970703, -15.998249053955078, -14.64336109161377, -13.288473129272461, -11.933584213256836, -10.578695297241211, -9.223807334899902, -7.868919372558594, -6.514030456542969, -5.159142017364502, -3.804253578186035, -2.4493651390075684, -1.0944766998291016, 0.26041173934936523, 1.615300178527832, 2.9701881408691406, 4.3250732421875, 5.679961681365967, 7.034850120544434, 8.389738082885742, 9.744626998901367, 11.099515914916992, 12.4544038772583, 13.80929183959961, 15.164180755615234, 16.51906967163086, 17.873958587646484, 19.228845596313477, 20.5837345123291, 21.938623428344727, 23.29351043701172, 24.648399353027344, 26.00328826904297, 27.358177185058594, 28.71306610107422, 30.06795310974121, 31.422842025756836, 32.77772903442383, 34.13261795043945, 35.48750686645508, 36.8423957824707, 38.19728469848633, 39.55217361450195, 40.90706253051758, 42.26194763183594, 43.61683654785156, 44.97172546386719, 46.32661437988281, 47.68150329589844]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 1.0, 4.0, 4.0, 3.0, 6.0, 11.0, 8.0, 8.0, 11.0, 14.0, 20.0, 23.0, 19.0, 25.0, 24.0, 22.0, 34.0, 43.0, 46.0, 41.0, 33.0, 55.0, 44.0, 49.0, 40.0, 43.0, 41.0, 43.0, 39.0, 41.0, 30.0, 26.0, 26.0, 22.0, 14.0, 14.0, 12.0, 13.0, 14.0, 7.0, 8.0, 10.0, 7.0, 2.0, 7.0, 1.0, 3.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.6940803527832, -32.41613006591797, -31.138179779052734, -29.8602294921875, -28.582279205322266, -27.30432891845703, -26.026378631591797, -24.748428344726562, -23.470478057861328, -22.192527770996094, -20.91457748413086, -19.636627197265625, -18.35867691040039, -17.080726623535156, -15.802775382995605, -14.524825096130371, -13.24687385559082, -11.968923568725586, -10.690973281860352, -9.413022994995117, -8.135072708129883, -6.85712194442749, -5.579171180725098, -4.301220893859863, -3.023270606994629, -1.745320200920105, -0.46736979484558105, 0.8105807304382324, 2.088531017303467, 3.366481304168701, 4.644432067871094, 5.922382354736328, 7.2003326416015625, 8.478282928466797, 9.756233215332031, 11.034183502197266, 12.3121337890625, 13.590084075927734, 14.868035316467285, 16.145984649658203, 17.423934936523438, 18.701885223388672, 19.979835510253906, 21.25778579711914, 22.535736083984375, 23.81368637084961, 25.091636657714844, 26.369586944580078, 27.647539138793945, 28.92548942565918, 30.203439712524414, 31.48138999938965, 32.759342193603516, 34.03729248046875, 35.315242767333984, 36.59319305419922, 37.87114334106445, 39.14909362792969, 40.42704391479492, 41.704994201660156, 42.98294448852539, 44.260894775390625, 45.53884506225586, 46.816795349121094, 48.09474563598633]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 5.0, 7.0, 15.0, 10.0, 16.0, 30.0, 47.0, 54.0, 94.0, 118.0, 183.0, 271.0, 388.0, 546.0, 910.0, 1372.0, 2258.0, 3877.0, 6655.0, 12272.0, 24811.0, 55763.0, 170156.0, 673337.0, 1882934.0, 983074.0, 237535.0, 72358.0, 30041.0, 15019.0, 7973.0, 4540.0, 2740.0, 1664.0, 1062.0, 702.0, 467.0, 339.0, 212.0, 128.0, 100.0, 64.0, 42.0, 42.0, 20.0, 8.0, 9.0, 9.0, 4.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-62.28125, -60.4296875, -58.578125, -56.7265625, -54.875, -53.0234375, -51.171875, -49.3203125, -47.46875, -45.6171875, -43.765625, -41.9140625, -40.0625, -38.2109375, -36.359375, -34.5078125, -32.65625, -30.8046875, -28.953125, -27.1015625, -25.25, -23.3984375, -21.546875, -19.6953125, -17.84375, -15.9921875, -14.140625, -12.2890625, -10.4375, -8.5859375, -6.734375, -4.8828125, -3.03125, -1.1796875, 0.671875, 2.5234375, 4.375, 6.2265625, 8.078125, 9.9296875, 11.78125, 13.6328125, 15.484375, 17.3359375, 19.1875, 21.0390625, 22.890625, 24.7421875, 26.59375, 28.4453125, 30.296875, 32.1484375, 34.0, 35.8515625, 37.703125, 39.5546875, 41.40625, 43.2578125, 45.109375, 46.9609375, 48.8125, 50.6640625, 52.515625, 54.3671875, 56.21875]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 5.0, 4.0, 9.0, 12.0, 6.0, 12.0, 23.0, 27.0, 29.0, 24.0, 23.0, 32.0, 35.0, 40.0, 43.0, 56.0, 46.0, 57.0, 60.0, 56.0, 43.0, 39.0, 44.0, 46.0, 41.0, 35.0, 19.0, 28.0, 18.0, 17.0, 7.0, 12.0, 11.0, 11.0, 6.0, 11.0, 7.0, 0.0, 4.0, 5.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.359375, -30.170166015625, -28.98095703125, -27.791748046875, -26.6025390625, -25.413330078125, -24.22412109375, -23.034912109375, -21.845703125, -20.656494140625, -19.46728515625, -18.278076171875, -17.0888671875, -15.899658203125, -14.71044921875, -13.521240234375, -12.33203125, -11.142822265625, -9.95361328125, -8.764404296875, -7.5751953125, -6.385986328125, -5.19677734375, -4.007568359375, -2.818359375, -1.629150390625, -0.43994140625, 0.749267578125, 1.9384765625, 3.127685546875, 4.31689453125, 5.506103515625, 6.6953125, 7.884521484375, 9.07373046875, 10.262939453125, 11.4521484375, 12.641357421875, 13.83056640625, 15.019775390625, 16.208984375, 17.398193359375, 18.58740234375, 19.776611328125, 20.9658203125, 22.155029296875, 23.34423828125, 24.533447265625, 25.72265625, 26.911865234375, 28.10107421875, 29.290283203125, 30.4794921875, 31.668701171875, 32.85791015625, 34.047119140625, 35.236328125, 36.425537109375, 37.61474609375, 38.803955078125, 39.9931640625, 41.182373046875, 42.37158203125, 43.560791015625, 44.75]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 6.0, 3.0, 9.0, 12.0, 19.0, 21.0, 23.0, 46.0, 55.0, 67.0, 118.0, 155.0, 237.0, 341.0, 470.0, 807.0, 1080.0, 1692.0, 2515.0, 4055.0, 6663.0, 11179.0, 19277.0, 34181.0, 64264.0, 127191.0, 277685.0, 705874.0, 1558648.0, 780701.0, 303262.0, 137564.0, 68539.0, 36184.0, 20321.0, 11727.0, 6958.0, 4247.0, 2750.0, 1773.0, 1128.0, 760.0, 502.0, 349.0, 252.0, 165.0, 136.0, 76.0, 53.0, 54.0, 29.0, 24.0, 15.0, 15.0, 9.0, 3.0, 2.0, 2.0, 5.0], "bins": [-50.0625, -48.5703125, -47.078125, -45.5859375, -44.09375, -42.6015625, -41.109375, -39.6171875, -38.125, -36.6328125, -35.140625, -33.6484375, -32.15625, -30.6640625, -29.171875, -27.6796875, -26.1875, -24.6953125, -23.203125, -21.7109375, -20.21875, -18.7265625, -17.234375, -15.7421875, -14.25, -12.7578125, -11.265625, -9.7734375, -8.28125, -6.7890625, -5.296875, -3.8046875, -2.3125, -0.8203125, 0.671875, 2.1640625, 3.65625, 5.1484375, 6.640625, 8.1328125, 9.625, 11.1171875, 12.609375, 14.1015625, 15.59375, 17.0859375, 18.578125, 20.0703125, 21.5625, 23.0546875, 24.546875, 26.0390625, 27.53125, 29.0234375, 30.515625, 32.0078125, 33.5, 34.9921875, 36.484375, 37.9765625, 39.46875, 40.9609375, 42.453125, 43.9453125, 45.4375]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 4.0, 3.0, 5.0, 7.0, 8.0, 15.0, 16.0, 15.0, 22.0, 27.0, 35.0, 47.0, 43.0, 50.0, 58.0, 79.0, 99.0, 105.0, 150.0, 181.0, 216.0, 288.0, 351.0, 358.0, 338.0, 271.0, 236.0, 195.0, 155.0, 119.0, 107.0, 83.0, 79.0, 68.0, 45.0, 46.0, 31.0, 16.0, 30.0, 20.0, 15.0, 7.0, 10.0, 3.0, 7.0, 4.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-15.5703125, -15.1063232421875, -14.642333984375, -14.1783447265625, -13.71435546875, -13.2503662109375, -12.786376953125, -12.3223876953125, -11.8583984375, -11.3944091796875, -10.930419921875, -10.4664306640625, -10.00244140625, -9.5384521484375, -9.074462890625, -8.6104736328125, -8.146484375, -7.6824951171875, -7.218505859375, -6.7545166015625, -6.29052734375, -5.8265380859375, -5.362548828125, -4.8985595703125, -4.4345703125, -3.9705810546875, -3.506591796875, -3.0426025390625, -2.57861328125, -2.1146240234375, -1.650634765625, -1.1866455078125, -0.72265625, -0.2586669921875, 0.205322265625, 0.6693115234375, 1.13330078125, 1.5972900390625, 2.061279296875, 2.5252685546875, 2.9892578125, 3.4532470703125, 3.917236328125, 4.3812255859375, 4.84521484375, 5.3092041015625, 5.773193359375, 6.2371826171875, 6.701171875, 7.1651611328125, 7.629150390625, 8.0931396484375, 8.55712890625, 9.0211181640625, 9.485107421875, 9.9490966796875, 10.4130859375, 10.8770751953125, 11.341064453125, 11.8050537109375, 12.26904296875, 12.7330322265625, 13.197021484375, 13.6610107421875, 14.125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 3.0, 3.0, 3.0, 8.0, 6.0, 8.0, 10.0, 5.0, 15.0, 16.0, 28.0, 25.0, 30.0, 36.0, 54.0, 49.0, 52.0, 54.0, 58.0, 68.0, 67.0, 57.0, 47.0, 48.0, 35.0, 40.0, 25.0, 21.0, 31.0, 19.0, 12.0, 16.0, 9.0, 6.0, 8.0, 7.0, 5.0, 4.0, 3.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-34.71540832519531, -33.58159255981445, -32.447776794433594, -31.313961029052734, -30.180145263671875, -29.046329498291016, -27.912513732910156, -26.778697967529297, -25.644882202148438, -24.511066436767578, -23.37725067138672, -22.24343490600586, -21.109619140625, -19.97580337524414, -18.84198760986328, -17.708171844482422, -16.574356079101562, -15.440540313720703, -14.306724548339844, -13.172908782958984, -12.039093017578125, -10.905277252197266, -9.771461486816406, -8.637645721435547, -7.5038299560546875, -6.370014190673828, -5.236198425292969, -4.102382659912109, -2.96856689453125, -1.8347511291503906, -0.7009353637695312, 0.4328804016113281, 1.5666961669921875, 2.700511932373047, 3.8343276977539062, 4.968143463134766, 6.101959228515625, 7.235774993896484, 8.369590759277344, 9.503406524658203, 10.637222290039062, 11.771038055419922, 12.904853820800781, 14.03866958618164, 15.1724853515625, 16.30630111694336, 17.44011688232422, 18.573932647705078, 19.707748413085938, 20.841564178466797, 21.975379943847656, 23.109195709228516, 24.243011474609375, 25.376827239990234, 26.510643005371094, 27.644458770751953, 28.778274536132812, 29.912090301513672, 31.04590606689453, 32.17972183227539, 33.31353759765625, 34.44735336303711, 35.58116912841797, 36.71498489379883, 37.84880065917969]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 3.0, 4.0, 5.0, 3.0, 3.0, 8.0, 14.0, 4.0, 14.0, 18.0, 13.0, 21.0, 19.0, 26.0, 27.0, 38.0, 31.0, 29.0, 39.0, 41.0, 39.0, 36.0, 48.0, 46.0, 43.0, 33.0, 41.0, 43.0, 31.0, 37.0, 28.0, 33.0, 24.0, 26.0, 20.0, 22.0, 12.0, 13.0, 14.0, 12.0, 6.0, 7.0, 3.0, 4.0, 9.0, 7.0, 6.0, 4.0, 2.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.75595474243164, -31.653465270996094, -30.550975799560547, -29.448486328125, -28.345996856689453, -27.243507385253906, -26.141016006469727, -25.03852653503418, -23.936037063598633, -22.833547592163086, -21.73105812072754, -20.628568649291992, -19.526077270507812, -18.423587799072266, -17.32109832763672, -16.218608856201172, -15.116119384765625, -14.013629913330078, -12.911140441894531, -11.808650016784668, -10.706160545349121, -9.603671073913574, -8.501180648803711, -7.398691177368164, -6.296201705932617, -5.19371223449707, -4.091222286224365, -2.9887325763702393, -1.8862428665161133, -0.7837533950805664, 0.31873655319213867, 1.4212265014648438, 2.5237159729003906, 3.6262056827545166, 4.728695392608643, 5.831185340881348, 6.9336748123168945, 8.036164283752441, 9.138654708862305, 10.241144180297852, 11.343633651733398, 12.446123123168945, 13.548612594604492, 14.651103019714355, 15.753592491149902, 16.856082916259766, 17.958572387695312, 19.06106185913086, 20.163551330566406, 21.266040802001953, 22.3685302734375, 23.471019744873047, 24.573509216308594, 25.67599868774414, 26.77849006652832, 27.880979537963867, 28.983469009399414, 30.08595848083496, 31.188447952270508, 32.29093933105469, 33.393428802490234, 34.49591827392578, 35.59840774536133, 36.700897216796875, 37.80338668823242]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [5.0, 1.0, 6.0, 6.0, 10.0, 8.0, 28.0, 27.0, 52.0, 63.0, 82.0, 139.0, 171.0, 251.0, 351.0, 451.0, 713.0, 1007.0, 1336.0, 1984.0, 2834.0, 4151.0, 5975.0, 8587.0, 13076.0, 19378.0, 29539.0, 46727.0, 75129.0, 126231.0, 211514.0, 192758.0, 113088.0, 67511.0, 42345.0, 27286.0, 17657.0, 11840.0, 8156.0, 5422.0, 3792.0, 2609.0, 1825.0, 1329.0, 889.0, 635.0, 475.0, 335.0, 242.0, 156.0, 124.0, 79.0, 42.0, 44.0, 41.0, 18.0, 19.0, 10.0, 6.0, 3.0, 3.0, 2.0, 2.0, 1.0], "bins": [-9.828125, -9.510009765625, -9.19189453125, -8.873779296875, -8.5556640625, -8.237548828125, -7.91943359375, -7.601318359375, -7.283203125, -6.965087890625, -6.64697265625, -6.328857421875, -6.0107421875, -5.692626953125, -5.37451171875, -5.056396484375, -4.73828125, -4.420166015625, -4.10205078125, -3.783935546875, -3.4658203125, -3.147705078125, -2.82958984375, -2.511474609375, -2.193359375, -1.875244140625, -1.55712890625, -1.239013671875, -0.9208984375, -0.602783203125, -0.28466796875, 0.033447265625, 0.3515625, 0.669677734375, 0.98779296875, 1.305908203125, 1.6240234375, 1.942138671875, 2.26025390625, 2.578369140625, 2.896484375, 3.214599609375, 3.53271484375, 3.850830078125, 4.1689453125, 4.487060546875, 4.80517578125, 5.123291015625, 5.44140625, 5.759521484375, 6.07763671875, 6.395751953125, 6.7138671875, 7.031982421875, 7.35009765625, 7.668212890625, 7.986328125, 8.304443359375, 8.62255859375, 8.940673828125, 9.2587890625, 9.576904296875, 9.89501953125, 10.213134765625, 10.53125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 3.0, 5.0, 5.0, 7.0, 11.0, 8.0, 21.0, 10.0, 11.0, 19.0, 20.0, 27.0, 29.0, 31.0, 37.0, 28.0, 41.0, 29.0, 36.0, 47.0, 43.0, 47.0, 42.0, 35.0, 47.0, 27.0, 41.0, 39.0, 28.0, 40.0, 30.0, 19.0, 23.0, 15.0, 20.0, 15.0, 7.0, 12.0, 4.0, 8.0, 7.0, 6.0, 6.0, 6.0, 3.0, 6.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-35.625, -34.5029296875, -33.380859375, -32.2587890625, -31.13671875, -30.0146484375, -28.892578125, -27.7705078125, -26.6484375, -25.5263671875, -24.404296875, -23.2822265625, -22.16015625, -21.0380859375, -19.916015625, -18.7939453125, -17.671875, -16.5498046875, -15.427734375, -14.3056640625, -13.18359375, -12.0615234375, -10.939453125, -9.8173828125, -8.6953125, -7.5732421875, -6.451171875, -5.3291015625, -4.20703125, -3.0849609375, -1.962890625, -0.8408203125, 0.28125, 1.4033203125, 2.525390625, 3.6474609375, 4.76953125, 5.8916015625, 7.013671875, 8.1357421875, 9.2578125, 10.3798828125, 11.501953125, 12.6240234375, 13.74609375, 14.8681640625, 15.990234375, 17.1123046875, 18.234375, 19.3564453125, 20.478515625, 21.6005859375, 22.72265625, 23.8447265625, 24.966796875, 26.0888671875, 27.2109375, 28.3330078125, 29.455078125, 30.5771484375, 31.69921875, 32.8212890625, 33.943359375, 35.0654296875, 36.1875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 3.0, 4.0, 7.0, 8.0, 5.0, 6.0, 20.0, 21.0, 36.0, 40.0, 74.0, 100.0, 148.0, 193.0, 306.0, 454.0, 731.0, 1182.0, 2040.0, 3597.0, 6853.0, 13393.0, 32143.0, 527019.0, 401775.0, 30298.0, 12946.0, 6453.0, 3488.0, 1980.0, 1105.0, 699.0, 452.0, 292.0, 191.0, 135.0, 94.0, 80.0, 43.0, 29.0, 24.0, 28.0, 11.0, 9.0, 14.0, 7.0, 6.0, 2.0, 5.0, 6.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-26.296875, -25.474365234375, -24.65185546875, -23.829345703125, -23.0068359375, -22.184326171875, -21.36181640625, -20.539306640625, -19.716796875, -18.894287109375, -18.07177734375, -17.249267578125, -16.4267578125, -15.604248046875, -14.78173828125, -13.959228515625, -13.13671875, -12.314208984375, -11.49169921875, -10.669189453125, -9.8466796875, -9.024169921875, -8.20166015625, -7.379150390625, -6.556640625, -5.734130859375, -4.91162109375, -4.089111328125, -3.2666015625, -2.444091796875, -1.62158203125, -0.799072265625, 0.0234375, 0.845947265625, 1.66845703125, 2.490966796875, 3.3134765625, 4.135986328125, 4.95849609375, 5.781005859375, 6.603515625, 7.426025390625, 8.24853515625, 9.071044921875, 9.8935546875, 10.716064453125, 11.53857421875, 12.361083984375, 13.18359375, 14.006103515625, 14.82861328125, 15.651123046875, 16.4736328125, 17.296142578125, 18.11865234375, 18.941162109375, 19.763671875, 20.586181640625, 21.40869140625, 22.231201171875, 23.0537109375, 23.876220703125, 24.69873046875, 25.521240234375, 26.34375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 2.0, 5.0, 3.0, 5.0, 4.0, 5.0, 9.0, 4.0, 9.0, 10.0, 18.0, 14.0, 5.0, 27.0, 24.0, 20.0, 30.0, 22.0, 43.0, 48.0, 28.0, 45.0, 34.0, 40.0, 38.0, 39.0, 29.0, 29.0, 40.0, 35.0, 44.0, 25.0, 32.0, 28.0, 34.0, 22.0, 28.0, 19.0, 17.0, 13.0, 16.0, 18.0, 10.0, 12.0, 7.0, 6.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0], "bins": [-24.203125, -23.479248046875, -22.75537109375, -22.031494140625, -21.3076171875, -20.583740234375, -19.85986328125, -19.135986328125, -18.412109375, -17.688232421875, -16.96435546875, -16.240478515625, -15.5166015625, -14.792724609375, -14.06884765625, -13.344970703125, -12.62109375, -11.897216796875, -11.17333984375, -10.449462890625, -9.7255859375, -9.001708984375, -8.27783203125, -7.553955078125, -6.830078125, -6.106201171875, -5.38232421875, -4.658447265625, -3.9345703125, -3.210693359375, -2.48681640625, -1.762939453125, -1.0390625, -0.315185546875, 0.40869140625, 1.132568359375, 1.8564453125, 2.580322265625, 3.30419921875, 4.028076171875, 4.751953125, 5.475830078125, 6.19970703125, 6.923583984375, 7.6474609375, 8.371337890625, 9.09521484375, 9.819091796875, 10.54296875, 11.266845703125, 11.99072265625, 12.714599609375, 13.4384765625, 14.162353515625, 14.88623046875, 15.610107421875, 16.333984375, 17.057861328125, 17.78173828125, 18.505615234375, 19.2294921875, 19.953369140625, 20.67724609375, 21.401123046875, 22.125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 6.0, 4.0, 9.0, 6.0, 19.0, 22.0, 30.0, 44.0, 71.0, 62.0, 121.0, 146.0, 221.0, 365.0, 615.0, 1188.0, 2424.0, 5755.0, 15321.0, 67207.0, 892786.0, 40788.0, 12002.0, 4548.0, 2073.0, 1048.0, 624.0, 352.0, 248.0, 136.0, 87.0, 50.0, 43.0, 27.0, 26.0, 20.0, 15.0, 11.0, 13.0, 4.0, 4.0, 7.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8046875, -2.709228515625, -2.61376953125, -2.518310546875, -2.4228515625, -2.327392578125, -2.23193359375, -2.136474609375, -2.041015625, -1.945556640625, -1.85009765625, -1.754638671875, -1.6591796875, -1.563720703125, -1.46826171875, -1.372802734375, -1.27734375, -1.181884765625, -1.08642578125, -0.990966796875, -0.8955078125, -0.800048828125, -0.70458984375, -0.609130859375, -0.513671875, -0.418212890625, -0.32275390625, -0.227294921875, -0.1318359375, -0.036376953125, 0.05908203125, 0.154541015625, 0.25, 0.345458984375, 0.44091796875, 0.536376953125, 0.6318359375, 0.727294921875, 0.82275390625, 0.918212890625, 1.013671875, 1.109130859375, 1.20458984375, 1.300048828125, 1.3955078125, 1.490966796875, 1.58642578125, 1.681884765625, 1.77734375, 1.872802734375, 1.96826171875, 2.063720703125, 2.1591796875, 2.254638671875, 2.35009765625, 2.445556640625, 2.541015625, 2.636474609375, 2.73193359375, 2.827392578125, 2.9228515625, 3.018310546875, 3.11376953125, 3.209228515625, 3.3046875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 0.0, 2.0, 3.0, 5.0, 3.0, 7.0, 6.0, 2.0, 14.0, 9.0, 13.0, 13.0, 26.0, 26.0, 33.0, 41.0, 41.0, 62.0, 63.0, 83.0, 65.0, 68.0, 67.0, 66.0, 56.0, 44.0, 23.0, 32.0, 20.0, 17.0, 19.0, 13.0, 16.0, 13.0, 11.0, 8.0, 3.0, 5.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00016009807586669922, -0.00015516020357608795, -0.00015022233128547668, -0.00014528445899486542, -0.00014034658670425415, -0.00013540871441364288, -0.00013047084212303162, -0.00012553296983242035, -0.00012059509754180908, -0.00011565722525119781, -0.00011071935296058655, -0.00010578148066997528, -0.00010084360837936401, -9.590573608875275e-05, -9.096786379814148e-05, -8.602999150753021e-05, -8.109211921691895e-05, -7.615424692630768e-05, -7.121637463569641e-05, -6.627850234508514e-05, -6.134063005447388e-05, -5.640275776386261e-05, -5.146488547325134e-05, -4.6527013182640076e-05, -4.158914089202881e-05, -3.665126860141754e-05, -3.1713396310806274e-05, -2.6775524020195007e-05, -2.183765172958374e-05, -1.6899779438972473e-05, -1.1961907148361206e-05, -7.024034857749939e-06, -2.086162567138672e-06, 2.8517097234725952e-06, 7.789582014083862e-06, 1.272745430469513e-05, 1.7665326595306396e-05, 2.2603198885917664e-05, 2.754107117652893e-05, 3.24789434671402e-05, 3.7416815757751465e-05, 4.235468804836273e-05, 4.7292560338974e-05, 5.2230432629585266e-05, 5.716830492019653e-05, 6.21061772108078e-05, 6.704404950141907e-05, 7.198192179203033e-05, 7.69197940826416e-05, 8.185766637325287e-05, 8.679553866386414e-05, 9.17334109544754e-05, 9.667128324508667e-05, 0.00010160915553569794, 0.0001065470278263092, 0.00011148490011692047, 0.00011642277240753174, 0.000121360644698143, 0.00012629851698875427, 0.00013123638927936554, 0.0001361742615699768, 0.00014111213386058807, 0.00014605000615119934, 0.0001509878784418106, 0.00015592575073242188]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 6.0, 10.0, 16.0, 32.0, 28.0, 36.0, 78.0, 101.0, 154.0, 204.0, 312.0, 414.0, 611.0, 919.0, 1348.0, 1906.0, 2783.0, 4188.0, 6459.0, 10162.0, 16405.0, 27944.0, 51127.0, 104035.0, 237867.0, 295683.0, 134853.0, 63588.0, 33994.0, 19064.0, 11764.0, 7418.0, 4847.0, 3389.0, 2160.0, 1511.0, 988.0, 624.0, 456.0, 329.0, 234.0, 163.0, 118.0, 59.0, 50.0, 49.0, 31.0, 11.0, 12.0, 2.0, 4.0, 5.0, 6.0, 0.0, 3.0], "bins": [-2.93359375, -2.84771728515625, -2.7618408203125, -2.67596435546875, -2.590087890625, -2.50421142578125, -2.4183349609375, -2.33245849609375, -2.24658203125, -2.16070556640625, -2.0748291015625, -1.98895263671875, -1.903076171875, -1.81719970703125, -1.7313232421875, -1.64544677734375, -1.5595703125, -1.47369384765625, -1.3878173828125, -1.30194091796875, -1.216064453125, -1.13018798828125, -1.0443115234375, -0.95843505859375, -0.87255859375, -0.78668212890625, -0.7008056640625, -0.61492919921875, -0.529052734375, -0.44317626953125, -0.3572998046875, -0.27142333984375, -0.185546875, -0.09967041015625, -0.0137939453125, 0.07208251953125, 0.157958984375, 0.24383544921875, 0.3297119140625, 0.41558837890625, 0.50146484375, 0.58734130859375, 0.6732177734375, 0.75909423828125, 0.844970703125, 0.93084716796875, 1.0167236328125, 1.10260009765625, 1.1884765625, 1.27435302734375, 1.3602294921875, 1.44610595703125, 1.531982421875, 1.61785888671875, 1.7037353515625, 1.78961181640625, 1.87548828125, 1.96136474609375, 2.0472412109375, 2.13311767578125, 2.218994140625, 2.30487060546875, 2.3907470703125, 2.47662353515625, 2.5625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 2.0, 1.0, 4.0, 4.0, 8.0, 3.0, 4.0, 7.0, 7.0, 12.0, 12.0, 18.0, 25.0, 23.0, 37.0, 44.0, 63.0, 83.0, 111.0, 87.0, 96.0, 72.0, 47.0, 58.0, 41.0, 22.0, 27.0, 12.0, 12.0, 6.0, 9.0, 7.0, 4.0, 8.0, 6.0, 5.0, 1.0, 3.0, 6.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0361328125, -1.0007476806640625, -0.965362548828125, -0.9299774169921875, -0.89459228515625, -0.8592071533203125, -0.823822021484375, -0.7884368896484375, -0.7530517578125, -0.7176666259765625, -0.682281494140625, -0.6468963623046875, -0.61151123046875, -0.5761260986328125, -0.540740966796875, -0.5053558349609375, -0.469970703125, -0.4345855712890625, -0.399200439453125, -0.3638153076171875, -0.32843017578125, -0.2930450439453125, -0.257659912109375, -0.2222747802734375, -0.1868896484375, -0.1515045166015625, -0.116119384765625, -0.0807342529296875, -0.04534912109375, -0.0099639892578125, 0.025421142578125, 0.0608062744140625, 0.09619140625, 0.1315765380859375, 0.166961669921875, 0.2023468017578125, 0.23773193359375, 0.2731170654296875, 0.308502197265625, 0.3438873291015625, 0.3792724609375, 0.4146575927734375, 0.450042724609375, 0.4854278564453125, 0.52081298828125, 0.5561981201171875, 0.591583251953125, 0.6269683837890625, 0.662353515625, 0.6977386474609375, 0.733123779296875, 0.7685089111328125, 0.80389404296875, 0.8392791748046875, 0.874664306640625, 0.9100494384765625, 0.9454345703125, 0.9808197021484375, 1.016204833984375, 1.0515899658203125, 1.08697509765625, 1.1223602294921875, 1.157745361328125, 1.1931304931640625, 1.228515625]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 2.0, 3.0, 7.0, 8.0, 8.0, 8.0, 7.0, 11.0, 17.0, 30.0, 27.0, 30.0, 38.0, 47.0, 61.0, 60.0, 62.0, 63.0, 55.0, 72.0, 68.0, 54.0, 43.0, 39.0, 29.0, 22.0, 24.0, 23.0, 17.0, 15.0, 6.0, 10.0, 12.0, 5.0, 6.0, 3.0, 4.0, 4.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.98853302001953, -34.8026237487793, -33.61671447753906, -32.43080520629883, -31.244897842407227, -30.058988571166992, -28.87308120727539, -27.687171936035156, -26.501262664794922, -25.315353393554688, -24.129444122314453, -22.94353675842285, -21.757627487182617, -20.571718215942383, -19.38581085205078, -18.199901580810547, -17.013992309570312, -15.828083038330078, -14.64217472076416, -13.456266403198242, -12.270357131958008, -11.084447860717773, -9.898539543151855, -8.712631225585938, -7.526721954345703, -6.340813159942627, -5.154904365539551, -3.9689955711364746, -2.7830867767333984, -1.5971779823303223, -0.4112691879272461, 0.7746391296386719, 1.9605522155761719, 3.146461009979248, 4.332369804382324, 5.5182785987854, 6.704187393188477, 7.890096187591553, 9.076004981994629, 10.261913299560547, 11.447822570800781, 12.633731842041016, 13.819640159606934, 15.005548477172852, 16.191457748413086, 17.37736701965332, 18.563274383544922, 19.749183654785156, 20.93509292602539, 22.121002197265625, 23.30691146850586, 24.49281883239746, 25.678728103637695, 26.86463737487793, 28.05054473876953, 29.236454010009766, 30.42236328125, 31.608272552490234, 32.79418182373047, 33.9800910949707, 35.16600036621094, 36.351905822753906, 37.53781509399414, 38.723724365234375, 39.90963363647461]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 6.0, 4.0, 3.0, 5.0, 8.0, 12.0, 3.0, 14.0, 17.0, 18.0, 20.0, 20.0, 28.0, 26.0, 37.0, 30.0, 29.0, 37.0, 45.0, 37.0, 37.0, 45.0, 46.0, 38.0, 40.0, 41.0, 39.0, 34.0, 32.0, 30.0, 33.0, 22.0, 28.0, 21.0, 22.0, 13.0, 14.0, 13.0, 9.0, 9.0, 6.0, 4.0, 3.0, 9.0, 7.0, 4.0, 6.0, 3.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.0479621887207, -30.97037124633789, -29.892780303955078, -28.815189361572266, -27.737598419189453, -26.66000747680664, -25.582416534423828, -24.504825592041016, -23.427234649658203, -22.34964370727539, -21.272052764892578, -20.194461822509766, -19.116870880126953, -18.03927993774414, -16.961688995361328, -15.884098052978516, -14.806507110595703, -13.72891616821289, -12.651325225830078, -11.573734283447266, -10.496143341064453, -9.41855239868164, -8.340961456298828, -7.263370513916016, -6.185779571533203, -5.108188629150391, -4.030597686767578, -2.9530067443847656, -1.8754158020019531, -0.7978248596191406, 0.2797660827636719, 1.3573570251464844, 2.4349517822265625, 3.512542724609375, 4.5901336669921875, 5.667724609375, 6.7453155517578125, 7.822906494140625, 8.900497436523438, 9.97808837890625, 11.055679321289062, 12.133270263671875, 13.210861206054688, 14.2884521484375, 15.366043090820312, 16.443634033203125, 17.521224975585938, 18.59881591796875, 19.676406860351562, 20.753997802734375, 21.831588745117188, 22.9091796875, 23.986770629882812, 25.064361572265625, 26.141952514648438, 27.21954345703125, 28.297134399414062, 29.374725341796875, 30.452316284179688, 31.5299072265625, 32.60749816894531, 33.685089111328125, 34.76268005371094, 35.84027099609375, 36.91786193847656]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 10.0, 14.0, 24.0, 25.0, 55.0, 78.0, 108.0, 181.0, 320.0, 542.0, 806.0, 1169.0, 1992.0, 2976.0, 4706.0, 7568.0, 12784.0, 21044.0, 36227.0, 63725.0, 112983.0, 195324.0, 231253.0, 151071.0, 85556.0, 47987.0, 27550.0, 16320.0, 9937.0, 5910.0, 3628.0, 2413.0, 1496.0, 1006.0, 643.0, 437.0, 240.0, 153.0, 97.0, 85.0, 42.0, 25.0, 21.0, 14.0, 9.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-49.625, -48.21728515625, -46.8095703125, -45.40185546875, -43.994140625, -42.58642578125, -41.1787109375, -39.77099609375, -38.36328125, -36.95556640625, -35.5478515625, -34.14013671875, -32.732421875, -31.32470703125, -29.9169921875, -28.50927734375, -27.1015625, -25.69384765625, -24.2861328125, -22.87841796875, -21.470703125, -20.06298828125, -18.6552734375, -17.24755859375, -15.83984375, -14.43212890625, -13.0244140625, -11.61669921875, -10.208984375, -8.80126953125, -7.3935546875, -5.98583984375, -4.578125, -3.17041015625, -1.7626953125, -0.35498046875, 1.052734375, 2.46044921875, 3.8681640625, 5.27587890625, 6.68359375, 8.09130859375, 9.4990234375, 10.90673828125, 12.314453125, 13.72216796875, 15.1298828125, 16.53759765625, 17.9453125, 19.35302734375, 20.7607421875, 22.16845703125, 23.576171875, 24.98388671875, 26.3916015625, 27.79931640625, 29.20703125, 30.61474609375, 32.0224609375, 33.43017578125, 34.837890625, 36.24560546875, 37.6533203125, 39.06103515625, 40.46875]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 4.0, 2.0, 3.0, 4.0, 2.0, 6.0, 6.0, 4.0, 5.0, 9.0, 14.0, 12.0, 17.0, 14.0, 19.0, 25.0, 33.0, 31.0, 26.0, 26.0, 40.0, 33.0, 51.0, 47.0, 54.0, 38.0, 42.0, 47.0, 28.0, 51.0, 38.0, 33.0, 30.0, 30.0, 29.0, 24.0, 19.0, 23.0, 16.0, 10.0, 11.0, 10.0, 9.0, 3.0, 10.0, 2.0, 3.0, 7.0, 6.0, 3.0, 1.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.296875, -29.207763671875, -28.11865234375, -27.029541015625, -25.9404296875, -24.851318359375, -23.76220703125, -22.673095703125, -21.583984375, -20.494873046875, -19.40576171875, -18.316650390625, -17.2275390625, -16.138427734375, -15.04931640625, -13.960205078125, -12.87109375, -11.781982421875, -10.69287109375, -9.603759765625, -8.5146484375, -7.425537109375, -6.33642578125, -5.247314453125, -4.158203125, -3.069091796875, -1.97998046875, -0.890869140625, 0.1982421875, 1.287353515625, 2.37646484375, 3.465576171875, 4.5546875, 5.643798828125, 6.73291015625, 7.822021484375, 8.9111328125, 10.000244140625, 11.08935546875, 12.178466796875, 13.267578125, 14.356689453125, 15.44580078125, 16.534912109375, 17.6240234375, 18.713134765625, 19.80224609375, 20.891357421875, 21.98046875, 23.069580078125, 24.15869140625, 25.247802734375, 26.3369140625, 27.426025390625, 28.51513671875, 29.604248046875, 30.693359375, 31.782470703125, 32.87158203125, 33.960693359375, 35.0498046875, 36.138916015625, 37.22802734375, 38.317138671875, 39.40625]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 2.0, 8.0, 4.0, 5.0, 10.0, 11.0, 25.0, 27.0, 41.0, 68.0, 85.0, 142.0, 162.0, 252.0, 392.0, 595.0, 894.0, 1332.0, 2003.0, 3028.0, 4697.0, 7156.0, 11090.0, 17479.0, 28178.0, 46157.0, 76520.0, 124968.0, 185068.0, 190530.0, 133524.0, 81537.0, 49319.0, 30399.0, 18855.0, 11763.0, 7711.0, 4899.0, 3253.0, 2141.0, 1379.0, 940.0, 635.0, 402.0, 255.0, 177.0, 143.0, 92.0, 62.0, 54.0, 39.0, 16.0, 12.0, 9.0, 5.0, 4.0, 5.0, 2.0, 4.0, 5.0], "bins": [-40.59375, -39.3662109375, -38.138671875, -36.9111328125, -35.68359375, -34.4560546875, -33.228515625, -32.0009765625, -30.7734375, -29.5458984375, -28.318359375, -27.0908203125, -25.86328125, -24.6357421875, -23.408203125, -22.1806640625, -20.953125, -19.7255859375, -18.498046875, -17.2705078125, -16.04296875, -14.8154296875, -13.587890625, -12.3603515625, -11.1328125, -9.9052734375, -8.677734375, -7.4501953125, -6.22265625, -4.9951171875, -3.767578125, -2.5400390625, -1.3125, -0.0849609375, 1.142578125, 2.3701171875, 3.59765625, 4.8251953125, 6.052734375, 7.2802734375, 8.5078125, 9.7353515625, 10.962890625, 12.1904296875, 13.41796875, 14.6455078125, 15.873046875, 17.1005859375, 18.328125, 19.5556640625, 20.783203125, 22.0107421875, 23.23828125, 24.4658203125, 25.693359375, 26.9208984375, 28.1484375, 29.3759765625, 30.603515625, 31.8310546875, 33.05859375, 34.2861328125, 35.513671875, 36.7412109375, 37.96875]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 4.0, 5.0, 6.0, 10.0, 9.0, 11.0, 15.0, 11.0, 17.0, 21.0, 26.0, 14.0, 25.0, 32.0, 28.0, 33.0, 33.0, 33.0, 33.0, 50.0, 48.0, 35.0, 43.0, 43.0, 36.0, 37.0, 33.0, 45.0, 30.0, 31.0, 43.0, 17.0, 16.0, 13.0, 18.0, 23.0, 12.0, 9.0, 6.0, 11.0, 7.0, 9.0, 3.0, 5.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0], "bins": [-20.5, -19.858642578125, -19.21728515625, -18.575927734375, -17.9345703125, -17.293212890625, -16.65185546875, -16.010498046875, -15.369140625, -14.727783203125, -14.08642578125, -13.445068359375, -12.8037109375, -12.162353515625, -11.52099609375, -10.879638671875, -10.23828125, -9.596923828125, -8.95556640625, -8.314208984375, -7.6728515625, -7.031494140625, -6.39013671875, -5.748779296875, -5.107421875, -4.466064453125, -3.82470703125, -3.183349609375, -2.5419921875, -1.900634765625, -1.25927734375, -0.617919921875, 0.0234375, 0.664794921875, 1.30615234375, 1.947509765625, 2.5888671875, 3.230224609375, 3.87158203125, 4.512939453125, 5.154296875, 5.795654296875, 6.43701171875, 7.078369140625, 7.7197265625, 8.361083984375, 9.00244140625, 9.643798828125, 10.28515625, 10.926513671875, 11.56787109375, 12.209228515625, 12.8505859375, 13.491943359375, 14.13330078125, 14.774658203125, 15.416015625, 16.057373046875, 16.69873046875, 17.340087890625, 17.9814453125, 18.622802734375, 19.26416015625, 19.905517578125, 20.546875]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 2.0, 3.0, 5.0, 9.0, 13.0, 21.0, 29.0, 40.0, 73.0, 88.0, 120.0, 150.0, 246.0, 308.0, 486.0, 674.0, 955.0, 1317.0, 1961.0, 2640.0, 4087.0, 6266.0, 9471.0, 14908.0, 24482.0, 42440.0, 77394.0, 146513.0, 253581.0, 204876.0, 108618.0, 58063.0, 33170.0, 19460.0, 12057.0, 7731.0, 5004.0, 3416.0, 2349.0, 1635.0, 1165.0, 814.0, 550.0, 419.0, 266.0, 199.0, 139.0, 100.0, 69.0, 57.0, 48.0, 24.0, 18.0, 13.0, 9.0, 3.0, 6.0, 4.0, 1.0, 3.0, 1.0], "bins": [-14.0234375, -13.58203125, -13.140625, -12.69921875, -12.2578125, -11.81640625, -11.375, -10.93359375, -10.4921875, -10.05078125, -9.609375, -9.16796875, -8.7265625, -8.28515625, -7.84375, -7.40234375, -6.9609375, -6.51953125, -6.078125, -5.63671875, -5.1953125, -4.75390625, -4.3125, -3.87109375, -3.4296875, -2.98828125, -2.546875, -2.10546875, -1.6640625, -1.22265625, -0.78125, -0.33984375, 0.1015625, 0.54296875, 0.984375, 1.42578125, 1.8671875, 2.30859375, 2.75, 3.19140625, 3.6328125, 4.07421875, 4.515625, 4.95703125, 5.3984375, 5.83984375, 6.28125, 6.72265625, 7.1640625, 7.60546875, 8.046875, 8.48828125, 8.9296875, 9.37109375, 9.8125, 10.25390625, 10.6953125, 11.13671875, 11.578125, 12.01953125, 12.4609375, 12.90234375, 13.34375, 13.78515625, 14.2265625]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 3.0, 3.0, 6.0, 11.0, 14.0, 13.0, 26.0, 28.0, 45.0, 43.0, 70.0, 84.0, 108.0, 139.0, 105.0, 79.0, 55.0, 51.0, 32.0, 18.0, 16.0, 13.0, 9.0, 7.0, 4.0, 8.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.002300262451171875, -0.002229154109954834, -0.002158045768737793, -0.002086937427520752, -0.002015829086303711, -0.00194472074508667, -0.001873612403869629, -0.0018025040626525879, -0.0017313957214355469, -0.0016602873802185059, -0.0015891790390014648, -0.0015180706977844238, -0.0014469623565673828, -0.0013758540153503418, -0.0013047456741333008, -0.0012336373329162598, -0.0011625289916992188, -0.0010914206504821777, -0.0010203123092651367, -0.0009492039680480957, -0.0008780956268310547, -0.0008069872856140137, -0.0007358789443969727, -0.0006647706031799316, -0.0005936622619628906, -0.0005225539207458496, -0.0004514455795288086, -0.0003803372383117676, -0.00030922889709472656, -0.00023812055587768555, -0.00016701221466064453, -9.590387344360352e-05, -2.47955322265625e-05, 4.6312808990478516e-05, 0.00011742115020751953, 0.00018852949142456055, 0.00025963783264160156, 0.0003307461738586426, 0.0004018545150756836, 0.0004729628562927246, 0.0005440711975097656, 0.0006151795387268066, 0.0006862878799438477, 0.0007573962211608887, 0.0008285045623779297, 0.0008996129035949707, 0.0009707212448120117, 0.0010418295860290527, 0.0011129379272460938, 0.0011840462684631348, 0.0012551546096801758, 0.0013262629508972168, 0.0013973712921142578, 0.0014684796333312988, 0.0015395879745483398, 0.0016106963157653809, 0.0016818046569824219, 0.0017529129981994629, 0.001824021339416504, 0.001895129680633545, 0.001966238021850586, 0.002037346363067627, 0.002108454704284668, 0.002179563045501709, 0.00225067138671875]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 5.0, 0.0, 8.0, 10.0, 7.0, 9.0, 22.0, 32.0, 41.0, 63.0, 99.0, 124.0, 185.0, 285.0, 393.0, 609.0, 860.0, 1255.0, 1855.0, 2970.0, 4642.0, 7141.0, 11557.0, 18840.0, 32022.0, 57034.0, 106907.0, 207248.0, 261874.0, 148407.0, 77263.0, 42258.0, 24262.0, 14575.0, 9013.0, 5682.0, 3669.0, 2422.0, 1612.0, 1083.0, 670.0, 490.0, 344.0, 222.0, 148.0, 111.0, 83.0, 52.0, 28.0, 24.0, 16.0, 14.0, 6.0, 5.0, 5.0, 8.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-14.5703125, -14.10400390625, -13.6376953125, -13.17138671875, -12.705078125, -12.23876953125, -11.7724609375, -11.30615234375, -10.83984375, -10.37353515625, -9.9072265625, -9.44091796875, -8.974609375, -8.50830078125, -8.0419921875, -7.57568359375, -7.109375, -6.64306640625, -6.1767578125, -5.71044921875, -5.244140625, -4.77783203125, -4.3115234375, -3.84521484375, -3.37890625, -2.91259765625, -2.4462890625, -1.97998046875, -1.513671875, -1.04736328125, -0.5810546875, -0.11474609375, 0.3515625, 0.81787109375, 1.2841796875, 1.75048828125, 2.216796875, 2.68310546875, 3.1494140625, 3.61572265625, 4.08203125, 4.54833984375, 5.0146484375, 5.48095703125, 5.947265625, 6.41357421875, 6.8798828125, 7.34619140625, 7.8125, 8.27880859375, 8.7451171875, 9.21142578125, 9.677734375, 10.14404296875, 10.6103515625, 11.07666015625, 11.54296875, 12.00927734375, 12.4755859375, 12.94189453125, 13.408203125, 13.87451171875, 14.3408203125, 14.80712890625, 15.2734375]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 4.0, 5.0, 6.0, 9.0, 8.0, 7.0, 11.0, 11.0, 16.0, 25.0, 16.0, 22.0, 31.0, 35.0, 72.0, 53.0, 80.0, 89.0, 79.0, 73.0, 55.0, 56.0, 55.0, 32.0, 18.0, 25.0, 24.0, 19.0, 17.0, 10.0, 5.0, 6.0, 10.0, 7.0, 5.0, 3.0, 3.0, 5.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.26171875, -6.05865478515625, -5.8555908203125, -5.65252685546875, -5.449462890625, -5.24639892578125, -5.0433349609375, -4.84027099609375, -4.63720703125, -4.43414306640625, -4.2310791015625, -4.02801513671875, -3.824951171875, -3.62188720703125, -3.4188232421875, -3.21575927734375, -3.0126953125, -2.80963134765625, -2.6065673828125, -2.40350341796875, -2.200439453125, -1.99737548828125, -1.7943115234375, -1.59124755859375, -1.38818359375, -1.18511962890625, -0.9820556640625, -0.77899169921875, -0.575927734375, -0.37286376953125, -0.1697998046875, 0.03326416015625, 0.236328125, 0.43939208984375, 0.6424560546875, 0.84552001953125, 1.048583984375, 1.25164794921875, 1.4547119140625, 1.65777587890625, 1.86083984375, 2.06390380859375, 2.2669677734375, 2.47003173828125, 2.673095703125, 2.87615966796875, 3.0792236328125, 3.28228759765625, 3.4853515625, 3.68841552734375, 3.8914794921875, 4.09454345703125, 4.297607421875, 4.50067138671875, 4.7037353515625, 4.90679931640625, 5.10986328125, 5.31292724609375, 5.5159912109375, 5.71905517578125, 5.922119140625, 6.12518310546875, 6.3282470703125, 6.53131103515625, 6.734375]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 3.0, 7.0, 6.0, 12.0, 12.0, 13.0, 24.0, 23.0, 33.0, 50.0, 48.0, 69.0, 70.0, 67.0, 75.0, 96.0, 72.0, 58.0, 60.0, 49.0, 30.0, 23.0, 23.0, 22.0, 13.0, 17.0, 7.0, 7.0, 4.0, 2.0, 7.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.99857711791992, -38.51227951049805, -37.02598571777344, -35.53968811035156, -34.05339431762695, -32.56709671020508, -31.080801010131836, -29.594505310058594, -28.10820770263672, -26.621912002563477, -25.135616302490234, -23.64931869506836, -22.163022994995117, -20.676727294921875, -19.190431594848633, -17.70413589477539, -16.21784019470215, -14.731544494628906, -13.245247840881348, -11.758952140808105, -10.272655487060547, -8.786359786987305, -7.3000640869140625, -5.813767433166504, -4.327471733093262, -2.8411755561828613, -1.35487961769104, 0.13141632080078125, 1.6177124977111816, 3.104008674621582, 4.590304374694824, 6.076601028442383, 7.562896728515625, 9.049192428588867, 10.535489082336426, 12.021784782409668, 13.508081436157227, 14.994377136230469, 16.48067283630371, 17.966968536376953, 19.453266143798828, 20.93956184387207, 22.425857543945312, 23.912155151367188, 25.39845085144043, 26.884746551513672, 28.371042251586914, 29.857337951660156, 31.3436336517334, 32.82992935180664, 34.316226959228516, 35.802520751953125, 37.288818359375, 38.775115966796875, 40.261409759521484, 41.74770736694336, 43.23400115966797, 44.720298767089844, 46.20659255981445, 47.69289016723633, 49.17918395996094, 50.66548156738281, 52.15177917480469, 53.6380729675293, 55.12437057495117]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 4.0, 3.0, 4.0, 8.0, 5.0, 8.0, 9.0, 12.0, 13.0, 12.0, 12.0, 17.0, 23.0, 20.0, 30.0, 24.0, 36.0, 34.0, 36.0, 29.0, 33.0, 43.0, 39.0, 47.0, 34.0, 41.0, 52.0, 46.0, 32.0, 30.0, 32.0, 32.0, 27.0, 20.0, 23.0, 21.0, 14.0, 15.0, 26.0, 12.0, 11.0, 4.0, 6.0, 6.0, 6.0, 9.0, 5.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-29.39145851135254, -28.269893646240234, -27.14832878112793, -26.026763916015625, -24.905197143554688, -23.783632278442383, -22.662067413330078, -21.540502548217773, -20.41893768310547, -19.297372817993164, -18.17580795288086, -17.054241180419922, -15.932676315307617, -14.811111450195312, -13.689546585083008, -12.567981719970703, -11.446414947509766, -10.324850082397461, -9.20328426361084, -8.081719398498535, -6.960154056549072, -5.838588714599609, -4.717023849487305, -3.595458507537842, -2.473893165588379, -1.3523279428482056, -0.23076272010803223, 0.8908023834228516, 2.0123677253723145, 3.1339330673217773, 4.255497932434082, 5.377063274383545, 6.498630523681641, 7.6201958656311035, 8.741761207580566, 9.863326072692871, 10.984891891479492, 12.106456756591797, 13.228021621704102, 14.349586486816406, 15.471152305603027, 16.59271812438965, 17.714282989501953, 18.835847854614258, 19.957412719726562, 21.0789794921875, 22.200542449951172, 23.32210922241211, 24.443674087524414, 25.56523895263672, 26.686803817749023, 27.808368682861328, 28.929935455322266, 30.05150032043457, 31.173065185546875, 32.29463195800781, 33.416194915771484, 34.53776168823242, 35.659324645996094, 36.78089141845703, 37.9024543762207, 39.02402114868164, 40.14558410644531, 41.26715087890625, 42.38871765136719]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 5.0, 9.0, 3.0, 10.0, 14.0, 17.0, 28.0, 54.0, 59.0, 111.0, 131.0, 240.0, 398.0, 649.0, 1057.0, 1780.0, 3201.0, 5966.0, 11605.0, 23979.0, 57151.0, 172535.0, 697435.0, 1882726.0, 964660.0, 232681.0, 73740.0, 30838.0, 15012.0, 7865.0, 4300.0, 2431.0, 1439.0, 829.0, 498.0, 299.0, 194.0, 107.0, 79.0, 58.0, 31.0, 23.0, 10.0, 9.0, 3.0, 7.0, 4.0, 3.0, 3.0, 2.0, 3.0, 0.0, 3.0], "bins": [-62.90625, -61.08935546875, -59.2724609375, -57.45556640625, -55.638671875, -53.82177734375, -52.0048828125, -50.18798828125, -48.37109375, -46.55419921875, -44.7373046875, -42.92041015625, -41.103515625, -39.28662109375, -37.4697265625, -35.65283203125, -33.8359375, -32.01904296875, -30.2021484375, -28.38525390625, -26.568359375, -24.75146484375, -22.9345703125, -21.11767578125, -19.30078125, -17.48388671875, -15.6669921875, -13.85009765625, -12.033203125, -10.21630859375, -8.3994140625, -6.58251953125, -4.765625, -2.94873046875, -1.1318359375, 0.68505859375, 2.501953125, 4.31884765625, 6.1357421875, 7.95263671875, 9.76953125, 11.58642578125, 13.4033203125, 15.22021484375, 17.037109375, 18.85400390625, 20.6708984375, 22.48779296875, 24.3046875, 26.12158203125, 27.9384765625, 29.75537109375, 31.572265625, 33.38916015625, 35.2060546875, 37.02294921875, 38.83984375, 40.65673828125, 42.4736328125, 44.29052734375, 46.107421875, 47.92431640625, 49.7412109375, 51.55810546875, 53.375]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 4.0, 3.0, 5.0, 3.0, 9.0, 6.0, 13.0, 9.0, 14.0, 11.0, 18.0, 15.0, 26.0, 22.0, 19.0, 30.0, 42.0, 38.0, 33.0, 35.0, 35.0, 47.0, 57.0, 47.0, 36.0, 45.0, 51.0, 36.0, 41.0, 29.0, 24.0, 33.0, 14.0, 23.0, 21.0, 18.0, 19.0, 12.0, 10.0, 15.0, 6.0, 10.0, 4.0, 3.0, 9.0, 5.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-26.609375, -25.604736328125, -24.60009765625, -23.595458984375, -22.5908203125, -21.586181640625, -20.58154296875, -19.576904296875, -18.572265625, -17.567626953125, -16.56298828125, -15.558349609375, -14.5537109375, -13.549072265625, -12.54443359375, -11.539794921875, -10.53515625, -9.530517578125, -8.52587890625, -7.521240234375, -6.5166015625, -5.511962890625, -4.50732421875, -3.502685546875, -2.498046875, -1.493408203125, -0.48876953125, 0.515869140625, 1.5205078125, 2.525146484375, 3.52978515625, 4.534423828125, 5.5390625, 6.543701171875, 7.54833984375, 8.552978515625, 9.5576171875, 10.562255859375, 11.56689453125, 12.571533203125, 13.576171875, 14.580810546875, 15.58544921875, 16.590087890625, 17.5947265625, 18.599365234375, 19.60400390625, 20.608642578125, 21.61328125, 22.617919921875, 23.62255859375, 24.627197265625, 25.6318359375, 26.636474609375, 27.64111328125, 28.645751953125, 29.650390625, 30.655029296875, 31.65966796875, 32.664306640625, 33.6689453125, 34.673583984375, 35.67822265625, 36.682861328125, 37.6875]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 5.0, 9.0, 11.0, 18.0, 36.0, 37.0, 50.0, 110.0, 157.0, 239.0, 350.0, 545.0, 836.0, 1234.0, 2072.0, 3244.0, 5231.0, 8815.0, 15605.0, 27678.0, 52944.0, 108112.0, 238694.0, 588532.0, 1465872.0, 978704.0, 371943.0, 159102.0, 75622.0, 38080.0, 20755.0, 11826.0, 6758.0, 4001.0, 2492.0, 1606.0, 964.0, 678.0, 436.0, 282.0, 214.0, 132.0, 91.0, 59.0, 35.0, 33.0, 19.0, 9.0, 5.0, 3.0, 2.0, 4.0, 3.0, 1.0], "bins": [-51.875, -50.38232421875, -48.8896484375, -47.39697265625, -45.904296875, -44.41162109375, -42.9189453125, -41.42626953125, -39.93359375, -38.44091796875, -36.9482421875, -35.45556640625, -33.962890625, -32.47021484375, -30.9775390625, -29.48486328125, -27.9921875, -26.49951171875, -25.0068359375, -23.51416015625, -22.021484375, -20.52880859375, -19.0361328125, -17.54345703125, -16.05078125, -14.55810546875, -13.0654296875, -11.57275390625, -10.080078125, -8.58740234375, -7.0947265625, -5.60205078125, -4.109375, -2.61669921875, -1.1240234375, 0.36865234375, 1.861328125, 3.35400390625, 4.8466796875, 6.33935546875, 7.83203125, 9.32470703125, 10.8173828125, 12.31005859375, 13.802734375, 15.29541015625, 16.7880859375, 18.28076171875, 19.7734375, 21.26611328125, 22.7587890625, 24.25146484375, 25.744140625, 27.23681640625, 28.7294921875, 30.22216796875, 31.71484375, 33.20751953125, 34.7001953125, 36.19287109375, 37.685546875, 39.17822265625, 40.6708984375, 42.16357421875, 43.65625]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 4.0, 3.0, 3.0, 5.0, 5.0, 13.0, 12.0, 28.0, 21.0, 26.0, 37.0, 62.0, 65.0, 97.0, 122.0, 149.0, 213.0, 248.0, 317.0, 373.0, 437.0, 376.0, 326.0, 248.0, 192.0, 147.0, 121.0, 107.0, 62.0, 60.0, 51.0, 47.0, 16.0, 23.0, 15.0, 17.0, 9.0, 5.0, 5.0, 7.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-20.03125, -19.4810791015625, -18.930908203125, -18.3807373046875, -17.83056640625, -17.2803955078125, -16.730224609375, -16.1800537109375, -15.6298828125, -15.0797119140625, -14.529541015625, -13.9793701171875, -13.42919921875, -12.8790283203125, -12.328857421875, -11.7786865234375, -11.228515625, -10.6783447265625, -10.128173828125, -9.5780029296875, -9.02783203125, -8.4776611328125, -7.927490234375, -7.3773193359375, -6.8271484375, -6.2769775390625, -5.726806640625, -5.1766357421875, -4.62646484375, -4.0762939453125, -3.526123046875, -2.9759521484375, -2.42578125, -1.8756103515625, -1.325439453125, -0.7752685546875, -0.22509765625, 0.3250732421875, 0.875244140625, 1.4254150390625, 1.9755859375, 2.5257568359375, 3.075927734375, 3.6260986328125, 4.17626953125, 4.7264404296875, 5.276611328125, 5.8267822265625, 6.376953125, 6.9271240234375, 7.477294921875, 8.0274658203125, 8.57763671875, 9.1278076171875, 9.677978515625, 10.2281494140625, 10.7783203125, 11.3284912109375, 11.878662109375, 12.4288330078125, 12.97900390625, 13.5291748046875, 14.079345703125, 14.6295166015625, 15.1796875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 6.0, 1.0, 7.0, 8.0, 11.0, 11.0, 9.0, 26.0, 22.0, 28.0, 30.0, 32.0, 39.0, 52.0, 87.0, 66.0, 60.0, 69.0, 64.0, 63.0, 55.0, 43.0, 34.0, 34.0, 33.0, 21.0, 26.0, 12.0, 14.0, 10.0, 10.0, 7.0, 1.0, 4.0, 1.0, 0.0, 4.0, 0.0, 1.0, 2.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.72513961791992, -40.499412536621094, -39.27368927001953, -38.0479621887207, -36.822235107421875, -35.59650802612305, -34.37078094482422, -33.145057678222656, -31.919330596923828, -30.693603515625, -29.467878341674805, -28.24215316772461, -27.01642608642578, -25.790699005126953, -24.564973831176758, -23.339248657226562, -22.113521575927734, -20.887794494628906, -19.66206932067871, -18.436344146728516, -17.210617065429688, -15.984890937805176, -14.759164810180664, -13.533438682556152, -12.30771255493164, -11.081986427307129, -9.856260299682617, -8.630534172058105, -7.404808044433594, -6.179081916809082, -4.95335578918457, -3.7276296615600586, -2.5019073486328125, -1.2761812210083008, -0.05045509338378906, 1.1752710342407227, 2.4009971618652344, 3.626723289489746, 4.852449417114258, 6.0781755447387695, 7.303901672363281, 8.529627799987793, 9.755353927612305, 10.981080055236816, 12.206806182861328, 13.43253231048584, 14.658258438110352, 15.883984565734863, 17.109710693359375, 18.335437774658203, 19.5611629486084, 20.786888122558594, 22.012615203857422, 23.23834228515625, 24.464067459106445, 25.68979263305664, 26.91551971435547, 28.141246795654297, 29.366971969604492, 30.592697143554688, 31.818424224853516, 33.044151306152344, 34.269874572753906, 35.495601654052734, 36.72132873535156]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 8.0, 2.0, 11.0, 10.0, 9.0, 9.0, 15.0, 26.0, 14.0, 19.0, 22.0, 30.0, 24.0, 21.0, 33.0, 32.0, 38.0, 44.0, 41.0, 45.0, 42.0, 51.0, 37.0, 29.0, 37.0, 45.0, 32.0, 34.0, 22.0, 23.0, 34.0, 25.0, 22.0, 21.0, 14.0, 15.0, 11.0, 10.0, 7.0, 8.0, 9.0, 4.0, 4.0, 4.0, 5.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-33.4442024230957, -32.367523193359375, -31.290842056274414, -30.214160919189453, -29.137481689453125, -28.060800552368164, -26.984119415283203, -25.907440185546875, -24.830759048461914, -23.754077911376953, -22.677398681640625, -21.600717544555664, -20.524036407470703, -19.447357177734375, -18.370676040649414, -17.293994903564453, -16.217315673828125, -15.14063549041748, -14.063955307006836, -12.987274169921875, -11.91059398651123, -10.833913803100586, -9.757232666015625, -8.68055248260498, -7.603872299194336, -6.527192115783691, -5.450511455535889, -4.373830795288086, -3.2971506118774414, -2.220470428466797, -1.1437897682189941, -0.0671091079711914, 1.0095710754394531, 2.0862514972686768, 3.1629319190979004, 4.239612579345703, 5.316292762756348, 6.392972946166992, 7.469653606414795, 8.546334266662598, 9.623014450073242, 10.699694633483887, 11.776374816894531, 12.853055953979492, 13.929736137390137, 15.006416320800781, 16.083097457885742, 17.159778594970703, 18.23645782470703, 19.313138961791992, 20.38981819152832, 21.46649932861328, 22.54317855834961, 23.61985969543457, 24.69654083251953, 25.77322006225586, 26.84990119934082, 27.92658233642578, 29.00326156616211, 30.07994270324707, 31.15662384033203, 32.23330307006836, 33.30998229980469, 34.38666534423828, 35.46334457397461]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 2.0, 4.0, 5.0, 9.0, 12.0, 28.0, 43.0, 45.0, 61.0, 85.0, 146.0, 187.0, 264.0, 357.0, 563.0, 780.0, 1068.0, 1600.0, 2360.0, 3190.0, 4899.0, 6851.0, 10342.0, 15147.0, 22040.0, 33851.0, 52644.0, 89955.0, 167896.0, 259128.0, 148390.0, 80809.0, 48776.0, 31460.0, 20803.0, 14027.0, 9450.0, 6466.0, 4618.0, 3112.0, 2110.0, 1592.0, 1015.0, 736.0, 508.0, 346.0, 259.0, 166.0, 105.0, 82.0, 61.0, 41.0, 24.0, 17.0, 12.0, 6.0, 1.0, 4.0, 5.0, 4.0, 1.0], "bins": [-10.4921875, -10.16845703125, -9.8447265625, -9.52099609375, -9.197265625, -8.87353515625, -8.5498046875, -8.22607421875, -7.90234375, -7.57861328125, -7.2548828125, -6.93115234375, -6.607421875, -6.28369140625, -5.9599609375, -5.63623046875, -5.3125, -4.98876953125, -4.6650390625, -4.34130859375, -4.017578125, -3.69384765625, -3.3701171875, -3.04638671875, -2.72265625, -2.39892578125, -2.0751953125, -1.75146484375, -1.427734375, -1.10400390625, -0.7802734375, -0.45654296875, -0.1328125, 0.19091796875, 0.5146484375, 0.83837890625, 1.162109375, 1.48583984375, 1.8095703125, 2.13330078125, 2.45703125, 2.78076171875, 3.1044921875, 3.42822265625, 3.751953125, 4.07568359375, 4.3994140625, 4.72314453125, 5.046875, 5.37060546875, 5.6943359375, 6.01806640625, 6.341796875, 6.66552734375, 6.9892578125, 7.31298828125, 7.63671875, 7.96044921875, 8.2841796875, 8.60791015625, 8.931640625, 9.25537109375, 9.5791015625, 9.90283203125, 10.2265625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 1.0, 2.0, 4.0, 1.0, 13.0, 7.0, 8.0, 14.0, 15.0, 17.0, 21.0, 25.0, 26.0, 26.0, 28.0, 32.0, 36.0, 37.0, 60.0, 32.0, 44.0, 37.0, 56.0, 48.0, 42.0, 37.0, 47.0, 27.0, 32.0, 25.0, 25.0, 39.0, 27.0, 19.0, 18.0, 7.0, 12.0, 13.0, 7.0, 7.0, 6.0, 10.0, 6.0, 2.0, 2.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-37.125, -35.939453125, -34.75390625, -33.568359375, -32.3828125, -31.197265625, -30.01171875, -28.826171875, -27.640625, -26.455078125, -25.26953125, -24.083984375, -22.8984375, -21.712890625, -20.52734375, -19.341796875, -18.15625, -16.970703125, -15.78515625, -14.599609375, -13.4140625, -12.228515625, -11.04296875, -9.857421875, -8.671875, -7.486328125, -6.30078125, -5.115234375, -3.9296875, -2.744140625, -1.55859375, -0.373046875, 0.8125, 1.998046875, 3.18359375, 4.369140625, 5.5546875, 6.740234375, 7.92578125, 9.111328125, 10.296875, 11.482421875, 12.66796875, 13.853515625, 15.0390625, 16.224609375, 17.41015625, 18.595703125, 19.78125, 20.966796875, 22.15234375, 23.337890625, 24.5234375, 25.708984375, 26.89453125, 28.080078125, 29.265625, 30.451171875, 31.63671875, 32.822265625, 34.0078125, 35.193359375, 36.37890625, 37.564453125, 38.75]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 3.0, 1.0, 1.0, 4.0, 2.0, 1.0, 4.0, 5.0, 9.0, 12.0, 27.0, 33.0, 37.0, 59.0, 74.0, 99.0, 151.0, 214.0, 317.0, 436.0, 561.0, 893.0, 1172.0, 1701.0, 2447.0, 3698.0, 5478.0, 8944.0, 16383.0, 43908.0, 325356.0, 535731.0, 53791.0, 18494.0, 9942.0, 5951.0, 3834.0, 2616.0, 1791.0, 1267.0, 909.0, 653.0, 463.0, 296.0, 236.0, 169.0, 112.0, 86.0, 55.0, 51.0, 15.0, 35.0, 17.0, 9.0, 2.0, 4.0, 3.0, 2.0, 0.0, 4.0, 1.0, 1.0], "bins": [-15.1015625, -14.64501953125, -14.1884765625, -13.73193359375, -13.275390625, -12.81884765625, -12.3623046875, -11.90576171875, -11.44921875, -10.99267578125, -10.5361328125, -10.07958984375, -9.623046875, -9.16650390625, -8.7099609375, -8.25341796875, -7.796875, -7.34033203125, -6.8837890625, -6.42724609375, -5.970703125, -5.51416015625, -5.0576171875, -4.60107421875, -4.14453125, -3.68798828125, -3.2314453125, -2.77490234375, -2.318359375, -1.86181640625, -1.4052734375, -0.94873046875, -0.4921875, -0.03564453125, 0.4208984375, 0.87744140625, 1.333984375, 1.79052734375, 2.2470703125, 2.70361328125, 3.16015625, 3.61669921875, 4.0732421875, 4.52978515625, 4.986328125, 5.44287109375, 5.8994140625, 6.35595703125, 6.8125, 7.26904296875, 7.7255859375, 8.18212890625, 8.638671875, 9.09521484375, 9.5517578125, 10.00830078125, 10.46484375, 10.92138671875, 11.3779296875, 11.83447265625, 12.291015625, 12.74755859375, 13.2041015625, 13.66064453125, 14.1171875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 5.0, 7.0, 6.0, 3.0, 4.0, 8.0, 9.0, 10.0, 19.0, 14.0, 26.0, 14.0, 26.0, 22.0, 20.0, 25.0, 30.0, 41.0, 40.0, 41.0, 34.0, 33.0, 42.0, 47.0, 51.0, 34.0, 33.0, 41.0, 26.0, 28.0, 39.0, 36.0, 21.0, 25.0, 25.0, 20.0, 16.0, 15.0, 12.0, 14.0, 9.0, 4.0, 5.0, 10.0, 5.0, 3.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.953125, -23.225830078125, -22.49853515625, -21.771240234375, -21.0439453125, -20.316650390625, -19.58935546875, -18.862060546875, -18.134765625, -17.407470703125, -16.68017578125, -15.952880859375, -15.2255859375, -14.498291015625, -13.77099609375, -13.043701171875, -12.31640625, -11.589111328125, -10.86181640625, -10.134521484375, -9.4072265625, -8.679931640625, -7.95263671875, -7.225341796875, -6.498046875, -5.770751953125, -5.04345703125, -4.316162109375, -3.5888671875, -2.861572265625, -2.13427734375, -1.406982421875, -0.6796875, 0.047607421875, 0.77490234375, 1.502197265625, 2.2294921875, 2.956787109375, 3.68408203125, 4.411376953125, 5.138671875, 5.865966796875, 6.59326171875, 7.320556640625, 8.0478515625, 8.775146484375, 9.50244140625, 10.229736328125, 10.95703125, 11.684326171875, 12.41162109375, 13.138916015625, 13.8662109375, 14.593505859375, 15.32080078125, 16.048095703125, 16.775390625, 17.502685546875, 18.22998046875, 18.957275390625, 19.6845703125, 20.411865234375, 21.13916015625, 21.866455078125, 22.59375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 5.0, 2.0, 8.0, 10.0, 15.0, 20.0, 33.0, 53.0, 91.0, 112.0, 194.0, 330.0, 668.0, 1188.0, 2726.0, 6881.0, 21547.0, 314818.0, 661284.0, 24870.0, 7757.0, 3002.0, 1327.0, 645.0, 394.0, 201.0, 129.0, 72.0, 51.0, 30.0, 29.0, 18.0, 18.0, 9.0, 5.0, 3.0, 3.0, 2.0, 3.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.451171875, -2.363800048828125, -2.27642822265625, -2.189056396484375, -2.1016845703125, -2.014312744140625, -1.92694091796875, -1.839569091796875, -1.752197265625, -1.664825439453125, -1.57745361328125, -1.490081787109375, -1.4027099609375, -1.315338134765625, -1.22796630859375, -1.140594482421875, -1.05322265625, -0.965850830078125, -0.87847900390625, -0.791107177734375, -0.7037353515625, -0.616363525390625, -0.52899169921875, -0.441619873046875, -0.354248046875, -0.266876220703125, -0.17950439453125, -0.092132568359375, -0.0047607421875, 0.082611083984375, 0.16998291015625, 0.257354736328125, 0.3447265625, 0.432098388671875, 0.51947021484375, 0.606842041015625, 0.6942138671875, 0.781585693359375, 0.86895751953125, 0.956329345703125, 1.043701171875, 1.131072998046875, 1.21844482421875, 1.305816650390625, 1.3931884765625, 1.480560302734375, 1.56793212890625, 1.655303955078125, 1.74267578125, 1.830047607421875, 1.91741943359375, 2.004791259765625, 2.0921630859375, 2.179534912109375, 2.26690673828125, 2.354278564453125, 2.441650390625, 2.529022216796875, 2.61639404296875, 2.703765869140625, 2.7911376953125, 2.878509521484375, 2.96588134765625, 3.053253173828125, 3.140625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 5.0, 3.0, 9.0, 4.0, 4.0, 7.0, 15.0, 27.0, 25.0, 23.0, 31.0, 48.0, 51.0, 68.0, 85.0, 81.0, 88.0, 92.0, 68.0, 60.0, 46.0, 35.0, 24.0, 20.0, 20.0, 14.0, 11.0, 8.0, 13.0, 5.0, 3.0, 4.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00017261505126953125, -0.00016794726252555847, -0.0001632794737815857, -0.00015861168503761292, -0.00015394389629364014, -0.00014927610754966736, -0.00014460831880569458, -0.0001399405300617218, -0.00013527274131774902, -0.00013060495257377625, -0.00012593716382980347, -0.00012126937508583069, -0.00011660158634185791, -0.00011193379759788513, -0.00010726600885391235, -0.00010259822010993958, -9.79304313659668e-05, -9.326264262199402e-05, -8.859485387802124e-05, -8.392706513404846e-05, -7.925927639007568e-05, -7.45914876461029e-05, -6.992369890213013e-05, -6.525591015815735e-05, -6.058812141418457e-05, -5.592033267021179e-05, -5.1252543926239014e-05, -4.6584755182266235e-05, -4.191696643829346e-05, -3.724917769432068e-05, -3.25813889503479e-05, -2.7913600206375122e-05, -2.3245811462402344e-05, -1.8578022718429565e-05, -1.3910233974456787e-05, -9.242445230484009e-06, -4.5746564865112305e-06, 9.313225746154785e-08, 4.760921001434326e-06, 9.428709745407104e-06, 1.4096498489379883e-05, 1.876428723335266e-05, 2.343207597732544e-05, 2.8099864721298218e-05, 3.2767653465270996e-05, 3.7435442209243774e-05, 4.210323095321655e-05, 4.677101969718933e-05, 5.143880844116211e-05, 5.610659718513489e-05, 6.0774385929107666e-05, 6.544217467308044e-05, 7.010996341705322e-05, 7.4777752161026e-05, 7.944554090499878e-05, 8.411332964897156e-05, 8.878111839294434e-05, 9.344890713691711e-05, 9.811669588088989e-05, 0.00010278448462486267, 0.00010745227336883545, 0.00011212006211280823, 0.000116787850856781, 0.00012145563960075378, 0.00012612342834472656]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 7.0, 5.0, 8.0, 21.0, 26.0, 25.0, 45.0, 75.0, 101.0, 152.0, 205.0, 312.0, 547.0, 944.0, 1485.0, 2440.0, 4211.0, 7593.0, 13712.0, 26913.0, 55674.0, 121926.0, 261450.0, 286208.0, 137120.0, 62686.0, 29945.0, 15111.0, 8252.0, 4533.0, 2641.0, 1567.0, 907.0, 578.0, 386.0, 234.0, 189.0, 114.0, 66.0, 54.0, 29.0, 24.0, 12.0, 10.0, 3.0, 7.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.93359375, -1.871368408203125, -1.80914306640625, -1.746917724609375, -1.6846923828125, -1.622467041015625, -1.56024169921875, -1.498016357421875, -1.435791015625, -1.373565673828125, -1.31134033203125, -1.249114990234375, -1.1868896484375, -1.124664306640625, -1.06243896484375, -1.000213623046875, -0.93798828125, -0.875762939453125, -0.81353759765625, -0.751312255859375, -0.6890869140625, -0.626861572265625, -0.56463623046875, -0.502410888671875, -0.440185546875, -0.377960205078125, -0.31573486328125, -0.253509521484375, -0.1912841796875, -0.129058837890625, -0.06683349609375, -0.004608154296875, 0.0576171875, 0.119842529296875, 0.18206787109375, 0.244293212890625, 0.3065185546875, 0.368743896484375, 0.43096923828125, 0.493194580078125, 0.555419921875, 0.617645263671875, 0.67987060546875, 0.742095947265625, 0.8043212890625, 0.866546630859375, 0.92877197265625, 0.990997314453125, 1.05322265625, 1.115447998046875, 1.17767333984375, 1.239898681640625, 1.3021240234375, 1.364349365234375, 1.42657470703125, 1.488800048828125, 1.551025390625, 1.613250732421875, 1.67547607421875, 1.737701416015625, 1.7999267578125, 1.862152099609375, 1.92437744140625, 1.986602783203125, 2.048828125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 4.0, 7.0, 8.0, 6.0, 10.0, 13.0, 12.0, 13.0, 28.0, 28.0, 41.0, 43.0, 49.0, 53.0, 57.0, 60.0, 68.0, 51.0, 56.0, 61.0, 45.0, 52.0, 49.0, 41.0, 29.0, 36.0, 20.0, 16.0, 11.0, 10.0, 10.0, 4.0, 5.0, 4.0, 3.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.44873046875, -0.431121826171875, -0.41351318359375, -0.395904541015625, -0.3782958984375, -0.360687255859375, -0.34307861328125, -0.325469970703125, -0.307861328125, -0.290252685546875, -0.27264404296875, -0.255035400390625, -0.2374267578125, -0.219818115234375, -0.20220947265625, -0.184600830078125, -0.1669921875, -0.149383544921875, -0.13177490234375, -0.114166259765625, -0.0965576171875, -0.078948974609375, -0.06134033203125, -0.043731689453125, -0.026123046875, -0.008514404296875, 0.00909423828125, 0.026702880859375, 0.0443115234375, 0.061920166015625, 0.07952880859375, 0.097137451171875, 0.11474609375, 0.132354736328125, 0.14996337890625, 0.167572021484375, 0.1851806640625, 0.202789306640625, 0.22039794921875, 0.238006591796875, 0.255615234375, 0.273223876953125, 0.29083251953125, 0.308441162109375, 0.3260498046875, 0.343658447265625, 0.36126708984375, 0.378875732421875, 0.396484375, 0.414093017578125, 0.43170166015625, 0.449310302734375, 0.4669189453125, 0.484527587890625, 0.50213623046875, 0.519744873046875, 0.537353515625, 0.554962158203125, 0.57257080078125, 0.590179443359375, 0.6077880859375, 0.625396728515625, 0.64300537109375, 0.660614013671875, 0.67822265625]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 6.0, 5.0, 5.0, 3.0, 6.0, 13.0, 10.0, 15.0, 15.0, 19.0, 34.0, 29.0, 27.0, 45.0, 44.0, 73.0, 74.0, 54.0, 73.0, 61.0, 61.0, 57.0, 53.0, 38.0, 36.0, 27.0, 24.0, 25.0, 22.0, 11.0, 11.0, 8.0, 5.0, 6.0, 1.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-41.68342590332031, -40.505332946777344, -39.327239990234375, -38.149147033691406, -36.97105407714844, -35.79296112060547, -34.6148681640625, -33.436771392822266, -32.2586784362793, -31.080585479736328, -29.90249252319336, -28.72439956665039, -27.54630470275879, -26.36821174621582, -25.19011878967285, -24.01202392578125, -22.833932876586914, -21.655839920043945, -20.477746963500977, -19.299652099609375, -18.121559143066406, -16.943466186523438, -15.765373229980469, -14.587279319763184, -13.409186363220215, -12.231093406677246, -11.052999496459961, -9.874906539916992, -8.696813583374023, -7.518719673156738, -6.3406267166137695, -5.162532806396484, -3.9844398498535156, -2.8063464164733887, -1.6282532215118408, -0.45016002655029297, 0.727933406829834, 1.906026840209961, 3.0841197967529297, 4.262213706970215, 5.440306663513184, 6.6184000968933105, 7.7964935302734375, 8.974586486816406, 10.152679443359375, 11.33077335357666, 12.508866310119629, 13.686960220336914, 14.865053176879883, 16.04314613342285, 17.22123908996582, 18.399333953857422, 19.57742691040039, 20.75551986694336, 21.933612823486328, 23.111705780029297, 24.289798736572266, 25.467891693115234, 26.645984649658203, 27.824077606201172, 29.002172470092773, 30.180265426635742, 31.35835838317871, 32.53645324707031, 33.71454620361328]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 1.0, 8.0, 3.0, 10.0, 7.0, 13.0, 8.0, 18.0, 23.0, 15.0, 20.0, 21.0, 30.0, 22.0, 24.0, 29.0, 36.0, 38.0, 45.0, 42.0, 44.0, 43.0, 51.0, 34.0, 31.0, 40.0, 41.0, 36.0, 33.0, 19.0, 27.0, 30.0, 25.0, 22.0, 21.0, 12.0, 16.0, 12.0, 9.0, 8.0, 6.0, 10.0, 3.0, 6.0, 3.0, 5.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-33.25746536254883, -32.19170379638672, -31.125944137573242, -30.060182571411133, -28.994422912597656, -27.928661346435547, -26.862899780273438, -25.797138214111328, -24.73137855529785, -23.665616989135742, -22.599857330322266, -21.534095764160156, -20.468334197998047, -19.40257453918457, -18.33681297302246, -17.271053314208984, -16.205291748046875, -15.139531135559082, -14.073770523071289, -13.00800895690918, -11.942248344421387, -10.876487731933594, -9.810726165771484, -8.744965553283691, -7.679204940795898, -6.6134443283081055, -5.547683238983154, -4.481922149658203, -3.41616153717041, -2.350400924682617, -1.284639835357666, -0.21887874603271484, 0.8468818664550781, 1.9126427173614502, 2.9784035682678223, 4.044164657592773, 5.109925270080566, 6.175685882568359, 7.2414469718933105, 8.307208061218262, 9.372968673706055, 10.438729286193848, 11.50448989868164, 12.57025146484375, 13.636012077331543, 14.701772689819336, 15.767534255981445, 16.833293914794922, 17.89905548095703, 18.96481704711914, 20.030576705932617, 21.096338272094727, 22.162097930908203, 23.227859497070312, 24.293621063232422, 25.35938262939453, 26.425142288208008, 27.490903854370117, 28.556663513183594, 29.622425079345703, 30.688186645507812, 31.75394630432129, 32.819705963134766, 33.885467529296875, 34.951229095458984]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 11.0, 10.0, 23.0, 32.0, 38.0, 53.0, 67.0, 110.0, 156.0, 259.0, 379.0, 543.0, 809.0, 1284.0, 2078.0, 2982.0, 4781.0, 7460.0, 11775.0, 18716.0, 29679.0, 48776.0, 80301.0, 131647.0, 195806.0, 189278.0, 123607.0, 75086.0, 45860.0, 28325.0, 17684.0, 11063.0, 7063.0, 4359.0, 2944.0, 1880.0, 1214.0, 788.0, 561.0, 357.0, 238.0, 151.0, 105.0, 64.0, 50.0, 31.0, 31.0, 13.0, 11.0, 8.0, 5.0, 2.0, 6.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-37.78125, -36.56005859375, -35.3388671875, -34.11767578125, -32.896484375, -31.67529296875, -30.4541015625, -29.23291015625, -28.01171875, -26.79052734375, -25.5693359375, -24.34814453125, -23.126953125, -21.90576171875, -20.6845703125, -19.46337890625, -18.2421875, -17.02099609375, -15.7998046875, -14.57861328125, -13.357421875, -12.13623046875, -10.9150390625, -9.69384765625, -8.47265625, -7.25146484375, -6.0302734375, -4.80908203125, -3.587890625, -2.36669921875, -1.1455078125, 0.07568359375, 1.296875, 2.51806640625, 3.7392578125, 4.96044921875, 6.181640625, 7.40283203125, 8.6240234375, 9.84521484375, 11.06640625, 12.28759765625, 13.5087890625, 14.72998046875, 15.951171875, 17.17236328125, 18.3935546875, 19.61474609375, 20.8359375, 22.05712890625, 23.2783203125, 24.49951171875, 25.720703125, 26.94189453125, 28.1630859375, 29.38427734375, 30.60546875, 31.82666015625, 33.0478515625, 34.26904296875, 35.490234375, 36.71142578125, 37.9326171875, 39.15380859375, 40.375]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 1.0, 5.0, 6.0, 3.0, 5.0, 9.0, 14.0, 17.0, 18.0, 18.0, 18.0, 20.0, 32.0, 23.0, 29.0, 31.0, 33.0, 35.0, 43.0, 41.0, 47.0, 38.0, 48.0, 42.0, 49.0, 38.0, 48.0, 43.0, 35.0, 29.0, 26.0, 24.0, 20.0, 24.0, 17.0, 14.0, 8.0, 11.0, 7.0, 8.0, 7.0, 4.0, 7.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-35.53125, -34.4287109375, -33.326171875, -32.2236328125, -31.12109375, -30.0185546875, -28.916015625, -27.8134765625, -26.7109375, -25.6083984375, -24.505859375, -23.4033203125, -22.30078125, -21.1982421875, -20.095703125, -18.9931640625, -17.890625, -16.7880859375, -15.685546875, -14.5830078125, -13.48046875, -12.3779296875, -11.275390625, -10.1728515625, -9.0703125, -7.9677734375, -6.865234375, -5.7626953125, -4.66015625, -3.5576171875, -2.455078125, -1.3525390625, -0.25, 0.8525390625, 1.955078125, 3.0576171875, 4.16015625, 5.2626953125, 6.365234375, 7.4677734375, 8.5703125, 9.6728515625, 10.775390625, 11.8779296875, 12.98046875, 14.0830078125, 15.185546875, 16.2880859375, 17.390625, 18.4931640625, 19.595703125, 20.6982421875, 21.80078125, 22.9033203125, 24.005859375, 25.1083984375, 26.2109375, 27.3134765625, 28.416015625, 29.5185546875, 30.62109375, 31.7236328125, 32.826171875, 33.9287109375, 35.03125]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 5.0, 3.0, 5.0, 7.0, 20.0, 15.0, 29.0, 48.0, 79.0, 125.0, 215.0, 361.0, 549.0, 1014.0, 1725.0, 2846.0, 4721.0, 8072.0, 13563.0, 23207.0, 39727.0, 66573.0, 110994.0, 176970.0, 210911.0, 154943.0, 94981.0, 55834.0, 33490.0, 19159.0, 11608.0, 6909.0, 3992.0, 2421.0, 1373.0, 851.0, 469.0, 316.0, 165.0, 112.0, 58.0, 37.0, 22.0, 15.0, 11.0, 9.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.65625, -38.2568359375, -36.857421875, -35.4580078125, -34.05859375, -32.6591796875, -31.259765625, -29.8603515625, -28.4609375, -27.0615234375, -25.662109375, -24.2626953125, -22.86328125, -21.4638671875, -20.064453125, -18.6650390625, -17.265625, -15.8662109375, -14.466796875, -13.0673828125, -11.66796875, -10.2685546875, -8.869140625, -7.4697265625, -6.0703125, -4.6708984375, -3.271484375, -1.8720703125, -0.47265625, 0.9267578125, 2.326171875, 3.7255859375, 5.125, 6.5244140625, 7.923828125, 9.3232421875, 10.72265625, 12.1220703125, 13.521484375, 14.9208984375, 16.3203125, 17.7197265625, 19.119140625, 20.5185546875, 21.91796875, 23.3173828125, 24.716796875, 26.1162109375, 27.515625, 28.9150390625, 30.314453125, 31.7138671875, 33.11328125, 34.5126953125, 35.912109375, 37.3115234375, 38.7109375, 40.1103515625, 41.509765625, 42.9091796875, 44.30859375, 45.7080078125, 47.107421875, 48.5068359375, 49.90625]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 5.0, 3.0, 6.0, 9.0, 6.0, 7.0, 10.0, 14.0, 18.0, 12.0, 26.0, 17.0, 17.0, 22.0, 20.0, 29.0, 23.0, 29.0, 33.0, 34.0, 37.0, 28.0, 30.0, 21.0, 24.0, 32.0, 28.0, 34.0, 41.0, 36.0, 39.0, 39.0, 38.0, 29.0, 27.0, 22.0, 23.0, 20.0, 19.0, 17.0, 14.0, 11.0, 8.0, 6.0, 7.0, 8.0, 3.0, 9.0, 7.0, 4.0, 0.0, 4.0, 1.0, 3.0, 2.0], "bins": [-19.796875, -19.20751953125, -18.6181640625, -18.02880859375, -17.439453125, -16.85009765625, -16.2607421875, -15.67138671875, -15.08203125, -14.49267578125, -13.9033203125, -13.31396484375, -12.724609375, -12.13525390625, -11.5458984375, -10.95654296875, -10.3671875, -9.77783203125, -9.1884765625, -8.59912109375, -8.009765625, -7.42041015625, -6.8310546875, -6.24169921875, -5.65234375, -5.06298828125, -4.4736328125, -3.88427734375, -3.294921875, -2.70556640625, -2.1162109375, -1.52685546875, -0.9375, -0.34814453125, 0.2412109375, 0.83056640625, 1.419921875, 2.00927734375, 2.5986328125, 3.18798828125, 3.77734375, 4.36669921875, 4.9560546875, 5.54541015625, 6.134765625, 6.72412109375, 7.3134765625, 7.90283203125, 8.4921875, 9.08154296875, 9.6708984375, 10.26025390625, 10.849609375, 11.43896484375, 12.0283203125, 12.61767578125, 13.20703125, 13.79638671875, 14.3857421875, 14.97509765625, 15.564453125, 16.15380859375, 16.7431640625, 17.33251953125, 17.921875]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 5.0, 2.0, 4.0, 7.0, 18.0, 14.0, 16.0, 43.0, 48.0, 63.0, 124.0, 201.0, 276.0, 449.0, 648.0, 1215.0, 1803.0, 2890.0, 4934.0, 8529.0, 15266.0, 28317.0, 54122.0, 109481.0, 212633.0, 269052.0, 164224.0, 81927.0, 41280.0, 21710.0, 11869.0, 6807.0, 4105.0, 2418.0, 1516.0, 913.0, 551.0, 373.0, 261.0, 170.0, 88.0, 69.0, 30.0, 22.0, 26.0, 13.0, 8.0, 11.0, 2.0, 3.0, 3.0, 1.0, 3.0, 4.0, 0.0, 0.0, 1.0], "bins": [-16.296875, -15.792236328125, -15.28759765625, -14.782958984375, -14.2783203125, -13.773681640625, -13.26904296875, -12.764404296875, -12.259765625, -11.755126953125, -11.25048828125, -10.745849609375, -10.2412109375, -9.736572265625, -9.23193359375, -8.727294921875, -8.22265625, -7.718017578125, -7.21337890625, -6.708740234375, -6.2041015625, -5.699462890625, -5.19482421875, -4.690185546875, -4.185546875, -3.680908203125, -3.17626953125, -2.671630859375, -2.1669921875, -1.662353515625, -1.15771484375, -0.653076171875, -0.1484375, 0.356201171875, 0.86083984375, 1.365478515625, 1.8701171875, 2.374755859375, 2.87939453125, 3.384033203125, 3.888671875, 4.393310546875, 4.89794921875, 5.402587890625, 5.9072265625, 6.411865234375, 6.91650390625, 7.421142578125, 7.92578125, 8.430419921875, 8.93505859375, 9.439697265625, 9.9443359375, 10.448974609375, 10.95361328125, 11.458251953125, 11.962890625, 12.467529296875, 12.97216796875, 13.476806640625, 13.9814453125, 14.486083984375, 14.99072265625, 15.495361328125, 16.0]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 5.0, 8.0, 16.0, 20.0, 25.0, 34.0, 55.0, 71.0, 106.0, 137.0, 134.0, 123.0, 89.0, 62.0, 40.0, 28.0, 23.0, 8.0, 4.0, 1.0, 4.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0028667449951171875, -0.0027831196784973145, -0.0026994943618774414, -0.0026158690452575684, -0.0025322437286376953, -0.0024486184120178223, -0.0023649930953979492, -0.002281367778778076, -0.002197742462158203, -0.00211411714553833, -0.002030491828918457, -0.001946866512298584, -0.001863241195678711, -0.0017796158790588379, -0.0016959905624389648, -0.0016123652458190918, -0.0015287399291992188, -0.0014451146125793457, -0.0013614892959594727, -0.0012778639793395996, -0.0011942386627197266, -0.0011106133460998535, -0.0010269880294799805, -0.0009433627128601074, -0.0008597373962402344, -0.0007761120796203613, -0.0006924867630004883, -0.0006088614463806152, -0.0005252361297607422, -0.00044161081314086914, -0.0003579854965209961, -0.00027436017990112305, -0.00019073486328125, -0.00010710954666137695, -2.3484230041503906e-05, 6.014108657836914e-05, 0.0001437664031982422, 0.00022739171981811523, 0.0003110170364379883, 0.00039464235305786133, 0.0004782676696777344, 0.0005618929862976074, 0.0006455183029174805, 0.0007291436195373535, 0.0008127689361572266, 0.0008963942527770996, 0.0009800195693969727, 0.0010636448860168457, 0.0011472702026367188, 0.0012308955192565918, 0.0013145208358764648, 0.0013981461524963379, 0.001481771469116211, 0.001565396785736084, 0.001649022102355957, 0.00173264741897583, 0.0018162727355957031, 0.0018998980522155762, 0.0019835233688354492, 0.0020671486854553223, 0.0021507740020751953, 0.0022343993186950684, 0.0023180246353149414, 0.0024016499519348145, 0.0024852752685546875]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 3.0, 11.0, 14.0, 14.0, 18.0, 34.0, 49.0, 94.0, 136.0, 176.0, 299.0, 476.0, 889.0, 1398.0, 2365.0, 4209.0, 7195.0, 13135.0, 24536.0, 47046.0, 92638.0, 184090.0, 279658.0, 189629.0, 95699.0, 48234.0, 25263.0, 13455.0, 7481.0, 4198.0, 2382.0, 1452.0, 873.0, 528.0, 325.0, 214.0, 115.0, 81.0, 50.0, 38.0, 18.0, 14.0, 7.0, 8.0, 7.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-18.59375, -18.0390625, -17.484375, -16.9296875, -16.375, -15.8203125, -15.265625, -14.7109375, -14.15625, -13.6015625, -13.046875, -12.4921875, -11.9375, -11.3828125, -10.828125, -10.2734375, -9.71875, -9.1640625, -8.609375, -8.0546875, -7.5, -6.9453125, -6.390625, -5.8359375, -5.28125, -4.7265625, -4.171875, -3.6171875, -3.0625, -2.5078125, -1.953125, -1.3984375, -0.84375, -0.2890625, 0.265625, 0.8203125, 1.375, 1.9296875, 2.484375, 3.0390625, 3.59375, 4.1484375, 4.703125, 5.2578125, 5.8125, 6.3671875, 6.921875, 7.4765625, 8.03125, 8.5859375, 9.140625, 9.6953125, 10.25, 10.8046875, 11.359375, 11.9140625, 12.46875, 13.0234375, 13.578125, 14.1328125, 14.6875, 15.2421875, 15.796875, 16.3515625, 16.90625]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 2.0, 4.0, 3.0, 9.0, 7.0, 10.0, 5.0, 12.0, 13.0, 16.0, 25.0, 24.0, 18.0, 35.0, 42.0, 37.0, 54.0, 60.0, 54.0, 65.0, 62.0, 52.0, 70.0, 41.0, 39.0, 37.0, 27.0, 28.0, 29.0, 24.0, 27.0, 13.0, 13.0, 7.0, 7.0, 6.0, 5.0, 5.0, 3.0, 3.0, 4.0, 2.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.734375, -4.58251953125, -4.4306640625, -4.27880859375, -4.126953125, -3.97509765625, -3.8232421875, -3.67138671875, -3.51953125, -3.36767578125, -3.2158203125, -3.06396484375, -2.912109375, -2.76025390625, -2.6083984375, -2.45654296875, -2.3046875, -2.15283203125, -2.0009765625, -1.84912109375, -1.697265625, -1.54541015625, -1.3935546875, -1.24169921875, -1.08984375, -0.93798828125, -0.7861328125, -0.63427734375, -0.482421875, -0.33056640625, -0.1787109375, -0.02685546875, 0.125, 0.27685546875, 0.4287109375, 0.58056640625, 0.732421875, 0.88427734375, 1.0361328125, 1.18798828125, 1.33984375, 1.49169921875, 1.6435546875, 1.79541015625, 1.947265625, 2.09912109375, 2.2509765625, 2.40283203125, 2.5546875, 2.70654296875, 2.8583984375, 3.01025390625, 3.162109375, 3.31396484375, 3.4658203125, 3.61767578125, 3.76953125, 3.92138671875, 4.0732421875, 4.22509765625, 4.376953125, 4.52880859375, 4.6806640625, 4.83251953125, 4.984375]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 4.0, 0.0, 4.0, 3.0, 3.0, 9.0, 5.0, 3.0, 9.0, 14.0, 12.0, 8.0, 13.0, 26.0, 20.0, 33.0, 37.0, 35.0, 45.0, 68.0, 56.0, 50.0, 69.0, 69.0, 46.0, 47.0, 54.0, 40.0, 38.0, 29.0, 23.0, 25.0, 18.0, 21.0, 17.0, 14.0, 4.0, 8.0, 9.0, 6.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-35.427425384521484, -34.3779411315918, -33.32845687866211, -32.278968811035156, -31.2294864654541, -30.18000030517578, -29.130516052246094, -28.081031799316406, -27.03154754638672, -25.98206329345703, -24.93257713317871, -23.883092880249023, -22.833608627319336, -21.784122467041016, -20.734638214111328, -19.68515396118164, -18.63566780090332, -17.586183547973633, -16.536697387695312, -15.487213134765625, -14.437728881835938, -13.388243675231934, -12.33875846862793, -11.289274215698242, -10.239789009094238, -9.190303802490234, -8.140819549560547, -7.091334342956543, -6.041849613189697, -4.992364883422852, -3.9428796768188477, -2.893394947052002, -1.843912124633789, -0.7944272756576538, 0.25505757331848145, 1.3045425415039062, 2.354027271270752, 3.4035120010375977, 4.452997207641602, 5.502481937408447, 6.551966667175293, 7.601451396942139, 8.650936126708984, 9.700421333312988, 10.749906539916992, 11.79939079284668, 12.848875999450684, 13.898361206054688, 14.947845458984375, 15.997330665588379, 17.046815872192383, 18.09630012512207, 19.145784378051758, 20.195270538330078, 21.244754791259766, 22.294239044189453, 23.34372329711914, 24.393207550048828, 25.44269371032715, 26.492177963256836, 27.541662216186523, 28.591148376464844, 29.64063262939453, 30.69011688232422, 31.73960304260254]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 6.0, 10.0, 4.0, 5.0, 7.0, 8.0, 12.0, 13.0, 13.0, 24.0, 19.0, 26.0, 26.0, 30.0, 29.0, 24.0, 39.0, 36.0, 43.0, 46.0, 26.0, 44.0, 54.0, 36.0, 49.0, 44.0, 27.0, 45.0, 28.0, 29.0, 29.0, 26.0, 23.0, 27.0, 17.0, 11.0, 12.0, 13.0, 10.0, 8.0, 5.0, 8.0, 1.0, 8.0, 5.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-35.69272232055664, -34.54065704345703, -33.38859176635742, -32.23652648925781, -31.084461212158203, -29.932395935058594, -28.780332565307617, -27.628267288208008, -26.4762020111084, -25.32413673400879, -24.17207145690918, -23.02000617980957, -21.867942810058594, -20.715877532958984, -19.563812255859375, -18.411746978759766, -17.259681701660156, -16.107616424560547, -14.955551147460938, -13.803486824035645, -12.651421546936035, -11.499356269836426, -10.347291946411133, -9.195226669311523, -8.043161392211914, -6.891096115112305, -5.7390313148498535, -4.586966514587402, -3.434901237487793, -2.2828359603881836, -1.1307711601257324, 0.02129364013671875, 1.1733627319335938, 2.325427770614624, 3.4774928092956543, 4.6295576095581055, 5.781622886657715, 6.933688163757324, 8.085752487182617, 9.237817764282227, 10.389883041381836, 11.541948318481445, 12.694013595581055, 13.846077919006348, 14.998143196105957, 16.15020751953125, 17.30227279663086, 18.45433807373047, 19.606403350830078, 20.758468627929688, 21.910533905029297, 23.062599182128906, 24.214664459228516, 25.366729736328125, 26.5187931060791, 27.67085838317871, 28.82292366027832, 29.97498893737793, 31.12705421447754, 32.279117584228516, 33.431182861328125, 34.583248138427734, 35.735313415527344, 36.88737869262695, 38.03944396972656]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [6.0, 4.0, 1.0, 6.0, 10.0, 9.0, 9.0, 19.0, 19.0, 33.0, 49.0, 69.0, 92.0, 174.0, 243.0, 373.0, 595.0, 895.0, 1286.0, 2006.0, 3065.0, 4840.0, 8058.0, 14009.0, 24995.0, 50342.0, 118007.0, 335318.0, 944276.0, 1478702.0, 754540.0, 258088.0, 95391.0, 42832.0, 22583.0, 12591.0, 7594.0, 4630.0, 2943.0, 1893.0, 1278.0, 833.0, 525.0, 352.0, 221.0, 165.0, 108.0, 68.0, 54.0, 23.0, 19.0, 15.0, 14.0, 8.0, 10.0, 2.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-39.375, -38.03515625, -36.6953125, -35.35546875, -34.015625, -32.67578125, -31.3359375, -29.99609375, -28.65625, -27.31640625, -25.9765625, -24.63671875, -23.296875, -21.95703125, -20.6171875, -19.27734375, -17.9375, -16.59765625, -15.2578125, -13.91796875, -12.578125, -11.23828125, -9.8984375, -8.55859375, -7.21875, -5.87890625, -4.5390625, -3.19921875, -1.859375, -0.51953125, 0.8203125, 2.16015625, 3.5, 4.83984375, 6.1796875, 7.51953125, 8.859375, 10.19921875, 11.5390625, 12.87890625, 14.21875, 15.55859375, 16.8984375, 18.23828125, 19.578125, 20.91796875, 22.2578125, 23.59765625, 24.9375, 26.27734375, 27.6171875, 28.95703125, 30.296875, 31.63671875, 32.9765625, 34.31640625, 35.65625, 36.99609375, 38.3359375, 39.67578125, 41.015625, 42.35546875, 43.6953125, 45.03515625, 46.375]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 2.0, 7.0, 3.0, 7.0, 6.0, 10.0, 8.0, 5.0, 14.0, 19.0, 13.0, 26.0, 26.0, 26.0, 25.0, 26.0, 27.0, 31.0, 37.0, 41.0, 47.0, 47.0, 44.0, 46.0, 45.0, 42.0, 46.0, 50.0, 36.0, 24.0, 29.0, 31.0, 24.0, 22.0, 18.0, 18.0, 11.0, 16.0, 13.0, 7.0, 7.0, 5.0, 4.0, 3.0, 3.0, 9.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-33.5, -32.45068359375, -31.4013671875, -30.35205078125, -29.302734375, -28.25341796875, -27.2041015625, -26.15478515625, -25.10546875, -24.05615234375, -23.0068359375, -21.95751953125, -20.908203125, -19.85888671875, -18.8095703125, -17.76025390625, -16.7109375, -15.66162109375, -14.6123046875, -13.56298828125, -12.513671875, -11.46435546875, -10.4150390625, -9.36572265625, -8.31640625, -7.26708984375, -6.2177734375, -5.16845703125, -4.119140625, -3.06982421875, -2.0205078125, -0.97119140625, 0.078125, 1.12744140625, 2.1767578125, 3.22607421875, 4.275390625, 5.32470703125, 6.3740234375, 7.42333984375, 8.47265625, 9.52197265625, 10.5712890625, 11.62060546875, 12.669921875, 13.71923828125, 14.7685546875, 15.81787109375, 16.8671875, 17.91650390625, 18.9658203125, 20.01513671875, 21.064453125, 22.11376953125, 23.1630859375, 24.21240234375, 25.26171875, 26.31103515625, 27.3603515625, 28.40966796875, 29.458984375, 30.50830078125, 31.5576171875, 32.60693359375, 33.65625]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 6.0, 7.0, 6.0, 23.0, 17.0, 35.0, 46.0, 90.0, 123.0, 179.0, 268.0, 415.0, 691.0, 1131.0, 1746.0, 2961.0, 5265.0, 8998.0, 16391.0, 31611.0, 63654.0, 134770.0, 316016.0, 841564.0, 1580156.0, 688738.0, 265503.0, 116633.0, 55129.0, 27653.0, 14738.0, 8049.0, 4574.0, 2725.0, 1616.0, 1015.0, 606.0, 391.0, 242.0, 166.0, 111.0, 84.0, 56.0, 27.0, 17.0, 12.0, 13.0, 11.0, 5.0, 5.0, 3.0, 0.0, 1.0, 2.0], "bins": [-54.125, -52.5517578125, -50.978515625, -49.4052734375, -47.83203125, -46.2587890625, -44.685546875, -43.1123046875, -41.5390625, -39.9658203125, -38.392578125, -36.8193359375, -35.24609375, -33.6728515625, -32.099609375, -30.5263671875, -28.953125, -27.3798828125, -25.806640625, -24.2333984375, -22.66015625, -21.0869140625, -19.513671875, -17.9404296875, -16.3671875, -14.7939453125, -13.220703125, -11.6474609375, -10.07421875, -8.5009765625, -6.927734375, -5.3544921875, -3.78125, -2.2080078125, -0.634765625, 0.9384765625, 2.51171875, 4.0849609375, 5.658203125, 7.2314453125, 8.8046875, 10.3779296875, 11.951171875, 13.5244140625, 15.09765625, 16.6708984375, 18.244140625, 19.8173828125, 21.390625, 22.9638671875, 24.537109375, 26.1103515625, 27.68359375, 29.2568359375, 30.830078125, 32.4033203125, 33.9765625, 35.5498046875, 37.123046875, 38.6962890625, 40.26953125, 41.8427734375, 43.416015625, 44.9892578125, 46.5625]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 2.0, 7.0, 6.0, 9.0, 15.0, 12.0, 10.0, 20.0, 21.0, 29.0, 44.0, 52.0, 61.0, 86.0, 98.0, 113.0, 167.0, 182.0, 215.0, 281.0, 314.0, 351.0, 354.0, 309.0, 234.0, 233.0, 161.0, 138.0, 119.0, 100.0, 67.0, 59.0, 49.0, 34.0, 30.0, 23.0, 17.0, 19.0, 12.0, 11.0, 4.0, 2.0, 3.0, 3.0, 2.0, 1.0, 3.0, 3.0, 1.0], "bins": [-18.09375, -17.6011962890625, -17.108642578125, -16.6160888671875, -16.12353515625, -15.6309814453125, -15.138427734375, -14.6458740234375, -14.1533203125, -13.6607666015625, -13.168212890625, -12.6756591796875, -12.18310546875, -11.6905517578125, -11.197998046875, -10.7054443359375, -10.212890625, -9.7203369140625, -9.227783203125, -8.7352294921875, -8.24267578125, -7.7501220703125, -7.257568359375, -6.7650146484375, -6.2724609375, -5.7799072265625, -5.287353515625, -4.7947998046875, -4.30224609375, -3.8096923828125, -3.317138671875, -2.8245849609375, -2.33203125, -1.8394775390625, -1.346923828125, -0.8543701171875, -0.36181640625, 0.1307373046875, 0.623291015625, 1.1158447265625, 1.6083984375, 2.1009521484375, 2.593505859375, 3.0860595703125, 3.57861328125, 4.0711669921875, 4.563720703125, 5.0562744140625, 5.548828125, 6.0413818359375, 6.533935546875, 7.0264892578125, 7.51904296875, 8.0115966796875, 8.504150390625, 8.9967041015625, 9.4892578125, 9.9818115234375, 10.474365234375, 10.9669189453125, 11.45947265625, 11.9520263671875, 12.444580078125, 12.9371337890625, 13.4296875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 2.0, 4.0, 9.0, 6.0, 10.0, 7.0, 9.0, 14.0, 12.0, 14.0, 19.0, 29.0, 42.0, 43.0, 44.0, 64.0, 72.0, 74.0, 73.0, 64.0, 60.0, 50.0, 48.0, 41.0, 29.0, 25.0, 38.0, 19.0, 18.0, 18.0, 9.0, 5.0, 8.0, 9.0, 5.0, 4.0, 2.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.86423110961914, -39.64664840698242, -38.42906188964844, -37.21147918701172, -35.993896484375, -34.77631378173828, -33.5587272644043, -32.34114456176758, -31.123559951782227, -29.905975341796875, -28.688392639160156, -27.470808029174805, -26.253223419189453, -25.035640716552734, -23.818056106567383, -22.60047149658203, -21.382888793945312, -20.16530418395996, -18.947721481323242, -17.73013687133789, -16.512554168701172, -15.29496955871582, -14.077384948730469, -12.859801292419434, -11.642217636108398, -10.424633979797363, -9.207050323486328, -7.989465713500977, -6.771882057189941, -5.554298400878906, -4.336714267730713, -3.1191301345825195, -1.9015426635742188, -0.6839587688446045, 0.5336251258850098, 1.751209020614624, 2.9687929153442383, 4.186376571655273, 5.403960704803467, 6.62154483795166, 7.839128494262695, 9.05671215057373, 10.274295806884766, 11.491880416870117, 12.709464073181152, 13.927047729492188, 15.144632339477539, 16.36221694946289, 17.57979965209961, 18.79738426208496, 20.01496696472168, 21.23255157470703, 22.45013427734375, 23.6677188873291, 24.885303497314453, 26.102886199951172, 27.320470809936523, 28.538055419921875, 29.755638122558594, 30.973222732543945, 32.1908073425293, 33.408390045166016, 34.625972747802734, 35.84355926513672, 37.06114196777344]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 4.0, 4.0, 8.0, 9.0, 8.0, 10.0, 18.0, 19.0, 32.0, 19.0, 27.0, 33.0, 29.0, 26.0, 37.0, 30.0, 40.0, 46.0, 41.0, 43.0, 41.0, 37.0, 51.0, 37.0, 44.0, 40.0, 27.0, 31.0, 43.0, 21.0, 30.0, 17.0, 16.0, 19.0, 15.0, 7.0, 14.0, 10.0, 4.0, 3.0, 8.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-42.64574432373047, -41.444091796875, -40.24243927001953, -39.04078674316406, -37.839134216308594, -36.63748550415039, -35.43583297729492, -34.23418045043945, -33.032527923583984, -31.830875396728516, -30.629222869873047, -29.42757225036621, -28.225919723510742, -27.024267196655273, -25.822616577148438, -24.62096405029297, -23.4193115234375, -22.21765899658203, -21.016006469726562, -19.814355850219727, -18.612703323364258, -17.41105079650879, -16.209400177001953, -15.007747650146484, -13.806095123291016, -12.604442596435547, -11.402791023254395, -10.201139450073242, -8.999486923217773, -7.797834873199463, -6.596182823181152, -5.39453125, -4.192882537841797, -2.9912304878234863, -1.7895784378051758, -0.5879263877868652, 0.6137256622314453, 1.8153777122497559, 3.0170297622680664, 4.218681335449219, 5.4203338623046875, 6.621985912322998, 7.823637962341309, 9.025289535522461, 10.22694206237793, 11.428594589233398, 12.63024616241455, 13.831897735595703, 15.033550262451172, 16.23520278930664, 17.43685531616211, 18.638505935668945, 19.840158462524414, 21.041810989379883, 22.24346160888672, 23.445114135742188, 24.646766662597656, 25.848419189453125, 27.050071716308594, 28.25172233581543, 29.4533748626709, 30.655027389526367, 31.856678009033203, 33.05833053588867, 34.25998306274414]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 11.0, 16.0, 22.0, 27.0, 28.0, 48.0, 89.0, 122.0, 177.0, 284.0, 360.0, 544.0, 813.0, 1276.0, 1832.0, 2682.0, 4327.0, 6478.0, 9975.0, 15518.0, 24432.0, 39346.0, 67176.0, 128860.0, 295937.0, 210478.0, 95300.0, 53253.0, 31746.0, 20216.0, 12879.0, 8318.0, 5354.0, 3552.0, 2350.0, 1562.0, 1010.0, 692.0, 474.0, 342.0, 217.0, 152.0, 95.0, 63.0, 44.0, 35.0, 15.0, 13.0, 11.0, 6.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.25, -11.8387451171875, -11.427490234375, -11.0162353515625, -10.60498046875, -10.1937255859375, -9.782470703125, -9.3712158203125, -8.9599609375, -8.5487060546875, -8.137451171875, -7.7261962890625, -7.31494140625, -6.9036865234375, -6.492431640625, -6.0811767578125, -5.669921875, -5.2586669921875, -4.847412109375, -4.4361572265625, -4.02490234375, -3.6136474609375, -3.202392578125, -2.7911376953125, -2.3798828125, -1.9686279296875, -1.557373046875, -1.1461181640625, -0.73486328125, -0.3236083984375, 0.087646484375, 0.4989013671875, 0.91015625, 1.3214111328125, 1.732666015625, 2.1439208984375, 2.55517578125, 2.9664306640625, 3.377685546875, 3.7889404296875, 4.2001953125, 4.6114501953125, 5.022705078125, 5.4339599609375, 5.84521484375, 6.2564697265625, 6.667724609375, 7.0789794921875, 7.490234375, 7.9014892578125, 8.312744140625, 8.7239990234375, 9.13525390625, 9.5465087890625, 9.957763671875, 10.3690185546875, 10.7802734375, 11.1915283203125, 11.602783203125, 12.0140380859375, 12.42529296875, 12.8365478515625, 13.247802734375, 13.6590576171875, 14.0703125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 8.0, 4.0, 5.0, 7.0, 7.0, 13.0, 23.0, 18.0, 26.0, 21.0, 34.0, 27.0, 30.0, 32.0, 33.0, 37.0, 52.0, 47.0, 42.0, 47.0, 47.0, 47.0, 47.0, 30.0, 44.0, 29.0, 31.0, 34.0, 33.0, 20.0, 26.0, 20.0, 15.0, 10.0, 6.0, 13.0, 12.0, 9.0, 5.0, 3.0, 2.0, 4.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0], "bins": [-44.8125, -43.5634765625, -42.314453125, -41.0654296875, -39.81640625, -38.5673828125, -37.318359375, -36.0693359375, -34.8203125, -33.5712890625, -32.322265625, -31.0732421875, -29.82421875, -28.5751953125, -27.326171875, -26.0771484375, -24.828125, -23.5791015625, -22.330078125, -21.0810546875, -19.83203125, -18.5830078125, -17.333984375, -16.0849609375, -14.8359375, -13.5869140625, -12.337890625, -11.0888671875, -9.83984375, -8.5908203125, -7.341796875, -6.0927734375, -4.84375, -3.5947265625, -2.345703125, -1.0966796875, 0.15234375, 1.4013671875, 2.650390625, 3.8994140625, 5.1484375, 6.3974609375, 7.646484375, 8.8955078125, 10.14453125, 11.3935546875, 12.642578125, 13.8916015625, 15.140625, 16.3896484375, 17.638671875, 18.8876953125, 20.13671875, 21.3857421875, 22.634765625, 23.8837890625, 25.1328125, 26.3818359375, 27.630859375, 28.8798828125, 30.12890625, 31.3779296875, 32.626953125, 33.8759765625, 35.125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 6.0, 4.0, 12.0, 11.0, 12.0, 32.0, 50.0, 59.0, 96.0, 129.0, 199.0, 288.0, 414.0, 613.0, 798.0, 1133.0, 1679.0, 2429.0, 3723.0, 5706.0, 9704.0, 18688.0, 59409.0, 621852.0, 246602.0, 36917.0, 14574.0, 8017.0, 5032.0, 3252.0, 2215.0, 1476.0, 1023.0, 740.0, 529.0, 357.0, 258.0, 181.0, 115.0, 79.0, 54.0, 30.0, 19.0, 18.0, 13.0, 9.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.1875, -14.678466796875, -14.16943359375, -13.660400390625, -13.1513671875, -12.642333984375, -12.13330078125, -11.624267578125, -11.115234375, -10.606201171875, -10.09716796875, -9.588134765625, -9.0791015625, -8.570068359375, -8.06103515625, -7.552001953125, -7.04296875, -6.533935546875, -6.02490234375, -5.515869140625, -5.0068359375, -4.497802734375, -3.98876953125, -3.479736328125, -2.970703125, -2.461669921875, -1.95263671875, -1.443603515625, -0.9345703125, -0.425537109375, 0.08349609375, 0.592529296875, 1.1015625, 1.610595703125, 2.11962890625, 2.628662109375, 3.1376953125, 3.646728515625, 4.15576171875, 4.664794921875, 5.173828125, 5.682861328125, 6.19189453125, 6.700927734375, 7.2099609375, 7.718994140625, 8.22802734375, 8.737060546875, 9.24609375, 9.755126953125, 10.26416015625, 10.773193359375, 11.2822265625, 11.791259765625, 12.30029296875, 12.809326171875, 13.318359375, 13.827392578125, 14.33642578125, 14.845458984375, 15.3544921875, 15.863525390625, 16.37255859375, 16.881591796875, 17.390625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 3.0, 3.0, 9.0, 11.0, 3.0, 14.0, 11.0, 14.0, 12.0, 16.0, 20.0, 28.0, 28.0, 26.0, 25.0, 35.0, 32.0, 32.0, 39.0, 40.0, 43.0, 42.0, 49.0, 44.0, 29.0, 37.0, 40.0, 33.0, 39.0, 29.0, 26.0, 39.0, 15.0, 28.0, 10.0, 19.0, 19.0, 14.0, 12.0, 11.0, 9.0, 9.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.625, -23.810546875, -22.99609375, -22.181640625, -21.3671875, -20.552734375, -19.73828125, -18.923828125, -18.109375, -17.294921875, -16.48046875, -15.666015625, -14.8515625, -14.037109375, -13.22265625, -12.408203125, -11.59375, -10.779296875, -9.96484375, -9.150390625, -8.3359375, -7.521484375, -6.70703125, -5.892578125, -5.078125, -4.263671875, -3.44921875, -2.634765625, -1.8203125, -1.005859375, -0.19140625, 0.623046875, 1.4375, 2.251953125, 3.06640625, 3.880859375, 4.6953125, 5.509765625, 6.32421875, 7.138671875, 7.953125, 8.767578125, 9.58203125, 10.396484375, 11.2109375, 12.025390625, 12.83984375, 13.654296875, 14.46875, 15.283203125, 16.09765625, 16.912109375, 17.7265625, 18.541015625, 19.35546875, 20.169921875, 20.984375, 21.798828125, 22.61328125, 23.427734375, 24.2421875, 25.056640625, 25.87109375, 26.685546875, 27.5]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 4.0, 5.0, 6.0, 10.0, 19.0, 21.0, 38.0, 62.0, 66.0, 105.0, 166.0, 266.0, 403.0, 643.0, 1162.0, 2042.0, 3844.0, 8198.0, 19319.0, 78904.0, 850255.0, 52076.0, 16106.0, 7026.0, 3387.0, 1750.0, 1024.0, 561.0, 408.0, 213.0, 159.0, 102.0, 53.0, 48.0, 40.0, 20.0, 21.0, 12.0, 3.0, 4.0, 3.0, 2.0, 2.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.3671875, -2.300323486328125, -2.23345947265625, -2.166595458984375, -2.0997314453125, -2.032867431640625, -1.96600341796875, -1.899139404296875, -1.832275390625, -1.765411376953125, -1.69854736328125, -1.631683349609375, -1.5648193359375, -1.497955322265625, -1.43109130859375, -1.364227294921875, -1.29736328125, -1.230499267578125, -1.16363525390625, -1.096771240234375, -1.0299072265625, -0.963043212890625, -0.89617919921875, -0.829315185546875, -0.762451171875, -0.695587158203125, -0.62872314453125, -0.561859130859375, -0.4949951171875, -0.428131103515625, -0.36126708984375, -0.294403076171875, -0.2275390625, -0.160675048828125, -0.09381103515625, -0.026947021484375, 0.0399169921875, 0.106781005859375, 0.17364501953125, 0.240509033203125, 0.307373046875, 0.374237060546875, 0.44110107421875, 0.507965087890625, 0.5748291015625, 0.641693115234375, 0.70855712890625, 0.775421142578125, 0.84228515625, 0.909149169921875, 0.97601318359375, 1.042877197265625, 1.1097412109375, 1.176605224609375, 1.24346923828125, 1.310333251953125, 1.377197265625, 1.444061279296875, 1.51092529296875, 1.577789306640625, 1.6446533203125, 1.711517333984375, 1.77838134765625, 1.845245361328125, 1.912109375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 4.0, 2.0, 7.0, 8.0, 6.0, 6.0, 10.0, 15.0, 16.0, 24.0, 30.0, 39.0, 44.0, 45.0, 55.0, 55.0, 57.0, 57.0, 68.0, 61.0, 67.0, 46.0, 56.0, 30.0, 33.0, 31.0, 27.0, 17.0, 13.0, 17.0, 15.0, 7.0, 2.0, 6.0, 5.0, 3.0, 2.0, 3.0, 3.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00010657310485839844, -0.00010285340249538422, -9.913370013237e-05, -9.541399776935577e-05, -9.169429540634155e-05, -8.797459304332733e-05, -8.425489068031311e-05, -8.053518831729889e-05, -7.681548595428467e-05, -7.309578359127045e-05, -6.937608122825623e-05, -6.5656378865242e-05, -6.193667650222778e-05, -5.821697413921356e-05, -5.449727177619934e-05, -5.077756941318512e-05, -4.70578670501709e-05, -4.333816468715668e-05, -3.9618462324142456e-05, -3.5898759961128235e-05, -3.2179057598114014e-05, -2.8459355235099792e-05, -2.473965287208557e-05, -2.101995050907135e-05, -1.730024814605713e-05, -1.3580545783042908e-05, -9.860843420028687e-06, -6.141141057014465e-06, -2.421438694000244e-06, 1.298263669013977e-06, 5.017966032028198e-06, 8.73766839504242e-06, 1.245737075805664e-05, 1.6177073121070862e-05, 1.9896775484085083e-05, 2.3616477847099304e-05, 2.7336180210113525e-05, 3.1055882573127747e-05, 3.477558493614197e-05, 3.849528729915619e-05, 4.221498966217041e-05, 4.593469202518463e-05, 4.965439438819885e-05, 5.3374096751213074e-05, 5.7093799114227295e-05, 6.0813501477241516e-05, 6.453320384025574e-05, 6.825290620326996e-05, 7.197260856628418e-05, 7.56923109292984e-05, 7.941201329231262e-05, 8.313171565532684e-05, 8.685141801834106e-05, 9.057112038135529e-05, 9.429082274436951e-05, 9.801052510738373e-05, 0.00010173022747039795, 0.00010544992983341217, 0.00010916963219642639, 0.00011288933455944061, 0.00011660903692245483, 0.00012032873928546906, 0.00012404844164848328, 0.0001277681440114975, 0.00013148784637451172]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 0.0, 3.0, 10.0, 7.0, 14.0, 21.0, 33.0, 57.0, 69.0, 101.0, 175.0, 284.0, 389.0, 588.0, 910.0, 1406.0, 2179.0, 3305.0, 5198.0, 8086.0, 12698.0, 20802.0, 35033.0, 62811.0, 115887.0, 212500.0, 240877.0, 141461.0, 76049.0, 42261.0, 24416.0, 15040.0, 9361.0, 5685.0, 3701.0, 2439.0, 1545.0, 1097.0, 713.0, 492.0, 295.0, 191.0, 130.0, 87.0, 48.0, 33.0, 28.0, 21.0, 9.0, 6.0, 6.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.197265625, -1.1600341796875, -1.122802734375, -1.0855712890625, -1.04833984375, -1.0111083984375, -0.973876953125, -0.9366455078125, -0.8994140625, -0.8621826171875, -0.824951171875, -0.7877197265625, -0.75048828125, -0.7132568359375, -0.676025390625, -0.6387939453125, -0.6015625, -0.5643310546875, -0.527099609375, -0.4898681640625, -0.45263671875, -0.4154052734375, -0.378173828125, -0.3409423828125, -0.3037109375, -0.2664794921875, -0.229248046875, -0.1920166015625, -0.15478515625, -0.1175537109375, -0.080322265625, -0.0430908203125, -0.005859375, 0.0313720703125, 0.068603515625, 0.1058349609375, 0.14306640625, 0.1802978515625, 0.217529296875, 0.2547607421875, 0.2919921875, 0.3292236328125, 0.366455078125, 0.4036865234375, 0.44091796875, 0.4781494140625, 0.515380859375, 0.5526123046875, 0.58984375, 0.6270751953125, 0.664306640625, 0.7015380859375, 0.73876953125, 0.7760009765625, 0.813232421875, 0.8504638671875, 0.8876953125, 0.9249267578125, 0.962158203125, 0.9993896484375, 1.03662109375, 1.0738525390625, 1.111083984375, 1.1483154296875, 1.185546875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 4.0, 4.0, 6.0, 10.0, 5.0, 10.0, 10.0, 12.0, 16.0, 11.0, 19.0, 28.0, 21.0, 40.0, 26.0, 39.0, 45.0, 61.0, 60.0, 55.0, 66.0, 47.0, 64.0, 40.0, 43.0, 35.0, 39.0, 24.0, 30.0, 18.0, 14.0, 18.0, 15.0, 15.0, 8.0, 11.0, 12.0, 4.0, 8.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.43115234375, -0.416015625, -0.40087890625, -0.3857421875, -0.37060546875, -0.35546875, -0.34033203125, -0.3251953125, -0.31005859375, -0.294921875, -0.27978515625, -0.2646484375, -0.24951171875, -0.234375, -0.21923828125, -0.2041015625, -0.18896484375, -0.173828125, -0.15869140625, -0.1435546875, -0.12841796875, -0.11328125, -0.09814453125, -0.0830078125, -0.06787109375, -0.052734375, -0.03759765625, -0.0224609375, -0.00732421875, 0.0078125, 0.02294921875, 0.0380859375, 0.05322265625, 0.068359375, 0.08349609375, 0.0986328125, 0.11376953125, 0.12890625, 0.14404296875, 0.1591796875, 0.17431640625, 0.189453125, 0.20458984375, 0.2197265625, 0.23486328125, 0.25, 0.26513671875, 0.2802734375, 0.29541015625, 0.310546875, 0.32568359375, 0.3408203125, 0.35595703125, 0.37109375, 0.38623046875, 0.4013671875, 0.41650390625, 0.431640625, 0.44677734375, 0.4619140625, 0.47705078125, 0.4921875, 0.50732421875, 0.5224609375, 0.53759765625]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 1.0, 5.0, 11.0, 6.0, 7.0, 11.0, 15.0, 18.0, 19.0, 28.0, 25.0, 48.0, 60.0, 59.0, 75.0, 73.0, 72.0, 56.0, 67.0, 62.0, 45.0, 32.0, 40.0, 32.0, 32.0, 18.0, 20.0, 15.0, 12.0, 6.0, 6.0, 9.0, 8.0, 1.0, 1.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-45.30769729614258, -44.071327209472656, -42.834957122802734, -41.59859085083008, -40.362220764160156, -39.125850677490234, -37.88948059082031, -36.65311050415039, -35.41674041748047, -34.18037033081055, -32.944000244140625, -31.707632064819336, -30.471263885498047, -29.234893798828125, -27.998523712158203, -26.76215362548828, -25.525787353515625, -24.289417266845703, -23.053049087524414, -21.816679000854492, -20.580310821533203, -19.34394073486328, -18.10757064819336, -16.871200561523438, -15.634832382202148, -14.398463249206543, -13.162094116210938, -11.925724029541016, -10.68935489654541, -9.452985763549805, -8.216615676879883, -6.980246543884277, -5.743877410888672, -4.507508277893066, -3.2711386680603027, -2.034769296646118, -0.7983999252319336, 0.4379692077636719, 1.6743388175964355, 2.910708427429199, 4.147077560424805, 5.38344669342041, 6.619816303253174, 7.8561859130859375, 9.092555046081543, 10.328924179077148, 11.56529426574707, 12.801663398742676, 14.038032531738281, 15.274401664733887, 16.510770797729492, 17.747140884399414, 18.983509063720703, 20.219879150390625, 21.456249237060547, 22.69261932373047, 23.928987503051758, 25.16535758972168, 26.40172576904297, 27.63809585571289, 28.874465942382812, 30.1108341217041, 31.347204208374023, 32.58357238769531, 33.819942474365234]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 4.0, 4.0, 6.0, 11.0, 8.0, 9.0, 16.0, 22.0, 31.0, 21.0, 25.0, 35.0, 27.0, 27.0, 37.0, 27.0, 39.0, 49.0, 42.0, 40.0, 45.0, 35.0, 48.0, 41.0, 42.0, 43.0, 25.0, 32.0, 42.0, 23.0, 25.0, 23.0, 15.0, 17.0, 15.0, 11.0, 11.0, 10.0, 5.0, 3.0, 6.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-41.921695709228516, -40.73655319213867, -39.55141067504883, -38.36627197265625, -37.181129455566406, -35.99598693847656, -34.81084442138672, -33.625701904296875, -32.44055938720703, -31.255416870117188, -30.070276260375977, -28.885133743286133, -27.699993133544922, -26.514850616455078, -25.329708099365234, -24.14456558227539, -22.959426879882812, -21.77428436279297, -20.589143753051758, -19.404001235961914, -18.218860626220703, -17.03371810913086, -15.848575592041016, -14.663434028625488, -13.478292465209961, -12.293150901794434, -11.108009338378906, -9.922866821289062, -8.737725257873535, -7.552583694458008, -6.367441654205322, -5.182299613952637, -3.9971580505371094, -2.812016248703003, -1.6268744468688965, -0.44173264503479004, 0.7434091567993164, 1.9285507202148438, 3.1136927604675293, 4.298834800720215, 5.483976364135742, 6.6691179275512695, 7.854259967803955, 9.03940200805664, 10.224543571472168, 11.409685134887695, 12.594827651977539, 13.779969215393066, 14.965110778808594, 16.150253295898438, 17.33539390563965, 18.520536422729492, 19.705677032470703, 20.890819549560547, 22.07596206665039, 23.261104583740234, 24.446245193481445, 25.63138771057129, 26.8165283203125, 28.001670837402344, 29.186813354492188, 30.3719539642334, 31.557096481323242, 32.74223709106445, 33.9273796081543]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 7.0, 7.0, 11.0, 28.0, 30.0, 46.0, 86.0, 103.0, 153.0, 284.0, 450.0, 749.0, 1223.0, 1894.0, 3098.0, 5300.0, 9160.0, 15612.0, 27023.0, 47604.0, 84836.0, 149208.0, 225623.0, 198985.0, 119578.0, 67377.0, 37616.0, 21401.0, 12438.0, 7308.0, 4448.0, 2627.0, 1613.0, 945.0, 606.0, 393.0, 245.0, 159.0, 107.0, 64.0, 31.0, 43.0, 15.0, 10.0, 8.0, 2.0, 2.0, 3.0, 1.0, 1.0, 3.0], "bins": [-52.5625, -51.09423828125, -49.6259765625, -48.15771484375, -46.689453125, -45.22119140625, -43.7529296875, -42.28466796875, -40.81640625, -39.34814453125, -37.8798828125, -36.41162109375, -34.943359375, -33.47509765625, -32.0068359375, -30.53857421875, -29.0703125, -27.60205078125, -26.1337890625, -24.66552734375, -23.197265625, -21.72900390625, -20.2607421875, -18.79248046875, -17.32421875, -15.85595703125, -14.3876953125, -12.91943359375, -11.451171875, -9.98291015625, -8.5146484375, -7.04638671875, -5.578125, -4.10986328125, -2.6416015625, -1.17333984375, 0.294921875, 1.76318359375, 3.2314453125, 4.69970703125, 6.16796875, 7.63623046875, 9.1044921875, 10.57275390625, 12.041015625, 13.50927734375, 14.9775390625, 16.44580078125, 17.9140625, 19.38232421875, 20.8505859375, 22.31884765625, 23.787109375, 25.25537109375, 26.7236328125, 28.19189453125, 29.66015625, 31.12841796875, 32.5966796875, 34.06494140625, 35.533203125, 37.00146484375, 38.4697265625, 39.93798828125, 41.40625]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 5.0, 8.0, 6.0, 11.0, 14.0, 19.0, 21.0, 29.0, 21.0, 31.0, 27.0, 34.0, 42.0, 31.0, 41.0, 53.0, 43.0, 50.0, 42.0, 33.0, 52.0, 46.0, 45.0, 47.0, 27.0, 33.0, 28.0, 33.0, 27.0, 20.0, 15.0, 13.0, 10.0, 16.0, 10.0, 5.0, 3.0, 0.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 3.0], "bins": [-44.40625, -43.1826171875, -41.958984375, -40.7353515625, -39.51171875, -38.2880859375, -37.064453125, -35.8408203125, -34.6171875, -33.3935546875, -32.169921875, -30.9462890625, -29.72265625, -28.4990234375, -27.275390625, -26.0517578125, -24.828125, -23.6044921875, -22.380859375, -21.1572265625, -19.93359375, -18.7099609375, -17.486328125, -16.2626953125, -15.0390625, -13.8154296875, -12.591796875, -11.3681640625, -10.14453125, -8.9208984375, -7.697265625, -6.4736328125, -5.25, -4.0263671875, -2.802734375, -1.5791015625, -0.35546875, 0.8681640625, 2.091796875, 3.3154296875, 4.5390625, 5.7626953125, 6.986328125, 8.2099609375, 9.43359375, 10.6572265625, 11.880859375, 13.1044921875, 14.328125, 15.5517578125, 16.775390625, 17.9990234375, 19.22265625, 20.4462890625, 21.669921875, 22.8935546875, 24.1171875, 25.3408203125, 26.564453125, 27.7880859375, 29.01171875, 30.2353515625, 31.458984375, 32.6826171875, 33.90625]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 10.0, 10.0, 16.0, 22.0, 31.0, 54.0, 70.0, 123.0, 175.0, 286.0, 418.0, 762.0, 1185.0, 2068.0, 3155.0, 5330.0, 8860.0, 14698.0, 25547.0, 43898.0, 75236.0, 128402.0, 202312.0, 208056.0, 135677.0, 79535.0, 46112.0, 26705.0, 15945.0, 9351.0, 5766.0, 3419.0, 2060.0, 1287.0, 748.0, 488.0, 272.0, 166.0, 118.0, 71.0, 42.0, 34.0, 18.0, 10.0, 11.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-48.21875, -46.71435546875, -45.2099609375, -43.70556640625, -42.201171875, -40.69677734375, -39.1923828125, -37.68798828125, -36.18359375, -34.67919921875, -33.1748046875, -31.67041015625, -30.166015625, -28.66162109375, -27.1572265625, -25.65283203125, -24.1484375, -22.64404296875, -21.1396484375, -19.63525390625, -18.130859375, -16.62646484375, -15.1220703125, -13.61767578125, -12.11328125, -10.60888671875, -9.1044921875, -7.60009765625, -6.095703125, -4.59130859375, -3.0869140625, -1.58251953125, -0.078125, 1.42626953125, 2.9306640625, 4.43505859375, 5.939453125, 7.44384765625, 8.9482421875, 10.45263671875, 11.95703125, 13.46142578125, 14.9658203125, 16.47021484375, 17.974609375, 19.47900390625, 20.9833984375, 22.48779296875, 23.9921875, 25.49658203125, 27.0009765625, 28.50537109375, 30.009765625, 31.51416015625, 33.0185546875, 34.52294921875, 36.02734375, 37.53173828125, 39.0361328125, 40.54052734375, 42.044921875, 43.54931640625, 45.0537109375, 46.55810546875, 48.0625]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 7.0, 9.0, 4.0, 5.0, 13.0, 11.0, 12.0, 20.0, 19.0, 23.0, 22.0, 31.0, 29.0, 39.0, 36.0, 36.0, 46.0, 35.0, 48.0, 41.0, 51.0, 43.0, 40.0, 47.0, 43.0, 39.0, 43.0, 30.0, 31.0, 26.0, 22.0, 18.0, 19.0, 13.0, 9.0, 8.0, 8.0, 5.0, 11.0, 5.0, 5.0, 3.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-25.046875, -24.247314453125, -23.44775390625, -22.648193359375, -21.8486328125, -21.049072265625, -20.24951171875, -19.449951171875, -18.650390625, -17.850830078125, -17.05126953125, -16.251708984375, -15.4521484375, -14.652587890625, -13.85302734375, -13.053466796875, -12.25390625, -11.454345703125, -10.65478515625, -9.855224609375, -9.0556640625, -8.256103515625, -7.45654296875, -6.656982421875, -5.857421875, -5.057861328125, -4.25830078125, -3.458740234375, -2.6591796875, -1.859619140625, -1.06005859375, -0.260498046875, 0.5390625, 1.338623046875, 2.13818359375, 2.937744140625, 3.7373046875, 4.536865234375, 5.33642578125, 6.135986328125, 6.935546875, 7.735107421875, 8.53466796875, 9.334228515625, 10.1337890625, 10.933349609375, 11.73291015625, 12.532470703125, 13.33203125, 14.131591796875, 14.93115234375, 15.730712890625, 16.5302734375, 17.329833984375, 18.12939453125, 18.928955078125, 19.728515625, 20.528076171875, 21.32763671875, 22.127197265625, 22.9267578125, 23.726318359375, 24.52587890625, 25.325439453125, 26.125]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 6.0, 5.0, 7.0, 15.0, 14.0, 12.0, 34.0, 41.0, 82.0, 117.0, 134.0, 233.0, 335.0, 496.0, 784.0, 1164.0, 1878.0, 2988.0, 4936.0, 8175.0, 13709.0, 24187.0, 42858.0, 78231.0, 145393.0, 243020.0, 212395.0, 117993.0, 64116.0, 35448.0, 19949.0, 11413.0, 7003.0, 4056.0, 2606.0, 1584.0, 1101.0, 682.0, 443.0, 288.0, 195.0, 136.0, 102.0, 59.0, 34.0, 38.0, 22.0, 21.0, 14.0, 3.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0], "bins": [-16.28125, -15.800048828125, -15.31884765625, -14.837646484375, -14.3564453125, -13.875244140625, -13.39404296875, -12.912841796875, -12.431640625, -11.950439453125, -11.46923828125, -10.988037109375, -10.5068359375, -10.025634765625, -9.54443359375, -9.063232421875, -8.58203125, -8.100830078125, -7.61962890625, -7.138427734375, -6.6572265625, -6.176025390625, -5.69482421875, -5.213623046875, -4.732421875, -4.251220703125, -3.77001953125, -3.288818359375, -2.8076171875, -2.326416015625, -1.84521484375, -1.364013671875, -0.8828125, -0.401611328125, 0.07958984375, 0.560791015625, 1.0419921875, 1.523193359375, 2.00439453125, 2.485595703125, 2.966796875, 3.447998046875, 3.92919921875, 4.410400390625, 4.8916015625, 5.372802734375, 5.85400390625, 6.335205078125, 6.81640625, 7.297607421875, 7.77880859375, 8.260009765625, 8.7412109375, 9.222412109375, 9.70361328125, 10.184814453125, 10.666015625, 11.147216796875, 11.62841796875, 12.109619140625, 12.5908203125, 13.072021484375, 13.55322265625, 14.034423828125, 14.515625]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 6.0, 4.0, 10.0, 10.0, 9.0, 28.0, 37.0, 24.0, 54.0, 61.0, 83.0, 101.0, 131.0, 123.0, 74.0, 62.0, 39.0, 45.0, 24.0, 26.0, 13.0, 10.0, 6.0, 8.0, 9.0, 4.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00222015380859375, -0.0021537840366363525, -0.002087414264678955, -0.0020210444927215576, -0.00195467472076416, -0.0018883049488067627, -0.0018219351768493652, -0.0017555654048919678, -0.0016891956329345703, -0.0016228258609771729, -0.0015564560890197754, -0.001490086317062378, -0.0014237165451049805, -0.001357346773147583, -0.0012909770011901855, -0.001224607229232788, -0.0011582374572753906, -0.0010918676853179932, -0.0010254979133605957, -0.0009591281414031982, -0.0008927583694458008, -0.0008263885974884033, -0.0007600188255310059, -0.0006936490535736084, -0.0006272792816162109, -0.0005609095096588135, -0.000494539737701416, -0.00042816996574401855, -0.0003618001937866211, -0.00029543042182922363, -0.00022906064987182617, -0.0001626908779144287, -9.632110595703125e-05, -2.995133399963379e-05, 3.641843795776367e-05, 0.00010278820991516113, 0.0001691579818725586, 0.00023552775382995605, 0.0003018975257873535, 0.000368267297744751, 0.00043463706970214844, 0.0005010068416595459, 0.0005673766136169434, 0.0006337463855743408, 0.0007001161575317383, 0.0007664859294891357, 0.0008328557014465332, 0.0008992254734039307, 0.0009655952453613281, 0.0010319650173187256, 0.001098334789276123, 0.0011647045612335205, 0.001231074333190918, 0.0012974441051483154, 0.0013638138771057129, 0.0014301836490631104, 0.0014965534210205078, 0.0015629231929779053, 0.0016292929649353027, 0.0016956627368927002, 0.0017620325088500977, 0.0018284022808074951, 0.0018947720527648926, 0.00196114182472229, 0.0020275115966796875]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [4.0, 3.0, 10.0, 8.0, 11.0, 15.0, 19.0, 32.0, 56.0, 92.0, 123.0, 134.0, 208.0, 345.0, 441.0, 683.0, 972.0, 1431.0, 2027.0, 3102.0, 4467.0, 6479.0, 9991.0, 14856.0, 23054.0, 36585.0, 58885.0, 96033.0, 151804.0, 195102.0, 161571.0, 104013.0, 63434.0, 39148.0, 25054.0, 15894.0, 10520.0, 7157.0, 4816.0, 3151.0, 2089.0, 1517.0, 1065.0, 693.0, 467.0, 314.0, 203.0, 158.0, 114.0, 79.0, 42.0, 28.0, 20.0, 17.0, 15.0, 9.0, 5.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.2578125, -11.8433837890625, -11.428955078125, -11.0145263671875, -10.60009765625, -10.1856689453125, -9.771240234375, -9.3568115234375, -8.9423828125, -8.5279541015625, -8.113525390625, -7.6990966796875, -7.28466796875, -6.8702392578125, -6.455810546875, -6.0413818359375, -5.626953125, -5.2125244140625, -4.798095703125, -4.3836669921875, -3.96923828125, -3.5548095703125, -3.140380859375, -2.7259521484375, -2.3115234375, -1.8970947265625, -1.482666015625, -1.0682373046875, -0.65380859375, -0.2393798828125, 0.175048828125, 0.5894775390625, 1.00390625, 1.4183349609375, 1.832763671875, 2.2471923828125, 2.66162109375, 3.0760498046875, 3.490478515625, 3.9049072265625, 4.3193359375, 4.7337646484375, 5.148193359375, 5.5626220703125, 5.97705078125, 6.3914794921875, 6.805908203125, 7.2203369140625, 7.634765625, 8.0491943359375, 8.463623046875, 8.8780517578125, 9.29248046875, 9.7069091796875, 10.121337890625, 10.5357666015625, 10.9501953125, 11.3646240234375, 11.779052734375, 12.1934814453125, 12.60791015625, 13.0223388671875, 13.436767578125, 13.8511962890625, 14.265625]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 6.0, 6.0, 3.0, 5.0, 8.0, 18.0, 10.0, 20.0, 22.0, 25.0, 23.0, 27.0, 31.0, 44.0, 53.0, 48.0, 48.0, 36.0, 55.0, 40.0, 62.0, 54.0, 44.0, 34.0, 52.0, 33.0, 31.0, 29.0, 20.0, 25.0, 14.0, 15.0, 9.0, 6.0, 8.0, 10.0, 5.0, 5.0, 5.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.27734375, -5.10687255859375, -4.9364013671875, -4.76593017578125, -4.595458984375, -4.42498779296875, -4.2545166015625, -4.08404541015625, -3.91357421875, -3.74310302734375, -3.5726318359375, -3.40216064453125, -3.231689453125, -3.06121826171875, -2.8907470703125, -2.72027587890625, -2.5498046875, -2.37933349609375, -2.2088623046875, -2.03839111328125, -1.867919921875, -1.69744873046875, -1.5269775390625, -1.35650634765625, -1.18603515625, -1.01556396484375, -0.8450927734375, -0.67462158203125, -0.504150390625, -0.33367919921875, -0.1632080078125, 0.00726318359375, 0.177734375, 0.34820556640625, 0.5186767578125, 0.68914794921875, 0.859619140625, 1.03009033203125, 1.2005615234375, 1.37103271484375, 1.54150390625, 1.71197509765625, 1.8824462890625, 2.05291748046875, 2.223388671875, 2.39385986328125, 2.5643310546875, 2.73480224609375, 2.9052734375, 3.07574462890625, 3.2462158203125, 3.41668701171875, 3.587158203125, 3.75762939453125, 3.9281005859375, 4.09857177734375, 4.26904296875, 4.43951416015625, 4.6099853515625, 4.78045654296875, 4.950927734375, 5.12139892578125, 5.2918701171875, 5.46234130859375, 5.6328125]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 0.0, 4.0, 5.0, 2.0, 4.0, 8.0, 6.0, 8.0, 6.0, 12.0, 15.0, 18.0, 27.0, 43.0, 39.0, 39.0, 42.0, 61.0, 61.0, 53.0, 72.0, 70.0, 50.0, 50.0, 48.0, 45.0, 31.0, 40.0, 32.0, 20.0, 17.0, 13.0, 12.0, 9.0, 9.0, 10.0, 4.0, 4.0, 7.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-41.44779968261719, -40.31585693359375, -39.18391418457031, -38.051971435546875, -36.9200325012207, -35.788089752197266, -34.65614700317383, -33.52420425415039, -32.39226150512695, -31.260318756103516, -30.12837791442871, -28.996435165405273, -27.864492416381836, -26.73255157470703, -25.600608825683594, -24.468666076660156, -23.33672523498535, -22.204782485961914, -21.07284164428711, -19.940898895263672, -18.808956146240234, -17.677013397216797, -16.545072555541992, -15.413129806518555, -14.281188011169434, -13.149246215820312, -12.017303466796875, -10.885361671447754, -9.753419876098633, -8.621477127075195, -7.489535331726074, -6.357593059539795, -5.225648880004883, -4.0937066078186035, -2.9617645740509033, -1.8298225402832031, -0.6978802680969238, 0.43406200408935547, 1.5660037994384766, 2.697946071624756, 3.829888343811035, 4.9618306159973145, 6.093772888183594, 7.225714683532715, 8.357656478881836, 9.489599227905273, 10.621541023254395, 11.753482818603516, 12.885425567626953, 14.017367362976074, 15.149310111999512, 16.281251907348633, 17.41319465637207, 18.545135498046875, 19.677078247070312, 20.80902099609375, 21.940963745117188, 23.072906494140625, 24.20484733581543, 25.336790084838867, 26.468732833862305, 27.60067367553711, 28.732616424560547, 29.864559173583984, 30.99650001525879]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 5.0, 0.0, 6.0, 8.0, 7.0, 14.0, 10.0, 14.0, 14.0, 22.0, 21.0, 20.0, 27.0, 26.0, 43.0, 40.0, 33.0, 36.0, 47.0, 36.0, 42.0, 37.0, 49.0, 26.0, 43.0, 39.0, 40.0, 44.0, 30.0, 27.0, 31.0, 21.0, 22.0, 20.0, 20.0, 15.0, 7.0, 11.0, 14.0, 11.0, 9.0, 4.0, 4.0, 4.0, 3.0, 2.0, 3.0, 3.0, 2.0], "bins": [-44.825984954833984, -43.59872055053711, -42.3714599609375, -41.144195556640625, -39.91693115234375, -38.689666748046875, -37.46240234375, -36.23514175415039, -35.007877349853516, -33.78061294555664, -32.55335235595703, -31.326087951660156, -30.09882354736328, -28.871559143066406, -27.644296646118164, -26.417034149169922, -25.189769744873047, -23.962505340576172, -22.73524284362793, -21.507980346679688, -20.280715942382812, -19.053451538085938, -17.826189041137695, -16.598926544189453, -15.371662139892578, -14.14439868927002, -12.917135238647461, -11.689871788024902, -10.462608337402344, -9.235344886779785, -8.008081436157227, -6.780817985534668, -5.553554534912109, -4.326291084289551, -3.099027633666992, -1.8717641830444336, -0.644500732421875, 0.5827627182006836, 1.8100261688232422, 3.037289619445801, 4.264553070068359, 5.491816520690918, 6.719079971313477, 7.946343421936035, 9.173606872558594, 10.400870323181152, 11.628133773803711, 12.85539722442627, 14.082660675048828, 15.309924125671387, 16.537187576293945, 17.764450073242188, 18.991714477539062, 20.218978881835938, 21.44624137878418, 22.673503875732422, 23.900768280029297, 25.128032684326172, 26.355295181274414, 27.582557678222656, 28.80982208251953, 30.037086486816406, 31.26434898376465, 32.49161148071289, 33.718875885009766]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 4.0, 2.0, 7.0, 10.0, 14.0, 14.0, 26.0, 29.0, 60.0, 80.0, 148.0, 197.0, 313.0, 540.0, 907.0, 1627.0, 2678.0, 4898.0, 9039.0, 17128.0, 33968.0, 74075.0, 198409.0, 624795.0, 1512840.0, 1116349.0, 370514.0, 122305.0, 51243.0, 24210.0, 12264.0, 6486.0, 3693.0, 2086.0, 1214.0, 748.0, 483.0, 299.0, 206.0, 116.0, 97.0, 49.0, 30.0, 30.0, 14.0, 14.0, 10.0, 12.0, 5.0, 1.0, 2.0, 0.0, 3.0], "bins": [-55.84375, -54.28271484375, -52.7216796875, -51.16064453125, -49.599609375, -48.03857421875, -46.4775390625, -44.91650390625, -43.35546875, -41.79443359375, -40.2333984375, -38.67236328125, -37.111328125, -35.55029296875, -33.9892578125, -32.42822265625, -30.8671875, -29.30615234375, -27.7451171875, -26.18408203125, -24.623046875, -23.06201171875, -21.5009765625, -19.93994140625, -18.37890625, -16.81787109375, -15.2568359375, -13.69580078125, -12.134765625, -10.57373046875, -9.0126953125, -7.45166015625, -5.890625, -4.32958984375, -2.7685546875, -1.20751953125, 0.353515625, 1.91455078125, 3.4755859375, 5.03662109375, 6.59765625, 8.15869140625, 9.7197265625, 11.28076171875, 12.841796875, 14.40283203125, 15.9638671875, 17.52490234375, 19.0859375, 20.64697265625, 22.2080078125, 23.76904296875, 25.330078125, 26.89111328125, 28.4521484375, 30.01318359375, 31.57421875, 33.13525390625, 34.6962890625, 36.25732421875, 37.818359375, 39.37939453125, 40.9404296875, 42.50146484375, 44.0625]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 2.0, 6.0, 6.0, 6.0, 11.0, 8.0, 14.0, 11.0, 19.0, 15.0, 19.0, 23.0, 27.0, 35.0, 36.0, 42.0, 26.0, 43.0, 44.0, 55.0, 36.0, 37.0, 40.0, 50.0, 44.0, 46.0, 36.0, 40.0, 29.0, 25.0, 18.0, 30.0, 22.0, 19.0, 8.0, 15.0, 13.0, 10.0, 9.0, 6.0, 8.0, 4.0, 4.0, 4.0, 3.0, 1.0, 3.0, 4.0, 1.0], "bins": [-41.90625, -40.759765625, -39.61328125, -38.466796875, -37.3203125, -36.173828125, -35.02734375, -33.880859375, -32.734375, -31.587890625, -30.44140625, -29.294921875, -28.1484375, -27.001953125, -25.85546875, -24.708984375, -23.5625, -22.416015625, -21.26953125, -20.123046875, -18.9765625, -17.830078125, -16.68359375, -15.537109375, -14.390625, -13.244140625, -12.09765625, -10.951171875, -9.8046875, -8.658203125, -7.51171875, -6.365234375, -5.21875, -4.072265625, -2.92578125, -1.779296875, -0.6328125, 0.513671875, 1.66015625, 2.806640625, 3.953125, 5.099609375, 6.24609375, 7.392578125, 8.5390625, 9.685546875, 10.83203125, 11.978515625, 13.125, 14.271484375, 15.41796875, 16.564453125, 17.7109375, 18.857421875, 20.00390625, 21.150390625, 22.296875, 23.443359375, 24.58984375, 25.736328125, 26.8828125, 28.029296875, 29.17578125, 30.322265625, 31.46875]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 5.0, 5.0, 6.0, 11.0, 13.0, 20.0, 31.0, 41.0, 56.0, 85.0, 123.0, 149.0, 234.0, 361.0, 461.0, 691.0, 1043.0, 1515.0, 2126.0, 3273.0, 4918.0, 7572.0, 11573.0, 18861.0, 30677.0, 51646.0, 88587.0, 160155.0, 302681.0, 604025.0, 1131380.0, 847756.0, 419416.0, 216546.0, 117259.0, 66427.0, 39167.0, 23342.0, 14690.0, 9328.0, 5910.0, 3900.0, 2585.0, 1753.0, 1168.0, 831.0, 583.0, 382.0, 279.0, 211.0, 138.0, 88.0, 68.0, 38.0, 35.0, 25.0, 19.0, 15.0, 6.0, 9.0, 1.0, 2.0, 2.0], "bins": [-37.90625, -36.7119140625, -35.517578125, -34.3232421875, -33.12890625, -31.9345703125, -30.740234375, -29.5458984375, -28.3515625, -27.1572265625, -25.962890625, -24.7685546875, -23.57421875, -22.3798828125, -21.185546875, -19.9912109375, -18.796875, -17.6025390625, -16.408203125, -15.2138671875, -14.01953125, -12.8251953125, -11.630859375, -10.4365234375, -9.2421875, -8.0478515625, -6.853515625, -5.6591796875, -4.46484375, -3.2705078125, -2.076171875, -0.8818359375, 0.3125, 1.5068359375, 2.701171875, 3.8955078125, 5.08984375, 6.2841796875, 7.478515625, 8.6728515625, 9.8671875, 11.0615234375, 12.255859375, 13.4501953125, 14.64453125, 15.8388671875, 17.033203125, 18.2275390625, 19.421875, 20.6162109375, 21.810546875, 23.0048828125, 24.19921875, 25.3935546875, 26.587890625, 27.7822265625, 28.9765625, 30.1708984375, 31.365234375, 32.5595703125, 33.75390625, 34.9482421875, 36.142578125, 37.3369140625, 38.53125]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 6.0, 6.0, 7.0, 9.0, 6.0, 13.0, 17.0, 23.0, 39.0, 50.0, 66.0, 58.0, 86.0, 97.0, 106.0, 174.0, 184.0, 230.0, 269.0, 302.0, 339.0, 335.0, 296.0, 258.0, 220.0, 185.0, 149.0, 115.0, 79.0, 75.0, 52.0, 50.0, 38.0, 31.0, 29.0, 13.0, 19.0, 16.0, 6.0, 7.0, 6.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-16.40625, -15.877197265625, -15.34814453125, -14.819091796875, -14.2900390625, -13.760986328125, -13.23193359375, -12.702880859375, -12.173828125, -11.644775390625, -11.11572265625, -10.586669921875, -10.0576171875, -9.528564453125, -8.99951171875, -8.470458984375, -7.94140625, -7.412353515625, -6.88330078125, -6.354248046875, -5.8251953125, -5.296142578125, -4.76708984375, -4.238037109375, -3.708984375, -3.179931640625, -2.65087890625, -2.121826171875, -1.5927734375, -1.063720703125, -0.53466796875, -0.005615234375, 0.5234375, 1.052490234375, 1.58154296875, 2.110595703125, 2.6396484375, 3.168701171875, 3.69775390625, 4.226806640625, 4.755859375, 5.284912109375, 5.81396484375, 6.343017578125, 6.8720703125, 7.401123046875, 7.93017578125, 8.459228515625, 8.98828125, 9.517333984375, 10.04638671875, 10.575439453125, 11.1044921875, 11.633544921875, 12.16259765625, 12.691650390625, 13.220703125, 13.749755859375, 14.27880859375, 14.807861328125, 15.3369140625, 15.865966796875, 16.39501953125, 16.924072265625, 17.453125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 5.0, 2.0, 6.0, 5.0, 8.0, 7.0, 19.0, 20.0, 24.0, 24.0, 54.0, 43.0, 54.0, 73.0, 78.0, 74.0, 69.0, 72.0, 69.0, 56.0, 43.0, 43.0, 42.0, 25.0, 21.0, 19.0, 14.0, 8.0, 7.0, 4.0, 5.0, 3.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.03807830810547, -48.57343292236328, -47.108787536621094, -45.64413833618164, -44.17949295043945, -42.714847564697266, -41.25020217895508, -39.785552978515625, -38.32090759277344, -36.85626220703125, -35.39161682128906, -33.92696762084961, -32.46232223510742, -30.997676849365234, -29.533031463623047, -28.068384170532227, -26.60373878479004, -25.13909339904785, -23.67444610595703, -22.209800720214844, -20.745153427124023, -19.280508041381836, -17.815860748291016, -16.351215362548828, -14.886569023132324, -13.42192268371582, -11.957276344299316, -10.492630004882812, -9.027984619140625, -7.563337802886963, -6.098691940307617, -4.634045600891113, -3.1693992614746094, -1.704753041267395, -0.24010682106018066, 1.2245392799377441, 2.689185619354248, 4.153831958770752, 5.618477821350098, 7.083124160766602, 8.547770500183105, 10.01241683959961, 11.477063179016113, 12.941709518432617, 14.406354904174805, 15.871002197265625, 17.335647583007812, 18.80029296875, 20.26494026184082, 21.729585647583008, 23.194232940673828, 24.658878326416016, 26.123525619506836, 27.588171005249023, 29.052818298339844, 30.51746368408203, 31.98210906982422, 33.446754455566406, 34.911399841308594, 36.37604904174805, 37.840694427490234, 39.30533981323242, 40.76998519897461, 42.23463439941406, 43.69927978515625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 4.0, 4.0, 10.0, 4.0, 5.0, 7.0, 11.0, 12.0, 20.0, 27.0, 17.0, 24.0, 23.0, 36.0, 30.0, 34.0, 51.0, 40.0, 49.0, 47.0, 35.0, 44.0, 53.0, 31.0, 44.0, 41.0, 32.0, 37.0, 39.0, 25.0, 31.0, 21.0, 16.0, 25.0, 12.0, 13.0, 13.0, 6.0, 8.0, 6.0, 8.0, 5.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.723575592041016, -45.40193176269531, -44.080284118652344, -42.75864028930664, -41.43699645996094, -40.11534881591797, -38.793704986572266, -37.47206115722656, -36.150413513183594, -34.82876968383789, -33.50712203979492, -32.18547821044922, -30.863832473754883, -29.542186737060547, -28.220542907714844, -26.898897171020508, -25.577251434326172, -24.255605697631836, -22.9339599609375, -21.612316131591797, -20.29067039489746, -18.969024658203125, -17.647380828857422, -16.325735092163086, -15.00408935546875, -13.682443618774414, -12.360798835754395, -11.039154052734375, -9.717508316040039, -8.395862579345703, -7.074217796325684, -5.752573013305664, -4.430927276611328, -3.1092820167541504, -1.7876367568969727, -0.4659914970397949, 0.8556537628173828, 2.1772990226745605, 3.4989442825317383, 4.820589065551758, 6.142234802246094, 7.4638800621032715, 8.78552532196045, 10.107170104980469, 11.428815841674805, 12.75046157836914, 14.07210636138916, 15.39375114440918, 16.715396881103516, 18.03704261779785, 19.358688354492188, 20.68033218383789, 22.001977920532227, 23.323623657226562, 24.645267486572266, 25.9669132232666, 27.288558959960938, 28.610204696655273, 29.93185043334961, 31.253494262695312, 32.57514190673828, 33.896785736083984, 35.21842956542969, 36.540077209472656, 37.86172103881836]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 7.0, 9.0, 25.0, 42.0, 46.0, 84.0, 113.0, 184.0, 274.0, 356.0, 562.0, 839.0, 1156.0, 1726.0, 2677.0, 3825.0, 6068.0, 9015.0, 13955.0, 21518.0, 34111.0, 56055.0, 97308.0, 200437.0, 281695.0, 128603.0, 70444.0, 41743.0, 26286.0, 16918.0, 11019.0, 7100.0, 4709.0, 3232.0, 2114.0, 1396.0, 955.0, 640.0, 407.0, 280.0, 204.0, 153.0, 83.0, 48.0, 47.0, 32.0, 21.0, 10.0, 10.0, 12.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0], "bins": [-13.8984375, -13.467041015625, -13.03564453125, -12.604248046875, -12.1728515625, -11.741455078125, -11.31005859375, -10.878662109375, -10.447265625, -10.015869140625, -9.58447265625, -9.153076171875, -8.7216796875, -8.290283203125, -7.85888671875, -7.427490234375, -6.99609375, -6.564697265625, -6.13330078125, -5.701904296875, -5.2705078125, -4.839111328125, -4.40771484375, -3.976318359375, -3.544921875, -3.113525390625, -2.68212890625, -2.250732421875, -1.8193359375, -1.387939453125, -0.95654296875, -0.525146484375, -0.09375, 0.337646484375, 0.76904296875, 1.200439453125, 1.6318359375, 2.063232421875, 2.49462890625, 2.926025390625, 3.357421875, 3.788818359375, 4.22021484375, 4.651611328125, 5.0830078125, 5.514404296875, 5.94580078125, 6.377197265625, 6.80859375, 7.239990234375, 7.67138671875, 8.102783203125, 8.5341796875, 8.965576171875, 9.39697265625, 9.828369140625, 10.259765625, 10.691162109375, 11.12255859375, 11.553955078125, 11.9853515625, 12.416748046875, 12.84814453125, 13.279541015625, 13.7109375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 3.0, 1.0, 3.0, 3.0, 7.0, 2.0, 11.0, 8.0, 12.0, 9.0, 22.0, 14.0, 21.0, 30.0, 31.0, 26.0, 33.0, 48.0, 50.0, 39.0, 37.0, 47.0, 44.0, 53.0, 43.0, 37.0, 44.0, 39.0, 33.0, 33.0, 32.0, 30.0, 23.0, 27.0, 15.0, 13.0, 30.0, 8.0, 9.0, 14.0, 4.0, 5.0, 3.0, 5.0, 4.0, 8.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.5, -43.150390625, -41.80078125, -40.451171875, -39.1015625, -37.751953125, -36.40234375, -35.052734375, -33.703125, -32.353515625, -31.00390625, -29.654296875, -28.3046875, -26.955078125, -25.60546875, -24.255859375, -22.90625, -21.556640625, -20.20703125, -18.857421875, -17.5078125, -16.158203125, -14.80859375, -13.458984375, -12.109375, -10.759765625, -9.41015625, -8.060546875, -6.7109375, -5.361328125, -4.01171875, -2.662109375, -1.3125, 0.037109375, 1.38671875, 2.736328125, 4.0859375, 5.435546875, 6.78515625, 8.134765625, 9.484375, 10.833984375, 12.18359375, 13.533203125, 14.8828125, 16.232421875, 17.58203125, 18.931640625, 20.28125, 21.630859375, 22.98046875, 24.330078125, 25.6796875, 27.029296875, 28.37890625, 29.728515625, 31.078125, 32.427734375, 33.77734375, 35.126953125, 36.4765625, 37.826171875, 39.17578125, 40.525390625, 41.875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 8.0, 8.0, 9.0, 13.0, 24.0, 31.0, 35.0, 58.0, 78.0, 125.0, 186.0, 245.0, 367.0, 525.0, 733.0, 1113.0, 1473.0, 2089.0, 3191.0, 4721.0, 7489.0, 13357.0, 31792.0, 191990.0, 675553.0, 65966.0, 19531.0, 9653.0, 5928.0, 3753.0, 2610.0, 1790.0, 1235.0, 832.0, 596.0, 464.0, 281.0, 228.0, 160.0, 106.0, 58.0, 41.0, 39.0, 21.0, 13.0, 13.0, 8.0, 3.0, 7.0, 1.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-18.1875, -17.62353515625, -17.0595703125, -16.49560546875, -15.931640625, -15.36767578125, -14.8037109375, -14.23974609375, -13.67578125, -13.11181640625, -12.5478515625, -11.98388671875, -11.419921875, -10.85595703125, -10.2919921875, -9.72802734375, -9.1640625, -8.60009765625, -8.0361328125, -7.47216796875, -6.908203125, -6.34423828125, -5.7802734375, -5.21630859375, -4.65234375, -4.08837890625, -3.5244140625, -2.96044921875, -2.396484375, -1.83251953125, -1.2685546875, -0.70458984375, -0.140625, 0.42333984375, 0.9873046875, 1.55126953125, 2.115234375, 2.67919921875, 3.2431640625, 3.80712890625, 4.37109375, 4.93505859375, 5.4990234375, 6.06298828125, 6.626953125, 7.19091796875, 7.7548828125, 8.31884765625, 8.8828125, 9.44677734375, 10.0107421875, 10.57470703125, 11.138671875, 11.70263671875, 12.2666015625, 12.83056640625, 13.39453125, 13.95849609375, 14.5224609375, 15.08642578125, 15.650390625, 16.21435546875, 16.7783203125, 17.34228515625, 17.90625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 7.0, 5.0, 8.0, 9.0, 13.0, 15.0, 19.0, 17.0, 29.0, 24.0, 19.0, 39.0, 25.0, 38.0, 29.0, 26.0, 40.0, 42.0, 51.0, 54.0, 45.0, 48.0, 38.0, 46.0, 46.0, 45.0, 29.0, 40.0, 15.0, 33.0, 23.0, 16.0, 13.0, 15.0, 15.0, 8.0, 7.0, 9.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.6875, -33.719482421875, -32.75146484375, -31.783447265625, -30.8154296875, -29.847412109375, -28.87939453125, -27.911376953125, -26.943359375, -25.975341796875, -25.00732421875, -24.039306640625, -23.0712890625, -22.103271484375, -21.13525390625, -20.167236328125, -19.19921875, -18.231201171875, -17.26318359375, -16.295166015625, -15.3271484375, -14.359130859375, -13.39111328125, -12.423095703125, -11.455078125, -10.487060546875, -9.51904296875, -8.551025390625, -7.5830078125, -6.614990234375, -5.64697265625, -4.678955078125, -3.7109375, -2.742919921875, -1.77490234375, -0.806884765625, 0.1611328125, 1.129150390625, 2.09716796875, 3.065185546875, 4.033203125, 5.001220703125, 5.96923828125, 6.937255859375, 7.9052734375, 8.873291015625, 9.84130859375, 10.809326171875, 11.77734375, 12.745361328125, 13.71337890625, 14.681396484375, 15.6494140625, 16.617431640625, 17.58544921875, 18.553466796875, 19.521484375, 20.489501953125, 21.45751953125, 22.425537109375, 23.3935546875, 24.361572265625, 25.32958984375, 26.297607421875, 27.265625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 4.0, 7.0, 7.0, 3.0, 9.0, 14.0, 23.0, 21.0, 38.0, 64.0, 99.0, 126.0, 163.0, 251.0, 413.0, 721.0, 1159.0, 1961.0, 3722.0, 7814.0, 20096.0, 126214.0, 824091.0, 38130.0, 11957.0, 5081.0, 2701.0, 1416.0, 806.0, 518.0, 311.0, 193.0, 119.0, 111.0, 61.0, 27.0, 34.0, 14.0, 14.0, 10.0, 9.0, 10.0, 3.0, 3.0, 5.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.517578125, -3.408477783203125, -3.29937744140625, -3.190277099609375, -3.0811767578125, -2.972076416015625, -2.86297607421875, -2.753875732421875, -2.644775390625, -2.535675048828125, -2.42657470703125, -2.317474365234375, -2.2083740234375, -2.099273681640625, -1.99017333984375, -1.881072998046875, -1.77197265625, -1.662872314453125, -1.55377197265625, -1.444671630859375, -1.3355712890625, -1.226470947265625, -1.11737060546875, -1.008270263671875, -0.899169921875, -0.790069580078125, -0.68096923828125, -0.571868896484375, -0.4627685546875, -0.353668212890625, -0.24456787109375, -0.135467529296875, -0.0263671875, 0.082733154296875, 0.19183349609375, 0.300933837890625, 0.4100341796875, 0.519134521484375, 0.62823486328125, 0.737335205078125, 0.846435546875, 0.955535888671875, 1.06463623046875, 1.173736572265625, 1.2828369140625, 1.391937255859375, 1.50103759765625, 1.610137939453125, 1.71923828125, 1.828338623046875, 1.93743896484375, 2.046539306640625, 2.1556396484375, 2.264739990234375, 2.37384033203125, 2.482940673828125, 2.592041015625, 2.701141357421875, 2.81024169921875, 2.919342041015625, 3.0284423828125, 3.137542724609375, 3.24664306640625, 3.355743408203125, 3.46484375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 4.0, 10.0, 9.0, 4.0, 9.0, 22.0, 20.0, 38.0, 43.0, 36.0, 54.0, 79.0, 85.0, 90.0, 87.0, 81.0, 77.0, 58.0, 41.0, 39.0, 27.0, 17.0, 18.0, 5.0, 14.0, 6.0, 5.0, 2.0, 4.0, 5.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00019788742065429688, -0.0001916550099849701, -0.0001854225993156433, -0.00017919018864631653, -0.00017295777797698975, -0.00016672536730766296, -0.00016049295663833618, -0.0001542605459690094, -0.00014802813529968262, -0.00014179572463035583, -0.00013556331396102905, -0.00012933090329170227, -0.0001230984926223755, -0.0001168660819530487, -0.00011063367128372192, -0.00010440126061439514, -9.816884994506836e-05, -9.193643927574158e-05, -8.57040286064148e-05, -7.947161793708801e-05, -7.323920726776123e-05, -6.700679659843445e-05, -6.0774385929107666e-05, -5.4541975259780884e-05, -4.83095645904541e-05, -4.207715392112732e-05, -3.584474325180054e-05, -2.9612332582473755e-05, -2.3379921913146973e-05, -1.714751124382019e-05, -1.0915100574493408e-05, -4.682689905166626e-06, 1.5497207641601562e-06, 7.782131433486938e-06, 1.401454210281372e-05, 2.0246952772140503e-05, 2.6479363441467285e-05, 3.271177411079407e-05, 3.894418478012085e-05, 4.517659544944763e-05, 5.1409006118774414e-05, 5.7641416788101196e-05, 6.387382745742798e-05, 7.010623812675476e-05, 7.633864879608154e-05, 8.257105946540833e-05, 8.880347013473511e-05, 9.503588080406189e-05, 0.00010126829147338867, 0.00010750070214271545, 0.00011373311281204224, 0.00011996552348136902, 0.0001261979341506958, 0.00013243034482002258, 0.00013866275548934937, 0.00014489516615867615, 0.00015112757682800293, 0.0001573599874973297, 0.0001635923981666565, 0.00016982480883598328, 0.00017605721950531006, 0.00018228963017463684, 0.00018852204084396362, 0.0001947544515132904, 0.0002009868621826172]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 3.0, 6.0, 6.0, 8.0, 15.0, 23.0, 34.0, 44.0, 71.0, 90.0, 136.0, 197.0, 283.0, 440.0, 566.0, 844.0, 1170.0, 1743.0, 2607.0, 4139.0, 6503.0, 10932.0, 18743.0, 34814.0, 69799.0, 155098.0, 305974.0, 224936.0, 99869.0, 47487.0, 24759.0, 13782.0, 8351.0, 5129.0, 3224.0, 2162.0, 1373.0, 995.0, 649.0, 500.0, 313.0, 240.0, 150.0, 109.0, 83.0, 58.0, 45.0, 18.0, 12.0, 12.0, 8.0, 9.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.7236328125, -1.6693115234375, -1.614990234375, -1.5606689453125, -1.50634765625, -1.4520263671875, -1.397705078125, -1.3433837890625, -1.2890625, -1.2347412109375, -1.180419921875, -1.1260986328125, -1.07177734375, -1.0174560546875, -0.963134765625, -0.9088134765625, -0.8544921875, -0.8001708984375, -0.745849609375, -0.6915283203125, -0.63720703125, -0.5828857421875, -0.528564453125, -0.4742431640625, -0.419921875, -0.3656005859375, -0.311279296875, -0.2569580078125, -0.20263671875, -0.1483154296875, -0.093994140625, -0.0396728515625, 0.0146484375, 0.0689697265625, 0.123291015625, 0.1776123046875, 0.23193359375, 0.2862548828125, 0.340576171875, 0.3948974609375, 0.44921875, 0.5035400390625, 0.557861328125, 0.6121826171875, 0.66650390625, 0.7208251953125, 0.775146484375, 0.8294677734375, 0.8837890625, 0.9381103515625, 0.992431640625, 1.0467529296875, 1.10107421875, 1.1553955078125, 1.209716796875, 1.2640380859375, 1.318359375, 1.3726806640625, 1.427001953125, 1.4813232421875, 1.53564453125, 1.5899658203125, 1.644287109375, 1.6986083984375, 1.7529296875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 3.0, 6.0, 8.0, 6.0, 4.0, 6.0, 4.0, 9.0, 14.0, 10.0, 14.0, 25.0, 29.0, 28.0, 38.0, 45.0, 62.0, 98.0, 87.0, 86.0, 73.0, 61.0, 54.0, 46.0, 37.0, 29.0, 25.0, 14.0, 15.0, 7.0, 5.0, 8.0, 9.0, 3.0, 2.0, 0.0, 8.0, 5.0, 3.0, 2.0, 3.0, 2.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.5869140625, -0.5678863525390625, -0.548858642578125, -0.5298309326171875, -0.51080322265625, -0.4917755126953125, -0.472747802734375, -0.4537200927734375, -0.4346923828125, -0.4156646728515625, -0.396636962890625, -0.3776092529296875, -0.35858154296875, -0.3395538330078125, -0.320526123046875, -0.3014984130859375, -0.282470703125, -0.2634429931640625, -0.244415283203125, -0.2253875732421875, -0.20635986328125, -0.1873321533203125, -0.168304443359375, -0.1492767333984375, -0.1302490234375, -0.1112213134765625, -0.092193603515625, -0.0731658935546875, -0.05413818359375, -0.0351104736328125, -0.016082763671875, 0.0029449462890625, 0.02197265625, 0.0410003662109375, 0.060028076171875, 0.0790557861328125, 0.09808349609375, 0.1171112060546875, 0.136138916015625, 0.1551666259765625, 0.1741943359375, 0.1932220458984375, 0.212249755859375, 0.2312774658203125, 0.25030517578125, 0.2693328857421875, 0.288360595703125, 0.3073883056640625, 0.326416015625, 0.3454437255859375, 0.364471435546875, 0.3834991455078125, 0.40252685546875, 0.4215545654296875, 0.440582275390625, 0.4596099853515625, 0.4786376953125, 0.4976654052734375, 0.516693115234375, 0.5357208251953125, 0.55474853515625, 0.5737762451171875, 0.592803955078125, 0.6118316650390625, 0.630859375]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 5.0, 4.0, 6.0, 6.0, 8.0, 13.0, 10.0, 24.0, 20.0, 29.0, 41.0, 52.0, 57.0, 67.0, 65.0, 89.0, 75.0, 74.0, 73.0, 38.0, 56.0, 49.0, 47.0, 18.0, 16.0, 15.0, 16.0, 10.0, 5.0, 6.0, 5.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.29299545288086, -48.8133430480957, -47.33369064331055, -45.85403823852539, -44.3743896484375, -42.894737243652344, -41.41508483886719, -39.93543243408203, -38.455780029296875, -36.97612762451172, -35.49647521972656, -34.016822814941406, -32.53717041015625, -31.057519912719727, -29.577869415283203, -28.098217010498047, -26.61856460571289, -25.138912200927734, -23.659259796142578, -22.179609298706055, -20.6999568939209, -19.220304489135742, -17.74065399169922, -16.261001586914062, -14.781349182128906, -13.30169677734375, -11.82204532623291, -10.34239387512207, -8.862741470336914, -7.383089542388916, -5.903437614440918, -4.423786163330078, -2.9441299438476562, -1.4644780158996582, 0.015173912048339844, 1.494825839996338, 2.974477767944336, 4.454129695892334, 5.933781623840332, 7.413433074951172, 8.893085479736328, 10.372737884521484, 11.852389335632324, 13.332040786743164, 14.81169319152832, 16.291345596313477, 17.77099609375, 19.250648498535156, 20.730300903320312, 22.20995330810547, 23.689605712890625, 25.16925621032715, 26.648908615112305, 28.12856101989746, 29.608211517333984, 31.08786392211914, 32.5675163269043, 34.04716873168945, 35.52682113647461, 37.006473541259766, 38.486122131347656, 39.96577453613281, 41.44542694091797, 42.925079345703125, 44.40473175048828]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 4.0, 4.0, 9.0, 3.0, 7.0, 6.0, 12.0, 16.0, 15.0, 32.0, 14.0, 22.0, 27.0, 36.0, 33.0, 30.0, 50.0, 42.0, 50.0, 47.0, 35.0, 45.0, 48.0, 35.0, 42.0, 42.0, 27.0, 42.0, 39.0, 26.0, 28.0, 20.0, 15.0, 24.0, 13.0, 13.0, 13.0, 5.0, 8.0, 6.0, 8.0, 4.0, 7.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.716773986816406, -44.41510009765625, -43.11343002319336, -41.8117561340332, -40.51008605957031, -39.208412170410156, -37.906742095947266, -36.60506820678711, -35.30339813232422, -34.00172424316406, -32.70005416870117, -31.39838218688965, -30.096710205078125, -28.79503631591797, -27.493364334106445, -26.191692352294922, -24.890018463134766, -23.588346481323242, -22.28667449951172, -20.985002517700195, -19.683330535888672, -18.381656646728516, -17.079984664916992, -15.778312683105469, -14.476640701293945, -13.174968719482422, -11.873296737670898, -10.571623802185059, -9.269951820373535, -7.968279838562012, -6.66660737991333, -5.364934921264648, -4.063266754150391, -2.761594533920288, -1.4599223136901855, -0.158250093460083, 1.1434221267700195, 2.445094108581543, 3.7467665672302246, 5.048439025878906, 6.35011100769043, 7.651782989501953, 8.953454971313477, 10.255127906799316, 11.55679988861084, 12.858471870422363, 14.160144805908203, 15.461816787719727, 16.76348876953125, 18.065160751342773, 19.366832733154297, 20.66850471496582, 21.970176696777344, 23.2718505859375, 24.573522567749023, 25.875194549560547, 27.17686653137207, 28.478538513183594, 29.780210494995117, 31.08188247680664, 32.3835563659668, 33.68522644042969, 34.986900329589844, 36.28857421875, 37.59024429321289]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 5.0, 6.0, 6.0, 12.0, 13.0, 17.0, 27.0, 62.0, 74.0, 109.0, 168.0, 216.0, 371.0, 515.0, 757.0, 1153.0, 1754.0, 2619.0, 3931.0, 6070.0, 9270.0, 14060.0, 21993.0, 33861.0, 52554.0, 81888.0, 124907.0, 173497.0, 171500.0, 122420.0, 79538.0, 50797.0, 32959.0, 21097.0, 13755.0, 9133.0, 5828.0, 3899.0, 2632.0, 1640.0, 1176.0, 765.0, 504.0, 341.0, 217.0, 142.0, 111.0, 68.0, 49.0, 28.0, 21.0, 12.0, 6.0, 9.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-37.03125, -35.83544921875, -34.6396484375, -33.44384765625, -32.248046875, -31.05224609375, -29.8564453125, -28.66064453125, -27.46484375, -26.26904296875, -25.0732421875, -23.87744140625, -22.681640625, -21.48583984375, -20.2900390625, -19.09423828125, -17.8984375, -16.70263671875, -15.5068359375, -14.31103515625, -13.115234375, -11.91943359375, -10.7236328125, -9.52783203125, -8.33203125, -7.13623046875, -5.9404296875, -4.74462890625, -3.548828125, -2.35302734375, -1.1572265625, 0.03857421875, 1.234375, 2.43017578125, 3.6259765625, 4.82177734375, 6.017578125, 7.21337890625, 8.4091796875, 9.60498046875, 10.80078125, 11.99658203125, 13.1923828125, 14.38818359375, 15.583984375, 16.77978515625, 17.9755859375, 19.17138671875, 20.3671875, 21.56298828125, 22.7587890625, 23.95458984375, 25.150390625, 26.34619140625, 27.5419921875, 28.73779296875, 29.93359375, 31.12939453125, 32.3251953125, 33.52099609375, 34.716796875, 35.91259765625, 37.1083984375, 38.30419921875, 39.5]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 5.0, 4.0, 2.0, 7.0, 3.0, 12.0, 11.0, 11.0, 14.0, 14.0, 14.0, 27.0, 18.0, 31.0, 35.0, 34.0, 40.0, 39.0, 31.0, 49.0, 43.0, 43.0, 49.0, 51.0, 38.0, 37.0, 38.0, 25.0, 33.0, 38.0, 37.0, 23.0, 24.0, 19.0, 12.0, 24.0, 16.0, 10.0, 9.0, 7.0, 8.0, 2.0, 6.0, 1.0, 5.0, 5.0, 1.0, 1.0, 2.0], "bins": [-43.65625, -42.4814453125, -41.306640625, -40.1318359375, -38.95703125, -37.7822265625, -36.607421875, -35.4326171875, -34.2578125, -33.0830078125, -31.908203125, -30.7333984375, -29.55859375, -28.3837890625, -27.208984375, -26.0341796875, -24.859375, -23.6845703125, -22.509765625, -21.3349609375, -20.16015625, -18.9853515625, -17.810546875, -16.6357421875, -15.4609375, -14.2861328125, -13.111328125, -11.9365234375, -10.76171875, -9.5869140625, -8.412109375, -7.2373046875, -6.0625, -4.8876953125, -3.712890625, -2.5380859375, -1.36328125, -0.1884765625, 0.986328125, 2.1611328125, 3.3359375, 4.5107421875, 5.685546875, 6.8603515625, 8.03515625, 9.2099609375, 10.384765625, 11.5595703125, 12.734375, 13.9091796875, 15.083984375, 16.2587890625, 17.43359375, 18.6083984375, 19.783203125, 20.9580078125, 22.1328125, 23.3076171875, 24.482421875, 25.6572265625, 26.83203125, 28.0068359375, 29.181640625, 30.3564453125, 31.53125]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 9.0, 12.0, 17.0, 26.0, 32.0, 59.0, 94.0, 150.0, 227.0, 280.0, 501.0, 617.0, 1071.0, 1510.0, 2258.0, 3380.0, 4949.0, 7716.0, 11658.0, 17576.0, 27036.0, 41552.0, 64477.0, 98818.0, 144514.0, 175056.0, 148534.0, 103082.0, 67525.0, 43488.0, 28000.0, 18402.0, 11843.0, 7944.0, 5378.0, 3574.0, 2429.0, 1545.0, 1038.0, 731.0, 514.0, 325.0, 201.0, 136.0, 94.0, 74.0, 38.0, 18.0, 24.0, 17.0, 4.0, 3.0, 3.0, 4.0, 0.0, 2.0], "bins": [-44.65625, -43.3251953125, -41.994140625, -40.6630859375, -39.33203125, -38.0009765625, -36.669921875, -35.3388671875, -34.0078125, -32.6767578125, -31.345703125, -30.0146484375, -28.68359375, -27.3525390625, -26.021484375, -24.6904296875, -23.359375, -22.0283203125, -20.697265625, -19.3662109375, -18.03515625, -16.7041015625, -15.373046875, -14.0419921875, -12.7109375, -11.3798828125, -10.048828125, -8.7177734375, -7.38671875, -6.0556640625, -4.724609375, -3.3935546875, -2.0625, -0.7314453125, 0.599609375, 1.9306640625, 3.26171875, 4.5927734375, 5.923828125, 7.2548828125, 8.5859375, 9.9169921875, 11.248046875, 12.5791015625, 13.91015625, 15.2412109375, 16.572265625, 17.9033203125, 19.234375, 20.5654296875, 21.896484375, 23.2275390625, 24.55859375, 25.8896484375, 27.220703125, 28.5517578125, 29.8828125, 31.2138671875, 32.544921875, 33.8759765625, 35.20703125, 36.5380859375, 37.869140625, 39.2001953125, 40.53125]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 4.0, 1.0, 0.0, 2.0, 8.0, 1.0, 7.0, 7.0, 12.0, 18.0, 12.0, 19.0, 16.0, 19.0, 21.0, 32.0, 24.0, 32.0, 43.0, 41.0, 34.0, 47.0, 38.0, 45.0, 49.0, 45.0, 35.0, 39.0, 30.0, 28.0, 47.0, 32.0, 29.0, 29.0, 17.0, 17.0, 24.0, 17.0, 14.0, 16.0, 13.0, 13.0, 8.0, 5.0, 3.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-25.25, -24.47705078125, -23.7041015625, -22.93115234375, -22.158203125, -21.38525390625, -20.6123046875, -19.83935546875, -19.06640625, -18.29345703125, -17.5205078125, -16.74755859375, -15.974609375, -15.20166015625, -14.4287109375, -13.65576171875, -12.8828125, -12.10986328125, -11.3369140625, -10.56396484375, -9.791015625, -9.01806640625, -8.2451171875, -7.47216796875, -6.69921875, -5.92626953125, -5.1533203125, -4.38037109375, -3.607421875, -2.83447265625, -2.0615234375, -1.28857421875, -0.515625, 0.25732421875, 1.0302734375, 1.80322265625, 2.576171875, 3.34912109375, 4.1220703125, 4.89501953125, 5.66796875, 6.44091796875, 7.2138671875, 7.98681640625, 8.759765625, 9.53271484375, 10.3056640625, 11.07861328125, 11.8515625, 12.62451171875, 13.3974609375, 14.17041015625, 14.943359375, 15.71630859375, 16.4892578125, 17.26220703125, 18.03515625, 18.80810546875, 19.5810546875, 20.35400390625, 21.126953125, 21.89990234375, 22.6728515625, 23.44580078125, 24.21875]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 8.0, 10.0, 9.0, 18.0, 16.0, 38.0, 55.0, 71.0, 99.0, 109.0, 199.0, 303.0, 424.0, 726.0, 954.0, 1564.0, 2464.0, 3856.0, 6246.0, 10394.0, 17899.0, 32796.0, 62548.0, 125794.0, 244406.0, 254918.0, 133708.0, 66270.0, 34733.0, 19134.0, 10890.0, 6554.0, 3963.0, 2515.0, 1599.0, 1099.0, 701.0, 470.0, 332.0, 198.0, 149.0, 90.0, 80.0, 42.0, 36.0, 29.0, 20.0, 11.0, 7.0, 3.0, 4.0, 1.0, 3.0, 0.0, 2.0, 1.0], "bins": [-25.703125, -24.92529296875, -24.1474609375, -23.36962890625, -22.591796875, -21.81396484375, -21.0361328125, -20.25830078125, -19.48046875, -18.70263671875, -17.9248046875, -17.14697265625, -16.369140625, -15.59130859375, -14.8134765625, -14.03564453125, -13.2578125, -12.47998046875, -11.7021484375, -10.92431640625, -10.146484375, -9.36865234375, -8.5908203125, -7.81298828125, -7.03515625, -6.25732421875, -5.4794921875, -4.70166015625, -3.923828125, -3.14599609375, -2.3681640625, -1.59033203125, -0.8125, -0.03466796875, 0.7431640625, 1.52099609375, 2.298828125, 3.07666015625, 3.8544921875, 4.63232421875, 5.41015625, 6.18798828125, 6.9658203125, 7.74365234375, 8.521484375, 9.29931640625, 10.0771484375, 10.85498046875, 11.6328125, 12.41064453125, 13.1884765625, 13.96630859375, 14.744140625, 15.52197265625, 16.2998046875, 17.07763671875, 17.85546875, 18.63330078125, 19.4111328125, 20.18896484375, 20.966796875, 21.74462890625, 22.5224609375, 23.30029296875, 24.078125]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 4.0, 6.0, 11.0, 14.0, 20.0, 15.0, 28.0, 46.0, 52.0, 81.0, 118.0, 131.0, 151.0, 97.0, 81.0, 42.0, 29.0, 18.0, 14.0, 10.0, 6.0, 4.0, 2.0, 9.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004322052001953125, -0.004204541444778442, -0.00408703088760376, -0.003969520330429077, -0.0038520097732543945, -0.003734499216079712, -0.0036169886589050293, -0.0034994781017303467, -0.003381967544555664, -0.0032644569873809814, -0.003146946430206299, -0.003029435873031616, -0.0029119253158569336, -0.002794414758682251, -0.0026769042015075684, -0.0025593936443328857, -0.002441883087158203, -0.0023243725299835205, -0.002206861972808838, -0.0020893514156341553, -0.0019718408584594727, -0.00185433030128479, -0.0017368197441101074, -0.0016193091869354248, -0.0015017986297607422, -0.0013842880725860596, -0.001266777515411377, -0.0011492669582366943, -0.0010317564010620117, -0.0009142458438873291, -0.0007967352867126465, -0.0006792247295379639, -0.0005617141723632812, -0.00044420361518859863, -0.000326693058013916, -0.0002091825008392334, -9.167194366455078e-05, 2.5838613510131836e-05, 0.00014334917068481445, 0.00026085972785949707, 0.0003783702850341797, 0.0004958808422088623, 0.0006133913993835449, 0.0007309019565582275, 0.0008484125137329102, 0.0009659230709075928, 0.0010834336280822754, 0.001200944185256958, 0.0013184547424316406, 0.0014359652996063232, 0.0015534758567810059, 0.0016709864139556885, 0.001788496971130371, 0.0019060075283050537, 0.0020235180854797363, 0.002141028642654419, 0.0022585391998291016, 0.002376049757003784, 0.002493560314178467, 0.0026110708713531494, 0.002728581428527832, 0.0028460919857025146, 0.0029636025428771973, 0.00308111310005188, 0.0031986236572265625]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 6.0, 2.0, 6.0, 15.0, 11.0, 25.0, 41.0, 48.0, 64.0, 107.0, 146.0, 226.0, 316.0, 502.0, 756.0, 1224.0, 1670.0, 2751.0, 4186.0, 6598.0, 10827.0, 18028.0, 31444.0, 57096.0, 107765.0, 206597.0, 262466.0, 151374.0, 79394.0, 42589.0, 24149.0, 14105.0, 8718.0, 5441.0, 3466.0, 2206.0, 1403.0, 959.0, 599.0, 392.0, 281.0, 180.0, 136.0, 79.0, 53.0, 38.0, 29.0, 17.0, 12.0, 4.0, 8.0, 4.0, 3.0, 1.0, 0.0, 3.0], "bins": [-25.203125, -24.467529296875, -23.73193359375, -22.996337890625, -22.2607421875, -21.525146484375, -20.78955078125, -20.053955078125, -19.318359375, -18.582763671875, -17.84716796875, -17.111572265625, -16.3759765625, -15.640380859375, -14.90478515625, -14.169189453125, -13.43359375, -12.697998046875, -11.96240234375, -11.226806640625, -10.4912109375, -9.755615234375, -9.02001953125, -8.284423828125, -7.548828125, -6.813232421875, -6.07763671875, -5.342041015625, -4.6064453125, -3.870849609375, -3.13525390625, -2.399658203125, -1.6640625, -0.928466796875, -0.19287109375, 0.542724609375, 1.2783203125, 2.013916015625, 2.74951171875, 3.485107421875, 4.220703125, 4.956298828125, 5.69189453125, 6.427490234375, 7.1630859375, 7.898681640625, 8.63427734375, 9.369873046875, 10.10546875, 10.841064453125, 11.57666015625, 12.312255859375, 13.0478515625, 13.783447265625, 14.51904296875, 15.254638671875, 15.990234375, 16.725830078125, 17.46142578125, 18.197021484375, 18.9326171875, 19.668212890625, 20.40380859375, 21.139404296875, 21.875]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 8.0, 4.0, 11.0, 19.0, 13.0, 16.0, 27.0, 32.0, 25.0, 36.0, 56.0, 63.0, 70.0, 75.0, 63.0, 66.0, 81.0, 60.0, 58.0, 51.0, 37.0, 28.0, 16.0, 15.0, 10.0, 18.0, 12.0, 6.0, 8.0, 4.0, 3.0, 2.0, 3.0, 2.0, 4.0, 1.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.875, -9.5443115234375, -9.213623046875, -8.8829345703125, -8.55224609375, -8.2215576171875, -7.890869140625, -7.5601806640625, -7.2294921875, -6.8988037109375, -6.568115234375, -6.2374267578125, -5.90673828125, -5.5760498046875, -5.245361328125, -4.9146728515625, -4.583984375, -4.2532958984375, -3.922607421875, -3.5919189453125, -3.26123046875, -2.9305419921875, -2.599853515625, -2.2691650390625, -1.9384765625, -1.6077880859375, -1.277099609375, -0.9464111328125, -0.61572265625, -0.2850341796875, 0.045654296875, 0.3763427734375, 0.70703125, 1.0377197265625, 1.368408203125, 1.6990966796875, 2.02978515625, 2.3604736328125, 2.691162109375, 3.0218505859375, 3.3525390625, 3.6832275390625, 4.013916015625, 4.3446044921875, 4.67529296875, 5.0059814453125, 5.336669921875, 5.6673583984375, 5.998046875, 6.3287353515625, 6.659423828125, 6.9901123046875, 7.32080078125, 7.6514892578125, 7.982177734375, 8.3128662109375, 8.6435546875, 8.9742431640625, 9.304931640625, 9.6356201171875, 9.96630859375, 10.2969970703125, 10.627685546875, 10.9583740234375, 11.2890625]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 3.0, 1.0, 3.0, 4.0, 6.0, 6.0, 8.0, 17.0, 16.0, 12.0, 23.0, 24.0, 34.0, 28.0, 31.0, 40.0, 50.0, 57.0, 61.0, 55.0, 78.0, 70.0, 60.0, 53.0, 42.0, 44.0, 36.0, 26.0, 25.0, 23.0, 16.0, 9.0, 10.0, 11.0, 6.0, 4.0, 6.0, 0.0, 3.0, 1.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.91347885131836, -45.59896469116211, -44.284454345703125, -42.969940185546875, -41.655426025390625, -40.34091567993164, -39.02640151977539, -37.711891174316406, -36.397377014160156, -35.082862854003906, -33.76835250854492, -32.45383834838867, -31.139326095581055, -29.824813842773438, -28.510299682617188, -27.19578742980957, -25.881275177001953, -24.566762924194336, -23.25225067138672, -21.93773651123047, -20.62322425842285, -19.308712005615234, -17.994197845458984, -16.679685592651367, -15.36517333984375, -14.050661087036133, -12.7361478805542, -11.421634674072266, -10.107122421264648, -8.792610168457031, -7.478096961975098, -6.163583755493164, -4.849067687988281, -3.534554958343506, -2.2200422286987305, -0.9055294990539551, 0.4089832305908203, 1.7234959602355957, 3.038008689880371, 4.352521896362305, 5.667034149169922, 6.981546878814697, 8.296059608459473, 9.610572814941406, 10.925085067749023, 12.23959732055664, 13.554110527038574, 14.868623733520508, 16.183135986328125, 17.497648239135742, 18.81216049194336, 20.12667465209961, 21.441186904907227, 22.755699157714844, 24.070213317871094, 25.38472557067871, 26.699237823486328, 28.013750076293945, 29.328262329101562, 30.642776489257812, 31.95728874206543, 33.27180099487305, 34.5863151550293, 35.90082550048828, 37.21533966064453]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 6.0, 6.0, 7.0, 11.0, 4.0, 10.0, 9.0, 17.0, 15.0, 19.0, 22.0, 21.0, 21.0, 39.0, 35.0, 38.0, 38.0, 32.0, 43.0, 48.0, 32.0, 45.0, 45.0, 49.0, 45.0, 33.0, 41.0, 34.0, 22.0, 36.0, 32.0, 17.0, 30.0, 16.0, 16.0, 14.0, 12.0, 10.0, 8.0, 3.0, 3.0, 2.0, 5.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-45.423152923583984, -44.04756546020508, -42.67197799682617, -41.296390533447266, -39.92080307006836, -38.54521560668945, -37.16962814331055, -35.79404067993164, -34.418453216552734, -33.04286575317383, -31.667278289794922, -30.291690826416016, -28.91610336303711, -27.540515899658203, -26.164928436279297, -24.78934097290039, -23.413755416870117, -22.03816795349121, -20.662580490112305, -19.2869930267334, -17.911405563354492, -16.535818099975586, -15.160231590270996, -13.78464412689209, -12.409056663513184, -11.033469200134277, -9.657881736755371, -8.282295227050781, -6.906707286834717, -5.5311198234558105, -4.1555328369140625, -2.7799453735351562, -1.40435791015625, -0.0287705659866333, 1.3468167781829834, 2.7224040031433105, 4.097991466522217, 5.473578929901123, 6.849165916442871, 8.224753379821777, 9.600340843200684, 10.97592830657959, 12.351515769958496, 13.727102279663086, 15.102689743041992, 16.4782772064209, 17.853864669799805, 19.22945213317871, 20.605039596557617, 21.980627059936523, 23.35621452331543, 24.731801986694336, 26.107389450073242, 27.48297691345215, 28.858562469482422, 30.234149932861328, 31.609737396240234, 32.98532485961914, 34.36091232299805, 35.73649978637695, 37.11208724975586, 38.487674713134766, 39.86326217651367, 41.23884963989258, 42.614437103271484]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 1.0, 4.0, 4.0, 9.0, 8.0, 16.0, 17.0, 16.0, 28.0, 26.0, 25.0, 41.0, 53.0, 63.0, 85.0, 100.0, 134.0, 166.0, 202.0, 286.0, 359.0, 450.0, 589.0, 697.0, 1043945.0, 730.0, 582.0, 455.0, 347.0, 225.0, 197.0, 147.0, 109.0, 96.0, 78.0, 61.0, 58.0, 50.0, 25.0, 28.0, 26.0, 26.0, 7.0, 4.0, 7.0, 6.0, 6.0, 3.0, 3.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0], "bins": [-714.0451049804688, -691.9876708984375, -669.9302368164062, -647.872802734375, -625.8153686523438, -603.7579345703125, -581.7005004882812, -559.64306640625, -537.5856323242188, -515.5281982421875, -493.47076416015625, -471.413330078125, -449.35589599609375, -427.2984619140625, -405.24102783203125, -383.18359375, -361.12615966796875, -339.0687255859375, -317.01129150390625, -294.953857421875, -272.89642333984375, -250.8389892578125, -228.78155517578125, -206.72412109375, -184.66668701171875, -162.6092529296875, -140.55181884765625, -118.494384765625, -96.43695068359375, -74.3795166015625, -52.32208251953125, -30.2646484375, -8.207275390625, 13.85015869140625, 35.9075927734375, 57.96502685546875, 80.0224609375, 102.07989501953125, 124.1373291015625, 146.19476318359375, 168.252197265625, 190.30963134765625, 212.3670654296875, 234.42449951171875, 256.48193359375, 278.53936767578125, 300.5968017578125, 322.65423583984375, 344.711669921875, 366.76910400390625, 388.8265380859375, 410.88397216796875, 432.94140625, 454.99884033203125, 477.0562744140625, 499.11370849609375, 521.171142578125, 543.2285766601562, 565.2860107421875, 587.3434448242188, 609.40087890625, 631.4583129882812, 653.5157470703125, 675.5731811523438, 697.630615234375]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 7.0, 1.0, 7.0, 7.0, 14.0, 18.0, 13.0, 17.0, 35.0, 27.0, 48.0, 57.0, 54.0, 78.0, 85.0, 121.0, 143.0, 154.0, 176.0, 230.0, 241.0, 380.0, 625.0, 1301.0, 51318996.0, 144589.0, 1306.0, 646.0, 394.0, 290.0, 221.0, 193.0, 155.0, 106.0, 118.0, 75.0, 81.0, 53.0, 48.0, 45.0, 41.0, 24.0, 26.0, 21.0, 13.0, 14.0, 4.0, 6.0, 7.0, 1.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 3.0], "bins": [-1786.1605224609375, -1730.3333740234375, -1674.5062255859375, -1618.6790771484375, -1562.8519287109375, -1507.0247802734375, -1451.1976318359375, -1395.3704833984375, -1339.5433349609375, -1283.7161865234375, -1227.8890380859375, -1172.0618896484375, -1116.2347412109375, -1060.4075927734375, -1004.5804443359375, -948.7532958984375, -892.9261474609375, -837.0989990234375, -781.2718505859375, -725.4447021484375, -669.6175537109375, -613.7904052734375, -557.9632568359375, -502.1361083984375, -446.3089599609375, -390.4818115234375, -334.6546630859375, -278.8275146484375, -223.0003662109375, -167.1732177734375, -111.3460693359375, -55.5189208984375, 0.308349609375, 56.135498046875, 111.962646484375, 167.789794921875, 223.616943359375, 279.444091796875, 335.271240234375, 391.098388671875, 446.925537109375, 502.752685546875, 558.579833984375, 614.406982421875, 670.234130859375, 726.061279296875, 781.888427734375, 837.715576171875, 893.542724609375, 949.369873046875, 1005.197021484375, 1061.024169921875, 1116.851318359375, 1172.678466796875, 1228.505615234375, 1284.332763671875, 1340.159912109375, 1395.987060546875, 1451.814208984375, 1507.641357421875, 1563.468505859375, 1619.295654296875, 1675.122802734375, 1730.949951171875, 1786.777099609375]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 5.0, 3.0, 6.0, 6.0, 11.0, 10.0, 20.0, 22.0, 21.0, 28.0, 35.0, 51.0, 73.0, 127.0, 123.0, 100.0, 78.0, 62.0, 47.0, 31.0, 33.0, 18.0, 14.0, 12.0, 12.0, 7.0, 8.0, 8.0, 6.0, 4.0, 3.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-1279.698486328125, -1233.0745849609375, -1186.4508056640625, -1139.826904296875, -1093.203125, -1046.5792236328125, -999.955322265625, -953.3314819335938, -906.7076416015625, -860.0838012695312, -813.4599609375, -766.8360595703125, -720.2122192382812, -673.58837890625, -626.9644775390625, -580.3406372070312, -533.716796875, -487.09295654296875, -440.4690856933594, -393.84521484375, -347.22137451171875, -300.5975341796875, -253.97366333007812, -207.34979248046875, -160.7259521484375, -114.10209655761719, -67.47824096679688, -20.854385375976562, 25.76947021484375, 72.39332580566406, 119.01718139648438, 165.64105224609375, 212.2647705078125, 258.88861083984375, 305.5124816894531, 352.1363525390625, 398.76019287109375, 445.384033203125, 492.0079040527344, 538.6317749023438, 585.255615234375, 631.8794555664062, 678.5032958984375, 725.127197265625, 771.7510375976562, 818.3748779296875, 864.998779296875, 911.6226196289062, 958.2464599609375, 1004.8703002929688, 1051.494140625, 1098.1180419921875, 1144.741943359375, 1191.36572265625, 1237.9896240234375, 1284.613525390625, 1331.2373046875, 1377.8612060546875, 1424.4849853515625, 1471.10888671875, 1517.732666015625, 1564.3565673828125, 1610.98046875, 1657.604248046875, 1704.2281494140625]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 6.0, 8.0, 8.0, 14.0, 15.0, 16.0, 20.0, 26.0, 23.0, 39.0, 27.0, 30.0, 38.0, 46.0, 55.0, 75.0, 64.0, 62.0, 55.0, 65.0, 38.0, 30.0, 31.0, 23.0, 24.0, 20.0, 24.0, 16.0, 15.0, 21.0, 7.0, 11.0, 7.0, 8.0, 9.0, 3.0, 3.0, 3.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1612.0467529296875, -1564.2908935546875, -1516.534912109375, -1468.779052734375, -1421.023193359375, -1373.267333984375, -1325.511474609375, -1277.7554931640625, -1229.9996337890625, -1182.2437744140625, -1134.48779296875, -1086.73193359375, -1038.97607421875, -991.22021484375, -943.4642944335938, -895.7083740234375, -847.9525146484375, -800.1966552734375, -752.4407348632812, -704.684814453125, -656.928955078125, -609.173095703125, -561.4171752929688, -513.6612548828125, -465.9053955078125, -418.1495056152344, -370.39361572265625, -322.6377258300781, -274.8818359375, -227.12594604492188, -179.37005615234375, -131.61416625976562, -83.858154296875, -36.102264404296875, 11.65362548828125, 59.409515380859375, 107.1654052734375, 154.92129516601562, 202.67718505859375, 250.43307495117188, 298.18896484375, 345.9448547363281, 393.70074462890625, 441.4566345214844, 489.2125244140625, 536.9683837890625, 584.7243041992188, 632.480224609375, 680.236083984375, 727.991943359375, 775.7478637695312, 823.5037841796875, 871.2596435546875, 919.0155029296875, 966.7714233398438, 1014.52734375, 1062.283203125, 1110.0390625, 1157.794921875, 1205.5509033203125, 1253.3067626953125, 1301.0626220703125, 1348.818603515625, 1396.574462890625, 1444.330322265625]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 9.0, 10.0, 12.0, 26.0, 34.0, 66.0, 92.0, 108.0, 177.0, 281.0, 415.0, 580.0, 932.0, 1343.0, 2071.0, 3285.0, 4980.0, 8122.0, 13395.0, 23531.0, 43091.0, 85659.0, 197450.0, 777587.0, 2531208.0, 270571.0, 105972.0, 51615.0, 28025.0, 15711.0, 9598.0, 6047.0, 3863.0, 2543.0, 1789.0, 1216.0, 827.0, 569.0, 410.0, 316.0, 211.0, 144.0, 116.0, 88.0, 52.0, 45.0, 30.0, 18.0, 20.0, 11.0, 10.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.578125, -25.634521484375, -24.69091796875, -23.747314453125, -22.8037109375, -21.860107421875, -20.91650390625, -19.972900390625, -19.029296875, -18.085693359375, -17.14208984375, -16.198486328125, -15.2548828125, -14.311279296875, -13.36767578125, -12.424072265625, -11.48046875, -10.536865234375, -9.59326171875, -8.649658203125, -7.7060546875, -6.762451171875, -5.81884765625, -4.875244140625, -3.931640625, -2.988037109375, -2.04443359375, -1.100830078125, -0.1572265625, 0.786376953125, 1.72998046875, 2.673583984375, 3.6171875, 4.560791015625, 5.50439453125, 6.447998046875, 7.3916015625, 8.335205078125, 9.27880859375, 10.222412109375, 11.166015625, 12.109619140625, 13.05322265625, 13.996826171875, 14.9404296875, 15.884033203125, 16.82763671875, 17.771240234375, 18.71484375, 19.658447265625, 20.60205078125, 21.545654296875, 22.4892578125, 23.432861328125, 24.37646484375, 25.320068359375, 26.263671875, 27.207275390625, 28.15087890625, 29.094482421875, 30.0380859375, 30.981689453125, 31.92529296875, 32.868896484375, 33.8125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 7.0, 2.0, 5.0, 4.0, 7.0, 9.0, 8.0, 12.0, 12.0, 18.0, 25.0, 25.0, 32.0, 39.0, 53.0, 60.0, 48.0, 65.0, 74.0, 73.0, 72.0, 55.0, 45.0, 56.0, 40.0, 36.0, 29.0, 16.0, 13.0, 15.0, 10.0, 10.0, 7.0, 9.0, 4.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.71484375, -2.617706298828125, -2.52056884765625, -2.423431396484375, -2.3262939453125, -2.229156494140625, -2.13201904296875, -2.034881591796875, -1.937744140625, -1.840606689453125, -1.74346923828125, -1.646331787109375, -1.5491943359375, -1.452056884765625, -1.35491943359375, -1.257781982421875, -1.16064453125, -1.063507080078125, -0.96636962890625, -0.869232177734375, -0.7720947265625, -0.674957275390625, -0.57781982421875, -0.480682373046875, -0.383544921875, -0.286407470703125, -0.18927001953125, -0.092132568359375, 0.0050048828125, 0.102142333984375, 0.19927978515625, 0.296417236328125, 0.3935546875, 0.490692138671875, 0.58782958984375, 0.684967041015625, 0.7821044921875, 0.879241943359375, 0.97637939453125, 1.073516845703125, 1.170654296875, 1.267791748046875, 1.36492919921875, 1.462066650390625, 1.5592041015625, 1.656341552734375, 1.75347900390625, 1.850616455078125, 1.94775390625, 2.044891357421875, 2.14202880859375, 2.239166259765625, 2.3363037109375, 2.433441162109375, 2.53057861328125, 2.627716064453125, 2.724853515625, 2.821990966796875, 2.91912841796875, 3.016265869140625, 3.1134033203125, 3.210540771484375, 3.30767822265625, 3.404815673828125, 3.501953125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 2.0, 11.0, 21.0, 19.0, 20.0, 49.0, 66.0, 102.0, 256.0, 387.0, 670.0, 1250.0, 2367.0, 4601.0, 9543.0, 20680.0, 48211.0, 121742.0, 389460.0, 2598060.0, 699974.0, 177450.0, 66995.0, 27795.0, 12508.0, 5726.0, 2896.0, 1482.0, 843.0, 433.0, 257.0, 152.0, 103.0, 49.0, 35.0, 23.0, 19.0, 7.0, 14.0, 3.0, 1.0, 8.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.90625, -22.18310546875, -21.4599609375, -20.73681640625, -20.013671875, -19.29052734375, -18.5673828125, -17.84423828125, -17.12109375, -16.39794921875, -15.6748046875, -14.95166015625, -14.228515625, -13.50537109375, -12.7822265625, -12.05908203125, -11.3359375, -10.61279296875, -9.8896484375, -9.16650390625, -8.443359375, -7.72021484375, -6.9970703125, -6.27392578125, -5.55078125, -4.82763671875, -4.1044921875, -3.38134765625, -2.658203125, -1.93505859375, -1.2119140625, -0.48876953125, 0.234375, 0.95751953125, 1.6806640625, 2.40380859375, 3.126953125, 3.85009765625, 4.5732421875, 5.29638671875, 6.01953125, 6.74267578125, 7.4658203125, 8.18896484375, 8.912109375, 9.63525390625, 10.3583984375, 11.08154296875, 11.8046875, 12.52783203125, 13.2509765625, 13.97412109375, 14.697265625, 15.42041015625, 16.1435546875, 16.86669921875, 17.58984375, 18.31298828125, 19.0361328125, 19.75927734375, 20.482421875, 21.20556640625, 21.9287109375, 22.65185546875, 23.375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 2.0, 7.0, 9.0, 13.0, 13.0, 19.0, 29.0, 26.0, 31.0, 43.0, 50.0, 62.0, 80.0, 85.0, 100.0, 144.0, 182.0, 270.0, 489.0, 902.0, 387.0, 241.0, 174.0, 144.0, 93.0, 92.0, 74.0, 68.0, 54.0, 43.0, 52.0, 28.0, 17.0, 11.0, 15.0, 14.0, 4.0, 6.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.5703125, -6.353515625, -6.13671875, -5.919921875, -5.703125, -5.486328125, -5.26953125, -5.052734375, -4.8359375, -4.619140625, -4.40234375, -4.185546875, -3.96875, -3.751953125, -3.53515625, -3.318359375, -3.1015625, -2.884765625, -2.66796875, -2.451171875, -2.234375, -2.017578125, -1.80078125, -1.583984375, -1.3671875, -1.150390625, -0.93359375, -0.716796875, -0.5, -0.283203125, -0.06640625, 0.150390625, 0.3671875, 0.583984375, 0.80078125, 1.017578125, 1.234375, 1.451171875, 1.66796875, 1.884765625, 2.1015625, 2.318359375, 2.53515625, 2.751953125, 2.96875, 3.185546875, 3.40234375, 3.619140625, 3.8359375, 4.052734375, 4.26953125, 4.486328125, 4.703125, 4.919921875, 5.13671875, 5.353515625, 5.5703125, 5.787109375, 6.00390625, 6.220703125, 6.4375, 6.654296875, 6.87109375, 7.087890625, 7.3046875]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 3.0, 1.0, 3.0, 8.0, 11.0, 20.0, 36.0, 56.0, 100.0, 157.0, 213.0, 152.0, 111.0, 51.0, 42.0, 18.0, 9.0, 9.0, 6.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-107.82499694824219, -104.59039306640625, -101.35578155517578, -98.12117767333984, -94.88656616210938, -91.65196228027344, -88.4173583984375, -85.18275451660156, -81.9481430053711, -78.71353912353516, -75.47892761230469, -72.24432373046875, -69.00971984863281, -65.77510833740234, -62.540504455566406, -59.3058967590332, -56.0712890625, -52.8366813659668, -49.602073669433594, -46.367469787597656, -43.13286209106445, -39.89825439453125, -36.66365051269531, -33.42904281616211, -30.194435119628906, -26.959827423095703, -23.725221633911133, -20.490615844726562, -17.25600814819336, -14.021400451660156, -10.786794662475586, -7.552188873291016, -4.3175811767578125, -1.0829744338989258, 2.151632308959961, 5.386239051818848, 8.620845794677734, 11.855453491210938, 15.090059280395508, 18.324665069580078, 21.55927276611328, 24.793880462646484, 28.028486251831055, 31.263092041015625, 34.49769973754883, 37.73230743408203, 40.96691131591797, 44.20151901245117, 47.436126708984375, 50.67073440551758, 53.90534210205078, 57.13994598388672, 60.37455368041992, 63.609161376953125, 66.84376525878906, 70.078369140625, 73.31298065185547, 76.5475845336914, 79.78219604492188, 83.01679992675781, 86.25140380859375, 89.48601531982422, 92.72061920166016, 95.95523071289062, 99.18983459472656]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 5.0, 7.0, 13.0, 8.0, 15.0, 18.0, 11.0, 25.0, 29.0, 26.0, 36.0, 41.0, 45.0, 40.0, 50.0, 44.0, 58.0, 54.0, 60.0, 54.0, 46.0, 63.0, 50.0, 33.0, 33.0, 29.0, 25.0, 11.0, 15.0, 17.0, 12.0, 6.0, 8.0, 9.0, 2.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.41141128540039, -38.95561218261719, -37.499813079833984, -36.04401397705078, -34.58821487426758, -33.132415771484375, -31.676616668701172, -30.22081756591797, -28.765018463134766, -27.309219360351562, -25.85342025756836, -24.397621154785156, -22.941822052001953, -21.48602294921875, -20.030223846435547, -18.574424743652344, -17.11862564086914, -15.662826538085938, -14.207027435302734, -12.751228332519531, -11.295429229736328, -9.839630126953125, -8.383831024169922, -6.928031921386719, -5.472232818603516, -4.0164337158203125, -2.5606346130371094, -1.1048355102539062, 0.3509635925292969, 1.8067626953125, 3.262561798095703, 4.718360900878906, 6.174163818359375, 7.629962921142578, 9.085762023925781, 10.541561126708984, 11.997360229492188, 13.45315933227539, 14.908958435058594, 16.364757537841797, 17.820556640625, 19.276355743408203, 20.732154846191406, 22.18795394897461, 23.643753051757812, 25.099552154541016, 26.55535125732422, 28.011150360107422, 29.466949462890625, 30.922748565673828, 32.37854766845703, 33.834346771240234, 35.29014587402344, 36.74594497680664, 38.201744079589844, 39.65754318237305, 41.11334228515625, 42.56914138793945, 44.024940490722656, 45.48073959350586, 46.93653869628906, 48.392337799072266, 49.84813690185547, 51.30393600463867, 52.759735107421875]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 5.0, 1.0, 4.0, 8.0, 9.0, 17.0, 19.0, 20.0, 37.0, 47.0, 68.0, 88.0, 109.0, 172.0, 238.0, 340.0, 538.0, 817.0, 1243.0, 2010.0, 3153.0, 5321.0, 9482.0, 17515.0, 34945.0, 74938.0, 206868.0, 435783.0, 137241.0, 56600.0, 27080.0, 14057.0, 7682.0, 4527.0, 2677.0, 1634.0, 1068.0, 682.0, 465.0, 312.0, 208.0, 146.0, 117.0, 65.0, 56.0, 51.0, 26.0, 22.0, 14.0, 14.0, 6.0, 4.0, 12.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-12.71875, -12.29931640625, -11.8798828125, -11.46044921875, -11.041015625, -10.62158203125, -10.2021484375, -9.78271484375, -9.36328125, -8.94384765625, -8.5244140625, -8.10498046875, -7.685546875, -7.26611328125, -6.8466796875, -6.42724609375, -6.0078125, -5.58837890625, -5.1689453125, -4.74951171875, -4.330078125, -3.91064453125, -3.4912109375, -3.07177734375, -2.65234375, -2.23291015625, -1.8134765625, -1.39404296875, -0.974609375, -0.55517578125, -0.1357421875, 0.28369140625, 0.703125, 1.12255859375, 1.5419921875, 1.96142578125, 2.380859375, 2.80029296875, 3.2197265625, 3.63916015625, 4.05859375, 4.47802734375, 4.8974609375, 5.31689453125, 5.736328125, 6.15576171875, 6.5751953125, 6.99462890625, 7.4140625, 7.83349609375, 8.2529296875, 8.67236328125, 9.091796875, 9.51123046875, 9.9306640625, 10.35009765625, 10.76953125, 11.18896484375, 11.6083984375, 12.02783203125, 12.447265625, 12.86669921875, 13.2861328125, 13.70556640625, 14.125]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 5.0, 6.0, 6.0, 11.0, 10.0, 13.0, 11.0, 30.0, 22.0, 33.0, 49.0, 32.0, 39.0, 68.0, 53.0, 63.0, 65.0, 74.0, 74.0, 59.0, 40.0, 54.0, 37.0, 29.0, 22.0, 23.0, 26.0, 7.0, 6.0, 8.0, 9.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.16015625, -3.053375244140625, -2.94659423828125, -2.839813232421875, -2.7330322265625, -2.626251220703125, -2.51947021484375, -2.412689208984375, -2.305908203125, -2.199127197265625, -2.09234619140625, -1.985565185546875, -1.8787841796875, -1.772003173828125, -1.66522216796875, -1.558441162109375, -1.45166015625, -1.344879150390625, -1.23809814453125, -1.131317138671875, -1.0245361328125, -0.917755126953125, -0.81097412109375, -0.704193115234375, -0.597412109375, -0.490631103515625, -0.38385009765625, -0.277069091796875, -0.1702880859375, -0.063507080078125, 0.04327392578125, 0.150054931640625, 0.2568359375, 0.363616943359375, 0.47039794921875, 0.577178955078125, 0.6839599609375, 0.790740966796875, 0.89752197265625, 1.004302978515625, 1.111083984375, 1.217864990234375, 1.32464599609375, 1.431427001953125, 1.5382080078125, 1.644989013671875, 1.75177001953125, 1.858551025390625, 1.96533203125, 2.072113037109375, 2.17889404296875, 2.285675048828125, 2.3924560546875, 2.499237060546875, 2.60601806640625, 2.712799072265625, 2.819580078125, 2.926361083984375, 3.03314208984375, 3.139923095703125, 3.2467041015625, 3.353485107421875, 3.46026611328125, 3.567047119140625, 3.673828125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 4.0, 6.0, 11.0, 13.0, 21.0, 20.0, 23.0, 36.0, 64.0, 83.0, 156.0, 297.0, 728.0, 1693.0, 5409.0, 22065.0, 161376.0, 763423.0, 74016.0, 13141.0, 3522.0, 1315.0, 499.0, 243.0, 126.0, 85.0, 49.0, 41.0, 18.0, 18.0, 11.0, 11.0, 8.0, 3.0, 6.0, 1.0, 5.0, 1.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-31.34375, -30.374267578125, -29.40478515625, -28.435302734375, -27.4658203125, -26.496337890625, -25.52685546875, -24.557373046875, -23.587890625, -22.618408203125, -21.64892578125, -20.679443359375, -19.7099609375, -18.740478515625, -17.77099609375, -16.801513671875, -15.83203125, -14.862548828125, -13.89306640625, -12.923583984375, -11.9541015625, -10.984619140625, -10.01513671875, -9.045654296875, -8.076171875, -7.106689453125, -6.13720703125, -5.167724609375, -4.1982421875, -3.228759765625, -2.25927734375, -1.289794921875, -0.3203125, 0.649169921875, 1.61865234375, 2.588134765625, 3.5576171875, 4.527099609375, 5.49658203125, 6.466064453125, 7.435546875, 8.405029296875, 9.37451171875, 10.343994140625, 11.3134765625, 12.282958984375, 13.25244140625, 14.221923828125, 15.19140625, 16.160888671875, 17.13037109375, 18.099853515625, 19.0693359375, 20.038818359375, 21.00830078125, 21.977783203125, 22.947265625, 23.916748046875, 24.88623046875, 25.855712890625, 26.8251953125, 27.794677734375, 28.76416015625, 29.733642578125, 30.703125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 4.0, 2.0, 2.0, 6.0, 3.0, 10.0, 13.0, 6.0, 9.0, 16.0, 13.0, 12.0, 17.0, 25.0, 20.0, 19.0, 37.0, 24.0, 31.0, 46.0, 45.0, 46.0, 35.0, 44.0, 43.0, 36.0, 46.0, 40.0, 44.0, 40.0, 30.0, 34.0, 22.0, 24.0, 21.0, 22.0, 26.0, 21.0, 12.0, 13.0, 10.0, 8.0, 3.0, 5.0, 5.0, 5.0, 2.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.3203125, -10.96435546875, -10.6083984375, -10.25244140625, -9.896484375, -9.54052734375, -9.1845703125, -8.82861328125, -8.47265625, -8.11669921875, -7.7607421875, -7.40478515625, -7.048828125, -6.69287109375, -6.3369140625, -5.98095703125, -5.625, -5.26904296875, -4.9130859375, -4.55712890625, -4.201171875, -3.84521484375, -3.4892578125, -3.13330078125, -2.77734375, -2.42138671875, -2.0654296875, -1.70947265625, -1.353515625, -0.99755859375, -0.6416015625, -0.28564453125, 0.0703125, 0.42626953125, 0.7822265625, 1.13818359375, 1.494140625, 1.85009765625, 2.2060546875, 2.56201171875, 2.91796875, 3.27392578125, 3.6298828125, 3.98583984375, 4.341796875, 4.69775390625, 5.0537109375, 5.40966796875, 5.765625, 6.12158203125, 6.4775390625, 6.83349609375, 7.189453125, 7.54541015625, 7.9013671875, 8.25732421875, 8.61328125, 8.96923828125, 9.3251953125, 9.68115234375, 10.037109375, 10.39306640625, 10.7490234375, 11.10498046875, 11.4609375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 1.0, 4.0, 10.0, 9.0, 22.0, 30.0, 38.0, 91.0, 132.0, 326.0, 786.0, 2562.0, 15816.0, 771468.0, 244392.0, 9695.0, 1934.0, 625.0, 276.0, 124.0, 78.0, 43.0, 28.0, 19.0, 11.0, 15.0, 6.0, 4.0, 4.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.8125, -41.27734375, -39.7421875, -38.20703125, -36.671875, -35.13671875, -33.6015625, -32.06640625, -30.53125, -28.99609375, -27.4609375, -25.92578125, -24.390625, -22.85546875, -21.3203125, -19.78515625, -18.25, -16.71484375, -15.1796875, -13.64453125, -12.109375, -10.57421875, -9.0390625, -7.50390625, -5.96875, -4.43359375, -2.8984375, -1.36328125, 0.171875, 1.70703125, 3.2421875, 4.77734375, 6.3125, 7.84765625, 9.3828125, 10.91796875, 12.453125, 13.98828125, 15.5234375, 17.05859375, 18.59375, 20.12890625, 21.6640625, 23.19921875, 24.734375, 26.26953125, 27.8046875, 29.33984375, 30.875, 32.41015625, 33.9453125, 35.48046875, 37.015625, 38.55078125, 40.0859375, 41.62109375, 43.15625, 44.69140625, 46.2265625, 47.76171875, 49.296875, 50.83203125, 52.3671875, 53.90234375, 55.4375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 6.0, 2.0, 6.0, 5.0, 4.0, 3.0, 5.0, 15.0, 9.0, 5.0, 17.0, 18.0, 28.0, 42.0, 30.0, 54.0, 70.0, 64.0, 88.0, 84.0, 81.0, 73.0, 50.0, 69.0, 32.0, 30.0, 23.0, 23.0, 11.0, 8.0, 10.0, 3.0, 6.0, 10.0, 6.0, 3.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0008544921875, -0.0008272528648376465, -0.000800013542175293, -0.0007727742195129395, -0.0007455348968505859, -0.0007182955741882324, -0.0006910562515258789, -0.0006638169288635254, -0.0006365776062011719, -0.0006093382835388184, -0.0005820989608764648, -0.0005548596382141113, -0.0005276203155517578, -0.0005003809928894043, -0.0004731416702270508, -0.00044590234756469727, -0.00041866302490234375, -0.00039142370223999023, -0.0003641843795776367, -0.0003369450569152832, -0.0003097057342529297, -0.00028246641159057617, -0.00025522708892822266, -0.00022798776626586914, -0.00020074844360351562, -0.0001735091209411621, -0.0001462697982788086, -0.00011903047561645508, -9.179115295410156e-05, -6.455183029174805e-05, -3.731250762939453e-05, -1.0073184967041016e-05, 1.71661376953125e-05, 4.4405460357666016e-05, 7.164478302001953e-05, 9.888410568237305e-05, 0.00012612342834472656, 0.00015336275100708008, 0.0001806020736694336, 0.0002078413963317871, 0.00023508071899414062, 0.00026232004165649414, 0.00028955936431884766, 0.00031679868698120117, 0.0003440380096435547, 0.0003712773323059082, 0.0003985166549682617, 0.00042575597763061523, 0.00045299530029296875, 0.00048023462295532227, 0.0005074739456176758, 0.0005347132682800293, 0.0005619525909423828, 0.0005891919136047363, 0.0006164312362670898, 0.0006436705589294434, 0.0006709098815917969, 0.0006981492042541504, 0.0007253885269165039, 0.0007526278495788574, 0.0007798671722412109, 0.0008071064949035645, 0.000834345817565918, 0.0008615851402282715, 0.000888824462890625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 7.0, 3.0, 8.0, 13.0, 17.0, 25.0, 22.0, 41.0, 52.0, 78.0, 130.0, 198.0, 310.0, 487.0, 807.0, 1364.0, 2474.0, 4792.0, 10393.0, 26000.0, 87835.0, 505057.0, 310596.0, 60742.0, 19642.0, 8292.0, 3913.0, 2083.0, 1214.0, 738.0, 421.0, 264.0, 166.0, 121.0, 72.0, 61.0, 39.0, 27.0, 15.0, 13.0, 7.0, 10.0, 2.0, 4.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-16.234375, -15.7550048828125, -15.275634765625, -14.7962646484375, -14.31689453125, -13.8375244140625, -13.358154296875, -12.8787841796875, -12.3994140625, -11.9200439453125, -11.440673828125, -10.9613037109375, -10.48193359375, -10.0025634765625, -9.523193359375, -9.0438232421875, -8.564453125, -8.0850830078125, -7.605712890625, -7.1263427734375, -6.64697265625, -6.1676025390625, -5.688232421875, -5.2088623046875, -4.7294921875, -4.2501220703125, -3.770751953125, -3.2913818359375, -2.81201171875, -2.3326416015625, -1.853271484375, -1.3739013671875, -0.89453125, -0.4151611328125, 0.064208984375, 0.5435791015625, 1.02294921875, 1.5023193359375, 1.981689453125, 2.4610595703125, 2.9404296875, 3.4197998046875, 3.899169921875, 4.3785400390625, 4.85791015625, 5.3372802734375, 5.816650390625, 6.2960205078125, 6.775390625, 7.2547607421875, 7.734130859375, 8.2135009765625, 8.69287109375, 9.1722412109375, 9.651611328125, 10.1309814453125, 10.6103515625, 11.0897216796875, 11.569091796875, 12.0484619140625, 12.52783203125, 13.0072021484375, 13.486572265625, 13.9659423828125, 14.4453125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 2.0, 6.0, 5.0, 5.0, 2.0, 7.0, 10.0, 12.0, 10.0, 13.0, 20.0, 21.0, 27.0, 38.0, 36.0, 42.0, 50.0, 43.0, 60.0, 68.0, 64.0, 64.0, 63.0, 52.0, 55.0, 47.0, 28.0, 30.0, 21.0, 11.0, 18.0, 8.0, 9.0, 12.0, 9.0, 8.0, 1.0, 3.0, 2.0, 4.0, 4.0, 3.0, 1.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-7.76953125, -7.52935791015625, -7.2891845703125, -7.04901123046875, -6.808837890625, -6.56866455078125, -6.3284912109375, -6.08831787109375, -5.84814453125, -5.60797119140625, -5.3677978515625, -5.12762451171875, -4.887451171875, -4.64727783203125, -4.4071044921875, -4.16693115234375, -3.9267578125, -3.68658447265625, -3.4464111328125, -3.20623779296875, -2.966064453125, -2.72589111328125, -2.4857177734375, -2.24554443359375, -2.00537109375, -1.76519775390625, -1.5250244140625, -1.28485107421875, -1.044677734375, -0.80450439453125, -0.5643310546875, -0.32415771484375, -0.083984375, 0.15618896484375, 0.3963623046875, 0.63653564453125, 0.876708984375, 1.11688232421875, 1.3570556640625, 1.59722900390625, 1.83740234375, 2.07757568359375, 2.3177490234375, 2.55792236328125, 2.798095703125, 3.03826904296875, 3.2784423828125, 3.51861572265625, 3.7587890625, 3.99896240234375, 4.2391357421875, 4.47930908203125, 4.719482421875, 4.95965576171875, 5.1998291015625, 5.44000244140625, 5.68017578125, 5.92034912109375, 6.1605224609375, 6.40069580078125, 6.640869140625, 6.88104248046875, 7.1212158203125, 7.36138916015625, 7.6015625]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 9.0, 8.0, 9.0, 18.0, 35.0, 57.0, 137.0, 234.0, 227.0, 136.0, 61.0, 26.0, 17.0, 14.0, 8.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-256.1457824707031, -249.74057006835938, -243.33535766601562, -236.93014526367188, -230.52491760253906, -224.1197052001953, -217.71449279785156, -211.3092803955078, -204.904052734375, -198.49884033203125, -192.0936279296875, -185.68841552734375, -179.28318786621094, -172.8779754638672, -166.47276306152344, -160.0675506591797, -153.66233825683594, -147.2571258544922, -140.85191345214844, -134.44668579101562, -128.04147338867188, -121.63626098632812, -115.23104858398438, -108.82583618164062, -102.42061614990234, -96.0154037475586, -89.61018371582031, -83.20497131347656, -76.79975891113281, -70.39453887939453, -63.98932647705078, -57.584110260009766, -51.17890930175781, -44.7736930847168, -38.36847686767578, -31.96326446533203, -25.558048248291016, -19.15283203125, -12.74761962890625, -6.342403411865234, 0.06281280517578125, 6.4680280685424805, 12.87324333190918, 19.278457641601562, 25.683673858642578, 32.088890075683594, 38.494102478027344, 44.89931869506836, 51.304534912109375, 57.70975112915039, 64.1149673461914, 70.52017974853516, 76.92539978027344, 83.33061218261719, 89.73582458496094, 96.14103698730469, 102.54625701904297, 108.95146942138672, 115.356689453125, 121.76190185546875, 128.1671142578125, 134.57232666015625, 140.9775390625, 147.3827667236328, 153.78797912597656]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 5.0, 1.0, 9.0, 4.0, 9.0, 10.0, 12.0, 32.0, 42.0, 74.0, 88.0, 110.0, 137.0, 127.0, 99.0, 73.0, 48.0, 38.0, 16.0, 15.0, 5.0, 6.0, 5.0, 7.0, 5.0, 7.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0], "bins": [-273.7947692871094, -266.71441650390625, -259.6340637207031, -252.55369567871094, -245.47332763671875, -238.39297485351562, -231.31260681152344, -224.2322540283203, -217.15188598632812, -210.071533203125, -202.9911651611328, -195.9108123779297, -188.8304443359375, -181.75009155273438, -174.6697235107422, -167.58937072753906, -160.50900268554688, -153.42864990234375, -146.34828186035156, -139.26792907714844, -132.18756103515625, -125.10720825195312, -118.02684020996094, -110.94648742675781, -103.86613464355469, -96.78577423095703, -89.70541381835938, -82.62505340576172, -75.54469299316406, -68.46434020996094, -61.383975982666016, -54.30361557006836, -47.22325134277344, -40.14289093017578, -33.062530517578125, -25.9821720123291, -18.901811599731445, -11.821453094482422, -4.741092681884766, 2.3392677307128906, 9.419628143310547, 16.499988555908203, 23.58034896850586, 30.660707473754883, 37.741065979003906, 44.82142639160156, 51.90178680419922, 58.982147216796875, 66.06250762939453, 73.14286804199219, 80.22322845458984, 87.3035888671875, 94.38394927978516, 101.46430969238281, 108.54466247558594, 115.62503051757812, 122.70538330078125, 129.78573608398438, 136.86610412597656, 143.9464569091797, 151.02682495117188, 158.107177734375, 165.1875457763672, 172.2678985595703, 179.3482666015625]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 7.0, 6.0, 18.0, 12.0, 16.0, 38.0, 46.0, 58.0, 95.0, 153.0, 252.0, 461.0, 793.0, 1527.0, 3276.0, 7821.0, 22855.0, 97458.0, 3759496.0, 241640.0, 36912.0, 11739.0, 4654.0, 2159.0, 1094.0, 641.0, 351.0, 210.0, 164.0, 105.0, 70.0, 43.0, 27.0, 18.0, 16.0, 18.0, 9.0, 7.0, 6.0, 4.0, 5.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-72.0625, -69.71484375, -67.3671875, -65.01953125, -62.671875, -60.32421875, -57.9765625, -55.62890625, -53.28125, -50.93359375, -48.5859375, -46.23828125, -43.890625, -41.54296875, -39.1953125, -36.84765625, -34.5, -32.15234375, -29.8046875, -27.45703125, -25.109375, -22.76171875, -20.4140625, -18.06640625, -15.71875, -13.37109375, -11.0234375, -8.67578125, -6.328125, -3.98046875, -1.6328125, 0.71484375, 3.0625, 5.41015625, 7.7578125, 10.10546875, 12.453125, 14.80078125, 17.1484375, 19.49609375, 21.84375, 24.19140625, 26.5390625, 28.88671875, 31.234375, 33.58203125, 35.9296875, 38.27734375, 40.625, 42.97265625, 45.3203125, 47.66796875, 50.015625, 52.36328125, 54.7109375, 57.05859375, 59.40625, 61.75390625, 64.1015625, 66.44921875, 68.796875, 71.14453125, 73.4921875, 75.83984375, 78.1875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 4.0, 6.0, 5.0, 9.0, 10.0, 8.0, 5.0, 10.0, 16.0, 14.0, 20.0, 33.0, 42.0, 29.0, 38.0, 50.0, 48.0, 56.0, 64.0, 52.0, 68.0, 67.0, 61.0, 37.0, 48.0, 30.0, 32.0, 31.0, 25.0, 18.0, 11.0, 17.0, 7.0, 10.0, 5.0, 4.0, 3.0, 3.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.01953125, -2.920623779296875, -2.82171630859375, -2.722808837890625, -2.6239013671875, -2.524993896484375, -2.42608642578125, -2.327178955078125, -2.228271484375, -2.129364013671875, -2.03045654296875, -1.931549072265625, -1.8326416015625, -1.733734130859375, -1.63482666015625, -1.535919189453125, -1.43701171875, -1.338104248046875, -1.23919677734375, -1.140289306640625, -1.0413818359375, -0.942474365234375, -0.84356689453125, -0.744659423828125, -0.645751953125, -0.546844482421875, -0.44793701171875, -0.349029541015625, -0.2501220703125, -0.151214599609375, -0.05230712890625, 0.046600341796875, 0.1455078125, 0.244415283203125, 0.34332275390625, 0.442230224609375, 0.5411376953125, 0.640045166015625, 0.73895263671875, 0.837860107421875, 0.936767578125, 1.035675048828125, 1.13458251953125, 1.233489990234375, 1.3323974609375, 1.431304931640625, 1.53021240234375, 1.629119873046875, 1.72802734375, 1.826934814453125, 1.92584228515625, 2.024749755859375, 2.1236572265625, 2.222564697265625, 2.32147216796875, 2.420379638671875, 2.519287109375, 2.618194580078125, 2.71710205078125, 2.816009521484375, 2.9149169921875, 3.013824462890625, 3.11273193359375, 3.211639404296875, 3.310546875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 1.0, 5.0, 9.0, 12.0, 7.0, 27.0, 42.0, 55.0, 81.0, 139.0, 205.0, 344.0, 502.0, 829.0, 1393.0, 2390.0, 4198.0, 7750.0, 14968.0, 31671.0, 78155.0, 297245.0, 3331789.0, 282929.0, 76400.0, 30783.0, 14610.0, 7694.0, 4100.0, 2391.0, 1363.0, 812.0, 521.0, 327.0, 174.0, 122.0, 77.0, 61.0, 29.0, 25.0, 20.0, 9.0, 6.0, 8.0, 0.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-35.03125, -33.84326171875, -32.6552734375, -31.46728515625, -30.279296875, -29.09130859375, -27.9033203125, -26.71533203125, -25.52734375, -24.33935546875, -23.1513671875, -21.96337890625, -20.775390625, -19.58740234375, -18.3994140625, -17.21142578125, -16.0234375, -14.83544921875, -13.6474609375, -12.45947265625, -11.271484375, -10.08349609375, -8.8955078125, -7.70751953125, -6.51953125, -5.33154296875, -4.1435546875, -2.95556640625, -1.767578125, -0.57958984375, 0.6083984375, 1.79638671875, 2.984375, 4.17236328125, 5.3603515625, 6.54833984375, 7.736328125, 8.92431640625, 10.1123046875, 11.30029296875, 12.48828125, 13.67626953125, 14.8642578125, 16.05224609375, 17.240234375, 18.42822265625, 19.6162109375, 20.80419921875, 21.9921875, 23.18017578125, 24.3681640625, 25.55615234375, 26.744140625, 27.93212890625, 29.1201171875, 30.30810546875, 31.49609375, 32.68408203125, 33.8720703125, 35.06005859375, 36.248046875, 37.43603515625, 38.6240234375, 39.81201171875, 41.0]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 2.0, 4.0, 2.0, 4.0, 6.0, 3.0, 9.0, 8.0, 10.0, 22.0, 6.0, 11.0, 21.0, 30.0, 28.0, 50.0, 60.0, 77.0, 116.0, 188.0, 334.0, 2009.0, 411.0, 196.0, 111.0, 73.0, 43.0, 51.0, 39.0, 26.0, 20.0, 21.0, 21.0, 8.0, 9.0, 8.0, 11.0, 7.0, 5.0, 10.0, 0.0, 4.0, 0.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.47265625, -5.29412841796875, -5.1156005859375, -4.93707275390625, -4.758544921875, -4.58001708984375, -4.4014892578125, -4.22296142578125, -4.04443359375, -3.86590576171875, -3.6873779296875, -3.50885009765625, -3.330322265625, -3.15179443359375, -2.9732666015625, -2.79473876953125, -2.6162109375, -2.43768310546875, -2.2591552734375, -2.08062744140625, -1.902099609375, -1.72357177734375, -1.5450439453125, -1.36651611328125, -1.18798828125, -1.00946044921875, -0.8309326171875, -0.65240478515625, -0.473876953125, -0.29534912109375, -0.1168212890625, 0.06170654296875, 0.240234375, 0.41876220703125, 0.5972900390625, 0.77581787109375, 0.954345703125, 1.13287353515625, 1.3114013671875, 1.48992919921875, 1.66845703125, 1.84698486328125, 2.0255126953125, 2.20404052734375, 2.382568359375, 2.56109619140625, 2.7396240234375, 2.91815185546875, 3.0966796875, 3.27520751953125, 3.4537353515625, 3.63226318359375, 3.810791015625, 3.98931884765625, 4.1678466796875, 4.34637451171875, 4.52490234375, 4.70343017578125, 4.8819580078125, 5.06048583984375, 5.239013671875, 5.41754150390625, 5.5960693359375, 5.77459716796875, 5.953125]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 9.0, 3.0, 12.0, 25.0, 50.0, 85.0, 130.0, 201.0, 201.0, 140.0, 70.0, 34.0, 22.0, 8.0, 3.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-37.876670837402344, -35.98329162597656, -34.08991241455078, -32.196533203125, -30.303150177001953, -28.409770965576172, -26.51639175415039, -24.62301254272461, -22.729631423950195, -20.836252212524414, -18.94287109375, -17.04949188232422, -15.156111717224121, -13.262731552124023, -11.369352340698242, -9.475972175598145, -7.582592010498047, -5.689211845397949, -3.7958321571350098, -1.9024524688720703, -0.009072303771972656, 1.884307861328125, 3.7776870727539062, 5.671067237854004, 7.564447402954102, 9.4578275680542, 11.351207733154297, 13.244586944580078, 15.137967109680176, 17.031347274780273, 18.924726486206055, 20.81810760498047, 22.71148681640625, 24.60486602783203, 26.498247146606445, 28.391626358032227, 30.28500747680664, 32.17838668823242, 34.0717658996582, 35.965145111083984, 37.85852813720703, 39.75190734863281, 41.645286560058594, 43.538665771484375, 45.43204879760742, 47.3254280090332, 49.218807220458984, 51.112186431884766, 53.00556564331055, 54.89894485473633, 56.79232406616211, 58.685707092285156, 60.57908630371094, 62.47246551513672, 64.3658447265625, 66.25922393798828, 68.15260314941406, 70.04598236083984, 71.93936157226562, 73.8327407836914, 75.72611999511719, 77.6195068359375, 79.51287841796875, 81.40626525878906, 83.29964447021484]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 5.0, 7.0, 6.0, 7.0, 11.0, 10.0, 11.0, 17.0, 18.0, 21.0, 36.0, 26.0, 30.0, 41.0, 36.0, 37.0, 46.0, 45.0, 55.0, 51.0, 42.0, 50.0, 40.0, 54.0, 40.0, 43.0, 27.0, 31.0, 31.0, 24.0, 20.0, 22.0, 18.0, 8.0, 6.0, 4.0, 3.0, 9.0, 4.0, 4.0, 6.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-18.90411949157715, -18.21017837524414, -17.516237258911133, -16.822296142578125, -16.128353118896484, -15.434412956237793, -14.740470886230469, -14.046529769897461, -13.352588653564453, -12.658647537231445, -11.964706420898438, -11.270764350891113, -10.576823234558105, -9.882882118225098, -9.188940048217773, -8.494998931884766, -7.801057815551758, -7.10711669921875, -6.413175106048584, -5.719233512878418, -5.02529239654541, -4.331351280212402, -3.6374096870422363, -2.9434680938720703, -2.2495269775390625, -1.5555856227874756, -0.8616442680358887, -0.16770291328430176, 0.5262384414672852, 1.220179796218872, 1.914121150970459, 2.608062744140625, 3.302003860473633, 3.9959452152252197, 4.689886569976807, 5.383828163146973, 6.0777692794799805, 6.771710395812988, 7.465651988983154, 8.15959358215332, 8.853534698486328, 9.547475814819336, 10.241416931152344, 10.935359001159668, 11.629300117492676, 12.323241233825684, 13.017183303833008, 13.711124420166016, 14.405065536499023, 15.099006652832031, 15.792947769165039, 16.486888885498047, 17.180831909179688, 17.874773025512695, 18.568714141845703, 19.26265525817871, 19.95659637451172, 20.650537490844727, 21.344478607177734, 22.038419723510742, 22.73236083984375, 23.42630386352539, 24.1202449798584, 24.814186096191406, 25.508127212524414]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 4.0, 6.0, 6.0, 9.0, 9.0, 9.0, 23.0, 14.0, 31.0, 61.0, 77.0, 98.0, 132.0, 243.0, 372.0, 639.0, 1041.0, 1825.0, 3468.0, 6497.0, 13271.0, 29266.0, 68498.0, 208904.0, 462752.0, 149587.0, 54525.0, 23738.0, 10975.0, 5549.0, 2899.0, 1535.0, 950.0, 546.0, 343.0, 243.0, 140.0, 99.0, 67.0, 34.0, 24.0, 17.0, 10.0, 12.0, 6.0, 5.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-29.3125, -28.279296875, -27.24609375, -26.212890625, -25.1796875, -24.146484375, -23.11328125, -22.080078125, -21.046875, -20.013671875, -18.98046875, -17.947265625, -16.9140625, -15.880859375, -14.84765625, -13.814453125, -12.78125, -11.748046875, -10.71484375, -9.681640625, -8.6484375, -7.615234375, -6.58203125, -5.548828125, -4.515625, -3.482421875, -2.44921875, -1.416015625, -0.3828125, 0.650390625, 1.68359375, 2.716796875, 3.75, 4.783203125, 5.81640625, 6.849609375, 7.8828125, 8.916015625, 9.94921875, 10.982421875, 12.015625, 13.048828125, 14.08203125, 15.115234375, 16.1484375, 17.181640625, 18.21484375, 19.248046875, 20.28125, 21.314453125, 22.34765625, 23.380859375, 24.4140625, 25.447265625, 26.48046875, 27.513671875, 28.546875, 29.580078125, 30.61328125, 31.646484375, 32.6796875, 33.712890625, 34.74609375, 35.779296875, 36.8125]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 7.0, 6.0, 9.0, 5.0, 6.0, 6.0, 13.0, 13.0, 21.0, 22.0, 29.0, 28.0, 33.0, 39.0, 42.0, 32.0, 60.0, 59.0, 64.0, 67.0, 57.0, 52.0, 57.0, 47.0, 34.0, 25.0, 31.0, 24.0, 26.0, 20.0, 23.0, 8.0, 7.0, 12.0, 13.0, 3.0, 1.0, 0.0, 2.0, 0.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.79296875, -2.693695068359375, -2.59442138671875, -2.495147705078125, -2.3958740234375, -2.296600341796875, -2.19732666015625, -2.098052978515625, -1.998779296875, -1.899505615234375, -1.80023193359375, -1.700958251953125, -1.6016845703125, -1.502410888671875, -1.40313720703125, -1.303863525390625, -1.20458984375, -1.105316162109375, -1.00604248046875, -0.906768798828125, -0.8074951171875, -0.708221435546875, -0.60894775390625, -0.509674072265625, -0.410400390625, -0.311126708984375, -0.21185302734375, -0.112579345703125, -0.0133056640625, 0.085968017578125, 0.18524169921875, 0.284515380859375, 0.3837890625, 0.483062744140625, 0.58233642578125, 0.681610107421875, 0.7808837890625, 0.880157470703125, 0.97943115234375, 1.078704833984375, 1.177978515625, 1.277252197265625, 1.37652587890625, 1.475799560546875, 1.5750732421875, 1.674346923828125, 1.77362060546875, 1.872894287109375, 1.97216796875, 2.071441650390625, 2.17071533203125, 2.269989013671875, 2.3692626953125, 2.468536376953125, 2.56781005859375, 2.667083740234375, 2.766357421875, 2.865631103515625, 2.96490478515625, 3.064178466796875, 3.1634521484375, 3.262725830078125, 3.36199951171875, 3.461273193359375, 3.560546875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 7.0, 7.0, 11.0, 11.0, 20.0, 15.0, 36.0, 46.0, 66.0, 102.0, 131.0, 187.0, 299.0, 498.0, 860.0, 1506.0, 2996.0, 6423.0, 14908.0, 39402.0, 123822.0, 493835.0, 253832.0, 66643.0, 23659.0, 9687.0, 4401.0, 2153.0, 1158.0, 677.0, 386.0, 221.0, 164.0, 107.0, 75.0, 57.0, 46.0, 27.0, 29.0, 14.0, 9.0, 3.0, 10.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-31.375, -30.4453125, -29.515625, -28.5859375, -27.65625, -26.7265625, -25.796875, -24.8671875, -23.9375, -23.0078125, -22.078125, -21.1484375, -20.21875, -19.2890625, -18.359375, -17.4296875, -16.5, -15.5703125, -14.640625, -13.7109375, -12.78125, -11.8515625, -10.921875, -9.9921875, -9.0625, -8.1328125, -7.203125, -6.2734375, -5.34375, -4.4140625, -3.484375, -2.5546875, -1.625, -0.6953125, 0.234375, 1.1640625, 2.09375, 3.0234375, 3.953125, 4.8828125, 5.8125, 6.7421875, 7.671875, 8.6015625, 9.53125, 10.4609375, 11.390625, 12.3203125, 13.25, 14.1796875, 15.109375, 16.0390625, 16.96875, 17.8984375, 18.828125, 19.7578125, 20.6875, 21.6171875, 22.546875, 23.4765625, 24.40625, 25.3359375, 26.265625, 27.1953125, 28.125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 7.0, 11.0, 7.0, 7.0, 10.0, 29.0, 22.0, 34.0, 48.0, 51.0, 43.0, 48.0, 55.0, 63.0, 59.0, 72.0, 69.0, 71.0, 53.0, 48.0, 41.0, 40.0, 20.0, 24.0, 24.0, 10.0, 9.0, 11.0, 7.0, 4.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.796875, -17.200439453125, -16.60400390625, -16.007568359375, -15.4111328125, -14.814697265625, -14.21826171875, -13.621826171875, -13.025390625, -12.428955078125, -11.83251953125, -11.236083984375, -10.6396484375, -10.043212890625, -9.44677734375, -8.850341796875, -8.25390625, -7.657470703125, -7.06103515625, -6.464599609375, -5.8681640625, -5.271728515625, -4.67529296875, -4.078857421875, -3.482421875, -2.885986328125, -2.28955078125, -1.693115234375, -1.0966796875, -0.500244140625, 0.09619140625, 0.692626953125, 1.2890625, 1.885498046875, 2.48193359375, 3.078369140625, 3.6748046875, 4.271240234375, 4.86767578125, 5.464111328125, 6.060546875, 6.656982421875, 7.25341796875, 7.849853515625, 8.4462890625, 9.042724609375, 9.63916015625, 10.235595703125, 10.83203125, 11.428466796875, 12.02490234375, 12.621337890625, 13.2177734375, 13.814208984375, 14.41064453125, 15.007080078125, 15.603515625, 16.199951171875, 16.79638671875, 17.392822265625, 17.9892578125, 18.585693359375, 19.18212890625, 19.778564453125, 20.375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 4.0, 3.0, 8.0, 8.0, 15.0, 21.0, 24.0, 44.0, 88.0, 160.0, 335.0, 830.0, 2244.0, 7429.0, 36664.0, 523613.0, 434304.0, 32318.0, 6910.0, 2114.0, 723.0, 353.0, 141.0, 81.0, 49.0, 32.0, 14.0, 13.0, 4.0, 4.0, 5.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-59.40625, -57.919921875, -56.43359375, -54.947265625, -53.4609375, -51.974609375, -50.48828125, -49.001953125, -47.515625, -46.029296875, -44.54296875, -43.056640625, -41.5703125, -40.083984375, -38.59765625, -37.111328125, -35.625, -34.138671875, -32.65234375, -31.166015625, -29.6796875, -28.193359375, -26.70703125, -25.220703125, -23.734375, -22.248046875, -20.76171875, -19.275390625, -17.7890625, -16.302734375, -14.81640625, -13.330078125, -11.84375, -10.357421875, -8.87109375, -7.384765625, -5.8984375, -4.412109375, -2.92578125, -1.439453125, 0.046875, 1.533203125, 3.01953125, 4.505859375, 5.9921875, 7.478515625, 8.96484375, 10.451171875, 11.9375, 13.423828125, 14.91015625, 16.396484375, 17.8828125, 19.369140625, 20.85546875, 22.341796875, 23.828125, 25.314453125, 26.80078125, 28.287109375, 29.7734375, 31.259765625, 32.74609375, 34.232421875, 35.71875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 3.0, 3.0, 5.0, 4.0, 10.0, 11.0, 11.0, 24.0, 22.0, 42.0, 65.0, 93.0, 134.0, 145.0, 148.0, 90.0, 52.0, 32.0, 23.0, 17.0, 13.0, 12.0, 11.0, 2.0, 4.0, 4.0, 3.0, 2.0, 3.0, 3.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0031375885009765625, -0.003019005060195923, -0.002900421619415283, -0.0027818381786346436, -0.002663254737854004, -0.0025446712970733643, -0.0024260878562927246, -0.002307504415512085, -0.0021889209747314453, -0.0020703375339508057, -0.001951754093170166, -0.0018331706523895264, -0.0017145872116088867, -0.001596003770828247, -0.0014774203300476074, -0.0013588368892669678, -0.0012402534484863281, -0.0011216700077056885, -0.0010030865669250488, -0.0008845031261444092, -0.0007659196853637695, -0.0006473362445831299, -0.0005287528038024902, -0.0004101693630218506, -0.00029158592224121094, -0.0001730024814605713, -5.441904067993164e-05, 6.416440010070801e-05, 0.00018274784088134766, 0.0003013312816619873, 0.00041991472244262695, 0.0005384981632232666, 0.0006570816040039062, 0.0007756650447845459, 0.0008942484855651855, 0.0010128319263458252, 0.0011314153671264648, 0.0012499988079071045, 0.0013685822486877441, 0.0014871656894683838, 0.0016057491302490234, 0.001724332571029663, 0.0018429160118103027, 0.0019614994525909424, 0.002080082893371582, 0.0021986663341522217, 0.0023172497749328613, 0.002435833215713501, 0.0025544166564941406, 0.0026730000972747803, 0.00279158353805542, 0.0029101669788360596, 0.0030287504196166992, 0.003147333860397339, 0.0032659173011779785, 0.003384500741958618, 0.003503084182739258, 0.0036216676235198975, 0.003740251064300537, 0.0038588345050811768, 0.003977417945861816, 0.004096001386642456, 0.004214584827423096, 0.004333168268203735, 0.004451751708984375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 9.0, 4.0, 18.0, 19.0, 32.0, 35.0, 72.0, 84.0, 153.0, 246.0, 443.0, 815.0, 1517.0, 3084.0, 6899.0, 18638.0, 65528.0, 362233.0, 468622.0, 83452.0, 21955.0, 7858.0, 3379.0, 1543.0, 802.0, 470.0, 235.0, 145.0, 95.0, 64.0, 36.0, 25.0, 11.0, 13.0, 5.0, 7.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.734375, -25.92626953125, -25.1181640625, -24.31005859375, -23.501953125, -22.69384765625, -21.8857421875, -21.07763671875, -20.26953125, -19.46142578125, -18.6533203125, -17.84521484375, -17.037109375, -16.22900390625, -15.4208984375, -14.61279296875, -13.8046875, -12.99658203125, -12.1884765625, -11.38037109375, -10.572265625, -9.76416015625, -8.9560546875, -8.14794921875, -7.33984375, -6.53173828125, -5.7236328125, -4.91552734375, -4.107421875, -3.29931640625, -2.4912109375, -1.68310546875, -0.875, -0.06689453125, 0.7412109375, 1.54931640625, 2.357421875, 3.16552734375, 3.9736328125, 4.78173828125, 5.58984375, 6.39794921875, 7.2060546875, 8.01416015625, 8.822265625, 9.63037109375, 10.4384765625, 11.24658203125, 12.0546875, 12.86279296875, 13.6708984375, 14.47900390625, 15.287109375, 16.09521484375, 16.9033203125, 17.71142578125, 18.51953125, 19.32763671875, 20.1357421875, 20.94384765625, 21.751953125, 22.56005859375, 23.3681640625, 24.17626953125, 24.984375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 3.0, 2.0, 7.0, 4.0, 4.0, 5.0, 15.0, 15.0, 17.0, 20.0, 27.0, 30.0, 59.0, 56.0, 64.0, 74.0, 79.0, 73.0, 87.0, 74.0, 63.0, 49.0, 43.0, 27.0, 26.0, 20.0, 9.0, 19.0, 3.0, 6.0, 5.0, 8.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.6796875, -13.3135986328125, -12.947509765625, -12.5814208984375, -12.21533203125, -11.8492431640625, -11.483154296875, -11.1170654296875, -10.7509765625, -10.3848876953125, -10.018798828125, -9.6527099609375, -9.28662109375, -8.9205322265625, -8.554443359375, -8.1883544921875, -7.822265625, -7.4561767578125, -7.090087890625, -6.7239990234375, -6.35791015625, -5.9918212890625, -5.625732421875, -5.2596435546875, -4.8935546875, -4.5274658203125, -4.161376953125, -3.7952880859375, -3.42919921875, -3.0631103515625, -2.697021484375, -2.3309326171875, -1.96484375, -1.5987548828125, -1.232666015625, -0.8665771484375, -0.50048828125, -0.1343994140625, 0.231689453125, 0.5977783203125, 0.9638671875, 1.3299560546875, 1.696044921875, 2.0621337890625, 2.42822265625, 2.7943115234375, 3.160400390625, 3.5264892578125, 3.892578125, 4.2586669921875, 4.624755859375, 4.9908447265625, 5.35693359375, 5.7230224609375, 6.089111328125, 6.4552001953125, 6.8212890625, 7.1873779296875, 7.553466796875, 7.9195556640625, 8.28564453125, 8.6517333984375, 9.017822265625, 9.3839111328125, 9.75]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 5.0, 12.0, 16.0, 21.0, 61.0, 130.0, 285.0, 246.0, 101.0, 61.0, 30.0, 14.0, 13.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-263.111572265625, -253.68032836914062, -244.24908447265625, -234.81784057617188, -225.3865966796875, -215.95535278320312, -206.52410888671875, -197.09286499023438, -187.66162109375, -178.23037719726562, -168.79913330078125, -159.36788940429688, -149.9366455078125, -140.50540161132812, -131.07415771484375, -121.64290618896484, -112.21165466308594, -102.78041076660156, -93.34916687011719, -83.91792297363281, -74.48667907714844, -65.05543518066406, -55.624183654785156, -46.19293975830078, -36.761695861816406, -27.33045196533203, -17.899206161499023, -8.467960357666016, 0.9632835388183594, 10.394527435302734, 19.825775146484375, 29.25701904296875, 38.688262939453125, 48.1195068359375, 57.550750732421875, 66.98199462890625, 76.41323852539062, 85.844482421875, 95.2757339477539, 104.70697784423828, 114.13822174072266, 123.56946563720703, 133.00071716308594, 142.4319610595703, 151.8632049560547, 161.29444885253906, 170.72569274902344, 180.1569366455078, 189.5881805419922, 199.01942443847656, 208.45066833496094, 217.8819122314453, 227.3131561279297, 236.74440002441406, 246.1756591796875, 255.60690307617188, 265.03814697265625, 274.4693908691406, 283.900634765625, 293.3318786621094, 302.76312255859375, 312.1943664550781, 321.6256103515625, 331.0568542480469, 340.48809814453125]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 7.0, 5.0, 7.0, 4.0, 11.0, 18.0, 18.0, 23.0, 40.0, 45.0, 44.0, 58.0, 64.0, 55.0, 65.0, 77.0, 69.0, 69.0, 49.0, 50.0, 50.0, 47.0, 32.0, 16.0, 16.0, 12.0, 14.0, 11.0, 3.0, 5.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-147.695556640625, -143.18995666503906, -138.68435668945312, -134.1787567138672, -129.67315673828125, -125.16755676269531, -120.66195678710938, -116.15635681152344, -111.6507568359375, -107.14515686035156, -102.63955688476562, -98.13395690917969, -93.62835693359375, -89.12275695800781, -84.61715698242188, -80.11155700683594, -75.60596466064453, -71.1003646850586, -66.59476470947266, -62.08916473388672, -57.58356475830078, -53.077964782714844, -48.57236862182617, -44.066768646240234, -39.5611686706543, -35.05556869506836, -30.549968719482422, -26.044370651245117, -21.53877067565918, -17.033170700073242, -12.527572631835938, -8.02197265625, -3.5163726806640625, 0.9892268180847168, 5.494826316833496, 10.000425338745117, 14.506025314331055, 19.011625289916992, 23.517223358154297, 28.022823333740234, 32.52842330932617, 37.03402328491211, 41.53962326049805, 46.04521942138672, 50.550819396972656, 55.056419372558594, 59.56201934814453, 64.06761932373047, 68.5732192993164, 73.07881927490234, 77.58441925048828, 82.09001922607422, 86.59561920166016, 91.1012191772461, 95.6068115234375, 100.11241149902344, 104.61801147460938, 109.12361145019531, 113.62921142578125, 118.13481140136719, 122.64041137695312, 127.14601135253906, 131.651611328125, 136.15721130371094, 140.66281127929688]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 7.0, 2.0, 7.0, 8.0, 20.0, 24.0, 38.0, 57.0, 91.0, 170.0, 250.0, 417.0, 739.0, 1304.0, 2416.0, 4483.0, 8787.0, 18481.0, 45212.0, 161359.0, 3551847.0, 291888.0, 60603.0, 22537.0, 10469.0, 5368.0, 2867.0, 1713.0, 965.0, 636.0, 433.0, 295.0, 203.0, 144.0, 110.0, 61.0, 63.0, 54.0, 32.0, 26.0, 21.0, 13.0, 27.0, 7.0, 4.0, 7.0, 6.0, 5.0, 5.0, 2.0, 3.0, 3.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-51.28125, -49.11279296875, -46.9443359375, -44.77587890625, -42.607421875, -40.43896484375, -38.2705078125, -36.10205078125, -33.93359375, -31.76513671875, -29.5966796875, -27.42822265625, -25.259765625, -23.09130859375, -20.9228515625, -18.75439453125, -16.5859375, -14.41748046875, -12.2490234375, -10.08056640625, -7.912109375, -5.74365234375, -3.5751953125, -1.40673828125, 0.76171875, 2.93017578125, 5.0986328125, 7.26708984375, 9.435546875, 11.60400390625, 13.7724609375, 15.94091796875, 18.109375, 20.27783203125, 22.4462890625, 24.61474609375, 26.783203125, 28.95166015625, 31.1201171875, 33.28857421875, 35.45703125, 37.62548828125, 39.7939453125, 41.96240234375, 44.130859375, 46.29931640625, 48.4677734375, 50.63623046875, 52.8046875, 54.97314453125, 57.1416015625, 59.31005859375, 61.478515625, 63.64697265625, 65.8154296875, 67.98388671875, 70.15234375, 72.32080078125, 74.4892578125, 76.65771484375, 78.826171875, 80.99462890625, 83.1630859375, 85.33154296875, 87.5]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 12.0, 14.0, 21.0, 20.0, 32.0, 48.0, 51.0, 56.0, 69.0, 83.0, 94.0, 90.0, 72.0, 81.0, 54.0, 52.0, 52.0, 32.0, 18.0, 18.0, 13.0, 7.0, 4.0, 6.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.66796875, -3.5091552734375, -3.350341796875, -3.1915283203125, -3.03271484375, -2.8739013671875, -2.715087890625, -2.5562744140625, -2.3974609375, -2.2386474609375, -2.079833984375, -1.9210205078125, -1.76220703125, -1.6033935546875, -1.444580078125, -1.2857666015625, -1.126953125, -0.9681396484375, -0.809326171875, -0.6505126953125, -0.49169921875, -0.3328857421875, -0.174072265625, -0.0152587890625, 0.1435546875, 0.3023681640625, 0.461181640625, 0.6199951171875, 0.77880859375, 0.9376220703125, 1.096435546875, 1.2552490234375, 1.4140625, 1.5728759765625, 1.731689453125, 1.8905029296875, 2.04931640625, 2.2081298828125, 2.366943359375, 2.5257568359375, 2.6845703125, 2.8433837890625, 3.002197265625, 3.1610107421875, 3.31982421875, 3.4786376953125, 3.637451171875, 3.7962646484375, 3.955078125, 4.1138916015625, 4.272705078125, 4.4315185546875, 4.59033203125, 4.7491455078125, 4.907958984375, 5.0667724609375, 5.2255859375, 5.3843994140625, 5.543212890625, 5.7020263671875, 5.86083984375, 6.0196533203125, 6.178466796875, 6.3372802734375, 6.49609375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 7.0, 9.0, 10.0, 20.0, 23.0, 31.0, 50.0, 105.0, 189.0, 346.0, 897.0, 2348.0, 7774.0, 34785.0, 348887.0, 3681356.0, 94429.0, 16271.0, 4238.0, 1412.0, 525.0, 247.0, 123.0, 61.0, 42.0, 33.0, 13.0, 7.0, 11.0, 9.0, 7.0, 5.0, 4.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-103.4375, -99.3427734375, -95.248046875, -91.1533203125, -87.05859375, -82.9638671875, -78.869140625, -74.7744140625, -70.6796875, -66.5849609375, -62.490234375, -58.3955078125, -54.30078125, -50.2060546875, -46.111328125, -42.0166015625, -37.921875, -33.8271484375, -29.732421875, -25.6376953125, -21.54296875, -17.4482421875, -13.353515625, -9.2587890625, -5.1640625, -1.0693359375, 3.025390625, 7.1201171875, 11.21484375, 15.3095703125, 19.404296875, 23.4990234375, 27.59375, 31.6884765625, 35.783203125, 39.8779296875, 43.97265625, 48.0673828125, 52.162109375, 56.2568359375, 60.3515625, 64.4462890625, 68.541015625, 72.6357421875, 76.73046875, 80.8251953125, 84.919921875, 89.0146484375, 93.109375, 97.2041015625, 101.298828125, 105.3935546875, 109.48828125, 113.5830078125, 117.677734375, 121.7724609375, 125.8671875, 129.9619140625, 134.056640625, 138.1513671875, 142.24609375, 146.3408203125, 150.435546875, 154.5302734375, 158.625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 2.0, 4.0, 8.0, 8.0, 3.0, 8.0, 18.0, 15.0, 17.0, 22.0, 45.0, 38.0, 49.0, 84.0, 113.0, 185.0, 424.0, 1924.0, 469.0, 204.0, 125.0, 81.0, 54.0, 43.0, 30.0, 22.0, 20.0, 12.0, 14.0, 9.0, 7.0, 7.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-13.328125, -12.9730224609375, -12.617919921875, -12.2628173828125, -11.90771484375, -11.5526123046875, -11.197509765625, -10.8424072265625, -10.4873046875, -10.1322021484375, -9.777099609375, -9.4219970703125, -9.06689453125, -8.7117919921875, -8.356689453125, -8.0015869140625, -7.646484375, -7.2913818359375, -6.936279296875, -6.5811767578125, -6.22607421875, -5.8709716796875, -5.515869140625, -5.1607666015625, -4.8056640625, -4.4505615234375, -4.095458984375, -3.7403564453125, -3.38525390625, -3.0301513671875, -2.675048828125, -2.3199462890625, -1.96484375, -1.6097412109375, -1.254638671875, -0.8995361328125, -0.54443359375, -0.1893310546875, 0.165771484375, 0.5208740234375, 0.8759765625, 1.2310791015625, 1.586181640625, 1.9412841796875, 2.29638671875, 2.6514892578125, 3.006591796875, 3.3616943359375, 3.716796875, 4.0718994140625, 4.427001953125, 4.7821044921875, 5.13720703125, 5.4923095703125, 5.847412109375, 6.2025146484375, 6.5576171875, 6.9127197265625, 7.267822265625, 7.6229248046875, 7.97802734375, 8.3331298828125, 8.688232421875, 9.0433349609375, 9.3984375]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 8.0, 9.0, 11.0, 20.0, 34.0, 67.0, 128.0, 209.0, 225.0, 120.0, 70.0, 36.0, 22.0, 19.0, 15.0, 5.0, 7.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.61849594116211, -58.402278900146484, -55.186065673828125, -51.9698486328125, -48.753631591796875, -45.53741455078125, -42.32120132446289, -39.104984283447266, -35.888771057128906, -32.67255401611328, -29.45633888244629, -26.240123748779297, -23.023906707763672, -19.80769157409668, -16.591476440429688, -13.375259399414062, -10.159042358398438, -6.942826271057129, -3.7266106605529785, -0.5103950500488281, 2.7058210372924805, 5.922037124633789, 9.138252258300781, 12.354469299316406, 15.570684432983398, 18.78689956665039, 22.003116607666016, 25.219331741333008, 28.435546875, 31.651763916015625, 34.86798095703125, 38.084197998046875, 41.30040740966797, 44.516624450683594, 47.73283767700195, 50.94905471801758, 54.1652717590332, 57.38148498535156, 60.59770202636719, 63.81391906738281, 67.03013610839844, 70.24635314941406, 73.46257019042969, 76.67878723144531, 79.8949966430664, 83.11121368408203, 86.32743072509766, 89.54364776611328, 92.75985717773438, 95.97607421875, 99.19229125976562, 102.40850830078125, 105.62471771240234, 108.84093475341797, 112.0571517944336, 115.27336883544922, 118.48958587646484, 121.70580291748047, 124.9220199584961, 128.1382293701172, 131.3544464111328, 134.57066345214844, 137.78688049316406, 141.0030975341797, 144.2193145751953]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 9.0, 10.0, 9.0, 13.0, 13.0, 16.0, 26.0, 29.0, 40.0, 43.0, 49.0, 39.0, 46.0, 48.0, 45.0, 40.0, 59.0, 62.0, 43.0, 47.0, 48.0, 43.0, 39.0, 29.0, 37.0, 30.0, 20.0, 19.0, 13.0, 14.0, 11.0, 6.0, 2.0, 7.0, 2.0, 2.0], "bins": [-67.78295135498047, -66.23178100585938, -64.68061828613281, -63.12944793701172, -61.578277587890625, -60.02710723876953, -58.4759407043457, -56.924774169921875, -55.37360382080078, -53.82243347167969, -52.27126693725586, -50.72010040283203, -49.16893005371094, -47.617759704589844, -46.066593170166016, -44.51542663574219, -42.964256286621094, -41.4130859375, -39.86191940307617, -38.310752868652344, -36.75958251953125, -35.208412170410156, -33.65724563598633, -32.1060791015625, -30.554908752441406, -29.003740310668945, -27.452571868896484, -25.901403427124023, -24.350234985351562, -22.7990665435791, -21.24789810180664, -19.69672966003418, -18.14556121826172, -16.594392776489258, -15.043224334716797, -13.492055892944336, -11.940887451171875, -10.389719009399414, -8.838550567626953, -7.287382125854492, -5.736213684082031, -4.18504524230957, -2.6338768005371094, -1.0827083587646484, 0.4684600830078125, 2.0196285247802734, 3.5707969665527344, 5.121965408325195, 6.673133850097656, 8.224302291870117, 9.775470733642578, 11.326639175415039, 12.8778076171875, 14.428976058959961, 15.980144500732422, 17.531312942504883, 19.082481384277344, 20.633649826049805, 22.184818267822266, 23.735986709594727, 25.287155151367188, 26.83832359313965, 28.38949203491211, 29.94066047668457, 31.49182891845703]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 5.0, 4.0, 6.0, 6.0, 10.0, 12.0, 14.0, 22.0, 31.0, 46.0, 50.0, 79.0, 112.0, 170.0, 278.0, 434.0, 663.0, 1080.0, 1748.0, 2998.0, 4979.0, 8993.0, 17210.0, 33552.0, 69483.0, 157766.0, 333117.0, 225723.0, 95642.0, 44482.0, 22300.0, 11601.0, 6476.0, 3563.0, 2251.0, 1306.0, 822.0, 509.0, 339.0, 205.0, 136.0, 93.0, 69.0, 46.0, 36.0, 28.0, 19.0, 12.0, 14.0, 9.0, 4.0, 6.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.28125, -30.32470703125, -29.3681640625, -28.41162109375, -27.455078125, -26.49853515625, -25.5419921875, -24.58544921875, -23.62890625, -22.67236328125, -21.7158203125, -20.75927734375, -19.802734375, -18.84619140625, -17.8896484375, -16.93310546875, -15.9765625, -15.02001953125, -14.0634765625, -13.10693359375, -12.150390625, -11.19384765625, -10.2373046875, -9.28076171875, -8.32421875, -7.36767578125, -6.4111328125, -5.45458984375, -4.498046875, -3.54150390625, -2.5849609375, -1.62841796875, -0.671875, 0.28466796875, 1.2412109375, 2.19775390625, 3.154296875, 4.11083984375, 5.0673828125, 6.02392578125, 6.98046875, 7.93701171875, 8.8935546875, 9.85009765625, 10.806640625, 11.76318359375, 12.7197265625, 13.67626953125, 14.6328125, 15.58935546875, 16.5458984375, 17.50244140625, 18.458984375, 19.41552734375, 20.3720703125, 21.32861328125, 22.28515625, 23.24169921875, 24.1982421875, 25.15478515625, 26.111328125, 27.06787109375, 28.0244140625, 28.98095703125, 29.9375]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 6.0, 11.0, 6.0, 5.0, 19.0, 21.0, 26.0, 23.0, 38.0, 33.0, 39.0, 48.0, 45.0, 58.0, 54.0, 58.0, 45.0, 50.0, 51.0, 60.0, 54.0, 47.0, 36.0, 27.0, 31.0, 23.0, 19.0, 17.0, 13.0, 8.0, 11.0, 6.0, 6.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.568359375, -3.450469970703125, -3.33258056640625, -3.214691162109375, -3.0968017578125, -2.978912353515625, -2.86102294921875, -2.743133544921875, -2.625244140625, -2.507354736328125, -2.38946533203125, -2.271575927734375, -2.1536865234375, -2.035797119140625, -1.91790771484375, -1.800018310546875, -1.68212890625, -1.564239501953125, -1.44635009765625, -1.328460693359375, -1.2105712890625, -1.092681884765625, -0.97479248046875, -0.856903076171875, -0.739013671875, -0.621124267578125, -0.50323486328125, -0.385345458984375, -0.2674560546875, -0.149566650390625, -0.03167724609375, 0.086212158203125, 0.2041015625, 0.321990966796875, 0.43988037109375, 0.557769775390625, 0.6756591796875, 0.793548583984375, 0.91143798828125, 1.029327392578125, 1.147216796875, 1.265106201171875, 1.38299560546875, 1.500885009765625, 1.6187744140625, 1.736663818359375, 1.85455322265625, 1.972442626953125, 2.09033203125, 2.208221435546875, 2.32611083984375, 2.444000244140625, 2.5618896484375, 2.679779052734375, 2.79766845703125, 2.915557861328125, 3.033447265625, 3.151336669921875, 3.26922607421875, 3.387115478515625, 3.5050048828125, 3.622894287109375, 3.74078369140625, 3.858673095703125, 3.9765625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 6.0, 6.0, 4.0, 12.0, 14.0, 34.0, 23.0, 35.0, 58.0, 79.0, 130.0, 199.0, 309.0, 569.0, 1181.0, 2152.0, 4854.0, 11649.0, 31397.0, 104597.0, 480432.0, 301607.0, 70087.0, 22683.0, 8738.0, 3729.0, 1815.0, 907.0, 438.0, 283.0, 182.0, 107.0, 75.0, 45.0, 33.0, 24.0, 24.0, 10.0, 10.0, 9.0, 2.0, 6.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-51.25, -49.58837890625, -47.9267578125, -46.26513671875, -44.603515625, -42.94189453125, -41.2802734375, -39.61865234375, -37.95703125, -36.29541015625, -34.6337890625, -32.97216796875, -31.310546875, -29.64892578125, -27.9873046875, -26.32568359375, -24.6640625, -23.00244140625, -21.3408203125, -19.67919921875, -18.017578125, -16.35595703125, -14.6943359375, -13.03271484375, -11.37109375, -9.70947265625, -8.0478515625, -6.38623046875, -4.724609375, -3.06298828125, -1.4013671875, 0.26025390625, 1.921875, 3.58349609375, 5.2451171875, 6.90673828125, 8.568359375, 10.22998046875, 11.8916015625, 13.55322265625, 15.21484375, 16.87646484375, 18.5380859375, 20.19970703125, 21.861328125, 23.52294921875, 25.1845703125, 26.84619140625, 28.5078125, 30.16943359375, 31.8310546875, 33.49267578125, 35.154296875, 36.81591796875, 38.4775390625, 40.13916015625, 41.80078125, 43.46240234375, 45.1240234375, 46.78564453125, 48.447265625, 50.10888671875, 51.7705078125, 53.43212890625, 55.09375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 5.0, 7.0, 4.0, 15.0, 6.0, 11.0, 4.0, 16.0, 15.0, 25.0, 24.0, 23.0, 32.0, 41.0, 42.0, 45.0, 47.0, 49.0, 52.0, 54.0, 56.0, 44.0, 66.0, 41.0, 33.0, 40.0, 50.0, 27.0, 18.0, 22.0, 8.0, 14.0, 23.0, 11.0, 9.0, 5.0, 4.0, 4.0, 4.0, 2.0, 1.0, 0.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-22.46875, -21.705322265625, -20.94189453125, -20.178466796875, -19.4150390625, -18.651611328125, -17.88818359375, -17.124755859375, -16.361328125, -15.597900390625, -14.83447265625, -14.071044921875, -13.3076171875, -12.544189453125, -11.78076171875, -11.017333984375, -10.25390625, -9.490478515625, -8.72705078125, -7.963623046875, -7.2001953125, -6.436767578125, -5.67333984375, -4.909912109375, -4.146484375, -3.383056640625, -2.61962890625, -1.856201171875, -1.0927734375, -0.329345703125, 0.43408203125, 1.197509765625, 1.9609375, 2.724365234375, 3.48779296875, 4.251220703125, 5.0146484375, 5.778076171875, 6.54150390625, 7.304931640625, 8.068359375, 8.831787109375, 9.59521484375, 10.358642578125, 11.1220703125, 11.885498046875, 12.64892578125, 13.412353515625, 14.17578125, 14.939208984375, 15.70263671875, 16.466064453125, 17.2294921875, 17.992919921875, 18.75634765625, 19.519775390625, 20.283203125, 21.046630859375, 21.81005859375, 22.573486328125, 23.3369140625, 24.100341796875, 24.86376953125, 25.627197265625, 26.390625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 3.0, 7.0, 8.0, 8.0, 16.0, 32.0, 35.0, 61.0, 90.0, 151.0, 257.0, 434.0, 879.0, 1670.0, 3308.0, 7394.0, 18929.0, 56520.0, 228179.0, 512420.0, 150862.0, 40918.0, 14502.0, 5977.0, 2804.0, 1420.0, 701.0, 382.0, 208.0, 124.0, 83.0, 53.0, 42.0, 24.0, 17.0, 11.0, 10.0, 6.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.5625, -26.65478515625, -25.7470703125, -24.83935546875, -23.931640625, -23.02392578125, -22.1162109375, -21.20849609375, -20.30078125, -19.39306640625, -18.4853515625, -17.57763671875, -16.669921875, -15.76220703125, -14.8544921875, -13.94677734375, -13.0390625, -12.13134765625, -11.2236328125, -10.31591796875, -9.408203125, -8.50048828125, -7.5927734375, -6.68505859375, -5.77734375, -4.86962890625, -3.9619140625, -3.05419921875, -2.146484375, -1.23876953125, -0.3310546875, 0.57666015625, 1.484375, 2.39208984375, 3.2998046875, 4.20751953125, 5.115234375, 6.02294921875, 6.9306640625, 7.83837890625, 8.74609375, 9.65380859375, 10.5615234375, 11.46923828125, 12.376953125, 13.28466796875, 14.1923828125, 15.10009765625, 16.0078125, 16.91552734375, 17.8232421875, 18.73095703125, 19.638671875, 20.54638671875, 21.4541015625, 22.36181640625, 23.26953125, 24.17724609375, 25.0849609375, 25.99267578125, 26.900390625, 27.80810546875, 28.7158203125, 29.62353515625, 30.53125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 1.0, 4.0, 6.0, 3.0, 3.0, 17.0, 8.0, 20.0, 19.0, 31.0, 48.0, 79.0, 102.0, 122.0, 140.0, 113.0, 79.0, 45.0, 53.0, 24.0, 18.0, 14.0, 13.0, 7.0, 7.0, 7.0, 3.0, 7.0, 1.0, 0.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00626373291015625, -0.006099998950958252, -0.005936264991760254, -0.005772531032562256, -0.005608797073364258, -0.00544506311416626, -0.005281329154968262, -0.005117595195770264, -0.004953861236572266, -0.004790127277374268, -0.0046263933181762695, -0.0044626593589782715, -0.0042989253997802734, -0.004135191440582275, -0.003971457481384277, -0.0038077235221862793, -0.0036439895629882812, -0.003480255603790283, -0.003316521644592285, -0.003152787685394287, -0.002989053726196289, -0.002825319766998291, -0.002661585807800293, -0.002497851848602295, -0.002334117889404297, -0.002170383930206299, -0.0020066499710083008, -0.0018429160118103027, -0.0016791820526123047, -0.0015154480934143066, -0.0013517141342163086, -0.0011879801750183105, -0.0010242462158203125, -0.0008605122566223145, -0.0006967782974243164, -0.0005330443382263184, -0.0003693103790283203, -0.00020557641983032227, -4.184246063232422e-05, 0.00012189149856567383, 0.0002856254577636719, 0.0004493594169616699, 0.000613093376159668, 0.000776827335357666, 0.0009405612945556641, 0.0011042952537536621, 0.0012680292129516602, 0.0014317631721496582, 0.0015954971313476562, 0.0017592310905456543, 0.0019229650497436523, 0.0020866990089416504, 0.0022504329681396484, 0.0024141669273376465, 0.0025779008865356445, 0.0027416348457336426, 0.0029053688049316406, 0.0030691027641296387, 0.0032328367233276367, 0.0033965706825256348, 0.003560304641723633, 0.003724038600921631, 0.003887772560119629, 0.004051506519317627, 0.004215240478515625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 1.0, 1.0, 7.0, 7.0, 8.0, 27.0, 22.0, 51.0, 52.0, 74.0, 88.0, 178.0, 258.0, 487.0, 922.0, 1789.0, 3825.0, 8999.0, 23856.0, 76512.0, 310262.0, 448964.0, 116729.0, 33715.0, 12092.0, 4969.0, 2208.0, 1015.0, 548.0, 337.0, 185.0, 117.0, 68.0, 55.0, 40.0, 20.0, 16.0, 13.0, 10.0, 10.0, 6.0, 3.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-30.03125, -29.152099609375, -28.27294921875, -27.393798828125, -26.5146484375, -25.635498046875, -24.75634765625, -23.877197265625, -22.998046875, -22.118896484375, -21.23974609375, -20.360595703125, -19.4814453125, -18.602294921875, -17.72314453125, -16.843994140625, -15.96484375, -15.085693359375, -14.20654296875, -13.327392578125, -12.4482421875, -11.569091796875, -10.68994140625, -9.810791015625, -8.931640625, -8.052490234375, -7.17333984375, -6.294189453125, -5.4150390625, -4.535888671875, -3.65673828125, -2.777587890625, -1.8984375, -1.019287109375, -0.14013671875, 0.739013671875, 1.6181640625, 2.497314453125, 3.37646484375, 4.255615234375, 5.134765625, 6.013916015625, 6.89306640625, 7.772216796875, 8.6513671875, 9.530517578125, 10.40966796875, 11.288818359375, 12.16796875, 13.047119140625, 13.92626953125, 14.805419921875, 15.6845703125, 16.563720703125, 17.44287109375, 18.322021484375, 19.201171875, 20.080322265625, 20.95947265625, 21.838623046875, 22.7177734375, 23.596923828125, 24.47607421875, 25.355224609375, 26.234375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 10.0, 11.0, 6.0, 7.0, 9.0, 9.0, 11.0, 26.0, 20.0, 20.0, 28.0, 38.0, 43.0, 57.0, 51.0, 52.0, 53.0, 62.0, 53.0, 39.0, 55.0, 49.0, 51.0, 45.0, 46.0, 27.0, 18.0, 18.0, 9.0, 13.0, 19.0, 9.0, 8.0, 4.0, 8.0, 1.0, 2.0, 3.0, 2.0, 1.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.75, -11.392578125, -11.03515625, -10.677734375, -10.3203125, -9.962890625, -9.60546875, -9.248046875, -8.890625, -8.533203125, -8.17578125, -7.818359375, -7.4609375, -7.103515625, -6.74609375, -6.388671875, -6.03125, -5.673828125, -5.31640625, -4.958984375, -4.6015625, -4.244140625, -3.88671875, -3.529296875, -3.171875, -2.814453125, -2.45703125, -2.099609375, -1.7421875, -1.384765625, -1.02734375, -0.669921875, -0.3125, 0.044921875, 0.40234375, 0.759765625, 1.1171875, 1.474609375, 1.83203125, 2.189453125, 2.546875, 2.904296875, 3.26171875, 3.619140625, 3.9765625, 4.333984375, 4.69140625, 5.048828125, 5.40625, 5.763671875, 6.12109375, 6.478515625, 6.8359375, 7.193359375, 7.55078125, 7.908203125, 8.265625, 8.623046875, 8.98046875, 9.337890625, 9.6953125, 10.052734375, 10.41015625, 10.767578125, 11.125]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 1.0, 3.0, 2.0, 3.0, 5.0, 2.0, 7.0, 11.0, 13.0, 23.0, 26.0, 52.0, 75.0, 110.0, 153.0, 148.0, 133.0, 83.0, 54.0, 37.0, 23.0, 14.0, 7.0, 8.0, 3.0, 2.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-220.2195587158203, -211.78562927246094, -203.3516845703125, -194.91775512695312, -186.48382568359375, -178.04989624023438, -169.615966796875, -161.18202209472656, -152.7480926513672, -144.3141632080078, -135.88021850585938, -127.4462890625, -119.01235961914062, -110.57843017578125, -102.14449310302734, -93.71055603027344, -85.27662658691406, -76.84269714355469, -68.40876007080078, -59.97482681274414, -51.5408935546875, -43.10696029663086, -34.67302703857422, -26.239093780517578, -17.805160522460938, -9.371227264404297, -0.9372940063476562, 7.496639251708984, 15.930572509765625, 24.364505767822266, 32.798439025878906, 41.23237228393555, 49.66632080078125, 58.10025405883789, 66.53418731689453, 74.96812438964844, 83.40205383300781, 91.83598327636719, 100.2699203491211, 108.703857421875, 117.13778686523438, 125.57171630859375, 134.00564575195312, 142.43959045410156, 150.87351989746094, 159.3074493408203, 167.74139404296875, 176.17532348632812, 184.6092529296875, 193.04318237304688, 201.47711181640625, 209.9110565185547, 218.34498596191406, 226.77891540527344, 235.21286010742188, 243.64678955078125, 252.08071899414062, 260.5146484375, 268.9485778808594, 277.38250732421875, 285.81646728515625, 294.2503967285156, 302.684326171875, 311.1182556152344, 319.55218505859375]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 6.0, 6.0, 8.0, 12.0, 13.0, 16.0, 26.0, 20.0, 21.0, 26.0, 29.0, 33.0, 42.0, 52.0, 48.0, 48.0, 64.0, 46.0, 68.0, 47.0, 46.0, 55.0, 44.0, 38.0, 34.0, 22.0, 28.0, 29.0, 13.0, 10.0, 10.0, 7.0, 9.0, 6.0, 5.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-193.78839111328125, -187.7338409423828, -181.6792755126953, -175.62472534179688, -169.57017517089844, -163.515625, -157.4610595703125, -151.40650939941406, -145.35195922851562, -139.2974090576172, -133.2428436279297, -127.18829345703125, -121.13374328613281, -115.07918548583984, -109.02462768554688, -102.97007751464844, -96.91551208496094, -90.86095428466797, -84.80640411376953, -78.75184631347656, -72.69729614257812, -66.64273834228516, -60.58818054199219, -54.533626556396484, -48.47907257080078, -42.42451858520508, -36.369964599609375, -30.315406799316406, -24.260852813720703, -18.206298828125, -12.151741027832031, -6.097187042236328, -0.0426483154296875, 6.011906623840332, 12.066461563110352, 18.121017456054688, 24.17557144165039, 30.230125427246094, 36.28468322753906, 42.339237213134766, 48.39379119873047, 54.44834518432617, 60.502899169921875, 66.55745697021484, 72.61201477050781, 78.66656494140625, 84.72112274169922, 90.77568054199219, 96.83023071289062, 102.8847885131836, 108.93933868408203, 114.993896484375, 121.04844665527344, 127.1030044555664, 133.15756225585938, 139.2121124267578, 145.26666259765625, 151.3212127685547, 157.3757781982422, 163.43032836914062, 169.48487854003906, 175.5394287109375, 181.593994140625, 187.64854431152344, 193.70310974121094]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 4.0, 3.0, 3.0, 7.0, 3.0, 10.0, 12.0, 11.0, 18.0, 27.0, 36.0, 49.0, 67.0, 85.0, 129.0, 182.0, 263.0, 431.0, 747.0, 1235.0, 2362.0, 4338.0, 9233.0, 21611.0, 61188.0, 313240.0, 3540044.0, 164641.0, 42470.0, 16342.0, 7225.0, 3539.0, 1930.0, 1032.0, 618.0, 391.0, 249.0, 166.0, 93.0, 81.0, 46.0, 32.0, 24.0, 15.0, 19.0, 10.0, 6.0, 5.0, 5.0, 2.0, 2.0, 5.0, 4.0, 2.0, 2.0, 0.0, 2.0], "bins": [-78.3125, -75.9638671875, -73.615234375, -71.2666015625, -68.91796875, -66.5693359375, -64.220703125, -61.8720703125, -59.5234375, -57.1748046875, -54.826171875, -52.4775390625, -50.12890625, -47.7802734375, -45.431640625, -43.0830078125, -40.734375, -38.3857421875, -36.037109375, -33.6884765625, -31.33984375, -28.9912109375, -26.642578125, -24.2939453125, -21.9453125, -19.5966796875, -17.248046875, -14.8994140625, -12.55078125, -10.2021484375, -7.853515625, -5.5048828125, -3.15625, -0.8076171875, 1.541015625, 3.8896484375, 6.23828125, 8.5869140625, 10.935546875, 13.2841796875, 15.6328125, 17.9814453125, 20.330078125, 22.6787109375, 25.02734375, 27.3759765625, 29.724609375, 32.0732421875, 34.421875, 36.7705078125, 39.119140625, 41.4677734375, 43.81640625, 46.1650390625, 48.513671875, 50.8623046875, 53.2109375, 55.5595703125, 57.908203125, 60.2568359375, 62.60546875, 64.9541015625, 67.302734375, 69.6513671875, 72.0]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 3.0, 6.0, 6.0, 5.0, 6.0, 19.0, 23.0, 22.0, 26.0, 39.0, 48.0, 60.0, 65.0, 54.0, 70.0, 71.0, 68.0, 53.0, 61.0, 56.0, 44.0, 50.0, 33.0, 30.0, 22.0, 17.0, 15.0, 4.0, 7.0, 4.0, 6.0, 5.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.67578125, -5.4912109375, -5.306640625, -5.1220703125, -4.9375, -4.7529296875, -4.568359375, -4.3837890625, -4.19921875, -4.0146484375, -3.830078125, -3.6455078125, -3.4609375, -3.2763671875, -3.091796875, -2.9072265625, -2.72265625, -2.5380859375, -2.353515625, -2.1689453125, -1.984375, -1.7998046875, -1.615234375, -1.4306640625, -1.24609375, -1.0615234375, -0.876953125, -0.6923828125, -0.5078125, -0.3232421875, -0.138671875, 0.0458984375, 0.23046875, 0.4150390625, 0.599609375, 0.7841796875, 0.96875, 1.1533203125, 1.337890625, 1.5224609375, 1.70703125, 1.8916015625, 2.076171875, 2.2607421875, 2.4453125, 2.6298828125, 2.814453125, 2.9990234375, 3.18359375, 3.3681640625, 3.552734375, 3.7373046875, 3.921875, 4.1064453125, 4.291015625, 4.4755859375, 4.66015625, 4.8447265625, 5.029296875, 5.2138671875, 5.3984375, 5.5830078125, 5.767578125, 5.9521484375, 6.13671875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 5.0, 5.0, 8.0, 10.0, 14.0, 9.0, 19.0, 28.0, 34.0, 46.0, 80.0, 130.0, 264.0, 710.0, 2404.0, 12377.0, 135029.0, 3906469.0, 121727.0, 11303.0, 2300.0, 735.0, 259.0, 125.0, 66.0, 36.0, 24.0, 25.0, 16.0, 6.0, 6.0, 4.0, 5.0, 1.0, 1.0, 2.0, 0.0, 3.0, 6.0, 0.0, 0.0, 2.0, 1.0], "bins": [-229.625, -223.658203125, -217.69140625, -211.724609375, -205.7578125, -199.791015625, -193.82421875, -187.857421875, -181.890625, -175.923828125, -169.95703125, -163.990234375, -158.0234375, -152.056640625, -146.08984375, -140.123046875, -134.15625, -128.189453125, -122.22265625, -116.255859375, -110.2890625, -104.322265625, -98.35546875, -92.388671875, -86.421875, -80.455078125, -74.48828125, -68.521484375, -62.5546875, -56.587890625, -50.62109375, -44.654296875, -38.6875, -32.720703125, -26.75390625, -20.787109375, -14.8203125, -8.853515625, -2.88671875, 3.080078125, 9.046875, 15.013671875, 20.98046875, 26.947265625, 32.9140625, 38.880859375, 44.84765625, 50.814453125, 56.78125, 62.748046875, 68.71484375, 74.681640625, 80.6484375, 86.615234375, 92.58203125, 98.548828125, 104.515625, 110.482421875, 116.44921875, 122.416015625, 128.3828125, 134.349609375, 140.31640625, 146.283203125, 152.25]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 8.0, 14.0, 20.0, 32.0, 45.0, 76.0, 127.0, 245.0, 989.0, 1902.0, 270.0, 137.0, 86.0, 52.0, 24.0, 14.0, 16.0, 9.0, 3.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.5625, -34.674560546875, -33.78662109375, -32.898681640625, -32.0107421875, -31.122802734375, -30.23486328125, -29.346923828125, -28.458984375, -27.571044921875, -26.68310546875, -25.795166015625, -24.9072265625, -24.019287109375, -23.13134765625, -22.243408203125, -21.35546875, -20.467529296875, -19.57958984375, -18.691650390625, -17.8037109375, -16.915771484375, -16.02783203125, -15.139892578125, -14.251953125, -13.364013671875, -12.47607421875, -11.588134765625, -10.7001953125, -9.812255859375, -8.92431640625, -8.036376953125, -7.1484375, -6.260498046875, -5.37255859375, -4.484619140625, -3.5966796875, -2.708740234375, -1.82080078125, -0.932861328125, -0.044921875, 0.843017578125, 1.73095703125, 2.618896484375, 3.5068359375, 4.394775390625, 5.28271484375, 6.170654296875, 7.05859375, 7.946533203125, 8.83447265625, 9.722412109375, 10.6103515625, 11.498291015625, 12.38623046875, 13.274169921875, 14.162109375, 15.050048828125, 15.93798828125, 16.825927734375, 17.7138671875, 18.601806640625, 19.48974609375, 20.377685546875, 21.265625]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 8.0, 10.0, 15.0, 14.0, 26.0, 46.0, 88.0, 117.0, 192.0, 187.0, 143.0, 64.0, 34.0, 24.0, 15.0, 9.0, 4.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-189.19717407226562, -184.57598876953125, -179.95480346679688, -175.33363342285156, -170.7124481201172, -166.0912628173828, -161.47007751464844, -156.84890747070312, -152.22772216796875, -147.60653686523438, -142.9853515625, -138.3641815185547, -133.7429962158203, -129.12181091308594, -124.50062561035156, -119.87944793701172, -115.25826263427734, -110.63707733154297, -106.01589965820312, -101.39471435546875, -96.7735366821289, -92.15235137939453, -87.53117370605469, -82.90998840332031, -78.28880310058594, -73.66761779785156, -69.04644012451172, -64.42525482177734, -59.8040771484375, -55.182891845703125, -50.561710357666016, -45.940528869628906, -41.31934356689453, -36.69816207885742, -32.07698059082031, -27.45579719543457, -22.83461570739746, -18.21343421936035, -13.59225082397461, -8.9710693359375, -4.349887847900391, 0.27129411697387695, 4.8924760818481445, 9.51365852355957, 14.13484001159668, 18.75602149963379, 23.37720489501953, 27.99838638305664, 32.61956787109375, 37.24074935913086, 41.86193084716797, 46.483116149902344, 51.10429382324219, 55.72547912597656, 60.34666061401367, 64.96784210205078, 69.58901977539062, 74.210205078125, 78.83138275146484, 83.45256805419922, 88.07374572753906, 92.69493103027344, 97.31611633300781, 101.93729400634766, 106.55847930908203]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 5.0, 7.0, 5.0, 12.0, 12.0, 19.0, 13.0, 24.0, 24.0, 31.0, 27.0, 44.0, 45.0, 48.0, 52.0, 62.0, 67.0, 61.0, 53.0, 53.0, 48.0, 41.0, 45.0, 40.0, 24.0, 27.0, 19.0, 24.0, 17.0, 18.0, 10.0, 10.0, 6.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.23884582519531, -61.92860412597656, -59.61836624145508, -57.30812454223633, -54.997886657714844, -52.687644958496094, -50.377403259277344, -48.06716537475586, -45.756927490234375, -43.446685791015625, -41.13644790649414, -38.82620620727539, -36.515968322753906, -34.205726623535156, -31.89548683166504, -29.585247039794922, -27.275005340576172, -24.964765548706055, -22.654525756835938, -20.344284057617188, -18.034046173095703, -15.72380542755127, -13.413564682006836, -11.103324890136719, -8.793085098266602, -6.482845306396484, -4.172605037689209, -1.8623647689819336, 0.4478750228881836, 2.758114814758301, 5.068355560302734, 7.378595352172852, 9.688835144042969, 11.999074935913086, 14.309314727783203, 16.619556427001953, 18.929794311523438, 21.240036010742188, 23.550275802612305, 25.860515594482422, 28.17075538635254, 30.480995178222656, 32.791236877441406, 35.10147476196289, 37.41171646118164, 39.721954345703125, 42.032196044921875, 44.342437744140625, 46.65267562866211, 48.96291732788086, 51.273155212402344, 53.583396911621094, 55.89363479614258, 58.20387649536133, 60.51411437988281, 62.82435607910156, 65.13459777832031, 67.44483947753906, 69.75508117675781, 72.06531524658203, 74.37555694580078, 76.68579864501953, 78.99604034423828, 81.3062744140625, 83.61651611328125]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 1.0, 4.0, 2.0, 2.0, 3.0, 7.0, 7.0, 9.0, 18.0, 22.0, 22.0, 48.0, 53.0, 61.0, 91.0, 164.0, 248.0, 378.0, 607.0, 1041.0, 1806.0, 3371.0, 6296.0, 13200.0, 30055.0, 78474.0, 231757.0, 413005.0, 164919.0, 57597.0, 23030.0, 10364.0, 5231.0, 2783.0, 1497.0, 871.0, 521.0, 346.0, 193.0, 141.0, 91.0, 61.0, 42.0, 36.0, 28.0, 16.0, 12.0, 10.0, 11.0, 3.0, 6.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-42.71875, -41.35595703125, -39.9931640625, -38.63037109375, -37.267578125, -35.90478515625, -34.5419921875, -33.17919921875, -31.81640625, -30.45361328125, -29.0908203125, -27.72802734375, -26.365234375, -25.00244140625, -23.6396484375, -22.27685546875, -20.9140625, -19.55126953125, -18.1884765625, -16.82568359375, -15.462890625, -14.10009765625, -12.7373046875, -11.37451171875, -10.01171875, -8.64892578125, -7.2861328125, -5.92333984375, -4.560546875, -3.19775390625, -1.8349609375, -0.47216796875, 0.890625, 2.25341796875, 3.6162109375, 4.97900390625, 6.341796875, 7.70458984375, 9.0673828125, 10.43017578125, 11.79296875, 13.15576171875, 14.5185546875, 15.88134765625, 17.244140625, 18.60693359375, 19.9697265625, 21.33251953125, 22.6953125, 24.05810546875, 25.4208984375, 26.78369140625, 28.146484375, 29.50927734375, 30.8720703125, 32.23486328125, 33.59765625, 34.96044921875, 36.3232421875, 37.68603515625, 39.048828125, 40.41162109375, 41.7744140625, 43.13720703125, 44.5]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 6.0, 10.0, 12.0, 16.0, 16.0, 17.0, 23.0, 32.0, 45.0, 54.0, 43.0, 55.0, 57.0, 85.0, 79.0, 59.0, 62.0, 62.0, 53.0, 52.0, 38.0, 24.0, 22.0, 23.0, 14.0, 8.0, 8.0, 10.0, 6.0, 4.0, 5.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.06640625, -6.85394287109375, -6.6414794921875, -6.42901611328125, -6.216552734375, -6.00408935546875, -5.7916259765625, -5.57916259765625, -5.36669921875, -5.15423583984375, -4.9417724609375, -4.72930908203125, -4.516845703125, -4.30438232421875, -4.0919189453125, -3.87945556640625, -3.6669921875, -3.45452880859375, -3.2420654296875, -3.02960205078125, -2.817138671875, -2.60467529296875, -2.3922119140625, -2.17974853515625, -1.96728515625, -1.75482177734375, -1.5423583984375, -1.32989501953125, -1.117431640625, -0.90496826171875, -0.6925048828125, -0.48004150390625, -0.267578125, -0.05511474609375, 0.1573486328125, 0.36981201171875, 0.582275390625, 0.79473876953125, 1.0072021484375, 1.21966552734375, 1.43212890625, 1.64459228515625, 1.8570556640625, 2.06951904296875, 2.281982421875, 2.49444580078125, 2.7069091796875, 2.91937255859375, 3.1318359375, 3.34429931640625, 3.5567626953125, 3.76922607421875, 3.981689453125, 4.19415283203125, 4.4066162109375, 4.61907958984375, 4.83154296875, 5.04400634765625, 5.2564697265625, 5.46893310546875, 5.681396484375, 5.89385986328125, 6.1063232421875, 6.31878662109375, 6.53125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 5.0, 7.0, 5.0, 12.0, 10.0, 18.0, 9.0, 13.0, 19.0, 36.0, 43.0, 61.0, 116.0, 119.0, 210.0, 334.0, 543.0, 971.0, 1737.0, 3297.0, 6617.0, 14642.0, 36731.0, 110571.0, 393290.0, 330548.0, 92059.0, 31317.0, 12744.0, 5808.0, 2957.0, 1529.0, 842.0, 508.0, 282.0, 175.0, 106.0, 73.0, 54.0, 38.0, 28.0, 28.0, 18.0, 14.0, 8.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.53125, -52.875, -51.21875, -49.5625, -47.90625, -46.25, -44.59375, -42.9375, -41.28125, -39.625, -37.96875, -36.3125, -34.65625, -33.0, -31.34375, -29.6875, -28.03125, -26.375, -24.71875, -23.0625, -21.40625, -19.75, -18.09375, -16.4375, -14.78125, -13.125, -11.46875, -9.8125, -8.15625, -6.5, -4.84375, -3.1875, -1.53125, 0.125, 1.78125, 3.4375, 5.09375, 6.75, 8.40625, 10.0625, 11.71875, 13.375, 15.03125, 16.6875, 18.34375, 20.0, 21.65625, 23.3125, 24.96875, 26.625, 28.28125, 29.9375, 31.59375, 33.25, 34.90625, 36.5625, 38.21875, 39.875, 41.53125, 43.1875, 44.84375, 46.5, 48.15625, 49.8125, 51.46875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 4.0, 6.0, 3.0, 6.0, 6.0, 8.0, 9.0, 13.0, 17.0, 12.0, 12.0, 23.0, 20.0, 31.0, 34.0, 33.0, 43.0, 34.0, 47.0, 44.0, 39.0, 33.0, 43.0, 41.0, 53.0, 52.0, 38.0, 38.0, 31.0, 39.0, 35.0, 31.0, 18.0, 23.0, 9.0, 10.0, 16.0, 7.0, 11.0, 9.0, 2.0, 9.0, 2.0, 2.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.40625, -30.4423828125, -29.478515625, -28.5146484375, -27.55078125, -26.5869140625, -25.623046875, -24.6591796875, -23.6953125, -22.7314453125, -21.767578125, -20.8037109375, -19.83984375, -18.8759765625, -17.912109375, -16.9482421875, -15.984375, -15.0205078125, -14.056640625, -13.0927734375, -12.12890625, -11.1650390625, -10.201171875, -9.2373046875, -8.2734375, -7.3095703125, -6.345703125, -5.3818359375, -4.41796875, -3.4541015625, -2.490234375, -1.5263671875, -0.5625, 0.4013671875, 1.365234375, 2.3291015625, 3.29296875, 4.2568359375, 5.220703125, 6.1845703125, 7.1484375, 8.1123046875, 9.076171875, 10.0400390625, 11.00390625, 11.9677734375, 12.931640625, 13.8955078125, 14.859375, 15.8232421875, 16.787109375, 17.7509765625, 18.71484375, 19.6787109375, 20.642578125, 21.6064453125, 22.5703125, 23.5341796875, 24.498046875, 25.4619140625, 26.42578125, 27.3896484375, 28.353515625, 29.3173828125, 30.28125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 5.0, 11.0, 20.0, 31.0, 49.0, 44.0, 67.0, 106.0, 153.0, 232.0, 324.0, 457.0, 695.0, 1035.0, 1460.0, 2100.0, 3271.0, 5364.0, 9288.0, 20146.0, 60397.0, 291035.0, 487473.0, 104811.0, 29304.0, 12501.0, 6425.0, 3953.0, 2465.0, 1744.0, 1118.0, 762.0, 506.0, 380.0, 260.0, 171.0, 128.0, 96.0, 64.0, 34.0, 33.0, 13.0, 13.0, 6.0, 3.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.109375, -24.21875, -23.328125, -22.4375, -21.546875, -20.65625, -19.765625, -18.875, -17.984375, -17.09375, -16.203125, -15.3125, -14.421875, -13.53125, -12.640625, -11.75, -10.859375, -9.96875, -9.078125, -8.1875, -7.296875, -6.40625, -5.515625, -4.625, -3.734375, -2.84375, -1.953125, -1.0625, -0.171875, 0.71875, 1.609375, 2.5, 3.390625, 4.28125, 5.171875, 6.0625, 6.953125, 7.84375, 8.734375, 9.625, 10.515625, 11.40625, 12.296875, 13.1875, 14.078125, 14.96875, 15.859375, 16.75, 17.640625, 18.53125, 19.421875, 20.3125, 21.203125, 22.09375, 22.984375, 23.875, 24.765625, 25.65625, 26.546875, 27.4375, 28.328125, 29.21875, 30.109375, 31.0, 31.890625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 11.0, 7.0, 18.0, 20.0, 25.0, 53.0, 113.0, 162.0, 201.0, 156.0, 86.0, 54.0, 26.0, 20.0, 11.0, 11.0, 6.0, 1.0, 2.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00714111328125, -0.006860613822937012, -0.0065801143646240234, -0.006299614906311035, -0.006019115447998047, -0.005738615989685059, -0.00545811653137207, -0.005177617073059082, -0.004897117614746094, -0.0046166181564331055, -0.004336118698120117, -0.004055619239807129, -0.0037751197814941406, -0.0034946203231811523, -0.003214120864868164, -0.0029336214065551758, -0.0026531219482421875, -0.0023726224899291992, -0.002092123031616211, -0.0018116235733032227, -0.0015311241149902344, -0.001250624656677246, -0.0009701251983642578, -0.0006896257400512695, -0.00040912628173828125, -0.00012862682342529297, 0.0001518726348876953, 0.0004323720932006836, 0.0007128715515136719, 0.0009933710098266602, 0.0012738704681396484, 0.0015543699264526367, 0.001834869384765625, 0.0021153688430786133, 0.0023958683013916016, 0.00267636775970459, 0.002956867218017578, 0.0032373666763305664, 0.0035178661346435547, 0.003798365592956543, 0.004078865051269531, 0.0043593645095825195, 0.004639863967895508, 0.004920363426208496, 0.005200862884521484, 0.005481362342834473, 0.005761861801147461, 0.006042361259460449, 0.0063228607177734375, 0.006603360176086426, 0.006883859634399414, 0.007164359092712402, 0.007444858551025391, 0.007725358009338379, 0.008005857467651367, 0.008286356925964355, 0.008566856384277344, 0.008847355842590332, 0.00912785530090332, 0.009408354759216309, 0.009688854217529297, 0.009969353675842285, 0.010249853134155273, 0.010530352592468262, 0.01081085205078125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 3.0, 2.0, 9.0, 13.0, 13.0, 13.0, 24.0, 42.0, 46.0, 93.0, 120.0, 201.0, 409.0, 640.0, 1258.0, 2463.0, 5335.0, 14037.0, 68065.0, 754202.0, 165265.0, 22428.0, 7191.0, 3109.0, 1591.0, 825.0, 480.0, 251.0, 160.0, 88.0, 50.0, 42.0, 23.0, 24.0, 10.0, 5.0, 4.0, 3.0, 8.0, 4.0, 1.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.40625, -58.5576171875, -56.708984375, -54.8603515625, -53.01171875, -51.1630859375, -49.314453125, -47.4658203125, -45.6171875, -43.7685546875, -41.919921875, -40.0712890625, -38.22265625, -36.3740234375, -34.525390625, -32.6767578125, -30.828125, -28.9794921875, -27.130859375, -25.2822265625, -23.43359375, -21.5849609375, -19.736328125, -17.8876953125, -16.0390625, -14.1904296875, -12.341796875, -10.4931640625, -8.64453125, -6.7958984375, -4.947265625, -3.0986328125, -1.25, 0.5986328125, 2.447265625, 4.2958984375, 6.14453125, 7.9931640625, 9.841796875, 11.6904296875, 13.5390625, 15.3876953125, 17.236328125, 19.0849609375, 20.93359375, 22.7822265625, 24.630859375, 26.4794921875, 28.328125, 30.1767578125, 32.025390625, 33.8740234375, 35.72265625, 37.5712890625, 39.419921875, 41.2685546875, 43.1171875, 44.9658203125, 46.814453125, 48.6630859375, 50.51171875, 52.3603515625, 54.208984375, 56.0576171875, 57.90625]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 3.0, 2.0, 4.0, 4.0, 4.0, 2.0, 1.0, 3.0, 5.0, 6.0, 6.0, 9.0, 2.0, 13.0, 15.0, 27.0, 46.0, 64.0, 92.0, 158.0, 144.0, 139.0, 80.0, 54.0, 30.0, 18.0, 12.0, 13.0, 13.0, 9.0, 5.0, 3.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-29.890625, -28.9658203125, -28.041015625, -27.1162109375, -26.19140625, -25.2666015625, -24.341796875, -23.4169921875, -22.4921875, -21.5673828125, -20.642578125, -19.7177734375, -18.79296875, -17.8681640625, -16.943359375, -16.0185546875, -15.09375, -14.1689453125, -13.244140625, -12.3193359375, -11.39453125, -10.4697265625, -9.544921875, -8.6201171875, -7.6953125, -6.7705078125, -5.845703125, -4.9208984375, -3.99609375, -3.0712890625, -2.146484375, -1.2216796875, -0.296875, 0.6279296875, 1.552734375, 2.4775390625, 3.40234375, 4.3271484375, 5.251953125, 6.1767578125, 7.1015625, 8.0263671875, 8.951171875, 9.8759765625, 10.80078125, 11.7255859375, 12.650390625, 13.5751953125, 14.5, 15.4248046875, 16.349609375, 17.2744140625, 18.19921875, 19.1240234375, 20.048828125, 20.9736328125, 21.8984375, 22.8232421875, 23.748046875, 24.6728515625, 25.59765625, 26.5224609375, 27.447265625, 28.3720703125, 29.296875]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 4.0, 8.0, 8.0, 5.0, 10.0, 14.0, 36.0, 44.0, 92.0, 101.0, 141.0, 186.0, 126.0, 71.0, 55.0, 39.0, 16.0, 14.0, 19.0, 4.0, 5.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-296.50390625, -284.24200439453125, -271.9801330566406, -259.7182312011719, -247.4563446044922, -235.1944580078125, -222.93255615234375, -210.67066955566406, -198.40878295898438, -186.1468963623047, -173.88499450683594, -161.62310791015625, -149.36122131347656, -137.09933471679688, -124.83743286132812, -112.57554626464844, -100.31364440917969, -88.05175018310547, -75.78986358642578, -63.52796936035156, -51.26607894897461, -39.004188537597656, -26.742294311523438, -14.48040771484375, -2.2185134887695312, 10.043377876281738, 22.305269241333008, 34.567161560058594, 46.82905197143555, 59.0909423828125, 71.35283660888672, 83.6147232055664, 95.87661743164062, 108.13851165771484, 120.40039825439453, 132.66229248046875, 144.92417907714844, 157.18606567382812, 169.44796752929688, 181.70985412597656, 193.97174072265625, 206.23362731933594, 218.4955291748047, 230.75741577148438, 243.01930236816406, 255.28118896484375, 267.5430908203125, 279.80499267578125, 292.06689453125, 304.32879638671875, 316.5906677246094, 328.8525695800781, 341.1144714355469, 353.3763427734375, 365.63824462890625, 377.900146484375, 390.1620178222656, 402.4239196777344, 414.685791015625, 426.94769287109375, 439.2095947265625, 451.4714660644531, 463.7333679199219, 475.9952392578125, 488.25714111328125]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 6.0, 1.0, 3.0, 7.0, 11.0, 6.0, 11.0, 9.0, 12.0, 14.0, 19.0, 13.0, 28.0, 26.0, 31.0, 26.0, 32.0, 35.0, 28.0, 41.0, 51.0, 46.0, 36.0, 34.0, 41.0, 51.0, 48.0, 41.0, 42.0, 34.0, 29.0, 35.0, 33.0, 14.0, 27.0, 14.0, 9.0, 16.0, 16.0, 8.0, 9.0, 7.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-254.588623046875, -247.61636352539062, -240.64410400390625, -233.67184448242188, -226.69956970214844, -219.72731018066406, -212.7550506591797, -205.7827911376953, -198.81051635742188, -191.8382568359375, -184.86599731445312, -177.89373779296875, -170.9214630126953, -163.94920349121094, -156.97694396972656, -150.0046844482422, -143.0324249267578, -136.06016540527344, -129.08790588378906, -122.11563873291016, -115.14337158203125, -108.17111206054688, -101.1988525390625, -94.22659301757812, -87.25432586669922, -80.28206634521484, -73.30979919433594, -66.33753967285156, -59.36527633666992, -52.39301300048828, -45.420753479003906, -38.448490142822266, -31.476242065429688, -24.503978729248047, -17.53171730041504, -10.559455871582031, -3.5871925354003906, 3.38507080078125, 10.357330322265625, 17.329593658447266, 24.301856994628906, 31.274120330810547, 38.24638366699219, 45.21864318847656, 52.1909065246582, 59.163169860839844, 66.13542938232422, 73.10769653320312, 80.0799560546875, 87.05221557617188, 94.02448272705078, 100.99674224853516, 107.96900939941406, 114.94126892089844, 121.91352844238281, 128.8857879638672, 135.85806274414062, 142.830322265625, 149.80258178710938, 156.77484130859375, 163.7471160888672, 170.71937561035156, 177.69163513183594, 184.6638946533203, 191.6361541748047]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 2.0, 8.0, 5.0, 3.0, 7.0, 6.0, 9.0, 15.0, 22.0, 17.0, 47.0, 61.0, 79.0, 104.0, 180.0, 262.0, 416.0, 730.0, 1196.0, 2180.0, 4479.0, 10078.0, 26491.0, 97076.0, 3627172.0, 341345.0, 50854.0, 16644.0, 6961.0, 3430.0, 1742.0, 993.0, 619.0, 350.0, 229.0, 152.0, 103.0, 70.0, 49.0, 36.0, 19.0, 10.0, 9.0, 2.0, 5.0, 4.0, 5.0, 4.0, 4.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-68.6875, -66.5263671875, -64.365234375, -62.2041015625, -60.04296875, -57.8818359375, -55.720703125, -53.5595703125, -51.3984375, -49.2373046875, -47.076171875, -44.9150390625, -42.75390625, -40.5927734375, -38.431640625, -36.2705078125, -34.109375, -31.9482421875, -29.787109375, -27.6259765625, -25.46484375, -23.3037109375, -21.142578125, -18.9814453125, -16.8203125, -14.6591796875, -12.498046875, -10.3369140625, -8.17578125, -6.0146484375, -3.853515625, -1.6923828125, 0.46875, 2.6298828125, 4.791015625, 6.9521484375, 9.11328125, 11.2744140625, 13.435546875, 15.5966796875, 17.7578125, 19.9189453125, 22.080078125, 24.2412109375, 26.40234375, 28.5634765625, 30.724609375, 32.8857421875, 35.046875, 37.2080078125, 39.369140625, 41.5302734375, 43.69140625, 45.8525390625, 48.013671875, 50.1748046875, 52.3359375, 54.4970703125, 56.658203125, 58.8193359375, 60.98046875, 63.1416015625, 65.302734375, 67.4638671875, 69.625]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 5.0, 10.0, 8.0, 13.0, 12.0, 23.0, 29.0, 36.0, 36.0, 30.0, 49.0, 50.0, 56.0, 65.0, 57.0, 59.0, 54.0, 61.0, 43.0, 43.0, 35.0, 50.0, 32.0, 33.0, 27.0, 17.0, 13.0, 9.0, 9.0, 10.0, 10.0, 3.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.046875, -5.825927734375, -5.60498046875, -5.384033203125, -5.1630859375, -4.942138671875, -4.72119140625, -4.500244140625, -4.279296875, -4.058349609375, -3.83740234375, -3.616455078125, -3.3955078125, -3.174560546875, -2.95361328125, -2.732666015625, -2.51171875, -2.290771484375, -2.06982421875, -1.848876953125, -1.6279296875, -1.406982421875, -1.18603515625, -0.965087890625, -0.744140625, -0.523193359375, -0.30224609375, -0.081298828125, 0.1396484375, 0.360595703125, 0.58154296875, 0.802490234375, 1.0234375, 1.244384765625, 1.46533203125, 1.686279296875, 1.9072265625, 2.128173828125, 2.34912109375, 2.570068359375, 2.791015625, 3.011962890625, 3.23291015625, 3.453857421875, 3.6748046875, 3.895751953125, 4.11669921875, 4.337646484375, 4.55859375, 4.779541015625, 5.00048828125, 5.221435546875, 5.4423828125, 5.663330078125, 5.88427734375, 6.105224609375, 6.326171875, 6.547119140625, 6.76806640625, 6.989013671875, 7.2099609375, 7.430908203125, 7.65185546875, 7.872802734375, 8.09375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 1.0, 5.0, 9.0, 8.0, 18.0, 35.0, 23.0, 36.0, 40.0, 75.0, 112.0, 205.0, 343.0, 651.0, 1324.0, 2777.0, 6446.0, 18874.0, 83110.0, 3353880.0, 644200.0, 57770.0, 14358.0, 5254.0, 2252.0, 1094.0, 581.0, 287.0, 179.0, 105.0, 69.0, 52.0, 38.0, 22.0, 22.0, 10.0, 9.0, 5.0, 6.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-93.25, -90.4150390625, -87.580078125, -84.7451171875, -81.91015625, -79.0751953125, -76.240234375, -73.4052734375, -70.5703125, -67.7353515625, -64.900390625, -62.0654296875, -59.23046875, -56.3955078125, -53.560546875, -50.7255859375, -47.890625, -45.0556640625, -42.220703125, -39.3857421875, -36.55078125, -33.7158203125, -30.880859375, -28.0458984375, -25.2109375, -22.3759765625, -19.541015625, -16.7060546875, -13.87109375, -11.0361328125, -8.201171875, -5.3662109375, -2.53125, 0.3037109375, 3.138671875, 5.9736328125, 8.80859375, 11.6435546875, 14.478515625, 17.3134765625, 20.1484375, 22.9833984375, 25.818359375, 28.6533203125, 31.48828125, 34.3232421875, 37.158203125, 39.9931640625, 42.828125, 45.6630859375, 48.498046875, 51.3330078125, 54.16796875, 57.0029296875, 59.837890625, 62.6728515625, 65.5078125, 68.3427734375, 71.177734375, 74.0126953125, 76.84765625, 79.6826171875, 82.517578125, 85.3525390625, 88.1875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 12.0, 12.0, 15.0, 19.0, 27.0, 53.0, 79.0, 157.0, 415.0, 2587.0, 327.0, 156.0, 81.0, 40.0, 34.0, 15.0, 12.0, 7.0, 6.0, 2.0, 6.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.5625, -27.732666015625, -26.90283203125, -26.072998046875, -25.2431640625, -24.413330078125, -23.58349609375, -22.753662109375, -21.923828125, -21.093994140625, -20.26416015625, -19.434326171875, -18.6044921875, -17.774658203125, -16.94482421875, -16.114990234375, -15.28515625, -14.455322265625, -13.62548828125, -12.795654296875, -11.9658203125, -11.135986328125, -10.30615234375, -9.476318359375, -8.646484375, -7.816650390625, -6.98681640625, -6.156982421875, -5.3271484375, -4.497314453125, -3.66748046875, -2.837646484375, -2.0078125, -1.177978515625, -0.34814453125, 0.481689453125, 1.3115234375, 2.141357421875, 2.97119140625, 3.801025390625, 4.630859375, 5.460693359375, 6.29052734375, 7.120361328125, 7.9501953125, 8.780029296875, 9.60986328125, 10.439697265625, 11.26953125, 12.099365234375, 12.92919921875, 13.759033203125, 14.5888671875, 15.418701171875, 16.24853515625, 17.078369140625, 17.908203125, 18.738037109375, 19.56787109375, 20.397705078125, 21.2275390625, 22.057373046875, 22.88720703125, 23.717041015625, 24.546875]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 4.0, 2.0, 11.0, 22.0, 27.0, 36.0, 61.0, 104.0, 132.0, 155.0, 143.0, 125.0, 70.0, 45.0, 25.0, 19.0, 10.0, 3.0, 6.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-114.69446563720703, -111.07264709472656, -107.45083618164062, -103.82901763916016, -100.20720672607422, -96.58538818359375, -92.96357727050781, -89.34175872802734, -85.7199478149414, -82.09812927246094, -78.476318359375, -74.85449981689453, -71.2326889038086, -67.61087036132812, -63.98905944824219, -60.36724090576172, -56.745426177978516, -53.12361145019531, -49.50179672241211, -45.879981994628906, -42.2581672668457, -38.6363525390625, -35.01453399658203, -31.39272117614746, -27.770906448364258, -24.149091720581055, -20.52727699279785, -16.905460357666016, -13.283646583557129, -9.66183090209961, -6.040016174316406, -2.418201446533203, 1.20361328125, 4.825428009033203, 8.447242736816406, 12.069058418273926, 15.690873146057129, 19.31268882751465, 22.93450355529785, 26.556318283081055, 30.178133010864258, 33.799949645996094, 37.4217643737793, 41.0435791015625, 44.6653938293457, 48.287208557128906, 51.90902328491211, 55.53083801269531, 59.152652740478516, 62.77446746826172, 66.39628601074219, 70.01809692382812, 73.6399154663086, 77.26172637939453, 80.883544921875, 84.50535583496094, 88.1271743774414, 91.74899291992188, 95.37080383300781, 98.99262237548828, 102.61443328857422, 106.23625183105469, 109.85806274414062, 113.4798812866211, 117.10169219970703]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 6.0, 2.0, 1.0, 2.0, 3.0, 6.0, 7.0, 8.0, 8.0, 18.0, 16.0, 18.0, 23.0, 28.0, 25.0, 22.0, 21.0, 34.0, 31.0, 38.0, 38.0, 37.0, 39.0, 34.0, 41.0, 27.0, 38.0, 41.0, 51.0, 35.0, 30.0, 38.0, 21.0, 29.0, 27.0, 17.0, 28.0, 26.0, 17.0, 10.0, 16.0, 12.0, 12.0, 6.0, 4.0, 2.0, 8.0, 5.0, 1.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-46.5582389831543, -44.98756408691406, -43.41688537597656, -41.84620666503906, -40.27553176879883, -38.704856872558594, -37.134178161621094, -35.563499450683594, -33.99282455444336, -32.422149658203125, -30.851470947265625, -29.280794143676758, -27.71011734008789, -26.139440536499023, -24.568763732910156, -22.99808692932129, -21.427410125732422, -19.856733322143555, -18.286056518554688, -16.71537971496582, -15.144702911376953, -13.574026107788086, -12.003349304199219, -10.432672500610352, -8.861995697021484, -7.291318893432617, -5.72064208984375, -4.149965286254883, -2.5792884826660156, -1.0086116790771484, 0.5620651245117188, 2.132741928100586, 3.7034225463867188, 5.274099349975586, 6.844776153564453, 8.41545295715332, 9.986129760742188, 11.556806564331055, 13.127483367919922, 14.698160171508789, 16.268836975097656, 17.839513778686523, 19.41019058227539, 20.980867385864258, 22.551544189453125, 24.122220993041992, 25.69289779663086, 27.263574600219727, 28.834251403808594, 30.40492820739746, 31.975605010986328, 33.54627990722656, 35.11695861816406, 36.68763732910156, 38.2583122253418, 39.82898712158203, 41.39966583251953, 42.97034454345703, 44.541019439697266, 46.1116943359375, 47.682373046875, 49.2530517578125, 50.823726654052734, 52.39440155029297, 53.96508026123047]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 6.0, 2.0, 0.0, 7.0, 9.0, 13.0, 22.0, 34.0, 35.0, 55.0, 100.0, 102.0, 233.0, 366.0, 566.0, 926.0, 1650.0, 2944.0, 5763.0, 11578.0, 24762.0, 57560.0, 148383.0, 368619.0, 255669.0, 94931.0, 39032.0, 17239.0, 8284.0, 4204.0, 2244.0, 1198.0, 752.0, 459.0, 278.0, 169.0, 122.0, 74.0, 50.0, 38.0, 24.0, 16.0, 17.0, 14.0, 5.0, 4.0, 1.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-36.125, -34.91162109375, -33.6982421875, -32.48486328125, -31.271484375, -30.05810546875, -28.8447265625, -27.63134765625, -26.41796875, -25.20458984375, -23.9912109375, -22.77783203125, -21.564453125, -20.35107421875, -19.1376953125, -17.92431640625, -16.7109375, -15.49755859375, -14.2841796875, -13.07080078125, -11.857421875, -10.64404296875, -9.4306640625, -8.21728515625, -7.00390625, -5.79052734375, -4.5771484375, -3.36376953125, -2.150390625, -0.93701171875, 0.2763671875, 1.48974609375, 2.703125, 3.91650390625, 5.1298828125, 6.34326171875, 7.556640625, 8.77001953125, 9.9833984375, 11.19677734375, 12.41015625, 13.62353515625, 14.8369140625, 16.05029296875, 17.263671875, 18.47705078125, 19.6904296875, 20.90380859375, 22.1171875, 23.33056640625, 24.5439453125, 25.75732421875, 26.970703125, 28.18408203125, 29.3974609375, 30.61083984375, 31.82421875, 33.03759765625, 34.2509765625, 35.46435546875, 36.677734375, 37.89111328125, 39.1044921875, 40.31787109375, 41.53125]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 7.0, 8.0, 10.0, 8.0, 13.0, 28.0, 38.0, 40.0, 40.0, 47.0, 70.0, 68.0, 59.0, 66.0, 72.0, 62.0, 54.0, 66.0, 50.0, 36.0, 29.0, 33.0, 23.0, 16.0, 14.0, 8.0, 15.0, 9.0, 3.0, 3.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.71875, -8.4537353515625, -8.188720703125, -7.9237060546875, -7.65869140625, -7.3936767578125, -7.128662109375, -6.8636474609375, -6.5986328125, -6.3336181640625, -6.068603515625, -5.8035888671875, -5.53857421875, -5.2735595703125, -5.008544921875, -4.7435302734375, -4.478515625, -4.2135009765625, -3.948486328125, -3.6834716796875, -3.41845703125, -3.1534423828125, -2.888427734375, -2.6234130859375, -2.3583984375, -2.0933837890625, -1.828369140625, -1.5633544921875, -1.29833984375, -1.0333251953125, -0.768310546875, -0.5032958984375, -0.23828125, 0.0267333984375, 0.291748046875, 0.5567626953125, 0.82177734375, 1.0867919921875, 1.351806640625, 1.6168212890625, 1.8818359375, 2.1468505859375, 2.411865234375, 2.6768798828125, 2.94189453125, 3.2069091796875, 3.471923828125, 3.7369384765625, 4.001953125, 4.2669677734375, 4.531982421875, 4.7969970703125, 5.06201171875, 5.3270263671875, 5.592041015625, 5.8570556640625, 6.1220703125, 6.3870849609375, 6.652099609375, 6.9171142578125, 7.18212890625, 7.4471435546875, 7.712158203125, 7.9771728515625, 8.2421875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 2.0, 5.0, 8.0, 7.0, 8.0, 16.0, 28.0, 34.0, 42.0, 67.0, 117.0, 194.0, 280.0, 458.0, 818.0, 1335.0, 2284.0, 4323.0, 8027.0, 16583.0, 36610.0, 96332.0, 310286.0, 372038.0, 117124.0, 42833.0, 18752.0, 8981.0, 4652.0, 2597.0, 1429.0, 819.0, 512.0, 349.0, 180.0, 133.0, 100.0, 58.0, 39.0, 27.0, 18.0, 17.0, 12.0, 13.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-44.75, -43.3974609375, -42.044921875, -40.6923828125, -39.33984375, -37.9873046875, -36.634765625, -35.2822265625, -33.9296875, -32.5771484375, -31.224609375, -29.8720703125, -28.51953125, -27.1669921875, -25.814453125, -24.4619140625, -23.109375, -21.7568359375, -20.404296875, -19.0517578125, -17.69921875, -16.3466796875, -14.994140625, -13.6416015625, -12.2890625, -10.9365234375, -9.583984375, -8.2314453125, -6.87890625, -5.5263671875, -4.173828125, -2.8212890625, -1.46875, -0.1162109375, 1.236328125, 2.5888671875, 3.94140625, 5.2939453125, 6.646484375, 7.9990234375, 9.3515625, 10.7041015625, 12.056640625, 13.4091796875, 14.76171875, 16.1142578125, 17.466796875, 18.8193359375, 20.171875, 21.5244140625, 22.876953125, 24.2294921875, 25.58203125, 26.9345703125, 28.287109375, 29.6396484375, 30.9921875, 32.3447265625, 33.697265625, 35.0498046875, 36.40234375, 37.7548828125, 39.107421875, 40.4599609375, 41.8125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 12.0, 6.0, 7.0, 9.0, 10.0, 13.0, 19.0, 16.0, 23.0, 39.0, 32.0, 37.0, 46.0, 51.0, 50.0, 52.0, 57.0, 42.0, 53.0, 54.0, 48.0, 38.0, 40.0, 36.0, 29.0, 26.0, 25.0, 22.0, 24.0, 16.0, 10.0, 14.0, 15.0, 10.0, 5.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.78125, -42.5419921875, -41.302734375, -40.0634765625, -38.82421875, -37.5849609375, -36.345703125, -35.1064453125, -33.8671875, -32.6279296875, -31.388671875, -30.1494140625, -28.91015625, -27.6708984375, -26.431640625, -25.1923828125, -23.953125, -22.7138671875, -21.474609375, -20.2353515625, -18.99609375, -17.7568359375, -16.517578125, -15.2783203125, -14.0390625, -12.7998046875, -11.560546875, -10.3212890625, -9.08203125, -7.8427734375, -6.603515625, -5.3642578125, -4.125, -2.8857421875, -1.646484375, -0.4072265625, 0.83203125, 2.0712890625, 3.310546875, 4.5498046875, 5.7890625, 7.0283203125, 8.267578125, 9.5068359375, 10.74609375, 11.9853515625, 13.224609375, 14.4638671875, 15.703125, 16.9423828125, 18.181640625, 19.4208984375, 20.66015625, 21.8994140625, 23.138671875, 24.3779296875, 25.6171875, 26.8564453125, 28.095703125, 29.3349609375, 30.57421875, 31.8134765625, 33.052734375, 34.2919921875, 35.53125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 14.0, 17.0, 17.0, 22.0, 17.0, 40.0, 70.0, 109.0, 131.0, 145.0, 222.0, 365.0, 493.0, 721.0, 1161.0, 1887.0, 3991.0, 11952.0, 76858.0, 765024.0, 156605.0, 17371.0, 5159.0, 2313.0, 1262.0, 818.0, 557.0, 352.0, 263.0, 182.0, 111.0, 84.0, 52.0, 46.0, 40.0, 32.0, 9.0, 17.0, 4.0, 4.0, 3.0, 6.0, 5.0, 1.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.4375, -39.990234375, -38.54296875, -37.095703125, -35.6484375, -34.201171875, -32.75390625, -31.306640625, -29.859375, -28.412109375, -26.96484375, -25.517578125, -24.0703125, -22.623046875, -21.17578125, -19.728515625, -18.28125, -16.833984375, -15.38671875, -13.939453125, -12.4921875, -11.044921875, -9.59765625, -8.150390625, -6.703125, -5.255859375, -3.80859375, -2.361328125, -0.9140625, 0.533203125, 1.98046875, 3.427734375, 4.875, 6.322265625, 7.76953125, 9.216796875, 10.6640625, 12.111328125, 13.55859375, 15.005859375, 16.453125, 17.900390625, 19.34765625, 20.794921875, 22.2421875, 23.689453125, 25.13671875, 26.583984375, 28.03125, 29.478515625, 30.92578125, 32.373046875, 33.8203125, 35.267578125, 36.71484375, 38.162109375, 39.609375, 41.056640625, 42.50390625, 43.951171875, 45.3984375, 46.845703125, 48.29296875, 49.740234375, 51.1875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 6.0, 3.0, 21.0, 30.0, 121.0, 446.0, 253.0, 72.0, 24.0, 16.0, 5.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0269775390625, -0.0263746976852417, -0.0257718563079834, -0.025169014930725098, -0.024566173553466797, -0.023963332176208496, -0.023360490798950195, -0.022757649421691895, -0.022154808044433594, -0.021551966667175293, -0.020949125289916992, -0.02034628391265869, -0.01974344253540039, -0.01914060115814209, -0.01853775978088379, -0.01793491840362549, -0.017332077026367188, -0.016729235649108887, -0.016126394271850586, -0.015523552894592285, -0.014920711517333984, -0.014317870140075684, -0.013715028762817383, -0.013112187385559082, -0.012509346008300781, -0.01190650463104248, -0.01130366325378418, -0.010700821876525879, -0.010097980499267578, -0.009495139122009277, -0.008892297744750977, -0.008289456367492676, -0.007686614990234375, -0.007083773612976074, -0.0064809322357177734, -0.005878090858459473, -0.005275249481201172, -0.004672408103942871, -0.00406956672668457, -0.0034667253494262695, -0.0028638839721679688, -0.002261042594909668, -0.0016582012176513672, -0.0010553598403930664, -0.0004525184631347656, 0.00015032291412353516, 0.0007531642913818359, 0.0013560056686401367, 0.0019588470458984375, 0.0025616884231567383, 0.003164529800415039, 0.00376737117767334, 0.004370212554931641, 0.004973053932189941, 0.005575895309448242, 0.006178736686706543, 0.006781578063964844, 0.0073844194412231445, 0.007987260818481445, 0.008590102195739746, 0.009192943572998047, 0.009795784950256348, 0.010398626327514648, 0.01100146770477295, 0.01160430908203125]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 6.0, 6.0, 11.0, 10.0, 32.0, 33.0, 35.0, 52.0, 69.0, 103.0, 164.0, 264.0, 379.0, 594.0, 934.0, 1616.0, 3179.0, 8660.0, 45211.0, 661392.0, 289432.0, 24171.0, 5950.0, 2449.0, 1415.0, 854.0, 493.0, 342.0, 209.0, 163.0, 106.0, 65.0, 52.0, 28.0, 24.0, 11.0, 16.0, 7.0, 6.0, 7.0, 0.0, 3.0, 3.0, 1.0, 2.0, 1.0], "bins": [-56.09375, -54.611328125, -53.12890625, -51.646484375, -50.1640625, -48.681640625, -47.19921875, -45.716796875, -44.234375, -42.751953125, -41.26953125, -39.787109375, -38.3046875, -36.822265625, -35.33984375, -33.857421875, -32.375, -30.892578125, -29.41015625, -27.927734375, -26.4453125, -24.962890625, -23.48046875, -21.998046875, -20.515625, -19.033203125, -17.55078125, -16.068359375, -14.5859375, -13.103515625, -11.62109375, -10.138671875, -8.65625, -7.173828125, -5.69140625, -4.208984375, -2.7265625, -1.244140625, 0.23828125, 1.720703125, 3.203125, 4.685546875, 6.16796875, 7.650390625, 9.1328125, 10.615234375, 12.09765625, 13.580078125, 15.0625, 16.544921875, 18.02734375, 19.509765625, 20.9921875, 22.474609375, 23.95703125, 25.439453125, 26.921875, 28.404296875, 29.88671875, 31.369140625, 32.8515625, 34.333984375, 35.81640625, 37.298828125, 38.78125]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 8.0, 4.0, 11.0, 19.0, 27.0, 46.0, 66.0, 112.0, 168.0, 176.0, 132.0, 85.0, 54.0, 24.0, 22.0, 17.0, 8.0, 6.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-38.09375, -37.0986328125, -36.103515625, -35.1083984375, -34.11328125, -33.1181640625, -32.123046875, -31.1279296875, -30.1328125, -29.1376953125, -28.142578125, -27.1474609375, -26.15234375, -25.1572265625, -24.162109375, -23.1669921875, -22.171875, -21.1767578125, -20.181640625, -19.1865234375, -18.19140625, -17.1962890625, -16.201171875, -15.2060546875, -14.2109375, -13.2158203125, -12.220703125, -11.2255859375, -10.23046875, -9.2353515625, -8.240234375, -7.2451171875, -6.25, -5.2548828125, -4.259765625, -3.2646484375, -2.26953125, -1.2744140625, -0.279296875, 0.7158203125, 1.7109375, 2.7060546875, 3.701171875, 4.6962890625, 5.69140625, 6.6865234375, 7.681640625, 8.6767578125, 9.671875, 10.6669921875, 11.662109375, 12.6572265625, 13.65234375, 14.6474609375, 15.642578125, 16.6376953125, 17.6328125, 18.6279296875, 19.623046875, 20.6181640625, 21.61328125, 22.6083984375, 23.603515625, 24.5986328125, 25.59375]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 3.0, 7.0, 8.0, 9.0, 14.0, 18.0, 21.0, 38.0, 35.0, 48.0, 62.0, 87.0, 103.0, 91.0, 93.0, 76.0, 68.0, 56.0, 40.0, 25.0, 25.0, 25.0, 13.0, 9.0, 7.0, 2.0, 6.0, 3.0, 7.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-176.0668182373047, -168.53146362304688, -160.99612426757812, -153.4607696533203, -145.9254150390625, -138.39007568359375, -130.85472106933594, -123.31936645507812, -115.78401947021484, -108.24867248535156, -100.71331787109375, -93.17797088623047, -85.64262390136719, -78.10726928710938, -70.5719223022461, -63.03657150268555, -55.501220703125, -47.96586990356445, -40.430519104003906, -32.895172119140625, -25.359821319580078, -17.82447052001953, -10.28912353515625, -2.753772735595703, 4.781578063964844, 12.316927909851074, 19.852277755737305, 27.38762664794922, 34.922977447509766, 42.45832824707031, 49.993675231933594, 57.52902603149414, 65.06439208984375, 72.59973907470703, 80.13509368896484, 87.67044067382812, 95.20579528808594, 102.74114227294922, 110.2764892578125, 117.81184387207031, 125.3471908569336, 132.88253784179688, 140.4178924560547, 147.9532470703125, 155.48858642578125, 163.02394104003906, 170.55929565429688, 178.09463500976562, 185.62998962402344, 193.16534423828125, 200.70068359375, 208.2360382080078, 215.77139282226562, 223.30673217773438, 230.8420867919922, 238.37744140625, 245.91278076171875, 253.44813537597656, 260.9834899902344, 268.5188293457031, 276.0541687011719, 283.58953857421875, 291.1248779296875, 298.66021728515625, 306.1955871582031]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 3.0, 1.0, 0.0, 4.0, 5.0, 5.0, 6.0, 8.0, 11.0, 18.0, 12.0, 22.0, 22.0, 21.0, 29.0, 31.0, 38.0, 46.0, 32.0, 36.0, 47.0, 39.0, 58.0, 45.0, 59.0, 31.0, 37.0, 32.0, 51.0, 32.0, 35.0, 30.0, 21.0, 30.0, 19.0, 17.0, 13.0, 13.0, 5.0, 5.0, 12.0, 9.0, 6.0, 1.0, 5.0, 3.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-201.77781677246094, -195.5265350341797, -189.27525329589844, -183.0239715576172, -176.77268981933594, -170.52142333984375, -164.2701416015625, -158.01885986328125, -151.767578125, -145.51629638671875, -139.2650146484375, -133.01373291015625, -126.76245880126953, -120.51117706298828, -114.25989532470703, -108.00862121582031, -101.75733184814453, -95.50605010986328, -89.25476837158203, -83.00349426269531, -76.75221252441406, -70.50093078613281, -64.24964904785156, -57.99837112426758, -51.74708938598633, -45.49580764770508, -39.244529724121094, -32.993247985839844, -26.741968154907227, -20.49068832397461, -14.23940658569336, -7.988128662109375, -1.736846923828125, 4.51443338394165, 10.765713691711426, 17.01699447631836, 23.268274307250977, 29.519554138183594, 35.770835876464844, 42.02211380004883, 48.27339553833008, 54.52467727661133, 60.77595520019531, 67.02723693847656, 73.27851867675781, 79.52980041503906, 85.78108215332031, 92.03235626220703, 98.28363800048828, 104.53491973876953, 110.78620147705078, 117.0374755859375, 123.28875732421875, 129.5400390625, 135.79132080078125, 142.0426025390625, 148.29388427734375, 154.545166015625, 160.79644775390625, 167.0477294921875, 173.29901123046875, 179.55029296875, 185.80157470703125, 192.05284118652344, 198.3041229248047]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 4.0, 3.0, 2.0, 8.0, 12.0, 11.0, 20.0, 34.0, 41.0, 77.0, 116.0, 178.0, 297.0, 564.0, 993.0, 2302.0, 5913.0, 20776.0, 162451.0, 3920404.0, 60440.0, 12126.0, 4065.0, 1609.0, 817.0, 401.0, 227.0, 134.0, 87.0, 68.0, 37.0, 23.0, 16.0, 11.0, 10.0, 5.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-101.5, -98.541015625, -95.58203125, -92.623046875, -89.6640625, -86.705078125, -83.74609375, -80.787109375, -77.828125, -74.869140625, -71.91015625, -68.951171875, -65.9921875, -63.033203125, -60.07421875, -57.115234375, -54.15625, -51.197265625, -48.23828125, -45.279296875, -42.3203125, -39.361328125, -36.40234375, -33.443359375, -30.484375, -27.525390625, -24.56640625, -21.607421875, -18.6484375, -15.689453125, -12.73046875, -9.771484375, -6.8125, -3.853515625, -0.89453125, 2.064453125, 5.0234375, 7.982421875, 10.94140625, 13.900390625, 16.859375, 19.818359375, 22.77734375, 25.736328125, 28.6953125, 31.654296875, 34.61328125, 37.572265625, 40.53125, 43.490234375, 46.44921875, 49.408203125, 52.3671875, 55.326171875, 58.28515625, 61.244140625, 64.203125, 67.162109375, 70.12109375, 73.080078125, 76.0390625, 78.998046875, 81.95703125, 84.916015625, 87.875]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 4.0, 4.0, 7.0, 8.0, 18.0, 22.0, 22.0, 23.0, 20.0, 36.0, 39.0, 44.0, 51.0, 55.0, 63.0, 52.0, 55.0, 67.0, 43.0, 58.0, 51.0, 39.0, 36.0, 42.0, 28.0, 20.0, 18.0, 16.0, 12.0, 18.0, 14.0, 7.0, 5.0, 4.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.3671875, -8.11834716796875, -7.8695068359375, -7.62066650390625, -7.371826171875, -7.12298583984375, -6.8741455078125, -6.62530517578125, -6.37646484375, -6.12762451171875, -5.8787841796875, -5.62994384765625, -5.381103515625, -5.13226318359375, -4.8834228515625, -4.63458251953125, -4.3857421875, -4.13690185546875, -3.8880615234375, -3.63922119140625, -3.390380859375, -3.14154052734375, -2.8927001953125, -2.64385986328125, -2.39501953125, -2.14617919921875, -1.8973388671875, -1.64849853515625, -1.399658203125, -1.15081787109375, -0.9019775390625, -0.65313720703125, -0.404296875, -0.15545654296875, 0.0933837890625, 0.34222412109375, 0.591064453125, 0.83990478515625, 1.0887451171875, 1.33758544921875, 1.58642578125, 1.83526611328125, 2.0841064453125, 2.33294677734375, 2.581787109375, 2.83062744140625, 3.0794677734375, 3.32830810546875, 3.5771484375, 3.82598876953125, 4.0748291015625, 4.32366943359375, 4.572509765625, 4.82135009765625, 5.0701904296875, 5.31903076171875, 5.56787109375, 5.81671142578125, 6.0655517578125, 6.31439208984375, 6.563232421875, 6.81207275390625, 7.0609130859375, 7.30975341796875, 7.55859375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 7.0, 4.0, 11.0, 12.0, 15.0, 18.0, 32.0, 50.0, 65.0, 104.0, 143.0, 264.0, 345.0, 683.0, 1351.0, 2935.0, 8085.0, 30215.0, 251723.0, 3780167.0, 91730.0, 17007.0, 5146.0, 2133.0, 929.0, 459.0, 270.0, 153.0, 93.0, 45.0, 31.0, 18.0, 18.0, 9.0, 11.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-112.625, -109.60546875, -106.5859375, -103.56640625, -100.546875, -97.52734375, -94.5078125, -91.48828125, -88.46875, -85.44921875, -82.4296875, -79.41015625, -76.390625, -73.37109375, -70.3515625, -67.33203125, -64.3125, -61.29296875, -58.2734375, -55.25390625, -52.234375, -49.21484375, -46.1953125, -43.17578125, -40.15625, -37.13671875, -34.1171875, -31.09765625, -28.078125, -25.05859375, -22.0390625, -19.01953125, -16.0, -12.98046875, -9.9609375, -6.94140625, -3.921875, -0.90234375, 2.1171875, 5.13671875, 8.15625, 11.17578125, 14.1953125, 17.21484375, 20.234375, 23.25390625, 26.2734375, 29.29296875, 32.3125, 35.33203125, 38.3515625, 41.37109375, 44.390625, 47.41015625, 50.4296875, 53.44921875, 56.46875, 59.48828125, 62.5078125, 65.52734375, 68.546875, 71.56640625, 74.5859375, 77.60546875, 80.625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 2.0, 3.0, 8.0, 9.0, 3.0, 15.0, 12.0, 24.0, 37.0, 64.0, 91.0, 179.0, 726.0, 2322.0, 237.0, 125.0, 63.0, 54.0, 37.0, 12.0, 13.0, 4.0, 5.0, 10.0, 6.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-27.625, -26.953369140625, -26.28173828125, -25.610107421875, -24.9384765625, -24.266845703125, -23.59521484375, -22.923583984375, -22.251953125, -21.580322265625, -20.90869140625, -20.237060546875, -19.5654296875, -18.893798828125, -18.22216796875, -17.550537109375, -16.87890625, -16.207275390625, -15.53564453125, -14.864013671875, -14.1923828125, -13.520751953125, -12.84912109375, -12.177490234375, -11.505859375, -10.834228515625, -10.16259765625, -9.490966796875, -8.8193359375, -8.147705078125, -7.47607421875, -6.804443359375, -6.1328125, -5.461181640625, -4.78955078125, -4.117919921875, -3.4462890625, -2.774658203125, -2.10302734375, -1.431396484375, -0.759765625, -0.088134765625, 0.58349609375, 1.255126953125, 1.9267578125, 2.598388671875, 3.27001953125, 3.941650390625, 4.61328125, 5.284912109375, 5.95654296875, 6.628173828125, 7.2998046875, 7.971435546875, 8.64306640625, 9.314697265625, 9.986328125, 10.657958984375, 11.32958984375, 12.001220703125, 12.6728515625, 13.344482421875, 14.01611328125, 14.687744140625, 15.359375]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 3.0, 5.0, 7.0, 11.0, 16.0, 43.0, 60.0, 77.0, 106.0, 162.0, 174.0, 128.0, 89.0, 52.0, 29.0, 14.0, 16.0, 7.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.265480041503906, -59.545352935791016, -55.82522201538086, -52.10509490966797, -48.38496398925781, -44.66483688354492, -40.94470977783203, -37.224578857421875, -33.504451751708984, -29.78432273864746, -26.064193725585938, -22.344066619873047, -18.623937606811523, -14.90380859375, -11.18368148803711, -7.463552474975586, -3.7434234619140625, -0.023294925689697266, 3.696833610534668, 7.416961669921875, 11.137090682983398, 14.857219696044922, 18.577346801757812, 22.297475814819336, 26.01760482788086, 29.737733840942383, 33.457862854003906, 37.1779899597168, 40.89811706542969, 44.618247985839844, 48.338375091552734, 52.058502197265625, 55.77862548828125, 59.49875259399414, 63.2188835144043, 66.93901062011719, 70.65914154052734, 74.3792724609375, 78.09939575195312, 81.81952667236328, 85.53965759277344, 89.2597885131836, 92.97991180419922, 96.70004272460938, 100.42017364501953, 104.14030456542969, 107.86042785644531, 111.58055877685547, 115.3006820678711, 119.02081298828125, 122.74093627929688, 126.46106719970703, 130.1811981201172, 133.9013214111328, 137.6214599609375, 141.34158325195312, 145.06170654296875, 148.78182983398438, 152.50196838378906, 156.2220916748047, 159.9422149658203, 163.662353515625, 167.38247680664062, 171.10260009765625, 174.82273864746094]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 2.0, 12.0, 5.0, 11.0, 13.0, 15.0, 14.0, 19.0, 18.0, 28.0, 28.0, 32.0, 31.0, 28.0, 39.0, 42.0, 38.0, 35.0, 39.0, 41.0, 37.0, 30.0, 43.0, 41.0, 24.0, 44.0, 34.0, 28.0, 33.0, 23.0, 28.0, 26.0, 16.0, 15.0, 9.0, 13.0, 9.0, 14.0, 9.0, 4.0, 6.0, 5.0, 7.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.437034606933594, -45.999656677246094, -44.562278747558594, -43.124900817871094, -41.687522888183594, -40.250144958496094, -38.812767028808594, -37.375389099121094, -35.938011169433594, -34.500633239746094, -33.063255310058594, -31.625877380371094, -30.188499450683594, -28.751121520996094, -27.313745498657227, -25.876367568969727, -24.43899154663086, -23.00161361694336, -21.56423568725586, -20.12685775756836, -18.68947982788086, -17.25210189819336, -15.814725875854492, -14.377347946166992, -12.939970016479492, -11.502592086791992, -10.065214157104492, -8.627837181091309, -7.190459251403809, -5.753081321716309, -4.315704345703125, -2.878326416015625, -1.440948486328125, -0.0035707950592041016, 1.4338068962097168, 2.8711843490600586, 4.308562278747559, 5.745940208435059, 7.183317184448242, 8.620695114135742, 10.058073043823242, 11.495450973510742, 12.932828903198242, 14.370205879211426, 15.807583808898926, 17.24496078491211, 18.68233871459961, 20.11971664428711, 21.55709457397461, 22.99447250366211, 24.43185043334961, 25.86922836303711, 27.30660629272461, 28.74398422241211, 30.181360244750977, 31.618738174438477, 33.056114196777344, 34.493492126464844, 35.930870056152344, 37.368247985839844, 38.805625915527344, 40.243003845214844, 41.680381774902344, 43.117759704589844, 44.555137634277344]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 4.0, 15.0, 9.0, 17.0, 20.0, 31.0, 42.0, 60.0, 102.0, 126.0, 185.0, 319.0, 436.0, 694.0, 1026.0, 1598.0, 2609.0, 4432.0, 7734.0, 13947.0, 26872.0, 55572.0, 121814.0, 269241.0, 287012.0, 131082.0, 59679.0, 28649.0, 14827.0, 8101.0, 4649.0, 2795.0, 1693.0, 1090.0, 689.0, 401.0, 327.0, 204.0, 125.0, 104.0, 64.0, 51.0, 29.0, 24.0, 21.0, 12.0, 9.0, 7.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-33.3125, -32.304443359375, -31.29638671875, -30.288330078125, -29.2802734375, -28.272216796875, -27.26416015625, -26.256103515625, -25.248046875, -24.239990234375, -23.23193359375, -22.223876953125, -21.2158203125, -20.207763671875, -19.19970703125, -18.191650390625, -17.18359375, -16.175537109375, -15.16748046875, -14.159423828125, -13.1513671875, -12.143310546875, -11.13525390625, -10.127197265625, -9.119140625, -8.111083984375, -7.10302734375, -6.094970703125, -5.0869140625, -4.078857421875, -3.07080078125, -2.062744140625, -1.0546875, -0.046630859375, 0.96142578125, 1.969482421875, 2.9775390625, 3.985595703125, 4.99365234375, 6.001708984375, 7.009765625, 8.017822265625, 9.02587890625, 10.033935546875, 11.0419921875, 12.050048828125, 13.05810546875, 14.066162109375, 15.07421875, 16.082275390625, 17.09033203125, 18.098388671875, 19.1064453125, 20.114501953125, 21.12255859375, 22.130615234375, 23.138671875, 24.146728515625, 25.15478515625, 26.162841796875, 27.1708984375, 28.178955078125, 29.18701171875, 30.195068359375, 31.203125]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 0.0, 3.0, 6.0, 5.0, 7.0, 4.0, 12.0, 17.0, 14.0, 25.0, 22.0, 21.0, 28.0, 31.0, 39.0, 38.0, 37.0, 47.0, 38.0, 45.0, 43.0, 51.0, 42.0, 47.0, 41.0, 43.0, 33.0, 27.0, 23.0, 41.0, 37.0, 23.0, 27.0, 12.0, 9.0, 16.0, 3.0, 12.0, 10.0, 3.0, 5.0, 6.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-6.828125, -6.62347412109375, -6.4188232421875, -6.21417236328125, -6.009521484375, -5.80487060546875, -5.6002197265625, -5.39556884765625, -5.19091796875, -4.98626708984375, -4.7816162109375, -4.57696533203125, -4.372314453125, -4.16766357421875, -3.9630126953125, -3.75836181640625, -3.5537109375, -3.34906005859375, -3.1444091796875, -2.93975830078125, -2.735107421875, -2.53045654296875, -2.3258056640625, -2.12115478515625, -1.91650390625, -1.71185302734375, -1.5072021484375, -1.30255126953125, -1.097900390625, -0.89324951171875, -0.6885986328125, -0.48394775390625, -0.279296875, -0.07464599609375, 0.1300048828125, 0.33465576171875, 0.539306640625, 0.74395751953125, 0.9486083984375, 1.15325927734375, 1.35791015625, 1.56256103515625, 1.7672119140625, 1.97186279296875, 2.176513671875, 2.38116455078125, 2.5858154296875, 2.79046630859375, 2.9951171875, 3.19976806640625, 3.4044189453125, 3.60906982421875, 3.813720703125, 4.01837158203125, 4.2230224609375, 4.42767333984375, 4.63232421875, 4.83697509765625, 5.0416259765625, 5.24627685546875, 5.450927734375, 5.65557861328125, 5.8602294921875, 6.06488037109375, 6.26953125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 12.0, 13.0, 25.0, 19.0, 57.0, 71.0, 121.0, 206.0, 325.0, 723.0, 1420.0, 3420.0, 9279.0, 30119.0, 123839.0, 523893.0, 270807.0, 58135.0, 16382.0, 5491.0, 2176.0, 914.0, 496.0, 260.0, 127.0, 70.0, 58.0, 33.0, 22.0, 11.0, 8.0, 8.0, 4.0, 2.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.625, -49.94580078125, -48.2666015625, -46.58740234375, -44.908203125, -43.22900390625, -41.5498046875, -39.87060546875, -38.19140625, -36.51220703125, -34.8330078125, -33.15380859375, -31.474609375, -29.79541015625, -28.1162109375, -26.43701171875, -24.7578125, -23.07861328125, -21.3994140625, -19.72021484375, -18.041015625, -16.36181640625, -14.6826171875, -13.00341796875, -11.32421875, -9.64501953125, -7.9658203125, -6.28662109375, -4.607421875, -2.92822265625, -1.2490234375, 0.43017578125, 2.109375, 3.78857421875, 5.4677734375, 7.14697265625, 8.826171875, 10.50537109375, 12.1845703125, 13.86376953125, 15.54296875, 17.22216796875, 18.9013671875, 20.58056640625, 22.259765625, 23.93896484375, 25.6181640625, 27.29736328125, 28.9765625, 30.65576171875, 32.3349609375, 34.01416015625, 35.693359375, 37.37255859375, 39.0517578125, 40.73095703125, 42.41015625, 44.08935546875, 45.7685546875, 47.44775390625, 49.126953125, 50.80615234375, 52.4853515625, 54.16455078125, 55.84375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 7.0, 5.0, 9.0, 12.0, 13.0, 19.0, 36.0, 20.0, 31.0, 43.0, 44.0, 53.0, 47.0, 58.0, 51.0, 72.0, 66.0, 63.0, 59.0, 54.0, 45.0, 45.0, 46.0, 23.0, 15.0, 10.0, 14.0, 12.0, 17.0, 8.0, 6.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.6875, -41.357421875, -40.02734375, -38.697265625, -37.3671875, -36.037109375, -34.70703125, -33.376953125, -32.046875, -30.716796875, -29.38671875, -28.056640625, -26.7265625, -25.396484375, -24.06640625, -22.736328125, -21.40625, -20.076171875, -18.74609375, -17.416015625, -16.0859375, -14.755859375, -13.42578125, -12.095703125, -10.765625, -9.435546875, -8.10546875, -6.775390625, -5.4453125, -4.115234375, -2.78515625, -1.455078125, -0.125, 1.205078125, 2.53515625, 3.865234375, 5.1953125, 6.525390625, 7.85546875, 9.185546875, 10.515625, 11.845703125, 13.17578125, 14.505859375, 15.8359375, 17.166015625, 18.49609375, 19.826171875, 21.15625, 22.486328125, 23.81640625, 25.146484375, 26.4765625, 27.806640625, 29.13671875, 30.466796875, 31.796875, 33.126953125, 34.45703125, 35.787109375, 37.1171875, 38.447265625, 39.77734375, 41.107421875, 42.4375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 4.0, 10.0, 16.0, 18.0, 23.0, 35.0, 53.0, 87.0, 119.0, 149.0, 222.0, 337.0, 545.0, 746.0, 1187.0, 1968.0, 3286.0, 5846.0, 12178.0, 29283.0, 95436.0, 437259.0, 338813.0, 73265.0, 24144.0, 10299.0, 5104.0, 2941.0, 1706.0, 1115.0, 711.0, 493.0, 329.0, 235.0, 180.0, 120.0, 63.0, 75.0, 40.0, 29.0, 23.0, 23.0, 18.0, 8.0, 4.0, 6.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-21.109375, -20.42626953125, -19.7431640625, -19.06005859375, -18.376953125, -17.69384765625, -17.0107421875, -16.32763671875, -15.64453125, -14.96142578125, -14.2783203125, -13.59521484375, -12.912109375, -12.22900390625, -11.5458984375, -10.86279296875, -10.1796875, -9.49658203125, -8.8134765625, -8.13037109375, -7.447265625, -6.76416015625, -6.0810546875, -5.39794921875, -4.71484375, -4.03173828125, -3.3486328125, -2.66552734375, -1.982421875, -1.29931640625, -0.6162109375, 0.06689453125, 0.75, 1.43310546875, 2.1162109375, 2.79931640625, 3.482421875, 4.16552734375, 4.8486328125, 5.53173828125, 6.21484375, 6.89794921875, 7.5810546875, 8.26416015625, 8.947265625, 9.63037109375, 10.3134765625, 10.99658203125, 11.6796875, 12.36279296875, 13.0458984375, 13.72900390625, 14.412109375, 15.09521484375, 15.7783203125, 16.46142578125, 17.14453125, 17.82763671875, 18.5107421875, 19.19384765625, 19.876953125, 20.56005859375, 21.2431640625, 21.92626953125, 22.609375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 6.0, 6.0, 8.0, 8.0, 11.0, 30.0, 41.0, 52.0, 98.0, 204.0, 197.0, 132.0, 94.0, 38.0, 25.0, 18.0, 12.0, 11.0, 5.0, 4.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0107421875, -0.010418534278869629, -0.010094881057739258, -0.009771227836608887, -0.009447574615478516, -0.009123921394348145, -0.008800268173217773, -0.008476614952087402, -0.008152961730957031, -0.00782930850982666, -0.007505655288696289, -0.007182002067565918, -0.006858348846435547, -0.006534695625305176, -0.006211042404174805, -0.005887389183044434, -0.0055637359619140625, -0.005240082740783691, -0.00491642951965332, -0.004592776298522949, -0.004269123077392578, -0.003945469856262207, -0.003621816635131836, -0.003298163414001465, -0.0029745101928710938, -0.0026508569717407227, -0.0023272037506103516, -0.0020035505294799805, -0.0016798973083496094, -0.0013562440872192383, -0.0010325908660888672, -0.0007089376449584961, -0.000385284423828125, -6.16312026977539e-05, 0.0002620220184326172, 0.0005856752395629883, 0.0009093284606933594, 0.0012329816818237305, 0.0015566349029541016, 0.0018802881240844727, 0.0022039413452148438, 0.002527594566345215, 0.002851247787475586, 0.003174901008605957, 0.003498554229736328, 0.0038222074508666992, 0.00414586067199707, 0.004469513893127441, 0.0047931671142578125, 0.005116820335388184, 0.005440473556518555, 0.005764126777648926, 0.006087779998779297, 0.006411433219909668, 0.006735086441040039, 0.00705873966217041, 0.007382392883300781, 0.007706046104431152, 0.008029699325561523, 0.008353352546691895, 0.008677005767822266, 0.009000658988952637, 0.009324312210083008, 0.009647965431213379, 0.00997161865234375]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 5.0, 2.0, 7.0, 5.0, 7.0, 9.0, 11.0, 23.0, 27.0, 36.0, 73.0, 110.0, 139.0, 259.0, 445.0, 693.0, 1299.0, 2448.0, 5251.0, 13152.0, 43899.0, 331098.0, 551898.0, 67068.0, 17310.0, 6610.0, 3000.0, 1525.0, 867.0, 476.0, 301.0, 176.0, 103.0, 91.0, 47.0, 22.0, 26.0, 12.0, 13.0, 5.0, 11.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-37.0625, -36.007568359375, -34.95263671875, -33.897705078125, -32.8427734375, -31.787841796875, -30.73291015625, -29.677978515625, -28.623046875, -27.568115234375, -26.51318359375, -25.458251953125, -24.4033203125, -23.348388671875, -22.29345703125, -21.238525390625, -20.18359375, -19.128662109375, -18.07373046875, -17.018798828125, -15.9638671875, -14.908935546875, -13.85400390625, -12.799072265625, -11.744140625, -10.689208984375, -9.63427734375, -8.579345703125, -7.5244140625, -6.469482421875, -5.41455078125, -4.359619140625, -3.3046875, -2.249755859375, -1.19482421875, -0.139892578125, 0.9150390625, 1.969970703125, 3.02490234375, 4.079833984375, 5.134765625, 6.189697265625, 7.24462890625, 8.299560546875, 9.3544921875, 10.409423828125, 11.46435546875, 12.519287109375, 13.57421875, 14.629150390625, 15.68408203125, 16.739013671875, 17.7939453125, 18.848876953125, 19.90380859375, 20.958740234375, 22.013671875, 23.068603515625, 24.12353515625, 25.178466796875, 26.2333984375, 27.288330078125, 28.34326171875, 29.398193359375, 30.453125]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 2.0, 4.0, 6.0, 6.0, 9.0, 16.0, 19.0, 22.0, 39.0, 66.0, 85.0, 111.0, 126.0, 142.0, 109.0, 79.0, 46.0, 31.0, 24.0, 18.0, 12.0, 6.0, 5.0, 5.0, 1.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-28.96875, -28.182373046875, -27.39599609375, -26.609619140625, -25.8232421875, -25.036865234375, -24.25048828125, -23.464111328125, -22.677734375, -21.891357421875, -21.10498046875, -20.318603515625, -19.5322265625, -18.745849609375, -17.95947265625, -17.173095703125, -16.38671875, -15.600341796875, -14.81396484375, -14.027587890625, -13.2412109375, -12.454833984375, -11.66845703125, -10.882080078125, -10.095703125, -9.309326171875, -8.52294921875, -7.736572265625, -6.9501953125, -6.163818359375, -5.37744140625, -4.591064453125, -3.8046875, -3.018310546875, -2.23193359375, -1.445556640625, -0.6591796875, 0.127197265625, 0.91357421875, 1.699951171875, 2.486328125, 3.272705078125, 4.05908203125, 4.845458984375, 5.6318359375, 6.418212890625, 7.20458984375, 7.990966796875, 8.77734375, 9.563720703125, 10.35009765625, 11.136474609375, 11.9228515625, 12.709228515625, 13.49560546875, 14.281982421875, 15.068359375, 15.854736328125, 16.64111328125, 17.427490234375, 18.2138671875, 19.000244140625, 19.78662109375, 20.572998046875, 21.359375]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 7.0, 10.0, 30.0, 55.0, 90.0, 123.0, 173.0, 175.0, 151.0, 92.0, 44.0, 31.0, 12.0, 5.0, 7.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-419.60833740234375, -406.0770568847656, -392.5458068847656, -379.0145263671875, -365.4832458496094, -351.95196533203125, -338.42071533203125, -324.8894348144531, -311.358154296875, -297.8268737792969, -284.2956237792969, -270.76434326171875, -257.2330627441406, -243.70179748535156, -230.1705322265625, -216.63925170898438, -203.10800170898438, -189.5767364501953, -176.0454559326172, -162.51419067382812, -148.98291015625, -135.45164489746094, -121.92037963867188, -108.38910675048828, -94.85783386230469, -81.3265609741211, -67.7952880859375, -54.26402282714844, -40.732749938964844, -27.20147705078125, -13.670211791992188, -0.13893890380859375, 13.392333984375, 26.92360496520996, 40.45487594604492, 53.98614501953125, 67.51741790771484, 81.04869079589844, 94.5799560546875, 108.1112289428711, 121.64250183105469, 135.17376708984375, 148.70504760742188, 162.23631286621094, 175.767578125, 189.29885864257812, 202.8301239013672, 216.36138916015625, 229.89266967773438, 243.42393493652344, 256.9552001953125, 270.4864807128906, 284.01776123046875, 297.54901123046875, 311.0802917480469, 324.611572265625, 338.142822265625, 351.6741027832031, 365.2053527832031, 378.73663330078125, 392.2679138183594, 405.7991943359375, 419.3304443359375, 432.8617248535156, 446.39300537109375]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 6.0, 6.0, 7.0, 6.0, 8.0, 9.0, 7.0, 17.0, 17.0, 18.0, 25.0, 28.0, 38.0, 36.0, 32.0, 36.0, 46.0, 38.0, 39.0, 51.0, 29.0, 50.0, 39.0, 48.0, 40.0, 36.0, 36.0, 27.0, 31.0, 27.0, 19.0, 17.0, 27.0, 15.0, 18.0, 10.0, 15.0, 8.0, 8.0, 9.0, 3.0, 4.0, 6.0, 4.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-155.17877197265625, -149.85716247558594, -144.5355682373047, -139.21395874023438, -133.89234924316406, -128.57073974609375, -123.2491455078125, -117.92753601074219, -112.6059341430664, -107.28433227539062, -101.96272277832031, -96.64112091064453, -91.31951904296875, -85.99790954589844, -80.67630767822266, -75.35470581054688, -70.03309631347656, -64.71149444580078, -59.38988494873047, -54.06828308105469, -48.74667739868164, -43.425071716308594, -38.10346984863281, -32.781864166259766, -27.46025848388672, -22.138652801513672, -16.817049026489258, -11.495444297790527, -6.173839569091797, -0.85223388671875, 4.469369888305664, 9.790973663330078, 15.112564086914062, 20.43416976928711, 25.755773544311523, 31.077377319335938, 36.398983001708984, 41.72058868408203, 47.04219055175781, 52.36379623413086, 57.685401916503906, 63.00700759887695, 68.32861328125, 73.65021514892578, 78.97181701660156, 84.29342651367188, 89.61502838134766, 94.93663024902344, 100.25823974609375, 105.57984161376953, 110.90145111083984, 116.22305297851562, 121.54466247558594, 126.86626434326172, 132.1878662109375, 137.5094757080078, 142.83108520507812, 148.15269470214844, 153.4742889404297, 158.7958984375, 164.1175079345703, 169.43911743164062, 174.76071166992188, 180.0823211669922, 185.40391540527344]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 3.0, 6.0, 9.0, 10.0, 13.0, 11.0, 19.0, 28.0, 43.0, 45.0, 79.0, 109.0, 132.0, 177.0, 315.0, 436.0, 661.0, 1042.0, 1773.0, 2896.0, 5403.0, 11295.0, 26660.0, 84689.0, 2448620.0, 1475847.0, 84464.0, 26111.0, 10902.0, 5448.0, 2827.0, 1657.0, 932.0, 539.0, 364.0, 236.0, 130.0, 117.0, 78.0, 44.0, 29.0, 20.0, 23.0, 10.0, 8.0, 7.0, 8.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0], "bins": [-52.96875, -51.36328125, -49.7578125, -48.15234375, -46.546875, -44.94140625, -43.3359375, -41.73046875, -40.125, -38.51953125, -36.9140625, -35.30859375, -33.703125, -32.09765625, -30.4921875, -28.88671875, -27.28125, -25.67578125, -24.0703125, -22.46484375, -20.859375, -19.25390625, -17.6484375, -16.04296875, -14.4375, -12.83203125, -11.2265625, -9.62109375, -8.015625, -6.41015625, -4.8046875, -3.19921875, -1.59375, 0.01171875, 1.6171875, 3.22265625, 4.828125, 6.43359375, 8.0390625, 9.64453125, 11.25, 12.85546875, 14.4609375, 16.06640625, 17.671875, 19.27734375, 20.8828125, 22.48828125, 24.09375, 25.69921875, 27.3046875, 28.91015625, 30.515625, 32.12109375, 33.7265625, 35.33203125, 36.9375, 38.54296875, 40.1484375, 41.75390625, 43.359375, 44.96484375, 46.5703125, 48.17578125, 49.78125]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 4.0, 6.0, 10.0, 8.0, 9.0, 18.0, 20.0, 11.0, 15.0, 25.0, 25.0, 30.0, 55.0, 44.0, 40.0, 52.0, 40.0, 57.0, 60.0, 44.0, 59.0, 48.0, 36.0, 43.0, 39.0, 35.0, 29.0, 26.0, 22.0, 18.0, 12.0, 19.0, 9.0, 10.0, 9.0, 7.0, 2.0, 4.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-7.6875, -7.45819091796875, -7.2288818359375, -6.99957275390625, -6.770263671875, -6.54095458984375, -6.3116455078125, -6.08233642578125, -5.85302734375, -5.62371826171875, -5.3944091796875, -5.16510009765625, -4.935791015625, -4.70648193359375, -4.4771728515625, -4.24786376953125, -4.0185546875, -3.78924560546875, -3.5599365234375, -3.33062744140625, -3.101318359375, -2.87200927734375, -2.6427001953125, -2.41339111328125, -2.18408203125, -1.95477294921875, -1.7254638671875, -1.49615478515625, -1.266845703125, -1.03753662109375, -0.8082275390625, -0.57891845703125, -0.349609375, -0.12030029296875, 0.1090087890625, 0.33831787109375, 0.567626953125, 0.79693603515625, 1.0262451171875, 1.25555419921875, 1.48486328125, 1.71417236328125, 1.9434814453125, 2.17279052734375, 2.402099609375, 2.63140869140625, 2.8607177734375, 3.09002685546875, 3.3193359375, 3.54864501953125, 3.7779541015625, 4.00726318359375, 4.236572265625, 4.46588134765625, 4.6951904296875, 4.92449951171875, 5.15380859375, 5.38311767578125, 5.6124267578125, 5.84173583984375, 6.071044921875, 6.30035400390625, 6.5296630859375, 6.75897216796875, 6.98828125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 11.0, 13.0, 23.0, 34.0, 72.0, 122.0, 188.0, 373.0, 634.0, 1372.0, 2958.0, 7501.0, 22356.0, 100530.0, 3363580.0, 607953.0, 60733.0, 15602.0, 5560.0, 2393.0, 1086.0, 535.0, 272.0, 146.0, 90.0, 71.0, 31.0, 17.0, 5.0, 11.0, 7.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-72.125, -69.708984375, -67.29296875, -64.876953125, -62.4609375, -60.044921875, -57.62890625, -55.212890625, -52.796875, -50.380859375, -47.96484375, -45.548828125, -43.1328125, -40.716796875, -38.30078125, -35.884765625, -33.46875, -31.052734375, -28.63671875, -26.220703125, -23.8046875, -21.388671875, -18.97265625, -16.556640625, -14.140625, -11.724609375, -9.30859375, -6.892578125, -4.4765625, -2.060546875, 0.35546875, 2.771484375, 5.1875, 7.603515625, 10.01953125, 12.435546875, 14.8515625, 17.267578125, 19.68359375, 22.099609375, 24.515625, 26.931640625, 29.34765625, 31.763671875, 34.1796875, 36.595703125, 39.01171875, 41.427734375, 43.84375, 46.259765625, 48.67578125, 51.091796875, 53.5078125, 55.923828125, 58.33984375, 60.755859375, 63.171875, 65.587890625, 68.00390625, 70.419921875, 72.8359375, 75.251953125, 77.66796875, 80.083984375, 82.5]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 1.0, 3.0, 4.0, 5.0, 12.0, 11.0, 13.0, 14.0, 17.0, 26.0, 52.0, 58.0, 91.0, 122.0, 237.0, 716.0, 1842.0, 324.0, 168.0, 111.0, 66.0, 52.0, 21.0, 25.0, 13.0, 12.0, 14.0, 13.0, 7.0, 6.0, 4.0, 4.0, 1.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.671875, -19.9384765625, -19.205078125, -18.4716796875, -17.73828125, -17.0048828125, -16.271484375, -15.5380859375, -14.8046875, -14.0712890625, -13.337890625, -12.6044921875, -11.87109375, -11.1376953125, -10.404296875, -9.6708984375, -8.9375, -8.2041015625, -7.470703125, -6.7373046875, -6.00390625, -5.2705078125, -4.537109375, -3.8037109375, -3.0703125, -2.3369140625, -1.603515625, -0.8701171875, -0.13671875, 0.5966796875, 1.330078125, 2.0634765625, 2.796875, 3.5302734375, 4.263671875, 4.9970703125, 5.73046875, 6.4638671875, 7.197265625, 7.9306640625, 8.6640625, 9.3974609375, 10.130859375, 10.8642578125, 11.59765625, 12.3310546875, 13.064453125, 13.7978515625, 14.53125, 15.2646484375, 15.998046875, 16.7314453125, 17.46484375, 18.1982421875, 18.931640625, 19.6650390625, 20.3984375, 21.1318359375, 21.865234375, 22.5986328125, 23.33203125, 24.0654296875, 24.798828125, 25.5322265625, 26.265625]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 7.0, 7.0, 4.0, 5.0, 15.0, 33.0, 62.0, 107.0, 171.0, 176.0, 144.0, 115.0, 74.0, 41.0, 22.0, 9.0, 8.0, 7.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-252.1884002685547, -245.286865234375, -238.38534545898438, -231.4838104248047, -224.582275390625, -217.68075561523438, -210.7792205810547, -203.877685546875, -196.9761505126953, -190.07461547851562, -183.173095703125, -176.2715606689453, -169.37002563476562, -162.468505859375, -155.5669708251953, -148.66543579101562, -141.763916015625, -134.8623809814453, -127.96085357666016, -121.059326171875, -114.15779113769531, -107.25626373291016, -100.354736328125, -93.45320129394531, -86.55166625976562, -79.65013885498047, -72.74860382080078, -65.84707641601562, -58.94554138183594, -52.04401397705078, -45.14248275756836, -38.24095153808594, -31.33941650390625, -24.437885284423828, -17.536354064941406, -10.634824752807617, -3.7332935333251953, 3.1682357788085938, 10.069766998291016, 16.971298217773438, 23.87282943725586, 30.77436065673828, 37.6758918762207, 44.577423095703125, 51.47895050048828, 58.3804817199707, 65.28201293945312, 72.18354797363281, 79.08507537841797, 85.98660278320312, 92.88813781738281, 99.78966522216797, 106.69120025634766, 113.59272766113281, 120.4942626953125, 127.39579010009766, 134.2973175048828, 141.1988525390625, 148.10037231445312, 155.0019073486328, 161.9034423828125, 168.80496215820312, 175.7064971923828, 182.6080322265625, 189.5095672607422]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 3.0, 5.0, 3.0, 5.0, 4.0, 6.0, 10.0, 7.0, 14.0, 20.0, 18.0, 19.0, 34.0, 25.0, 30.0, 30.0, 33.0, 37.0, 41.0, 39.0, 40.0, 38.0, 37.0, 45.0, 51.0, 39.0, 36.0, 32.0, 31.0, 37.0, 33.0, 29.0, 23.0, 23.0, 18.0, 14.0, 22.0, 11.0, 10.0, 15.0, 20.0, 4.0, 3.0, 6.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-81.61823272705078, -79.24981689453125, -76.88140106201172, -74.51298522949219, -72.14456939697266, -69.77615356445312, -67.4077377319336, -65.03932189941406, -62.670902252197266, -60.302486419677734, -57.9340705871582, -55.56565475463867, -53.197235107421875, -50.828819274902344, -48.46040344238281, -46.09198760986328, -43.72357177734375, -41.35515594482422, -38.98674011230469, -36.618324279785156, -34.249908447265625, -31.88149070739746, -29.513072967529297, -27.144657135009766, -24.776241302490234, -22.407825469970703, -20.039409637451172, -17.670991897583008, -15.302576065063477, -12.934160232543945, -10.565743446350098, -8.19732666015625, -5.828910827636719, -3.4604945182800293, -1.0920782089233398, 1.2763381004333496, 3.644754409790039, 6.01317024230957, 8.381587028503418, 10.750003814697266, 13.118419647216797, 15.486835479736328, 17.85525131225586, 20.223669052124023, 22.592084884643555, 24.960500717163086, 27.32891845703125, 29.69733428955078, 32.06575012207031, 34.434165954589844, 36.802581787109375, 39.170997619628906, 41.53941345214844, 43.90782928466797, 46.276248931884766, 48.6446647644043, 51.01308059692383, 53.38149642944336, 55.74991226196289, 58.11832809448242, 60.48674774169922, 62.85516357421875, 65.22357940673828, 67.59199523925781, 69.96041107177734]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 8.0, 11.0, 7.0, 7.0, 12.0, 17.0, 23.0, 25.0, 42.0, 59.0, 96.0, 158.0, 247.0, 390.0, 645.0, 1117.0, 2008.0, 3880.0, 7998.0, 18202.0, 47043.0, 135850.0, 436516.0, 259539.0, 80161.0, 30071.0, 12284.0, 5538.0, 2828.0, 1557.0, 821.0, 526.0, 303.0, 192.0, 109.0, 87.0, 67.0, 31.0, 30.0, 19.0, 14.0, 9.0, 7.0, 6.0, 0.0, 1.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-52.59375, -50.93798828125, -49.2822265625, -47.62646484375, -45.970703125, -44.31494140625, -42.6591796875, -41.00341796875, -39.34765625, -37.69189453125, -36.0361328125, -34.38037109375, -32.724609375, -31.06884765625, -29.4130859375, -27.75732421875, -26.1015625, -24.44580078125, -22.7900390625, -21.13427734375, -19.478515625, -17.82275390625, -16.1669921875, -14.51123046875, -12.85546875, -11.19970703125, -9.5439453125, -7.88818359375, -6.232421875, -4.57666015625, -2.9208984375, -1.26513671875, 0.390625, 2.04638671875, 3.7021484375, 5.35791015625, 7.013671875, 8.66943359375, 10.3251953125, 11.98095703125, 13.63671875, 15.29248046875, 16.9482421875, 18.60400390625, 20.259765625, 21.91552734375, 23.5712890625, 25.22705078125, 26.8828125, 28.53857421875, 30.1943359375, 31.85009765625, 33.505859375, 35.16162109375, 36.8173828125, 38.47314453125, 40.12890625, 41.78466796875, 43.4404296875, 45.09619140625, 46.751953125, 48.40771484375, 50.0634765625, 51.71923828125, 53.375]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 7.0, 3.0, 7.0, 8.0, 11.0, 12.0, 25.0, 21.0, 20.0, 28.0, 16.0, 34.0, 36.0, 33.0, 43.0, 55.0, 49.0, 55.0, 51.0, 51.0, 40.0, 57.0, 51.0, 31.0, 40.0, 33.0, 26.0, 25.0, 33.0, 21.0, 20.0, 19.0, 12.0, 5.0, 6.0, 5.0, 7.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.56640625, -7.34234619140625, -7.1182861328125, -6.89422607421875, -6.670166015625, -6.44610595703125, -6.2220458984375, -5.99798583984375, -5.77392578125, -5.54986572265625, -5.3258056640625, -5.10174560546875, -4.877685546875, -4.65362548828125, -4.4295654296875, -4.20550537109375, -3.9814453125, -3.75738525390625, -3.5333251953125, -3.30926513671875, -3.085205078125, -2.86114501953125, -2.6370849609375, -2.41302490234375, -2.18896484375, -1.96490478515625, -1.7408447265625, -1.51678466796875, -1.292724609375, -1.06866455078125, -0.8446044921875, -0.62054443359375, -0.396484375, -0.17242431640625, 0.0516357421875, 0.27569580078125, 0.499755859375, 0.72381591796875, 0.9478759765625, 1.17193603515625, 1.39599609375, 1.62005615234375, 1.8441162109375, 2.06817626953125, 2.292236328125, 2.51629638671875, 2.7403564453125, 2.96441650390625, 3.1884765625, 3.41253662109375, 3.6365966796875, 3.86065673828125, 4.084716796875, 4.30877685546875, 4.5328369140625, 4.75689697265625, 4.98095703125, 5.20501708984375, 5.4290771484375, 5.65313720703125, 5.877197265625, 6.10125732421875, 6.3253173828125, 6.54937744140625, 6.7734375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 3.0, 3.0, 3.0, 2.0, 7.0, 7.0, 11.0, 20.0, 19.0, 35.0, 44.0, 71.0, 108.0, 139.0, 238.0, 331.0, 560.0, 848.0, 1543.0, 2566.0, 4732.0, 9431.0, 22068.0, 58255.0, 184229.0, 462945.0, 194652.0, 61392.0, 22691.0, 9966.0, 4910.0, 2682.0, 1481.0, 912.0, 563.0, 364.0, 250.0, 157.0, 108.0, 59.0, 51.0, 30.0, 20.0, 15.0, 13.0, 6.0, 7.0, 4.0, 6.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.34375, -39.943359375, -38.54296875, -37.142578125, -35.7421875, -34.341796875, -32.94140625, -31.541015625, -30.140625, -28.740234375, -27.33984375, -25.939453125, -24.5390625, -23.138671875, -21.73828125, -20.337890625, -18.9375, -17.537109375, -16.13671875, -14.736328125, -13.3359375, -11.935546875, -10.53515625, -9.134765625, -7.734375, -6.333984375, -4.93359375, -3.533203125, -2.1328125, -0.732421875, 0.66796875, 2.068359375, 3.46875, 4.869140625, 6.26953125, 7.669921875, 9.0703125, 10.470703125, 11.87109375, 13.271484375, 14.671875, 16.072265625, 17.47265625, 18.873046875, 20.2734375, 21.673828125, 23.07421875, 24.474609375, 25.875, 27.275390625, 28.67578125, 30.076171875, 31.4765625, 32.876953125, 34.27734375, 35.677734375, 37.078125, 38.478515625, 39.87890625, 41.279296875, 42.6796875, 44.080078125, 45.48046875, 46.880859375, 48.28125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 3.0, 5.0, 12.0, 8.0, 12.0, 8.0, 18.0, 10.0, 20.0, 26.0, 17.0, 25.0, 27.0, 35.0, 39.0, 44.0, 59.0, 44.0, 55.0, 52.0, 49.0, 44.0, 45.0, 45.0, 48.0, 34.0, 36.0, 27.0, 26.0, 28.0, 26.0, 15.0, 15.0, 10.0, 10.0, 5.0, 3.0, 5.0, 3.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-35.25, -34.06298828125, -32.8759765625, -31.68896484375, -30.501953125, -29.31494140625, -28.1279296875, -26.94091796875, -25.75390625, -24.56689453125, -23.3798828125, -22.19287109375, -21.005859375, -19.81884765625, -18.6318359375, -17.44482421875, -16.2578125, -15.07080078125, -13.8837890625, -12.69677734375, -11.509765625, -10.32275390625, -9.1357421875, -7.94873046875, -6.76171875, -5.57470703125, -4.3876953125, -3.20068359375, -2.013671875, -0.82666015625, 0.3603515625, 1.54736328125, 2.734375, 3.92138671875, 5.1083984375, 6.29541015625, 7.482421875, 8.66943359375, 9.8564453125, 11.04345703125, 12.23046875, 13.41748046875, 14.6044921875, 15.79150390625, 16.978515625, 18.16552734375, 19.3525390625, 20.53955078125, 21.7265625, 22.91357421875, 24.1005859375, 25.28759765625, 26.474609375, 27.66162109375, 28.8486328125, 30.03564453125, 31.22265625, 32.40966796875, 33.5966796875, 34.78369140625, 35.970703125, 37.15771484375, 38.3447265625, 39.53173828125, 40.71875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 6.0, 9.0, 14.0, 21.0, 48.0, 68.0, 111.0, 210.0, 346.0, 650.0, 1109.0, 2253.0, 4577.0, 10473.0, 31340.0, 263216.0, 651300.0, 55709.0, 14897.0, 6100.0, 2768.0, 1522.0, 786.0, 461.0, 219.0, 133.0, 90.0, 39.0, 41.0, 17.0, 9.0, 6.0, 2.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.3125, -50.634765625, -48.95703125, -47.279296875, -45.6015625, -43.923828125, -42.24609375, -40.568359375, -38.890625, -37.212890625, -35.53515625, -33.857421875, -32.1796875, -30.501953125, -28.82421875, -27.146484375, -25.46875, -23.791015625, -22.11328125, -20.435546875, -18.7578125, -17.080078125, -15.40234375, -13.724609375, -12.046875, -10.369140625, -8.69140625, -7.013671875, -5.3359375, -3.658203125, -1.98046875, -0.302734375, 1.375, 3.052734375, 4.73046875, 6.408203125, 8.0859375, 9.763671875, 11.44140625, 13.119140625, 14.796875, 16.474609375, 18.15234375, 19.830078125, 21.5078125, 23.185546875, 24.86328125, 26.541015625, 28.21875, 29.896484375, 31.57421875, 33.251953125, 34.9296875, 36.607421875, 38.28515625, 39.962890625, 41.640625, 43.318359375, 44.99609375, 46.673828125, 48.3515625, 50.029296875, 51.70703125, 53.384765625, 55.0625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 8.0, 2.0, 5.0, 11.0, 11.0, 25.0, 34.0, 80.0, 194.0, 326.0, 142.0, 60.0, 26.0, 21.0, 17.0, 8.0, 4.0, 6.0, 3.0, 4.0, 0.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.01534271240234375, -0.014820694923400879, -0.014298677444458008, -0.013776659965515137, -0.013254642486572266, -0.012732625007629395, -0.012210607528686523, -0.011688590049743652, -0.011166572570800781, -0.01064455509185791, -0.010122537612915039, -0.009600520133972168, -0.009078502655029297, -0.008556485176086426, -0.008034467697143555, -0.007512450218200684, -0.0069904327392578125, -0.006468415260314941, -0.00594639778137207, -0.005424380302429199, -0.004902362823486328, -0.004380345344543457, -0.003858327865600586, -0.003336310386657715, -0.0028142929077148438, -0.0022922754287719727, -0.0017702579498291016, -0.0012482404708862305, -0.0007262229919433594, -0.00020420551300048828, 0.0003178119659423828, 0.0008398294448852539, 0.001361846923828125, 0.001883864402770996, 0.002405881881713867, 0.0029278993606567383, 0.0034499168395996094, 0.0039719343185424805, 0.0044939517974853516, 0.005015969276428223, 0.005537986755371094, 0.006060004234313965, 0.006582021713256836, 0.007104039192199707, 0.007626056671142578, 0.00814807415008545, 0.00867009162902832, 0.009192109107971191, 0.009714126586914062, 0.010236144065856934, 0.010758161544799805, 0.011280179023742676, 0.011802196502685547, 0.012324213981628418, 0.012846231460571289, 0.01336824893951416, 0.013890266418457031, 0.014412283897399902, 0.014934301376342773, 0.015456318855285645, 0.015978336334228516, 0.016500353813171387, 0.017022371292114258, 0.01754438877105713, 0.01806640625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 4.0, 6.0, 5.0, 5.0, 14.0, 24.0, 21.0, 42.0, 50.0, 80.0, 119.0, 184.0, 301.0, 432.0, 809.0, 1331.0, 2286.0, 4218.0, 8859.0, 21641.0, 76130.0, 531628.0, 316489.0, 51570.0, 16608.0, 7057.0, 3613.0, 2005.0, 1133.0, 674.0, 421.0, 246.0, 175.0, 114.0, 86.0, 52.0, 36.0, 33.0, 14.0, 9.0, 12.0, 9.0, 2.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-41.90625, -40.73779296875, -39.5693359375, -38.40087890625, -37.232421875, -36.06396484375, -34.8955078125, -33.72705078125, -32.55859375, -31.39013671875, -30.2216796875, -29.05322265625, -27.884765625, -26.71630859375, -25.5478515625, -24.37939453125, -23.2109375, -22.04248046875, -20.8740234375, -19.70556640625, -18.537109375, -17.36865234375, -16.2001953125, -15.03173828125, -13.86328125, -12.69482421875, -11.5263671875, -10.35791015625, -9.189453125, -8.02099609375, -6.8525390625, -5.68408203125, -4.515625, -3.34716796875, -2.1787109375, -1.01025390625, 0.158203125, 1.32666015625, 2.4951171875, 3.66357421875, 4.83203125, 6.00048828125, 7.1689453125, 8.33740234375, 9.505859375, 10.67431640625, 11.8427734375, 13.01123046875, 14.1796875, 15.34814453125, 16.5166015625, 17.68505859375, 18.853515625, 20.02197265625, 21.1904296875, 22.35888671875, 23.52734375, 24.69580078125, 25.8642578125, 27.03271484375, 28.201171875, 29.36962890625, 30.5380859375, 31.70654296875, 32.875]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 7.0, 7.0, 8.0, 9.0, 19.0, 18.0, 21.0, 38.0, 43.0, 59.0, 84.0, 116.0, 125.0, 116.0, 95.0, 57.0, 39.0, 24.0, 32.0, 10.0, 13.0, 10.0, 13.0, 3.0, 7.0, 2.0, 3.0, 1.0, 5.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-32.71875, -31.846435546875, -30.97412109375, -30.101806640625, -29.2294921875, -28.357177734375, -27.48486328125, -26.612548828125, -25.740234375, -24.867919921875, -23.99560546875, -23.123291015625, -22.2509765625, -21.378662109375, -20.50634765625, -19.634033203125, -18.76171875, -17.889404296875, -17.01708984375, -16.144775390625, -15.2724609375, -14.400146484375, -13.52783203125, -12.655517578125, -11.783203125, -10.910888671875, -10.03857421875, -9.166259765625, -8.2939453125, -7.421630859375, -6.54931640625, -5.677001953125, -4.8046875, -3.932373046875, -3.06005859375, -2.187744140625, -1.3154296875, -0.443115234375, 0.42919921875, 1.301513671875, 2.173828125, 3.046142578125, 3.91845703125, 4.790771484375, 5.6630859375, 6.535400390625, 7.40771484375, 8.280029296875, 9.15234375, 10.024658203125, 10.89697265625, 11.769287109375, 12.6416015625, 13.513916015625, 14.38623046875, 15.258544921875, 16.130859375, 17.003173828125, 17.87548828125, 18.747802734375, 19.6201171875, 20.492431640625, 21.36474609375, 22.237060546875, 23.109375]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 14.0, 30.0, 78.0, 168.0, 327.0, 228.0, 100.0, 47.0, 14.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1513.858642578125, -1484.44580078125, -1455.032958984375, -1425.6202392578125, -1396.2073974609375, -1366.7945556640625, -1337.3817138671875, -1307.968994140625, -1278.55615234375, -1249.143310546875, -1219.73046875, -1190.3177490234375, -1160.9049072265625, -1131.4920654296875, -1102.0792236328125, -1072.66650390625, -1043.253662109375, -1013.8408203125, -984.4280395507812, -955.0151977539062, -925.6024169921875, -896.1895751953125, -866.7767944335938, -837.3639526367188, -807.9511108398438, -778.5382690429688, -749.12548828125, -719.712646484375, -690.2998657226562, -660.8870239257812, -631.4742431640625, -602.0614013671875, -572.6485595703125, -543.2357177734375, -513.8229370117188, -484.4101257324219, -454.997314453125, -425.58447265625, -396.17169189453125, -366.75885009765625, -337.3460693359375, -307.9332580566406, -278.52044677734375, -249.10763549804688, -219.69482421875, -190.28199768066406, -160.8691864013672, -131.4563751220703, -102.0435791015625, -72.63076782226562, -43.217952728271484, -13.805137634277344, 15.607673645019531, 45.02049255371094, 74.43330383300781, 103.84611511230469, 133.25892639160156, 162.67173767089844, 192.0845489501953, 221.49737548828125, 250.91018676757812, 280.322998046875, 309.7358093261719, 339.14862060546875, 368.5614318847656]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 8.0, 4.0, 14.0, 7.0, 12.0, 15.0, 18.0, 29.0, 30.0, 36.0, 26.0, 42.0, 46.0, 38.0, 38.0, 56.0, 50.0, 54.0, 51.0, 46.0, 37.0, 52.0, 44.0, 36.0, 39.0, 29.0, 26.0, 25.0, 21.0, 24.0, 13.0, 12.0, 7.0, 6.0, 5.0, 1.0, 6.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-302.77764892578125, -294.8313293457031, -286.8850402832031, -278.938720703125, -270.9924011230469, -263.0461120605469, -255.09979248046875, -247.1534881591797, -239.20718383789062, -231.26087951660156, -223.31455993652344, -215.36825561523438, -207.4219512939453, -199.47564697265625, -191.52932739257812, -183.58302307128906, -175.63671875, -167.69041442871094, -159.7440948486328, -151.79779052734375, -143.8514862060547, -135.90518188476562, -127.9588623046875, -120.01255798339844, -112.06623840332031, -104.11992645263672, -96.17362213134766, -88.22731018066406, -80.281005859375, -72.3346939086914, -64.38838195800781, -56.44207763671875, -48.49577331542969, -40.54946517944336, -32.60315704345703, -24.65684700012207, -16.710538864135742, -8.764228820800781, -0.8179206848144531, 7.128387451171875, 15.074695587158203, 23.02100372314453, 30.96731185913086, 38.91361999511719, 46.85993194580078, 54.80624008178711, 62.75254821777344, 70.6988525390625, 78.6451644897461, 86.59147644042969, 94.53778076171875, 102.48409271240234, 110.4303970336914, 118.376708984375, 126.32301330566406, 134.26931762695312, 142.21563720703125, 150.1619415283203, 158.10826110839844, 166.0545654296875, 174.00086975097656, 181.94717407226562, 189.89349365234375, 197.8397979736328, 205.78610229492188]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 2.0, 6.0, 21.0, 14.0, 16.0, 20.0, 43.0, 62.0, 85.0, 101.0, 199.0, 295.0, 482.0, 726.0, 1374.0, 2404.0, 5073.0, 12297.0, 41160.0, 669584.0, 3389823.0, 47142.0, 12729.0, 4977.0, 2478.0, 1304.0, 727.0, 409.0, 254.0, 155.0, 102.0, 76.0, 56.0, 26.0, 22.0, 19.0, 5.0, 5.0, 4.0, 9.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-77.125, -74.5576171875, -71.990234375, -69.4228515625, -66.85546875, -64.2880859375, -61.720703125, -59.1533203125, -56.5859375, -54.0185546875, -51.451171875, -48.8837890625, -46.31640625, -43.7490234375, -41.181640625, -38.6142578125, -36.046875, -33.4794921875, -30.912109375, -28.3447265625, -25.77734375, -23.2099609375, -20.642578125, -18.0751953125, -15.5078125, -12.9404296875, -10.373046875, -7.8056640625, -5.23828125, -2.6708984375, -0.103515625, 2.4638671875, 5.03125, 7.5986328125, 10.166015625, 12.7333984375, 15.30078125, 17.8681640625, 20.435546875, 23.0029296875, 25.5703125, 28.1376953125, 30.705078125, 33.2724609375, 35.83984375, 38.4072265625, 40.974609375, 43.5419921875, 46.109375, 48.6767578125, 51.244140625, 53.8115234375, 56.37890625, 58.9462890625, 61.513671875, 64.0810546875, 66.6484375, 69.2158203125, 71.783203125, 74.3505859375, 76.91796875, 79.4853515625, 82.052734375, 84.6201171875, 87.1875]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 5.0, 6.0, 8.0, 9.0, 9.0, 10.0, 10.0, 12.0, 16.0, 14.0, 22.0, 27.0, 22.0, 40.0, 33.0, 29.0, 35.0, 46.0, 45.0, 36.0, 37.0, 41.0, 46.0, 52.0, 48.0, 41.0, 35.0, 39.0, 23.0, 16.0, 20.0, 29.0, 19.0, 27.0, 20.0, 22.0, 10.0, 9.0, 8.0, 7.0, 6.0, 4.0, 3.0, 1.0, 6.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.59765625, -7.376708984375, -7.15576171875, -6.934814453125, -6.7138671875, -6.492919921875, -6.27197265625, -6.051025390625, -5.830078125, -5.609130859375, -5.38818359375, -5.167236328125, -4.9462890625, -4.725341796875, -4.50439453125, -4.283447265625, -4.0625, -3.841552734375, -3.62060546875, -3.399658203125, -3.1787109375, -2.957763671875, -2.73681640625, -2.515869140625, -2.294921875, -2.073974609375, -1.85302734375, -1.632080078125, -1.4111328125, -1.190185546875, -0.96923828125, -0.748291015625, -0.52734375, -0.306396484375, -0.08544921875, 0.135498046875, 0.3564453125, 0.577392578125, 0.79833984375, 1.019287109375, 1.240234375, 1.461181640625, 1.68212890625, 1.903076171875, 2.1240234375, 2.344970703125, 2.56591796875, 2.786865234375, 3.0078125, 3.228759765625, 3.44970703125, 3.670654296875, 3.8916015625, 4.112548828125, 4.33349609375, 4.554443359375, 4.775390625, 4.996337890625, 5.21728515625, 5.438232421875, 5.6591796875, 5.880126953125, 6.10107421875, 6.322021484375, 6.54296875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 4.0, 8.0, 2.0, 14.0, 15.0, 19.0, 32.0, 42.0, 54.0, 83.0, 130.0, 172.0, 257.0, 414.0, 664.0, 1109.0, 1867.0, 3218.0, 6208.0, 13354.0, 35289.0, 145323.0, 3687889.0, 222128.0, 43772.0, 15862.0, 7145.0, 3708.0, 2063.0, 1255.0, 785.0, 485.0, 299.0, 173.0, 141.0, 74.0, 69.0, 40.0, 28.0, 16.0, 24.0, 13.0, 6.0, 10.0, 5.0, 4.0, 3.0, 4.0, 0.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-73.125, -70.654296875, -68.18359375, -65.712890625, -63.2421875, -60.771484375, -58.30078125, -55.830078125, -53.359375, -50.888671875, -48.41796875, -45.947265625, -43.4765625, -41.005859375, -38.53515625, -36.064453125, -33.59375, -31.123046875, -28.65234375, -26.181640625, -23.7109375, -21.240234375, -18.76953125, -16.298828125, -13.828125, -11.357421875, -8.88671875, -6.416015625, -3.9453125, -1.474609375, 0.99609375, 3.466796875, 5.9375, 8.408203125, 10.87890625, 13.349609375, 15.8203125, 18.291015625, 20.76171875, 23.232421875, 25.703125, 28.173828125, 30.64453125, 33.115234375, 35.5859375, 38.056640625, 40.52734375, 42.998046875, 45.46875, 47.939453125, 50.41015625, 52.880859375, 55.3515625, 57.822265625, 60.29296875, 62.763671875, 65.234375, 67.705078125, 70.17578125, 72.646484375, 75.1171875, 77.587890625, 80.05859375, 82.529296875, 85.0]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 5.0, 3.0, 5.0, 6.0, 12.0, 22.0, 18.0, 50.0, 67.0, 141.0, 446.0, 2714.0, 274.0, 123.0, 51.0, 41.0, 26.0, 19.0, 16.0, 7.0, 4.0, 3.0, 6.0, 3.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.296875, -28.092041015625, -26.88720703125, -25.682373046875, -24.4775390625, -23.272705078125, -22.06787109375, -20.863037109375, -19.658203125, -18.453369140625, -17.24853515625, -16.043701171875, -14.8388671875, -13.634033203125, -12.42919921875, -11.224365234375, -10.01953125, -8.814697265625, -7.60986328125, -6.405029296875, -5.2001953125, -3.995361328125, -2.79052734375, -1.585693359375, -0.380859375, 0.823974609375, 2.02880859375, 3.233642578125, 4.4384765625, 5.643310546875, 6.84814453125, 8.052978515625, 9.2578125, 10.462646484375, 11.66748046875, 12.872314453125, 14.0771484375, 15.281982421875, 16.48681640625, 17.691650390625, 18.896484375, 20.101318359375, 21.30615234375, 22.510986328125, 23.7158203125, 24.920654296875, 26.12548828125, 27.330322265625, 28.53515625, 29.739990234375, 30.94482421875, 32.149658203125, 33.3544921875, 34.559326171875, 35.76416015625, 36.968994140625, 38.173828125, 39.378662109375, 40.58349609375, 41.788330078125, 42.9931640625, 44.197998046875, 45.40283203125, 46.607666015625, 47.8125]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 9.0, 8.0, 25.0, 47.0, 102.0, 209.0, 278.0, 186.0, 82.0, 32.0, 23.0, 8.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-204.7943572998047, -192.905517578125, -181.0166778564453, -169.12783813476562, -157.23899841308594, -145.35015869140625, -133.46133422851562, -121.5724868774414, -109.68364715576172, -97.79480743408203, -85.90596771240234, -74.01713562011719, -62.128292083740234, -50.23945236206055, -38.350616455078125, -26.461776733398438, -14.57293701171875, -2.684098243713379, 9.204740524291992, 21.093578338623047, 32.982418060302734, 44.87125778198242, 56.760093688964844, 68.64893341064453, 80.53777313232422, 92.4266128540039, 104.3154525756836, 116.20428466796875, 128.09312438964844, 139.98196411132812, 151.8708038330078, 163.7596435546875, 175.64846801757812, 187.5373077392578, 199.4261474609375, 211.3149871826172, 223.20382690429688, 235.09266662597656, 246.98150634765625, 258.8703308105469, 270.7591857910156, 282.64801025390625, 294.536865234375, 306.4256896972656, 318.3145446777344, 330.203369140625, 342.09222412109375, 353.9810485839844, 365.869873046875, 377.7586975097656, 389.6475524902344, 401.536376953125, 413.42523193359375, 425.3140563964844, 437.2029113769531, 449.09173583984375, 460.9805908203125, 472.8694152832031, 484.7582702636719, 496.6470947265625, 508.53594970703125, 520.4248046875, 532.3135986328125, 544.2024536132812, 556.09130859375]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 5.0, 1.0, 4.0, 5.0, 3.0, 12.0, 3.0, 6.0, 10.0, 15.0, 20.0, 15.0, 11.0, 25.0, 24.0, 35.0, 34.0, 31.0, 33.0, 37.0, 47.0, 46.0, 43.0, 45.0, 50.0, 42.0, 35.0, 50.0, 35.0, 38.0, 24.0, 31.0, 36.0, 20.0, 33.0, 12.0, 20.0, 13.0, 10.0, 13.0, 6.0, 7.0, 5.0, 6.0, 2.0, 6.0, 3.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-82.41522216796875, -79.52839660644531, -76.64156341552734, -73.7547378540039, -70.86790466308594, -67.9810791015625, -65.09425354003906, -62.207420349121094, -59.32059097290039, -56.43376159667969, -53.546932220458984, -50.66010284423828, -47.773277282714844, -44.886444091796875, -41.99961853027344, -39.112789154052734, -36.22595977783203, -33.33913040161133, -30.452301025390625, -27.565473556518555, -24.67864418029785, -21.79181480407715, -18.904987335205078, -16.018157958984375, -13.131328582763672, -10.244499206542969, -7.357670783996582, -4.470842361450195, -1.5840129852294922, 1.302816390991211, 4.189643859863281, 7.076473236083984, 9.963294982910156, 12.85012435913086, 15.736952781677246, 18.623781204223633, 21.510610580444336, 24.39743995666504, 27.28426742553711, 30.171096801757812, 33.057926177978516, 35.94475555419922, 38.83158493041992, 41.718414306640625, 44.60523986816406, 47.49207305908203, 50.37889862060547, 53.26572799682617, 56.152557373046875, 59.03938674926758, 61.92621612548828, 64.81304168701172, 67.69987487792969, 70.58670043945312, 73.47352600097656, 76.36035919189453, 79.2471923828125, 82.13401794433594, 85.0208511352539, 87.90767669677734, 90.79450988769531, 93.68133544921875, 96.56816101074219, 99.45499420166016, 102.3418197631836]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 7.0, 6.0, 4.0, 12.0, 27.0, 19.0, 33.0, 60.0, 71.0, 123.0, 155.0, 236.0, 341.0, 536.0, 793.0, 1213.0, 2009.0, 3267.0, 5289.0, 9001.0, 15877.0, 30032.0, 62521.0, 148231.0, 350947.0, 233010.0, 92307.0, 41932.0, 20894.0, 11551.0, 6700.0, 4075.0, 2484.0, 1638.0, 1054.0, 662.0, 447.0, 313.0, 230.0, 139.0, 94.0, 65.0, 29.0, 38.0, 16.0, 23.0, 14.0, 11.0, 8.0, 6.0, 1.0, 1.0, 2.0, 1.0, 5.0], "bins": [-47.96875, -46.546875, -45.125, -43.703125, -42.28125, -40.859375, -39.4375, -38.015625, -36.59375, -35.171875, -33.75, -32.328125, -30.90625, -29.484375, -28.0625, -26.640625, -25.21875, -23.796875, -22.375, -20.953125, -19.53125, -18.109375, -16.6875, -15.265625, -13.84375, -12.421875, -11.0, -9.578125, -8.15625, -6.734375, -5.3125, -3.890625, -2.46875, -1.046875, 0.375, 1.796875, 3.21875, 4.640625, 6.0625, 7.484375, 8.90625, 10.328125, 11.75, 13.171875, 14.59375, 16.015625, 17.4375, 18.859375, 20.28125, 21.703125, 23.125, 24.546875, 25.96875, 27.390625, 28.8125, 30.234375, 31.65625, 33.078125, 34.5, 35.921875, 37.34375, 38.765625, 40.1875, 41.609375, 43.03125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 10.0, 6.0, 5.0, 6.0, 11.0, 14.0, 15.0, 13.0, 10.0, 14.0, 26.0, 17.0, 19.0, 29.0, 37.0, 19.0, 40.0, 41.0, 46.0, 43.0, 40.0, 49.0, 47.0, 36.0, 40.0, 25.0, 56.0, 38.0, 39.0, 28.0, 22.0, 31.0, 24.0, 18.0, 18.0, 17.0, 9.0, 9.0, 11.0, 8.0, 6.0, 2.0, 7.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-8.40625, -8.1561279296875, -7.906005859375, -7.6558837890625, -7.40576171875, -7.1556396484375, -6.905517578125, -6.6553955078125, -6.4052734375, -6.1551513671875, -5.905029296875, -5.6549072265625, -5.40478515625, -5.1546630859375, -4.904541015625, -4.6544189453125, -4.404296875, -4.1541748046875, -3.904052734375, -3.6539306640625, -3.40380859375, -3.1536865234375, -2.903564453125, -2.6534423828125, -2.4033203125, -2.1531982421875, -1.903076171875, -1.6529541015625, -1.40283203125, -1.1527099609375, -0.902587890625, -0.6524658203125, -0.40234375, -0.1522216796875, 0.097900390625, 0.3480224609375, 0.59814453125, 0.8482666015625, 1.098388671875, 1.3485107421875, 1.5986328125, 1.8487548828125, 2.098876953125, 2.3489990234375, 2.59912109375, 2.8492431640625, 3.099365234375, 3.3494873046875, 3.599609375, 3.8497314453125, 4.099853515625, 4.3499755859375, 4.60009765625, 4.8502197265625, 5.100341796875, 5.3504638671875, 5.6005859375, 5.8507080078125, 6.100830078125, 6.3509521484375, 6.60107421875, 6.8511962890625, 7.101318359375, 7.3514404296875, 7.6015625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 5.0, 7.0, 15.0, 17.0, 8.0, 7.0, 12.0, 19.0, 35.0, 53.0, 71.0, 124.0, 210.0, 349.0, 593.0, 1046.0, 1867.0, 3754.0, 7898.0, 18215.0, 47131.0, 152896.0, 489353.0, 219346.0, 62822.0, 23228.0, 9805.0, 4536.0, 2270.0, 1175.0, 649.0, 365.0, 238.0, 125.0, 94.0, 65.0, 39.0, 22.0, 24.0, 10.0, 13.0, 10.0, 16.0, 5.0, 3.0, 4.0, 2.0, 4.0, 2.0, 1.0, 0.0, 2.0], "bins": [-59.59375, -57.873046875, -56.15234375, -54.431640625, -52.7109375, -50.990234375, -49.26953125, -47.548828125, -45.828125, -44.107421875, -42.38671875, -40.666015625, -38.9453125, -37.224609375, -35.50390625, -33.783203125, -32.0625, -30.341796875, -28.62109375, -26.900390625, -25.1796875, -23.458984375, -21.73828125, -20.017578125, -18.296875, -16.576171875, -14.85546875, -13.134765625, -11.4140625, -9.693359375, -7.97265625, -6.251953125, -4.53125, -2.810546875, -1.08984375, 0.630859375, 2.3515625, 4.072265625, 5.79296875, 7.513671875, 9.234375, 10.955078125, 12.67578125, 14.396484375, 16.1171875, 17.837890625, 19.55859375, 21.279296875, 23.0, 24.720703125, 26.44140625, 28.162109375, 29.8828125, 31.603515625, 33.32421875, 35.044921875, 36.765625, 38.486328125, 40.20703125, 41.927734375, 43.6484375, 45.369140625, 47.08984375, 48.810546875, 50.53125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 3.0, 8.0, 8.0, 13.0, 8.0, 15.0, 14.0, 12.0, 13.0, 19.0, 34.0, 38.0, 34.0, 33.0, 28.0, 41.0, 44.0, 42.0, 45.0, 50.0, 47.0, 37.0, 48.0, 47.0, 40.0, 42.0, 38.0, 31.0, 25.0, 23.0, 19.0, 15.0, 17.0, 12.0, 10.0, 12.0, 9.0, 7.0, 5.0, 3.0, 4.0, 3.0, 3.0, 1.0, 5.0, 0.0, 0.0, 2.0], "bins": [-49.28125, -47.8896484375, -46.498046875, -45.1064453125, -43.71484375, -42.3232421875, -40.931640625, -39.5400390625, -38.1484375, -36.7568359375, -35.365234375, -33.9736328125, -32.58203125, -31.1904296875, -29.798828125, -28.4072265625, -27.015625, -25.6240234375, -24.232421875, -22.8408203125, -21.44921875, -20.0576171875, -18.666015625, -17.2744140625, -15.8828125, -14.4912109375, -13.099609375, -11.7080078125, -10.31640625, -8.9248046875, -7.533203125, -6.1416015625, -4.75, -3.3583984375, -1.966796875, -0.5751953125, 0.81640625, 2.2080078125, 3.599609375, 4.9912109375, 6.3828125, 7.7744140625, 9.166015625, 10.5576171875, 11.94921875, 13.3408203125, 14.732421875, 16.1240234375, 17.515625, 18.9072265625, 20.298828125, 21.6904296875, 23.08203125, 24.4736328125, 25.865234375, 27.2568359375, 28.6484375, 30.0400390625, 31.431640625, 32.8232421875, 34.21484375, 35.6064453125, 36.998046875, 38.3896484375, 39.78125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 5.0, 5.0, 5.0, 8.0, 10.0, 16.0, 25.0, 39.0, 47.0, 65.0, 97.0, 135.0, 187.0, 362.0, 587.0, 1115.0, 2112.0, 5004.0, 15196.0, 73578.0, 705039.0, 203583.0, 27125.0, 7722.0, 3077.0, 1431.0, 720.0, 411.0, 273.0, 203.0, 107.0, 73.0, 56.0, 29.0, 39.0, 23.0, 14.0, 10.0, 6.0, 6.0, 7.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.5, -58.5302734375, -56.560546875, -54.5908203125, -52.62109375, -50.6513671875, -48.681640625, -46.7119140625, -44.7421875, -42.7724609375, -40.802734375, -38.8330078125, -36.86328125, -34.8935546875, -32.923828125, -30.9541015625, -28.984375, -27.0146484375, -25.044921875, -23.0751953125, -21.10546875, -19.1357421875, -17.166015625, -15.1962890625, -13.2265625, -11.2568359375, -9.287109375, -7.3173828125, -5.34765625, -3.3779296875, -1.408203125, 0.5615234375, 2.53125, 4.5009765625, 6.470703125, 8.4404296875, 10.41015625, 12.3798828125, 14.349609375, 16.3193359375, 18.2890625, 20.2587890625, 22.228515625, 24.1982421875, 26.16796875, 28.1376953125, 30.107421875, 32.0771484375, 34.046875, 36.0166015625, 37.986328125, 39.9560546875, 41.92578125, 43.8955078125, 45.865234375, 47.8349609375, 49.8046875, 51.7744140625, 53.744140625, 55.7138671875, 57.68359375, 59.6533203125, 61.623046875, 63.5927734375, 65.5625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 4.0, 6.0, 7.0, 4.0, 9.0, 15.0, 18.0, 30.0, 42.0, 73.0, 103.0, 220.0, 175.0, 96.0, 65.0, 33.0, 27.0, 21.0, 11.0, 7.0, 6.0, 8.0, 2.0, 2.0, 4.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0171966552734375, -0.016753792762756348, -0.016310930252075195, -0.015868067741394043, -0.01542520523071289, -0.014982342720031738, -0.014539480209350586, -0.014096617698669434, -0.013653755187988281, -0.013210892677307129, -0.012768030166625977, -0.012325167655944824, -0.011882305145263672, -0.01143944263458252, -0.010996580123901367, -0.010553717613220215, -0.010110855102539062, -0.00966799259185791, -0.009225130081176758, -0.008782267570495605, -0.008339405059814453, -0.0078965425491333, -0.0074536800384521484, -0.007010817527770996, -0.006567955017089844, -0.006125092506408691, -0.005682229995727539, -0.005239367485046387, -0.004796504974365234, -0.004353642463684082, -0.00391077995300293, -0.0034679174423217773, -0.003025054931640625, -0.0025821924209594727, -0.0021393299102783203, -0.001696467399597168, -0.0012536048889160156, -0.0008107423782348633, -0.00036787986755371094, 7.49826431274414e-05, 0.0005178451538085938, 0.0009607076644897461, 0.0014035701751708984, 0.0018464326858520508, 0.002289295196533203, 0.0027321577072143555, 0.003175020217895508, 0.00361788272857666, 0.0040607452392578125, 0.004503607749938965, 0.004946470260620117, 0.0053893327713012695, 0.005832195281982422, 0.006275057792663574, 0.0067179203033447266, 0.007160782814025879, 0.007603645324707031, 0.008046507835388184, 0.008489370346069336, 0.008932232856750488, 0.00937509536743164, 0.009817957878112793, 0.010260820388793945, 0.010703682899475098, 0.01114654541015625]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 6.0, 3.0, 4.0, 7.0, 10.0, 8.0, 17.0, 27.0, 25.0, 45.0, 60.0, 101.0, 126.0, 209.0, 365.0, 695.0, 1272.0, 3044.0, 9331.0, 47280.0, 604757.0, 337984.0, 31165.0, 6946.0, 2413.0, 1144.0, 591.0, 325.0, 194.0, 125.0, 83.0, 51.0, 40.0, 26.0, 17.0, 13.0, 7.0, 11.0, 7.0, 8.0, 3.0, 7.0, 5.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0], "bins": [-77.875, -75.705078125, -73.53515625, -71.365234375, -69.1953125, -67.025390625, -64.85546875, -62.685546875, -60.515625, -58.345703125, -56.17578125, -54.005859375, -51.8359375, -49.666015625, -47.49609375, -45.326171875, -43.15625, -40.986328125, -38.81640625, -36.646484375, -34.4765625, -32.306640625, -30.13671875, -27.966796875, -25.796875, -23.626953125, -21.45703125, -19.287109375, -17.1171875, -14.947265625, -12.77734375, -10.607421875, -8.4375, -6.267578125, -4.09765625, -1.927734375, 0.2421875, 2.412109375, 4.58203125, 6.751953125, 8.921875, 11.091796875, 13.26171875, 15.431640625, 17.6015625, 19.771484375, 21.94140625, 24.111328125, 26.28125, 28.451171875, 30.62109375, 32.791015625, 34.9609375, 37.130859375, 39.30078125, 41.470703125, 43.640625, 45.810546875, 47.98046875, 50.150390625, 52.3203125, 54.490234375, 56.66015625, 58.830078125, 61.0]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 4.0, 9.0, 4.0, 10.0, 12.0, 15.0, 22.0, 39.0, 49.0, 66.0, 96.0, 137.0, 147.0, 116.0, 75.0, 56.0, 52.0, 19.0, 21.0, 15.0, 15.0, 6.0, 4.0, 5.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-39.46875, -38.11572265625, -36.7626953125, -35.40966796875, -34.056640625, -32.70361328125, -31.3505859375, -29.99755859375, -28.64453125, -27.29150390625, -25.9384765625, -24.58544921875, -23.232421875, -21.87939453125, -20.5263671875, -19.17333984375, -17.8203125, -16.46728515625, -15.1142578125, -13.76123046875, -12.408203125, -11.05517578125, -9.7021484375, -8.34912109375, -6.99609375, -5.64306640625, -4.2900390625, -2.93701171875, -1.583984375, -0.23095703125, 1.1220703125, 2.47509765625, 3.828125, 5.18115234375, 6.5341796875, 7.88720703125, 9.240234375, 10.59326171875, 11.9462890625, 13.29931640625, 14.65234375, 16.00537109375, 17.3583984375, 18.71142578125, 20.064453125, 21.41748046875, 22.7705078125, 24.12353515625, 25.4765625, 26.82958984375, 28.1826171875, 29.53564453125, 30.888671875, 32.24169921875, 33.5947265625, 34.94775390625, 36.30078125, 37.65380859375, 39.0068359375, 40.35986328125, 41.712890625, 43.06591796875, 44.4189453125, 45.77197265625, 47.125]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 10.0, 15.0, 30.0, 42.0, 97.0, 125.0, 186.0, 166.0, 152.0, 83.0, 42.0, 33.0, 17.0, 7.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-615.23486328125, -594.6429443359375, -574.051025390625, -553.4590454101562, -532.8671264648438, -512.2752075195312, -491.6832580566406, -471.09130859375, -450.4993896484375, -429.907470703125, -409.3155212402344, -388.72357177734375, -368.13165283203125, -347.53973388671875, -326.9477844238281, -306.3558349609375, -285.763916015625, -265.1719970703125, -244.58004760742188, -223.9881134033203, -203.39617919921875, -182.8042449951172, -162.21231079101562, -141.62037658691406, -121.0284423828125, -100.43650817871094, -79.84457397460938, -59.25263977050781, -38.66070556640625, -18.068771362304688, 2.523162841796875, 23.115097045898438, 43.70703125, 64.29896545410156, 84.89089965820312, 105.48283386230469, 126.07476806640625, 146.6667022705078, 167.25863647460938, 187.85057067871094, 208.4425048828125, 229.03443908691406, 249.62637329101562, 270.21832275390625, 290.81024169921875, 311.40216064453125, 331.9941101074219, 352.5860595703125, 373.177978515625, 393.7698974609375, 414.3618469238281, 434.95379638671875, 455.54571533203125, 476.13763427734375, 496.7295837402344, 517.321533203125, 537.9134521484375, 558.50537109375, 579.0972900390625, 599.6892700195312, 620.2811889648438, 640.8731079101562, 661.465087890625, 682.0570068359375, 702.64892578125]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 7.0, 5.0, 8.0, 7.0, 7.0, 14.0, 19.0, 14.0, 21.0, 26.0, 39.0, 39.0, 48.0, 42.0, 55.0, 46.0, 58.0, 47.0, 37.0, 53.0, 54.0, 49.0, 53.0, 37.0, 28.0, 36.0, 22.0, 22.0, 24.0, 17.0, 26.0, 19.0, 5.0, 8.0, 6.0, 4.0, 5.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-262.41778564453125, -253.11940002441406, -243.82102966308594, -234.52264404296875, -225.22427368164062, -215.92588806152344, -206.62750244140625, -197.32913208007812, -188.03076171875, -178.7323760986328, -169.4340057373047, -160.1356201171875, -150.83724975585938, -141.5388641357422, -132.240478515625, -122.94210815429688, -113.64372253417969, -104.34534454345703, -95.04696655273438, -85.74858093261719, -76.45021057128906, -67.15182495117188, -57.85344696044922, -48.55506896972656, -39.256690979003906, -29.95831298828125, -20.65993309020996, -11.361553192138672, -2.0631752014160156, 7.235202789306641, 16.533584594726562, 25.83196258544922, 35.130340576171875, 44.42871856689453, 53.72709655761719, 63.02547836303711, 72.3238525390625, 81.62223815917969, 90.92061614990234, 100.218994140625, 109.51737213134766, 118.81575012207031, 128.1141357421875, 137.41250610351562, 146.7108917236328, 156.00926208496094, 165.30764770507812, 174.60601806640625, 183.90440368652344, 193.20278930664062, 202.50115966796875, 211.79954528808594, 221.09791564941406, 230.39630126953125, 239.69467163085938, 248.99305725097656, 258.29144287109375, 267.5898132324219, 276.8882141113281, 286.18658447265625, 295.4849548339844, 304.7833251953125, 314.08172607421875, 323.3800964355469, 332.678466796875]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 3.0, 6.0, 9.0, 11.0, 8.0, 15.0, 26.0, 25.0, 29.0, 38.0, 76.0, 109.0, 138.0, 208.0, 289.0, 383.0, 662.0, 1040.0, 1643.0, 2888.0, 5753.0, 12699.0, 35250.0, 168500.0, 3749113.0, 155736.0, 34505.0, 12215.0, 5537.0, 3012.0, 1606.0, 968.0, 589.0, 393.0, 243.0, 183.0, 102.0, 80.0, 56.0, 42.0, 29.0, 22.0, 15.0, 7.0, 13.0, 6.0, 4.0, 3.0, 2.0, 1.0, 0.0, 3.0], "bins": [-84.0, -81.697265625, -79.39453125, -77.091796875, -74.7890625, -72.486328125, -70.18359375, -67.880859375, -65.578125, -63.275390625, -60.97265625, -58.669921875, -56.3671875, -54.064453125, -51.76171875, -49.458984375, -47.15625, -44.853515625, -42.55078125, -40.248046875, -37.9453125, -35.642578125, -33.33984375, -31.037109375, -28.734375, -26.431640625, -24.12890625, -21.826171875, -19.5234375, -17.220703125, -14.91796875, -12.615234375, -10.3125, -8.009765625, -5.70703125, -3.404296875, -1.1015625, 1.201171875, 3.50390625, 5.806640625, 8.109375, 10.412109375, 12.71484375, 15.017578125, 17.3203125, 19.623046875, 21.92578125, 24.228515625, 26.53125, 28.833984375, 31.13671875, 33.439453125, 35.7421875, 38.044921875, 40.34765625, 42.650390625, 44.953125, 47.255859375, 49.55859375, 51.861328125, 54.1640625, 56.466796875, 58.76953125, 61.072265625, 63.375]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 6.0, 11.0, 12.0, 9.0, 17.0, 17.0, 19.0, 27.0, 38.0, 45.0, 52.0, 40.0, 61.0, 67.0, 55.0, 56.0, 49.0, 73.0, 53.0, 49.0, 42.0, 52.0, 38.0, 26.0, 26.0, 22.0, 14.0, 5.0, 12.0, 6.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.3515625, -10.9781494140625, -10.604736328125, -10.2313232421875, -9.85791015625, -9.4844970703125, -9.111083984375, -8.7376708984375, -8.3642578125, -7.9908447265625, -7.617431640625, -7.2440185546875, -6.87060546875, -6.4971923828125, -6.123779296875, -5.7503662109375, -5.376953125, -5.0035400390625, -4.630126953125, -4.2567138671875, -3.88330078125, -3.5098876953125, -3.136474609375, -2.7630615234375, -2.3896484375, -2.0162353515625, -1.642822265625, -1.2694091796875, -0.89599609375, -0.5225830078125, -0.149169921875, 0.2242431640625, 0.59765625, 0.9710693359375, 1.344482421875, 1.7178955078125, 2.09130859375, 2.4647216796875, 2.838134765625, 3.2115478515625, 3.5849609375, 3.9583740234375, 4.331787109375, 4.7052001953125, 5.07861328125, 5.4520263671875, 5.825439453125, 6.1988525390625, 6.572265625, 6.9456787109375, 7.319091796875, 7.6925048828125, 8.06591796875, 8.4393310546875, 8.812744140625, 9.1861572265625, 9.5595703125, 9.9329833984375, 10.306396484375, 10.6798095703125, 11.05322265625, 11.4266357421875, 11.800048828125, 12.1734619140625, 12.546875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 2.0, 4.0, 7.0, 12.0, 13.0, 21.0, 12.0, 41.0, 47.0, 69.0, 95.0, 151.0, 259.0, 436.0, 778.0, 1341.0, 2937.0, 7484.0, 25647.0, 138519.0, 3726715.0, 237815.0, 34971.0, 9546.0, 3561.0, 1601.0, 862.0, 483.0, 287.0, 173.0, 122.0, 91.0, 55.0, 42.0, 24.0, 20.0, 13.0, 5.0, 8.0, 6.0, 5.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-115.1875, -111.6552734375, -108.123046875, -104.5908203125, -101.05859375, -97.5263671875, -93.994140625, -90.4619140625, -86.9296875, -83.3974609375, -79.865234375, -76.3330078125, -72.80078125, -69.2685546875, -65.736328125, -62.2041015625, -58.671875, -55.1396484375, -51.607421875, -48.0751953125, -44.54296875, -41.0107421875, -37.478515625, -33.9462890625, -30.4140625, -26.8818359375, -23.349609375, -19.8173828125, -16.28515625, -12.7529296875, -9.220703125, -5.6884765625, -2.15625, 1.3759765625, 4.908203125, 8.4404296875, 11.97265625, 15.5048828125, 19.037109375, 22.5693359375, 26.1015625, 29.6337890625, 33.166015625, 36.6982421875, 40.23046875, 43.7626953125, 47.294921875, 50.8271484375, 54.359375, 57.8916015625, 61.423828125, 64.9560546875, 68.48828125, 72.0205078125, 75.552734375, 79.0849609375, 82.6171875, 86.1494140625, 89.681640625, 93.2138671875, 96.74609375, 100.2783203125, 103.810546875, 107.3427734375, 110.875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 5.0, 6.0, 6.0, 11.0, 18.0, 28.0, 36.0, 72.0, 137.0, 374.0, 2595.0, 454.0, 139.0, 84.0, 50.0, 24.0, 8.0, 11.0, 7.0, 10.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.46875, -36.59814453125, -34.7275390625, -32.85693359375, -30.986328125, -29.11572265625, -27.2451171875, -25.37451171875, -23.50390625, -21.63330078125, -19.7626953125, -17.89208984375, -16.021484375, -14.15087890625, -12.2802734375, -10.40966796875, -8.5390625, -6.66845703125, -4.7978515625, -2.92724609375, -1.056640625, 0.81396484375, 2.6845703125, 4.55517578125, 6.42578125, 8.29638671875, 10.1669921875, 12.03759765625, 13.908203125, 15.77880859375, 17.6494140625, 19.52001953125, 21.390625, 23.26123046875, 25.1318359375, 27.00244140625, 28.873046875, 30.74365234375, 32.6142578125, 34.48486328125, 36.35546875, 38.22607421875, 40.0966796875, 41.96728515625, 43.837890625, 45.70849609375, 47.5791015625, 49.44970703125, 51.3203125, 53.19091796875, 55.0615234375, 56.93212890625, 58.802734375, 60.67333984375, 62.5439453125, 64.41455078125, 66.28515625, 68.15576171875, 70.0263671875, 71.89697265625, 73.767578125, 75.63818359375, 77.5087890625, 79.37939453125, 81.25]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 8.0, 27.0, 181.0, 367.0, 298.0, 99.0, 24.0, 9.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-877.7890625, -853.2758178710938, -828.7625122070312, -804.249267578125, -779.7360229492188, -755.2227172851562, -730.70947265625, -706.1961669921875, -681.6829223632812, -657.169677734375, -632.6563720703125, -608.1431274414062, -583.6298828125, -559.1165771484375, -534.6033325195312, -510.0900573730469, -485.5768127441406, -461.06353759765625, -436.55029296875, -412.0370178222656, -387.52374267578125, -363.010498046875, -338.4972229003906, -313.98394775390625, -289.470703125, -264.9574279785156, -240.4441680908203, -215.930908203125, -191.41763305664062, -166.9043731689453, -142.39111328125, -117.87783813476562, -93.36456298828125, -68.8512954711914, -44.33803176879883, -19.82476806640625, 4.688499450683594, 29.201766967773438, 53.71502685546875, 78.22830200195312, 102.74156188964844, 127.25482940673828, 151.76809692382812, 176.28135681152344, 200.79461669921875, 225.30789184570312, 249.82115173339844, 274.33441162109375, 298.8476867675781, 323.3609619140625, 347.87420654296875, 372.3874816894531, 396.9007568359375, 421.41400146484375, 445.9272766113281, 470.4405517578125, 494.95379638671875, 519.467041015625, 543.9803466796875, 568.4935913085938, 593.0068359375, 617.5201416015625, 642.0333862304688, 666.546630859375, 691.0599365234375]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 6.0, 2.0, 4.0, 6.0, 7.0, 11.0, 14.0, 10.0, 18.0, 25.0, 19.0, 26.0, 32.0, 38.0, 34.0, 44.0, 61.0, 40.0, 51.0, 37.0, 54.0, 61.0, 56.0, 41.0, 47.0, 32.0, 41.0, 28.0, 23.0, 27.0, 27.0, 22.0, 17.0, 9.0, 10.0, 5.0, 6.0, 12.0, 3.0, 5.0, 2.0, 1.0, 5.0, 1.0], "bins": [-179.501708984375, -175.03573608398438, -170.56976318359375, -166.1038055419922, -161.63783264160156, -157.17185974121094, -152.7058868408203, -148.2399139404297, -143.77395629882812, -139.3079833984375, -134.84201049804688, -130.3760528564453, -125.91007995605469, -121.44410705566406, -116.97813415527344, -112.51216125488281, -108.04618835449219, -103.58021545410156, -99.11425018310547, -94.64827728271484, -90.18231201171875, -85.71633911132812, -81.2503662109375, -76.78439331054688, -72.31842803955078, -67.85245513916016, -63.38648986816406, -58.92051696777344, -54.45454788208008, -49.98857879638672, -45.522605895996094, -41.056636810302734, -36.590660095214844, -32.124691009521484, -27.658720016479492, -23.1927490234375, -18.72677993774414, -14.260810852050781, -9.794839859008789, -5.328868865966797, -0.8628997802734375, 3.6030702590942383, 8.069040298461914, 12.53501033782959, 17.000980377197266, 21.466949462890625, 25.932920455932617, 30.39889144897461, 34.86486053466797, 39.33082962036133, 43.79679870605469, 48.26277160644531, 52.72874069213867, 57.19470977783203, 61.660682678222656, 66.12664794921875, 70.59262084960938, 75.05859375, 79.5245590209961, 83.99053192138672, 88.45649719238281, 92.92247009277344, 97.38844299316406, 101.85441589355469, 106.32038116455078]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 9.0, 5.0, 6.0, 18.0, 24.0, 19.0, 38.0, 43.0, 64.0, 99.0, 121.0, 191.0, 268.0, 429.0, 580.0, 833.0, 1305.0, 1930.0, 3130.0, 5075.0, 8766.0, 16071.0, 32696.0, 73764.0, 210944.0, 438712.0, 139970.0, 55173.0, 25586.0, 13107.0, 7473.0, 4335.0, 2622.0, 1697.0, 1111.0, 750.0, 514.0, 339.0, 210.0, 152.0, 119.0, 79.0, 59.0, 37.0, 26.0, 20.0, 12.0, 18.0, 4.0, 3.0, 3.0, 2.0, 1.0, 2.0, 2.0], "bins": [-51.8125, -50.30322265625, -48.7939453125, -47.28466796875, -45.775390625, -44.26611328125, -42.7568359375, -41.24755859375, -39.73828125, -38.22900390625, -36.7197265625, -35.21044921875, -33.701171875, -32.19189453125, -30.6826171875, -29.17333984375, -27.6640625, -26.15478515625, -24.6455078125, -23.13623046875, -21.626953125, -20.11767578125, -18.6083984375, -17.09912109375, -15.58984375, -14.08056640625, -12.5712890625, -11.06201171875, -9.552734375, -8.04345703125, -6.5341796875, -5.02490234375, -3.515625, -2.00634765625, -0.4970703125, 1.01220703125, 2.521484375, 4.03076171875, 5.5400390625, 7.04931640625, 8.55859375, 10.06787109375, 11.5771484375, 13.08642578125, 14.595703125, 16.10498046875, 17.6142578125, 19.12353515625, 20.6328125, 22.14208984375, 23.6513671875, 25.16064453125, 26.669921875, 28.17919921875, 29.6884765625, 31.19775390625, 32.70703125, 34.21630859375, 35.7255859375, 37.23486328125, 38.744140625, 40.25341796875, 41.7626953125, 43.27197265625, 44.78125]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 8.0, 5.0, 5.0, 4.0, 8.0, 15.0, 7.0, 13.0, 13.0, 12.0, 19.0, 18.0, 23.0, 32.0, 34.0, 22.0, 24.0, 46.0, 46.0, 35.0, 39.0, 37.0, 51.0, 47.0, 43.0, 38.0, 42.0, 42.0, 37.0, 29.0, 24.0, 37.0, 22.0, 19.0, 18.0, 16.0, 9.0, 9.0, 11.0, 15.0, 5.0, 5.0, 5.0, 6.0, 2.0, 3.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-9.859375, -9.57177734375, -9.2841796875, -8.99658203125, -8.708984375, -8.42138671875, -8.1337890625, -7.84619140625, -7.55859375, -7.27099609375, -6.9833984375, -6.69580078125, -6.408203125, -6.12060546875, -5.8330078125, -5.54541015625, -5.2578125, -4.97021484375, -4.6826171875, -4.39501953125, -4.107421875, -3.81982421875, -3.5322265625, -3.24462890625, -2.95703125, -2.66943359375, -2.3818359375, -2.09423828125, -1.806640625, -1.51904296875, -1.2314453125, -0.94384765625, -0.65625, -0.36865234375, -0.0810546875, 0.20654296875, 0.494140625, 0.78173828125, 1.0693359375, 1.35693359375, 1.64453125, 1.93212890625, 2.2197265625, 2.50732421875, 2.794921875, 3.08251953125, 3.3701171875, 3.65771484375, 3.9453125, 4.23291015625, 4.5205078125, 4.80810546875, 5.095703125, 5.38330078125, 5.6708984375, 5.95849609375, 6.24609375, 6.53369140625, 6.8212890625, 7.10888671875, 7.396484375, 7.68408203125, 7.9716796875, 8.25927734375, 8.546875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 5.0, 2.0, 3.0, 8.0, 6.0, 6.0, 9.0, 16.0, 18.0, 26.0, 27.0, 45.0, 73.0, 107.0, 146.0, 252.0, 330.0, 654.0, 1102.0, 2111.0, 4371.0, 10326.0, 30793.0, 137655.0, 655767.0, 151399.0, 32849.0, 10712.0, 4624.0, 2209.0, 1148.0, 643.0, 374.0, 246.0, 161.0, 97.0, 50.0, 43.0, 38.0, 32.0, 18.0, 21.0, 12.0, 5.0, 4.0, 10.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0], "bins": [-76.875, -74.58203125, -72.2890625, -69.99609375, -67.703125, -65.41015625, -63.1171875, -60.82421875, -58.53125, -56.23828125, -53.9453125, -51.65234375, -49.359375, -47.06640625, -44.7734375, -42.48046875, -40.1875, -37.89453125, -35.6015625, -33.30859375, -31.015625, -28.72265625, -26.4296875, -24.13671875, -21.84375, -19.55078125, -17.2578125, -14.96484375, -12.671875, -10.37890625, -8.0859375, -5.79296875, -3.5, -1.20703125, 1.0859375, 3.37890625, 5.671875, 7.96484375, 10.2578125, 12.55078125, 14.84375, 17.13671875, 19.4296875, 21.72265625, 24.015625, 26.30859375, 28.6015625, 30.89453125, 33.1875, 35.48046875, 37.7734375, 40.06640625, 42.359375, 44.65234375, 46.9453125, 49.23828125, 51.53125, 53.82421875, 56.1171875, 58.41015625, 60.703125, 62.99609375, 65.2890625, 67.58203125, 69.875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 3.0, 10.0, 9.0, 6.0, 9.0, 12.0, 14.0, 26.0, 34.0, 27.0, 35.0, 41.0, 60.0, 45.0, 71.0, 60.0, 71.0, 50.0, 69.0, 58.0, 57.0, 42.0, 45.0, 40.0, 22.0, 18.0, 18.0, 12.0, 6.0, 10.0, 7.0, 2.0, 6.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-72.4375, -70.33984375, -68.2421875, -66.14453125, -64.046875, -61.94921875, -59.8515625, -57.75390625, -55.65625, -53.55859375, -51.4609375, -49.36328125, -47.265625, -45.16796875, -43.0703125, -40.97265625, -38.875, -36.77734375, -34.6796875, -32.58203125, -30.484375, -28.38671875, -26.2890625, -24.19140625, -22.09375, -19.99609375, -17.8984375, -15.80078125, -13.703125, -11.60546875, -9.5078125, -7.41015625, -5.3125, -3.21484375, -1.1171875, 0.98046875, 3.078125, 5.17578125, 7.2734375, 9.37109375, 11.46875, 13.56640625, 15.6640625, 17.76171875, 19.859375, 21.95703125, 24.0546875, 26.15234375, 28.25, 30.34765625, 32.4453125, 34.54296875, 36.640625, 38.73828125, 40.8359375, 42.93359375, 45.03125, 47.12890625, 49.2265625, 51.32421875, 53.421875, 55.51953125, 57.6171875, 59.71484375, 61.8125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 3.0, 4.0, 7.0, 12.0, 24.0, 27.0, 35.0, 50.0, 63.0, 106.0, 162.0, 251.0, 449.0, 836.0, 1766.0, 4758.0, 17489.0, 175248.0, 797914.0, 36437.0, 7731.0, 2564.0, 1144.0, 572.0, 328.0, 194.0, 111.0, 73.0, 61.0, 46.0, 24.0, 14.0, 14.0, 14.0, 10.0, 4.0, 5.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-82.0625, -79.2529296875, -76.443359375, -73.6337890625, -70.82421875, -68.0146484375, -65.205078125, -62.3955078125, -59.5859375, -56.7763671875, -53.966796875, -51.1572265625, -48.34765625, -45.5380859375, -42.728515625, -39.9189453125, -37.109375, -34.2998046875, -31.490234375, -28.6806640625, -25.87109375, -23.0615234375, -20.251953125, -17.4423828125, -14.6328125, -11.8232421875, -9.013671875, -6.2041015625, -3.39453125, -0.5849609375, 2.224609375, 5.0341796875, 7.84375, 10.6533203125, 13.462890625, 16.2724609375, 19.08203125, 21.8916015625, 24.701171875, 27.5107421875, 30.3203125, 33.1298828125, 35.939453125, 38.7490234375, 41.55859375, 44.3681640625, 47.177734375, 49.9873046875, 52.796875, 55.6064453125, 58.416015625, 61.2255859375, 64.03515625, 66.8447265625, 69.654296875, 72.4638671875, 75.2734375, 78.0830078125, 80.892578125, 83.7021484375, 86.51171875, 89.3212890625, 92.130859375, 94.9404296875, 97.75]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 1.0, 4.0, 4.0, 5.0, 7.0, 9.0, 38.0, 42.0, 120.0, 472.0, 175.0, 55.0, 27.0, 20.0, 12.0, 3.0, 4.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.019866943359375, -0.018901824951171875, -0.01793670654296875, -0.016971588134765625, -0.0160064697265625, -0.015041351318359375, -0.01407623291015625, -0.013111114501953125, -0.01214599609375, -0.011180877685546875, -0.01021575927734375, -0.009250640869140625, -0.0082855224609375, -0.007320404052734375, -0.00635528564453125, -0.005390167236328125, -0.004425048828125, -0.003459930419921875, -0.00249481201171875, -0.001529693603515625, -0.0005645751953125, 0.000400543212890625, 0.00136566162109375, 0.002330780029296875, 0.0032958984375, 0.004261016845703125, 0.00522613525390625, 0.006191253662109375, 0.0071563720703125, 0.008121490478515625, 0.00908660888671875, 0.010051727294921875, 0.011016845703125, 0.011981964111328125, 0.01294708251953125, 0.013912200927734375, 0.0148773193359375, 0.015842437744140625, 0.01680755615234375, 0.017772674560546875, 0.01873779296875, 0.019702911376953125, 0.02066802978515625, 0.021633148193359375, 0.0225982666015625, 0.023563385009765625, 0.02452850341796875, 0.025493621826171875, 0.026458740234375, 0.027423858642578125, 0.02838897705078125, 0.029354095458984375, 0.0303192138671875, 0.031284332275390625, 0.03224945068359375, 0.033214569091796875, 0.0341796875, 0.035144805908203125, 0.03610992431640625, 0.037075042724609375, 0.0380401611328125, 0.039005279541015625, 0.03997039794921875, 0.040935516357421875, 0.041900634765625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 4.0, 4.0, 2.0, 8.0, 6.0, 9.0, 9.0, 13.0, 13.0, 27.0, 41.0, 67.0, 120.0, 168.0, 331.0, 676.0, 1490.0, 3596.0, 13201.0, 117970.0, 852035.0, 46419.0, 7606.0, 2488.0, 1106.0, 515.0, 232.0, 159.0, 92.0, 62.0, 26.0, 21.0, 14.0, 6.0, 5.0, 4.0, 6.0, 1.0, 5.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-81.0625, -78.2978515625, -75.533203125, -72.7685546875, -70.00390625, -67.2392578125, -64.474609375, -61.7099609375, -58.9453125, -56.1806640625, -53.416015625, -50.6513671875, -47.88671875, -45.1220703125, -42.357421875, -39.5927734375, -36.828125, -34.0634765625, -31.298828125, -28.5341796875, -25.76953125, -23.0048828125, -20.240234375, -17.4755859375, -14.7109375, -11.9462890625, -9.181640625, -6.4169921875, -3.65234375, -0.8876953125, 1.876953125, 4.6416015625, 7.40625, 10.1708984375, 12.935546875, 15.7001953125, 18.46484375, 21.2294921875, 23.994140625, 26.7587890625, 29.5234375, 32.2880859375, 35.052734375, 37.8173828125, 40.58203125, 43.3466796875, 46.111328125, 48.8759765625, 51.640625, 54.4052734375, 57.169921875, 59.9345703125, 62.69921875, 65.4638671875, 68.228515625, 70.9931640625, 73.7578125, 76.5224609375, 79.287109375, 82.0517578125, 84.81640625, 87.5810546875, 90.345703125, 93.1103515625, 95.875]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 6.0, 5.0, 10.0, 16.0, 25.0, 33.0, 52.0, 67.0, 181.0, 288.0, 135.0, 59.0, 36.0, 28.0, 23.0, 11.0, 9.0, 4.0, 4.0, 0.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.96875, -49.99560546875, -48.0224609375, -46.04931640625, -44.076171875, -42.10302734375, -40.1298828125, -38.15673828125, -36.18359375, -34.21044921875, -32.2373046875, -30.26416015625, -28.291015625, -26.31787109375, -24.3447265625, -22.37158203125, -20.3984375, -18.42529296875, -16.4521484375, -14.47900390625, -12.505859375, -10.53271484375, -8.5595703125, -6.58642578125, -4.61328125, -2.64013671875, -0.6669921875, 1.30615234375, 3.279296875, 5.25244140625, 7.2255859375, 9.19873046875, 11.171875, 13.14501953125, 15.1181640625, 17.09130859375, 19.064453125, 21.03759765625, 23.0107421875, 24.98388671875, 26.95703125, 28.93017578125, 30.9033203125, 32.87646484375, 34.849609375, 36.82275390625, 38.7958984375, 40.76904296875, 42.7421875, 44.71533203125, 46.6884765625, 48.66162109375, 50.634765625, 52.60791015625, 54.5810546875, 56.55419921875, 58.52734375, 60.50048828125, 62.4736328125, 64.44677734375, 66.419921875, 68.39306640625, 70.3662109375, 72.33935546875, 74.3125]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 5.0, 12.0, 25.0, 64.0, 100.0, 156.0, 216.0, 180.0, 101.0, 71.0, 33.0, 20.0, 13.0, 3.0, 7.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-337.5392150878906, -312.78826904296875, -288.03729248046875, -263.2863464355469, -238.53538513183594, -213.784423828125, -189.03347778320312, -164.2825164794922, -139.53155517578125, -114.78059387207031, -90.0296401977539, -65.2786865234375, -40.52772521972656, -15.776763916015625, 8.97418212890625, 33.72514343261719, 58.476104736328125, 83.22706604003906, 107.97801971435547, 132.72897338867188, 157.4799346923828, 182.23089599609375, 206.98184204101562, 231.73280334472656, 256.4837646484375, 281.2347106933594, 305.9856872558594, 330.73663330078125, 355.48760986328125, 380.2385559082031, 404.989501953125, 429.740478515625, 454.491455078125, 479.2424011230469, 503.9933776855469, 528.7443237304688, 553.4953002929688, 578.2462158203125, 602.9971923828125, 627.7481689453125, 652.4991455078125, 677.2501220703125, 702.0010375976562, 726.7520141601562, 751.5029907226562, 776.25390625, 801.0048828125, 825.755859375, 850.5067749023438, 875.2577514648438, 900.0086669921875, 924.7596435546875, 949.5106201171875, 974.2615966796875, 999.0125122070312, 1023.7634887695312, 1048.514404296875, 1073.265380859375, 1098.016357421875, 1122.767333984375, 1147.5181884765625, 1172.2691650390625, 1197.0201416015625, 1221.7711181640625, 1246.5220947265625]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 5.0, 5.0, 3.0, 6.0, 3.0, 4.0, 8.0, 20.0, 10.0, 12.0, 19.0, 24.0, 30.0, 21.0, 35.0, 39.0, 39.0, 36.0, 49.0, 41.0, 36.0, 38.0, 31.0, 48.0, 48.0, 41.0, 34.0, 29.0, 41.0, 21.0, 33.0, 26.0, 27.0, 23.0, 13.0, 21.0, 22.0, 13.0, 16.0, 9.0, 4.0, 9.0, 3.0, 7.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-248.39794921875, -240.1319122314453, -231.86585998535156, -223.59982299804688, -215.33377075195312, -207.06773376464844, -198.80169677734375, -190.53564453125, -182.2696075439453, -174.00357055664062, -165.73751831054688, -157.4714813232422, -149.2054443359375, -140.93939208984375, -132.67335510253906, -124.40731048583984, -116.14126586914062, -107.8752212524414, -99.60917663574219, -91.3431396484375, -83.07709503173828, -74.81105041503906, -66.54501342773438, -58.278968811035156, -50.01292419433594, -41.74687957763672, -33.480838775634766, -25.21479606628418, -16.948753356933594, -8.682708740234375, -0.4166679382324219, 7.849372863769531, 16.11541748046875, 24.381460189819336, 32.64750289916992, 40.913543701171875, 49.179588317871094, 57.44563293457031, 65.711669921875, 73.97771453857422, 82.24375915527344, 90.50980377197266, 98.77584838867188, 107.04188537597656, 115.30792999267578, 123.573974609375, 131.8400115966797, 140.10604858398438, 148.37210083007812, 156.6381378173828, 164.90419006347656, 173.17022705078125, 181.436279296875, 189.7023162841797, 197.96835327148438, 206.23440551757812, 214.5004425048828, 222.7664794921875, 231.03253173828125, 239.29856872558594, 247.56460571289062, 255.83065795898438, 264.0967102050781, 272.36273193359375, 280.6287841796875]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 3.0, 6.0, 7.0, 11.0, 12.0, 9.0, 25.0, 31.0, 32.0, 46.0, 66.0, 93.0, 145.0, 214.0, 310.0, 427.0, 722.0, 1266.0, 2296.0, 4295.0, 9354.0, 24143.0, 93548.0, 3796123.0, 198910.0, 36788.0, 12879.0, 5696.0, 2759.0, 1511.0, 880.0, 566.0, 363.0, 228.0, 152.0, 96.0, 80.0, 45.0, 40.0, 35.0, 27.0, 11.0, 15.0, 6.0, 8.0, 1.0, 3.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-78.5625, -76.08203125, -73.6015625, -71.12109375, -68.640625, -66.16015625, -63.6796875, -61.19921875, -58.71875, -56.23828125, -53.7578125, -51.27734375, -48.796875, -46.31640625, -43.8359375, -41.35546875, -38.875, -36.39453125, -33.9140625, -31.43359375, -28.953125, -26.47265625, -23.9921875, -21.51171875, -19.03125, -16.55078125, -14.0703125, -11.58984375, -9.109375, -6.62890625, -4.1484375, -1.66796875, 0.8125, 3.29296875, 5.7734375, 8.25390625, 10.734375, 13.21484375, 15.6953125, 18.17578125, 20.65625, 23.13671875, 25.6171875, 28.09765625, 30.578125, 33.05859375, 35.5390625, 38.01953125, 40.5, 42.98046875, 45.4609375, 47.94140625, 50.421875, 52.90234375, 55.3828125, 57.86328125, 60.34375, 62.82421875, 65.3046875, 67.78515625, 70.265625, 72.74609375, 75.2265625, 77.70703125, 80.1875]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 4.0, 8.0, 3.0, 11.0, 6.0, 11.0, 9.0, 19.0, 15.0, 17.0, 28.0, 30.0, 31.0, 41.0, 27.0, 32.0, 35.0, 50.0, 49.0, 53.0, 56.0, 53.0, 49.0, 48.0, 50.0, 38.0, 36.0, 28.0, 30.0, 37.0, 17.0, 21.0, 11.0, 13.0, 11.0, 8.0, 9.0, 6.0, 1.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-12.875, -12.4864501953125, -12.097900390625, -11.7093505859375, -11.32080078125, -10.9322509765625, -10.543701171875, -10.1551513671875, -9.7666015625, -9.3780517578125, -8.989501953125, -8.6009521484375, -8.21240234375, -7.8238525390625, -7.435302734375, -7.0467529296875, -6.658203125, -6.2696533203125, -5.881103515625, -5.4925537109375, -5.10400390625, -4.7154541015625, -4.326904296875, -3.9383544921875, -3.5498046875, -3.1612548828125, -2.772705078125, -2.3841552734375, -1.99560546875, -1.6070556640625, -1.218505859375, -0.8299560546875, -0.44140625, -0.0528564453125, 0.335693359375, 0.7242431640625, 1.11279296875, 1.5013427734375, 1.889892578125, 2.2784423828125, 2.6669921875, 3.0555419921875, 3.444091796875, 3.8326416015625, 4.22119140625, 4.6097412109375, 4.998291015625, 5.3868408203125, 5.775390625, 6.1639404296875, 6.552490234375, 6.9410400390625, 7.32958984375, 7.7181396484375, 8.106689453125, 8.4952392578125, 8.8837890625, 9.2723388671875, 9.660888671875, 10.0494384765625, 10.43798828125, 10.8265380859375, 11.215087890625, 11.6036376953125, 11.9921875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 8.0, 12.0, 8.0, 11.0, 8.0, 8.0, 16.0, 26.0, 23.0, 32.0, 50.0, 64.0, 98.0, 177.0, 289.0, 524.0, 1182.0, 2705.0, 7353.0, 25661.0, 168876.0, 3843375.0, 112526.0, 20486.0, 6191.0, 2341.0, 1077.0, 416.0, 292.0, 150.0, 94.0, 61.0, 34.0, 34.0, 18.0, 10.0, 8.0, 10.0, 7.0, 7.0, 3.0, 6.0, 4.0, 8.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-135.5, -131.4453125, -127.390625, -123.3359375, -119.28125, -115.2265625, -111.171875, -107.1171875, -103.0625, -99.0078125, -94.953125, -90.8984375, -86.84375, -82.7890625, -78.734375, -74.6796875, -70.625, -66.5703125, -62.515625, -58.4609375, -54.40625, -50.3515625, -46.296875, -42.2421875, -38.1875, -34.1328125, -30.078125, -26.0234375, -21.96875, -17.9140625, -13.859375, -9.8046875, -5.75, -1.6953125, 2.359375, 6.4140625, 10.46875, 14.5234375, 18.578125, 22.6328125, 26.6875, 30.7421875, 34.796875, 38.8515625, 42.90625, 46.9609375, 51.015625, 55.0703125, 59.125, 63.1796875, 67.234375, 71.2890625, 75.34375, 79.3984375, 83.453125, 87.5078125, 91.5625, 95.6171875, 99.671875, 103.7265625, 107.78125, 111.8359375, 115.890625, 119.9453125, 124.0]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 4.0, 13.0, 10.0, 21.0, 25.0, 44.0, 102.0, 271.0, 2695.0, 558.0, 156.0, 64.0, 40.0, 21.0, 17.0, 12.0, 5.0, 7.0, 0.0, 6.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-85.0, -83.1015625, -81.203125, -79.3046875, -77.40625, -75.5078125, -73.609375, -71.7109375, -69.8125, -67.9140625, -66.015625, -64.1171875, -62.21875, -60.3203125, -58.421875, -56.5234375, -54.625, -52.7265625, -50.828125, -48.9296875, -47.03125, -45.1328125, -43.234375, -41.3359375, -39.4375, -37.5390625, -35.640625, -33.7421875, -31.84375, -29.9453125, -28.046875, -26.1484375, -24.25, -22.3515625, -20.453125, -18.5546875, -16.65625, -14.7578125, -12.859375, -10.9609375, -9.0625, -7.1640625, -5.265625, -3.3671875, -1.46875, 0.4296875, 2.328125, 4.2265625, 6.125, 8.0234375, 9.921875, 11.8203125, 13.71875, 15.6171875, 17.515625, 19.4140625, 21.3125, 23.2109375, 25.109375, 27.0078125, 28.90625, 30.8046875, 32.703125, 34.6015625, 36.5]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 7.0, 7.0, 14.0, 15.0, 18.0, 39.0, 50.0, 93.0, 113.0, 135.0, 146.0, 125.0, 78.0, 67.0, 40.0, 21.0, 13.0, 10.0, 1.0, 7.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-305.647216796875, -298.75439453125, -291.8615417480469, -284.9687194824219, -278.07586669921875, -271.18304443359375, -264.29022216796875, -257.3973693847656, -250.50453186035156, -243.6116943359375, -236.71885681152344, -229.82601928710938, -222.93319702148438, -216.0403594970703, -209.14752197265625, -202.2546844482422, -195.36184692382812, -188.46900939941406, -181.576171875, -174.683349609375, -167.79051208496094, -160.89767456054688, -154.0048370361328, -147.11199951171875, -140.21917724609375, -133.3263397216797, -126.43350982666016, -119.5406723022461, -112.64783477783203, -105.7550048828125, -98.86216735839844, -91.96932983398438, -85.07649230957031, -78.18365478515625, -71.29082489013672, -64.39798736572266, -57.505149841308594, -50.6123161315918, -43.719482421875, -36.82664489746094, -29.93381118774414, -23.04097557067871, -16.14813995361328, -9.255306243896484, -2.3624706268310547, 4.530364990234375, 11.423198699951172, 18.316036224365234, 25.20886993408203, 32.10170364379883, 38.99454116821289, 45.88737487792969, 52.78021240234375, 59.67304611206055, 66.56587982177734, 73.4587173461914, 80.35154724121094, 87.244384765625, 94.13721466064453, 101.0300521850586, 107.92288970947266, 114.81571960449219, 121.70855712890625, 128.6013946533203, 135.49423217773438]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 4.0, 1.0, 7.0, 5.0, 11.0, 11.0, 8.0, 7.0, 23.0, 27.0, 17.0, 35.0, 24.0, 34.0, 32.0, 42.0, 37.0, 51.0, 39.0, 46.0, 44.0, 43.0, 58.0, 38.0, 47.0, 31.0, 41.0, 34.0, 31.0, 33.0, 26.0, 20.0, 22.0, 19.0, 13.0, 12.0, 7.0, 7.0, 6.0, 7.0, 3.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-127.66360473632812, -123.73861694335938, -119.81362915039062, -115.88864135742188, -111.96365356445312, -108.03866577148438, -104.11367797851562, -100.18869018554688, -96.26370239257812, -92.33871459960938, -88.41372680664062, -84.48873901367188, -80.56375122070312, -76.63876342773438, -72.71377563476562, -68.78878784179688, -64.86380767822266, -60.938819885253906, -57.013832092285156, -53.088844299316406, -49.163856506347656, -45.238868713378906, -41.31388473510742, -37.38889694213867, -33.46390914916992, -29.538921356201172, -25.613933563232422, -21.688947677612305, -17.763959884643555, -13.838972091674805, -9.913986206054688, -5.9889984130859375, -2.0640106201171875, 1.8609766960144043, 5.785964012145996, 9.71095085144043, 13.63593864440918, 17.56092643737793, 21.485912322998047, 25.410900115966797, 29.335887908935547, 33.2608757019043, 37.18586349487305, 41.11084747314453, 45.03583526611328, 48.96082305908203, 52.88581085205078, 56.81079864501953, 60.73578643798828, 64.66077423095703, 68.58576202392578, 72.51074981689453, 76.43573760986328, 80.36072540283203, 84.28570556640625, 88.210693359375, 92.13568115234375, 96.0606689453125, 99.98565673828125, 103.91064453125, 107.83563232421875, 111.7606201171875, 115.68560791015625, 119.610595703125, 123.53558349609375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 5.0, 2.0, 5.0, 8.0, 11.0, 14.0, 17.0, 24.0, 40.0, 55.0, 73.0, 92.0, 181.0, 281.0, 466.0, 743.0, 1386.0, 2496.0, 4436.0, 8255.0, 16363.0, 34279.0, 78570.0, 248041.0, 430775.0, 125094.0, 49333.0, 22821.0, 11211.0, 5899.0, 3245.0, 1731.0, 1022.0, 604.0, 348.0, 201.0, 119.0, 83.0, 63.0, 45.0, 36.0, 24.0, 13.0, 16.0, 15.0, 11.0, 3.0, 4.0, 6.0, 0.0, 1.0, 3.0], "bins": [-50.1875, -48.80224609375, -47.4169921875, -46.03173828125, -44.646484375, -43.26123046875, -41.8759765625, -40.49072265625, -39.10546875, -37.72021484375, -36.3349609375, -34.94970703125, -33.564453125, -32.17919921875, -30.7939453125, -29.40869140625, -28.0234375, -26.63818359375, -25.2529296875, -23.86767578125, -22.482421875, -21.09716796875, -19.7119140625, -18.32666015625, -16.94140625, -15.55615234375, -14.1708984375, -12.78564453125, -11.400390625, -10.01513671875, -8.6298828125, -7.24462890625, -5.859375, -4.47412109375, -3.0888671875, -1.70361328125, -0.318359375, 1.06689453125, 2.4521484375, 3.83740234375, 5.22265625, 6.60791015625, 7.9931640625, 9.37841796875, 10.763671875, 12.14892578125, 13.5341796875, 14.91943359375, 16.3046875, 17.68994140625, 19.0751953125, 20.46044921875, 21.845703125, 23.23095703125, 24.6162109375, 26.00146484375, 27.38671875, 28.77197265625, 30.1572265625, 31.54248046875, 32.927734375, 34.31298828125, 35.6982421875, 37.08349609375, 38.46875]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 4.0, 1.0, 4.0, 2.0, 5.0, 4.0, 12.0, 12.0, 12.0, 12.0, 10.0, 15.0, 16.0, 19.0, 17.0, 22.0, 29.0, 30.0, 29.0, 41.0, 33.0, 37.0, 40.0, 52.0, 40.0, 34.0, 28.0, 40.0, 40.0, 38.0, 35.0, 41.0, 20.0, 29.0, 23.0, 26.0, 20.0, 26.0, 16.0, 17.0, 13.0, 13.0, 7.0, 8.0, 7.0, 8.0, 4.0, 3.0, 7.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.2421875, -10.894287109375, -10.54638671875, -10.198486328125, -9.8505859375, -9.502685546875, -9.15478515625, -8.806884765625, -8.458984375, -8.111083984375, -7.76318359375, -7.415283203125, -7.0673828125, -6.719482421875, -6.37158203125, -6.023681640625, -5.67578125, -5.327880859375, -4.97998046875, -4.632080078125, -4.2841796875, -3.936279296875, -3.58837890625, -3.240478515625, -2.892578125, -2.544677734375, -2.19677734375, -1.848876953125, -1.5009765625, -1.153076171875, -0.80517578125, -0.457275390625, -0.109375, 0.238525390625, 0.58642578125, 0.934326171875, 1.2822265625, 1.630126953125, 1.97802734375, 2.325927734375, 2.673828125, 3.021728515625, 3.36962890625, 3.717529296875, 4.0654296875, 4.413330078125, 4.76123046875, 5.109130859375, 5.45703125, 5.804931640625, 6.15283203125, 6.500732421875, 6.8486328125, 7.196533203125, 7.54443359375, 7.892333984375, 8.240234375, 8.588134765625, 8.93603515625, 9.283935546875, 9.6318359375, 9.979736328125, 10.32763671875, 10.675537109375, 11.0234375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 1.0, 4.0, 3.0, 4.0, 7.0, 9.0, 7.0, 11.0, 25.0, 24.0, 32.0, 43.0, 62.0, 68.0, 119.0, 171.0, 249.0, 472.0, 744.0, 1391.0, 2567.0, 5490.0, 14168.0, 52247.0, 541378.0, 363523.0, 42848.0, 12414.0, 4881.0, 2323.0, 1256.0, 708.0, 434.0, 292.0, 170.0, 115.0, 78.0, 56.0, 39.0, 26.0, 21.0, 14.0, 20.0, 16.0, 9.0, 7.0, 9.0, 6.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-81.1875, -78.3818359375, -75.576171875, -72.7705078125, -69.96484375, -67.1591796875, -64.353515625, -61.5478515625, -58.7421875, -55.9365234375, -53.130859375, -50.3251953125, -47.51953125, -44.7138671875, -41.908203125, -39.1025390625, -36.296875, -33.4912109375, -30.685546875, -27.8798828125, -25.07421875, -22.2685546875, -19.462890625, -16.6572265625, -13.8515625, -11.0458984375, -8.240234375, -5.4345703125, -2.62890625, 0.1767578125, 2.982421875, 5.7880859375, 8.59375, 11.3994140625, 14.205078125, 17.0107421875, 19.81640625, 22.6220703125, 25.427734375, 28.2333984375, 31.0390625, 33.8447265625, 36.650390625, 39.4560546875, 42.26171875, 45.0673828125, 47.873046875, 50.6787109375, 53.484375, 56.2900390625, 59.095703125, 61.9013671875, 64.70703125, 67.5126953125, 70.318359375, 73.1240234375, 75.9296875, 78.7353515625, 81.541015625, 84.3466796875, 87.15234375, 89.9580078125, 92.763671875, 95.5693359375, 98.375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 6.0, 6.0, 6.0, 8.0, 14.0, 13.0, 16.0, 24.0, 36.0, 38.0, 51.0, 67.0, 78.0, 75.0, 92.0, 57.0, 79.0, 73.0, 58.0, 49.0, 34.0, 26.0, 23.0, 16.0, 6.0, 11.0, 7.0, 2.0, 4.0, 2.0, 5.0, 0.0, 6.0, 0.0, 3.0, 4.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-91.6875, -88.693359375, -85.69921875, -82.705078125, -79.7109375, -76.716796875, -73.72265625, -70.728515625, -67.734375, -64.740234375, -61.74609375, -58.751953125, -55.7578125, -52.763671875, -49.76953125, -46.775390625, -43.78125, -40.787109375, -37.79296875, -34.798828125, -31.8046875, -28.810546875, -25.81640625, -22.822265625, -19.828125, -16.833984375, -13.83984375, -10.845703125, -7.8515625, -4.857421875, -1.86328125, 1.130859375, 4.125, 7.119140625, 10.11328125, 13.107421875, 16.1015625, 19.095703125, 22.08984375, 25.083984375, 28.078125, 31.072265625, 34.06640625, 37.060546875, 40.0546875, 43.048828125, 46.04296875, 49.037109375, 52.03125, 55.025390625, 58.01953125, 61.013671875, 64.0078125, 67.001953125, 69.99609375, 72.990234375, 75.984375, 78.978515625, 81.97265625, 84.966796875, 87.9609375, 90.955078125, 93.94921875, 96.943359375, 99.9375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 7.0, 3.0, 7.0, 10.0, 14.0, 18.0, 18.0, 32.0, 43.0, 65.0, 87.0, 126.0, 151.0, 253.0, 379.0, 516.0, 755.0, 1186.0, 2105.0, 4223.0, 11101.0, 54593.0, 860864.0, 86535.0, 14253.0, 4869.0, 2285.0, 1333.0, 882.0, 608.0, 370.0, 240.0, 156.0, 141.0, 93.0, 64.0, 49.0, 40.0, 21.0, 19.0, 12.0, 10.0, 11.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-67.25, -64.9775390625, -62.705078125, -60.4326171875, -58.16015625, -55.8876953125, -53.615234375, -51.3427734375, -49.0703125, -46.7978515625, -44.525390625, -42.2529296875, -39.98046875, -37.7080078125, -35.435546875, -33.1630859375, -30.890625, -28.6181640625, -26.345703125, -24.0732421875, -21.80078125, -19.5283203125, -17.255859375, -14.9833984375, -12.7109375, -10.4384765625, -8.166015625, -5.8935546875, -3.62109375, -1.3486328125, 0.923828125, 3.1962890625, 5.46875, 7.7412109375, 10.013671875, 12.2861328125, 14.55859375, 16.8310546875, 19.103515625, 21.3759765625, 23.6484375, 25.9208984375, 28.193359375, 30.4658203125, 32.73828125, 35.0107421875, 37.283203125, 39.5556640625, 41.828125, 44.1005859375, 46.373046875, 48.6455078125, 50.91796875, 53.1904296875, 55.462890625, 57.7353515625, 60.0078125, 62.2802734375, 64.552734375, 66.8251953125, 69.09765625, 71.3701171875, 73.642578125, 75.9150390625, 78.1875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 0.0, 3.0, 5.0, 8.0, 11.0, 16.0, 23.0, 37.0, 90.0, 365.0, 283.0, 71.0, 26.0, 20.0, 14.0, 11.0, 7.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0207672119140625, -0.020022153854370117, -0.019277095794677734, -0.01853203773498535, -0.01778697967529297, -0.017041921615600586, -0.016296863555908203, -0.01555180549621582, -0.014806747436523438, -0.014061689376831055, -0.013316631317138672, -0.012571573257446289, -0.011826515197753906, -0.011081457138061523, -0.01033639907836914, -0.009591341018676758, -0.008846282958984375, -0.008101224899291992, -0.007356166839599609, -0.0066111087799072266, -0.005866050720214844, -0.005120992660522461, -0.004375934600830078, -0.0036308765411376953, -0.0028858184814453125, -0.0021407604217529297, -0.0013957023620605469, -0.0006506443023681641, 9.441375732421875e-05, 0.0008394718170166016, 0.0015845298767089844, 0.002329587936401367, 0.00307464599609375, 0.003819704055786133, 0.004564762115478516, 0.0053098201751708984, 0.006054878234863281, 0.006799936294555664, 0.007544994354248047, 0.00829005241394043, 0.009035110473632812, 0.009780168533325195, 0.010525226593017578, 0.011270284652709961, 0.012015342712402344, 0.012760400772094727, 0.01350545883178711, 0.014250516891479492, 0.014995574951171875, 0.015740633010864258, 0.01648569107055664, 0.017230749130249023, 0.017975807189941406, 0.01872086524963379, 0.019465923309326172, 0.020210981369018555, 0.020956039428710938, 0.02170109748840332, 0.022446155548095703, 0.023191213607788086, 0.02393627166748047, 0.02468132972717285, 0.025426387786865234, 0.026171445846557617, 0.02691650390625]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 7.0, 3.0, 10.0, 14.0, 14.0, 21.0, 36.0, 48.0, 88.0, 110.0, 179.0, 301.0, 593.0, 1039.0, 2298.0, 6538.0, 26083.0, 586647.0, 391077.0, 22932.0, 5878.0, 2262.0, 1022.0, 544.0, 307.0, 174.0, 115.0, 66.0, 42.0, 33.0, 25.0, 16.0, 5.0, 8.0, 8.0, 2.0, 4.0, 3.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.3125, -73.84765625, -71.3828125, -68.91796875, -66.453125, -63.98828125, -61.5234375, -59.05859375, -56.59375, -54.12890625, -51.6640625, -49.19921875, -46.734375, -44.26953125, -41.8046875, -39.33984375, -36.875, -34.41015625, -31.9453125, -29.48046875, -27.015625, -24.55078125, -22.0859375, -19.62109375, -17.15625, -14.69140625, -12.2265625, -9.76171875, -7.296875, -4.83203125, -2.3671875, 0.09765625, 2.5625, 5.02734375, 7.4921875, 9.95703125, 12.421875, 14.88671875, 17.3515625, 19.81640625, 22.28125, 24.74609375, 27.2109375, 29.67578125, 32.140625, 34.60546875, 37.0703125, 39.53515625, 42.0, 44.46484375, 46.9296875, 49.39453125, 51.859375, 54.32421875, 56.7890625, 59.25390625, 61.71875, 64.18359375, 66.6484375, 69.11328125, 71.578125, 74.04296875, 76.5078125, 78.97265625, 81.4375]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 3.0, 4.0, 7.0, 12.0, 7.0, 14.0, 19.0, 43.0, 98.0, 325.0, 257.0, 107.0, 31.0, 20.0, 17.0, 9.0, 7.0, 6.0, 7.0, 3.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.125, -69.7880859375, -67.451171875, -65.1142578125, -62.77734375, -60.4404296875, -58.103515625, -55.7666015625, -53.4296875, -51.0927734375, -48.755859375, -46.4189453125, -44.08203125, -41.7451171875, -39.408203125, -37.0712890625, -34.734375, -32.3974609375, -30.060546875, -27.7236328125, -25.38671875, -23.0498046875, -20.712890625, -18.3759765625, -16.0390625, -13.7021484375, -11.365234375, -9.0283203125, -6.69140625, -4.3544921875, -2.017578125, 0.3193359375, 2.65625, 4.9931640625, 7.330078125, 9.6669921875, 12.00390625, 14.3408203125, 16.677734375, 19.0146484375, 21.3515625, 23.6884765625, 26.025390625, 28.3623046875, 30.69921875, 33.0361328125, 35.373046875, 37.7099609375, 40.046875, 42.3837890625, 44.720703125, 47.0576171875, 49.39453125, 51.7314453125, 54.068359375, 56.4052734375, 58.7421875, 61.0791015625, 63.416015625, 65.7529296875, 68.08984375, 70.4267578125, 72.763671875, 75.1005859375, 77.4375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 10.0, 10.0, 28.0, 60.0, 105.0, 190.0, 198.0, 182.0, 102.0, 47.0, 36.0, 21.0, 7.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-445.5379943847656, -416.69622802734375, -387.8544921875, -359.0127258300781, -330.1709899902344, -301.3292236328125, -272.48748779296875, -243.64572143554688, -214.80397033691406, -185.96221923828125, -157.12046813964844, -128.27871704101562, -99.43695831298828, -70.59519958496094, -41.753448486328125, -12.911697387695312, 15.9300537109375, 44.77180480957031, 73.61355590820312, 102.45531463623047, 131.29705810546875, 160.13882446289062, 188.98057556152344, 217.82232666015625, 246.66407775878906, 275.5058288574219, 304.34759521484375, 333.1893310546875, 362.0310974121094, 390.87286376953125, 419.714599609375, 448.55633544921875, 477.39813232421875, 506.2398986816406, 535.0816650390625, 563.9234008789062, 592.76513671875, 621.60693359375, 650.4486694335938, 679.2904052734375, 708.1321411132812, 736.973876953125, 765.815673828125, 794.6574096679688, 823.4991455078125, 852.3409423828125, 881.1826782226562, 910.0244140625, 938.8662109375, 967.7079467773438, 996.5497436523438, 1025.3914794921875, 1054.2332763671875, 1083.074951171875, 1111.916748046875, 1140.758544921875, 1169.6002197265625, 1198.4420166015625, 1227.28369140625, 1256.12548828125, 1284.96728515625, 1313.8089599609375, 1342.6507568359375, 1371.492431640625, 1400.334228515625]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 9.0, 2.0, 4.0, 10.0, 3.0, 11.0, 9.0, 9.0, 15.0, 14.0, 10.0, 23.0, 21.0, 22.0, 25.0, 15.0, 35.0, 37.0, 27.0, 30.0, 30.0, 39.0, 44.0, 41.0, 39.0, 43.0, 45.0, 47.0, 41.0, 37.0, 26.0, 31.0, 33.0, 17.0, 21.0, 21.0, 19.0, 24.0, 17.0, 10.0, 7.0, 10.0, 5.0, 10.0, 4.0, 3.0, 2.0, 2.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-278.5648193359375, -269.580322265625, -260.5958251953125, -251.611328125, -242.62681579589844, -233.64231872558594, -224.65782165527344, -215.67332458496094, -206.68881225585938, -197.70431518554688, -188.71981811523438, -179.73532104492188, -170.7508087158203, -161.7663116455078, -152.7818145751953, -143.7973175048828, -134.8128204345703, -125.82832336425781, -116.84381866455078, -107.85932159423828, -98.87481689453125, -89.89031982421875, -80.90582275390625, -71.92132568359375, -62.93682098388672, -53.95232009887695, -44.96781921386719, -35.98332214355469, -26.998821258544922, -18.014320373535156, -9.029823303222656, -0.045322418212890625, 8.939178466796875, 17.92367935180664, 26.908178329467773, 35.892677307128906, 44.87717819213867, 53.86167907714844, 62.84617614746094, 71.83067321777344, 80.81517791748047, 89.79967498779297, 98.7841796875, 107.7686767578125, 116.753173828125, 125.73767852783203, 134.72216796875, 143.70668029785156, 152.69117736816406, 161.67567443847656, 170.66017150878906, 179.64468383789062, 188.62918090820312, 197.61367797851562, 206.59817504882812, 215.58267211914062, 224.56716918945312, 233.55166625976562, 242.53616333007812, 251.52066040039062, 260.5051574707031, 269.48968505859375, 278.47418212890625, 287.45867919921875, 296.44317626953125]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 5.0, 4.0, 3.0, 4.0, 5.0, 10.0, 12.0, 16.0, 13.0, 23.0, 28.0, 41.0, 75.0, 98.0, 153.0, 235.0, 346.0, 561.0, 951.0, 1585.0, 2881.0, 5353.0, 10922.0, 27774.0, 124063.0, 3846040.0, 120945.0, 28392.0, 11319.0, 5446.0, 2889.0, 1616.0, 958.0, 551.0, 338.0, 204.0, 134.0, 94.0, 63.0, 39.0, 19.0, 17.0, 13.0, 14.0, 12.0, 6.0, 6.0, 2.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-125.0, -121.267578125, -117.53515625, -113.802734375, -110.0703125, -106.337890625, -102.60546875, -98.873046875, -95.140625, -91.408203125, -87.67578125, -83.943359375, -80.2109375, -76.478515625, -72.74609375, -69.013671875, -65.28125, -61.548828125, -57.81640625, -54.083984375, -50.3515625, -46.619140625, -42.88671875, -39.154296875, -35.421875, -31.689453125, -27.95703125, -24.224609375, -20.4921875, -16.759765625, -13.02734375, -9.294921875, -5.5625, -1.830078125, 1.90234375, 5.634765625, 9.3671875, 13.099609375, 16.83203125, 20.564453125, 24.296875, 28.029296875, 31.76171875, 35.494140625, 39.2265625, 42.958984375, 46.69140625, 50.423828125, 54.15625, 57.888671875, 61.62109375, 65.353515625, 69.0859375, 72.818359375, 76.55078125, 80.283203125, 84.015625, 87.748046875, 91.48046875, 95.212890625, 98.9453125, 102.677734375, 106.41015625, 110.142578125, 113.875]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 8.0, 8.0, 4.0, 4.0, 7.0, 17.0, 8.0, 19.0, 21.0, 29.0, 27.0, 37.0, 49.0, 28.0, 41.0, 52.0, 35.0, 50.0, 57.0, 54.0, 58.0, 46.0, 55.0, 34.0, 37.0, 38.0, 26.0, 26.0, 29.0, 30.0, 18.0, 16.0, 8.0, 9.0, 9.0, 3.0, 7.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.3984375, -13.8973388671875, -13.396240234375, -12.8951416015625, -12.39404296875, -11.8929443359375, -11.391845703125, -10.8907470703125, -10.3896484375, -9.8885498046875, -9.387451171875, -8.8863525390625, -8.38525390625, -7.8841552734375, -7.383056640625, -6.8819580078125, -6.380859375, -5.8797607421875, -5.378662109375, -4.8775634765625, -4.37646484375, -3.8753662109375, -3.374267578125, -2.8731689453125, -2.3720703125, -1.8709716796875, -1.369873046875, -0.8687744140625, -0.36767578125, 0.1334228515625, 0.634521484375, 1.1356201171875, 1.63671875, 2.1378173828125, 2.638916015625, 3.1400146484375, 3.64111328125, 4.1422119140625, 4.643310546875, 5.1444091796875, 5.6455078125, 6.1466064453125, 6.647705078125, 7.1488037109375, 7.64990234375, 8.1510009765625, 8.652099609375, 9.1531982421875, 9.654296875, 10.1553955078125, 10.656494140625, 11.1575927734375, 11.65869140625, 12.1597900390625, 12.660888671875, 13.1619873046875, 13.6630859375, 14.1641845703125, 14.665283203125, 15.1663818359375, 15.66748046875, 16.1685791015625, 16.669677734375, 17.1707763671875, 17.671875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 0.0, 4.0, 2.0, 1.0, 4.0, 7.0, 7.0, 5.0, 6.0, 19.0, 11.0, 13.0, 30.0, 42.0, 57.0, 50.0, 95.0, 144.0, 252.0, 469.0, 1164.0, 3313.0, 11148.0, 56985.0, 3969535.0, 126579.0, 16778.0, 4539.0, 1569.0, 615.0, 311.0, 173.0, 104.0, 68.0, 46.0, 30.0, 18.0, 18.0, 18.0, 16.0, 2.0, 11.0, 11.0, 9.0, 6.0, 1.0, 5.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-309.0, -300.08203125, -291.1640625, -282.24609375, -273.328125, -264.41015625, -255.4921875, -246.57421875, -237.65625, -228.73828125, -219.8203125, -210.90234375, -201.984375, -193.06640625, -184.1484375, -175.23046875, -166.3125, -157.39453125, -148.4765625, -139.55859375, -130.640625, -121.72265625, -112.8046875, -103.88671875, -94.96875, -86.05078125, -77.1328125, -68.21484375, -59.296875, -50.37890625, -41.4609375, -32.54296875, -23.625, -14.70703125, -5.7890625, 3.12890625, 12.046875, 20.96484375, 29.8828125, 38.80078125, 47.71875, 56.63671875, 65.5546875, 74.47265625, 83.390625, 92.30859375, 101.2265625, 110.14453125, 119.0625, 127.98046875, 136.8984375, 145.81640625, 154.734375, 163.65234375, 172.5703125, 181.48828125, 190.40625, 199.32421875, 208.2421875, 217.16015625, 226.078125, 234.99609375, 243.9140625, 252.83203125, 261.75]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 9.0, 6.0, 9.0, 14.0, 31.0, 66.0, 222.0, 3269.0, 296.0, 63.0, 35.0, 18.0, 21.0, 10.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-178.875, -174.669921875, -170.46484375, -166.259765625, -162.0546875, -157.849609375, -153.64453125, -149.439453125, -145.234375, -141.029296875, -136.82421875, -132.619140625, -128.4140625, -124.208984375, -120.00390625, -115.798828125, -111.59375, -107.388671875, -103.18359375, -98.978515625, -94.7734375, -90.568359375, -86.36328125, -82.158203125, -77.953125, -73.748046875, -69.54296875, -65.337890625, -61.1328125, -56.927734375, -52.72265625, -48.517578125, -44.3125, -40.107421875, -35.90234375, -31.697265625, -27.4921875, -23.287109375, -19.08203125, -14.876953125, -10.671875, -6.466796875, -2.26171875, 1.943359375, 6.1484375, 10.353515625, 14.55859375, 18.763671875, 22.96875, 27.173828125, 31.37890625, 35.583984375, 39.7890625, 43.994140625, 48.19921875, 52.404296875, 56.609375, 60.814453125, 65.01953125, 69.224609375, 73.4296875, 77.634765625, 81.83984375, 86.044921875, 90.25]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 15.0, 19.0, 32.0, 66.0, 149.0, 245.0, 243.0, 116.0, 72.0, 27.0, 12.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-434.6964111328125, -414.8282470703125, -394.9600830078125, -375.0919189453125, -355.2237548828125, -335.3555908203125, -315.4874267578125, -295.6192626953125, -275.7510986328125, -255.8829345703125, -236.0147705078125, -216.1466064453125, -196.2784423828125, -176.4102783203125, -156.5421142578125, -136.6739501953125, -116.8057861328125, -96.9376220703125, -77.0694580078125, -57.2012939453125, -37.3331298828125, -17.4649658203125, 2.4031982421875, 22.2713623046875, 42.1395263671875, 62.0076904296875, 81.8758544921875, 101.7440185546875, 121.6121826171875, 141.4803466796875, 161.3485107421875, 181.2166748046875, 201.08489990234375, 220.95306396484375, 240.82122802734375, 260.68939208984375, 280.55755615234375, 300.42572021484375, 320.29388427734375, 340.16204833984375, 360.03021240234375, 379.89837646484375, 399.76654052734375, 419.63470458984375, 439.50286865234375, 459.37103271484375, 479.23919677734375, 499.10736083984375, 518.9755249023438, 538.8436889648438, 558.7118530273438, 578.5800170898438, 598.4481811523438, 618.3163452148438, 638.1845092773438, 658.0526733398438, 677.9208374023438, 697.7890014648438, 717.6571655273438, 737.5253295898438, 757.3934936523438, 777.2616577148438, 797.1298217773438, 816.9979858398438, 836.8661499023438]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 5.0, 5.0, 6.0, 6.0, 5.0, 7.0, 5.0, 10.0, 15.0, 19.0, 31.0, 23.0, 17.0, 25.0, 38.0, 33.0, 28.0, 34.0, 40.0, 40.0, 39.0, 36.0, 47.0, 48.0, 41.0, 49.0, 33.0, 45.0, 24.0, 31.0, 36.0, 27.0, 21.0, 13.0, 24.0, 16.0, 7.0, 13.0, 9.0, 16.0, 13.0, 6.0, 6.0, 6.0, 4.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-171.8367919921875, -166.40737915039062, -160.9779510498047, -155.5485382080078, -150.11912536621094, -144.689697265625, -139.26028442382812, -133.83087158203125, -128.40145874023438, -122.97203826904297, -117.5426254272461, -112.11320495605469, -106.68379211425781, -101.2543716430664, -95.824951171875, -90.39553833007812, -84.96611022949219, -79.53668975830078, -74.1072769165039, -68.6778564453125, -63.24843978881836, -57.81902313232422, -52.38960266113281, -46.96018600463867, -41.53076934814453, -36.10135269165039, -30.671934127807617, -25.242515563964844, -19.813098907470703, -14.383682250976562, -8.954261779785156, -3.5248451232910156, 1.904571533203125, 7.333989143371582, 12.763406753540039, 18.192825317382812, 23.622241973876953, 29.051658630371094, 34.4810791015625, 39.91049575805664, 45.33991241455078, 50.76932907104492, 56.19874572753906, 61.62816619873047, 67.05758666992188, 72.48699951171875, 77.91641998291016, 83.34584045410156, 88.77525329589844, 94.20467376708984, 99.63408660888672, 105.06350708007812, 110.492919921875, 115.9223403930664, 121.35176086425781, 126.78117370605469, 132.21060180664062, 137.6400146484375, 143.06944274902344, 148.4988555908203, 153.9282684326172, 159.35769653320312, 164.787109375, 170.21652221679688, 175.64593505859375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 5.0, 3.0, 9.0, 8.0, 15.0, 18.0, 37.0, 46.0, 66.0, 98.0, 127.0, 210.0, 275.0, 465.0, 730.0, 1109.0, 1716.0, 2797.0, 4905.0, 8768.0, 16878.0, 34589.0, 77865.0, 204060.0, 402828.0, 162832.0, 64729.0, 29602.0, 14679.0, 7768.0, 4411.0, 2613.0, 1569.0, 976.0, 560.0, 409.0, 254.0, 159.0, 126.0, 74.0, 52.0, 35.0, 24.0, 16.0, 15.0, 9.0, 5.0, 9.0, 5.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.34375, -52.35986328125, -50.3759765625, -48.39208984375, -46.408203125, -44.42431640625, -42.4404296875, -40.45654296875, -38.47265625, -36.48876953125, -34.5048828125, -32.52099609375, -30.537109375, -28.55322265625, -26.5693359375, -24.58544921875, -22.6015625, -20.61767578125, -18.6337890625, -16.64990234375, -14.666015625, -12.68212890625, -10.6982421875, -8.71435546875, -6.73046875, -4.74658203125, -2.7626953125, -0.77880859375, 1.205078125, 3.18896484375, 5.1728515625, 7.15673828125, 9.140625, 11.12451171875, 13.1083984375, 15.09228515625, 17.076171875, 19.06005859375, 21.0439453125, 23.02783203125, 25.01171875, 26.99560546875, 28.9794921875, 30.96337890625, 32.947265625, 34.93115234375, 36.9150390625, 38.89892578125, 40.8828125, 42.86669921875, 44.8505859375, 46.83447265625, 48.818359375, 50.80224609375, 52.7861328125, 54.77001953125, 56.75390625, 58.73779296875, 60.7216796875, 62.70556640625, 64.689453125, 66.67333984375, 68.6572265625, 70.64111328125, 72.625]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 6.0, 3.0, 5.0, 5.0, 11.0, 7.0, 9.0, 20.0, 20.0, 23.0, 20.0, 25.0, 22.0, 38.0, 29.0, 27.0, 43.0, 46.0, 49.0, 44.0, 44.0, 36.0, 40.0, 46.0, 41.0, 29.0, 27.0, 27.0, 38.0, 24.0, 26.0, 29.0, 20.0, 20.0, 20.0, 18.0, 15.0, 9.0, 10.0, 6.0, 7.0, 2.0, 3.0, 0.0, 5.0, 1.0, 2.0, 3.0], "bins": [-19.515625, -18.988037109375, -18.46044921875, -17.932861328125, -17.4052734375, -16.877685546875, -16.35009765625, -15.822509765625, -15.294921875, -14.767333984375, -14.23974609375, -13.712158203125, -13.1845703125, -12.656982421875, -12.12939453125, -11.601806640625, -11.07421875, -10.546630859375, -10.01904296875, -9.491455078125, -8.9638671875, -8.436279296875, -7.90869140625, -7.381103515625, -6.853515625, -6.325927734375, -5.79833984375, -5.270751953125, -4.7431640625, -4.215576171875, -3.68798828125, -3.160400390625, -2.6328125, -2.105224609375, -1.57763671875, -1.050048828125, -0.5224609375, 0.005126953125, 0.53271484375, 1.060302734375, 1.587890625, 2.115478515625, 2.64306640625, 3.170654296875, 3.6982421875, 4.225830078125, 4.75341796875, 5.281005859375, 5.80859375, 6.336181640625, 6.86376953125, 7.391357421875, 7.9189453125, 8.446533203125, 8.97412109375, 9.501708984375, 10.029296875, 10.556884765625, 11.08447265625, 11.612060546875, 12.1396484375, 12.667236328125, 13.19482421875, 13.722412109375, 14.25]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 5.0, 4.0, 6.0, 2.0, 13.0, 9.0, 11.0, 8.0, 18.0, 26.0, 33.0, 43.0, 57.0, 86.0, 116.0, 194.0, 294.0, 421.0, 805.0, 1466.0, 2733.0, 5793.0, 14011.0, 40264.0, 163782.0, 613386.0, 143840.0, 36502.0, 13107.0, 5488.0, 2628.0, 1303.0, 781.0, 456.0, 259.0, 187.0, 114.0, 92.0, 49.0, 43.0, 22.0, 22.0, 24.0, 17.0, 12.0, 11.0, 8.0, 4.0, 3.0, 1.0, 0.0, 4.0, 0.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-83.9375, -80.880859375, -77.82421875, -74.767578125, -71.7109375, -68.654296875, -65.59765625, -62.541015625, -59.484375, -56.427734375, -53.37109375, -50.314453125, -47.2578125, -44.201171875, -41.14453125, -38.087890625, -35.03125, -31.974609375, -28.91796875, -25.861328125, -22.8046875, -19.748046875, -16.69140625, -13.634765625, -10.578125, -7.521484375, -4.46484375, -1.408203125, 1.6484375, 4.705078125, 7.76171875, 10.818359375, 13.875, 16.931640625, 19.98828125, 23.044921875, 26.1015625, 29.158203125, 32.21484375, 35.271484375, 38.328125, 41.384765625, 44.44140625, 47.498046875, 50.5546875, 53.611328125, 56.66796875, 59.724609375, 62.78125, 65.837890625, 68.89453125, 71.951171875, 75.0078125, 78.064453125, 81.12109375, 84.177734375, 87.234375, 90.291015625, 93.34765625, 96.404296875, 99.4609375, 102.517578125, 105.57421875, 108.630859375, 111.6875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [5.0, 1.0, 1.0, 4.0, 4.0, 2.0, 7.0, 7.0, 2.0, 5.0, 11.0, 9.0, 12.0, 19.0, 13.0, 20.0, 15.0, 20.0, 28.0, 28.0, 38.0, 36.0, 33.0, 33.0, 32.0, 39.0, 43.0, 59.0, 55.0, 44.0, 56.0, 41.0, 38.0, 34.0, 37.0, 38.0, 26.0, 12.0, 14.0, 16.0, 15.0, 16.0, 6.0, 9.0, 9.0, 6.0, 5.0, 4.0, 3.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-73.3125, -70.6162109375, -67.919921875, -65.2236328125, -62.52734375, -59.8310546875, -57.134765625, -54.4384765625, -51.7421875, -49.0458984375, -46.349609375, -43.6533203125, -40.95703125, -38.2607421875, -35.564453125, -32.8681640625, -30.171875, -27.4755859375, -24.779296875, -22.0830078125, -19.38671875, -16.6904296875, -13.994140625, -11.2978515625, -8.6015625, -5.9052734375, -3.208984375, -0.5126953125, 2.18359375, 4.8798828125, 7.576171875, 10.2724609375, 12.96875, 15.6650390625, 18.361328125, 21.0576171875, 23.75390625, 26.4501953125, 29.146484375, 31.8427734375, 34.5390625, 37.2353515625, 39.931640625, 42.6279296875, 45.32421875, 48.0205078125, 50.716796875, 53.4130859375, 56.109375, 58.8056640625, 61.501953125, 64.1982421875, 66.89453125, 69.5908203125, 72.287109375, 74.9833984375, 77.6796875, 80.3759765625, 83.072265625, 85.7685546875, 88.46484375, 91.1611328125, 93.857421875, 96.5537109375, 99.25]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 6.0, 11.0, 7.0, 25.0, 19.0, 24.0, 45.0, 69.0, 118.0, 201.0, 313.0, 609.0, 1175.0, 2437.0, 5216.0, 14411.0, 51789.0, 415748.0, 474016.0, 56296.0, 15223.0, 5737.0, 2416.0, 1180.0, 588.0, 336.0, 228.0, 110.0, 56.0, 39.0, 30.0, 28.0, 17.0, 13.0, 6.0, 5.0, 3.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-48.0625, -46.2841796875, -44.505859375, -42.7275390625, -40.94921875, -39.1708984375, -37.392578125, -35.6142578125, -33.8359375, -32.0576171875, -30.279296875, -28.5009765625, -26.72265625, -24.9443359375, -23.166015625, -21.3876953125, -19.609375, -17.8310546875, -16.052734375, -14.2744140625, -12.49609375, -10.7177734375, -8.939453125, -7.1611328125, -5.3828125, -3.6044921875, -1.826171875, -0.0478515625, 1.73046875, 3.5087890625, 5.287109375, 7.0654296875, 8.84375, 10.6220703125, 12.400390625, 14.1787109375, 15.95703125, 17.7353515625, 19.513671875, 21.2919921875, 23.0703125, 24.8486328125, 26.626953125, 28.4052734375, 30.18359375, 31.9619140625, 33.740234375, 35.5185546875, 37.296875, 39.0751953125, 40.853515625, 42.6318359375, 44.41015625, 46.1884765625, 47.966796875, 49.7451171875, 51.5234375, 53.3017578125, 55.080078125, 56.8583984375, 58.63671875, 60.4150390625, 62.193359375, 63.9716796875, 65.75]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 3.0, 4.0, 7.0, 7.0, 9.0, 10.0, 9.0, 20.0, 20.0, 36.0, 48.0, 86.0, 141.0, 201.0, 141.0, 77.0, 55.0, 29.0, 27.0, 21.0, 9.0, 10.0, 13.0, 7.0, 5.0, 5.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0164337158203125, -0.01594412326812744, -0.015454530715942383, -0.014964938163757324, -0.014475345611572266, -0.013985753059387207, -0.013496160507202148, -0.01300656795501709, -0.012516975402832031, -0.012027382850646973, -0.011537790298461914, -0.011048197746276855, -0.010558605194091797, -0.010069012641906738, -0.00957942008972168, -0.009089827537536621, -0.008600234985351562, -0.008110642433166504, -0.007621049880981445, -0.007131457328796387, -0.006641864776611328, -0.0061522722244262695, -0.005662679672241211, -0.005173087120056152, -0.004683494567871094, -0.004193902015686035, -0.0037043094635009766, -0.003214716911315918, -0.0027251243591308594, -0.0022355318069458008, -0.0017459392547607422, -0.0012563467025756836, -0.000766754150390625, -0.0002771615982055664, 0.0002124309539794922, 0.0007020235061645508, 0.0011916160583496094, 0.001681208610534668, 0.0021708011627197266, 0.002660393714904785, 0.0031499862670898438, 0.0036395788192749023, 0.004129171371459961, 0.0046187639236450195, 0.005108356475830078, 0.005597949028015137, 0.006087541580200195, 0.006577134132385254, 0.0070667266845703125, 0.007556319236755371, 0.00804591178894043, 0.008535504341125488, 0.009025096893310547, 0.009514689445495605, 0.010004281997680664, 0.010493874549865723, 0.010983467102050781, 0.01147305965423584, 0.011962652206420898, 0.012452244758605957, 0.012941837310791016, 0.013431429862976074, 0.013921022415161133, 0.014410614967346191, 0.01490020751953125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 8.0, 1.0, 5.0, 8.0, 11.0, 20.0, 25.0, 33.0, 47.0, 74.0, 101.0, 196.0, 315.0, 607.0, 1253.0, 2730.0, 7874.0, 28155.0, 176411.0, 680226.0, 117810.0, 21686.0, 6143.0, 2440.0, 1091.0, 542.0, 263.0, 176.0, 100.0, 67.0, 32.0, 32.0, 23.0, 8.0, 15.0, 7.0, 2.0, 10.0, 4.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-53.3125, -51.3671875, -49.421875, -47.4765625, -45.53125, -43.5859375, -41.640625, -39.6953125, -37.75, -35.8046875, -33.859375, -31.9140625, -29.96875, -28.0234375, -26.078125, -24.1328125, -22.1875, -20.2421875, -18.296875, -16.3515625, -14.40625, -12.4609375, -10.515625, -8.5703125, -6.625, -4.6796875, -2.734375, -0.7890625, 1.15625, 3.1015625, 5.046875, 6.9921875, 8.9375, 10.8828125, 12.828125, 14.7734375, 16.71875, 18.6640625, 20.609375, 22.5546875, 24.5, 26.4453125, 28.390625, 30.3359375, 32.28125, 34.2265625, 36.171875, 38.1171875, 40.0625, 42.0078125, 43.953125, 45.8984375, 47.84375, 49.7890625, 51.734375, 53.6796875, 55.625, 57.5703125, 59.515625, 61.4609375, 63.40625, 65.3515625, 67.296875, 69.2421875, 71.1875]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 4.0, 14.0, 8.0, 12.0, 11.0, 12.0, 29.0, 33.0, 46.0, 52.0, 76.0, 127.0, 130.0, 133.0, 93.0, 59.0, 34.0, 36.0, 22.0, 20.0, 12.0, 7.0, 5.0, 9.0, 5.0, 1.0, 1.0, 3.0, 0.0, 4.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.375, -39.61328125, -37.8515625, -36.08984375, -34.328125, -32.56640625, -30.8046875, -29.04296875, -27.28125, -25.51953125, -23.7578125, -21.99609375, -20.234375, -18.47265625, -16.7109375, -14.94921875, -13.1875, -11.42578125, -9.6640625, -7.90234375, -6.140625, -4.37890625, -2.6171875, -0.85546875, 0.90625, 2.66796875, 4.4296875, 6.19140625, 7.953125, 9.71484375, 11.4765625, 13.23828125, 15.0, 16.76171875, 18.5234375, 20.28515625, 22.046875, 23.80859375, 25.5703125, 27.33203125, 29.09375, 30.85546875, 32.6171875, 34.37890625, 36.140625, 37.90234375, 39.6640625, 41.42578125, 43.1875, 44.94921875, 46.7109375, 48.47265625, 50.234375, 51.99609375, 53.7578125, 55.51953125, 57.28125, 59.04296875, 60.8046875, 62.56640625, 64.328125, 66.08984375, 67.8515625, 69.61328125, 71.375]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 10.0, 23.0, 49.0, 78.0, 149.0, 193.0, 220.0, 136.0, 74.0, 35.0, 24.0, 8.0, 7.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1474.6683349609375, -1435.7587890625, -1396.84912109375, -1357.9395751953125, -1319.030029296875, -1280.120361328125, -1241.2108154296875, -1202.30126953125, -1163.3916015625, -1124.4820556640625, -1085.5723876953125, -1046.662841796875, -1007.7532348632812, -968.8436279296875, -929.93408203125, -891.0244750976562, -852.1148681640625, -813.2052612304688, -774.295654296875, -735.3861083984375, -696.4765014648438, -657.56689453125, -618.6573486328125, -579.7477416992188, -540.838134765625, -501.92852783203125, -463.0189514160156, -424.109375, -385.19976806640625, -346.2901611328125, -307.3805847167969, -268.47100830078125, -229.56134033203125, -190.65174865722656, -151.74215698242188, -112.83256530761719, -73.9229736328125, -35.01338195800781, 3.896209716796875, 42.8057861328125, 81.71539306640625, 120.62498474121094, 159.53457641601562, 198.4441680908203, 237.353759765625, 276.26336669921875, 315.1729431152344, 354.08251953125, 392.99212646484375, 431.9017333984375, 470.8113098144531, 509.72088623046875, 548.6304931640625, 587.5401000976562, 626.44970703125, 665.3592529296875, 704.2688598632812, 743.178466796875, 782.0880126953125, 820.9976196289062, 859.9072265625, 898.8168334960938, 937.7264404296875, 976.635986328125, 1015.5455932617188]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 1.0, 5.0, 0.0, 1.0, 3.0, 6.0, 3.0, 5.0, 9.0, 10.0, 9.0, 6.0, 9.0, 6.0, 15.0, 18.0, 21.0, 32.0, 26.0, 19.0, 25.0, 29.0, 32.0, 40.0, 44.0, 39.0, 35.0, 39.0, 34.0, 31.0, 39.0, 33.0, 43.0, 35.0, 24.0, 39.0, 35.0, 34.0, 19.0, 19.0, 23.0, 16.0, 15.0, 9.0, 11.0, 13.0, 6.0, 5.0, 11.0, 8.0, 10.0, 2.0, 1.0, 5.0, 5.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-383.0623474121094, -371.3676452636719, -359.6729431152344, -347.9782409667969, -336.28350830078125, -324.58880615234375, -312.89410400390625, -301.19940185546875, -289.50469970703125, -277.80999755859375, -266.11529541015625, -254.4205780029297, -242.7258758544922, -231.0311737060547, -219.33645629882812, -207.64175415039062, -195.94705200195312, -184.25234985351562, -172.55764770507812, -160.86293029785156, -149.16822814941406, -137.47352600097656, -125.77881622314453, -114.0841064453125, -102.389404296875, -90.6947021484375, -78.99999237060547, -67.30528259277344, -55.61058044433594, -43.91587448120117, -32.221168518066406, -20.526458740234375, -8.831787109375, 2.8629188537597656, 14.557624816894531, 26.252330780029297, 37.94703674316406, 49.64174270629883, 61.336448669433594, 73.03115844726562, 84.72586059570312, 96.42056274414062, 108.11527252197266, 119.80998229980469, 131.5046844482422, 143.1993865966797, 154.89410400390625, 166.58880615234375, 178.28350830078125, 189.97821044921875, 201.67291259765625, 213.3676300048828, 225.0623321533203, 236.7570343017578, 248.45175170898438, 260.1464538574219, 271.8411560058594, 283.5358581542969, 295.2305603027344, 306.9252624511719, 318.6199951171875, 330.314697265625, 342.0093994140625, 353.7041015625, 365.3988037109375]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 1.0, 7.0, 5.0, 11.0, 10.0, 16.0, 12.0, 22.0, 32.0, 37.0, 72.0, 91.0, 98.0, 174.0, 218.0, 345.0, 484.0, 718.0, 1109.0, 1585.0, 2468.0, 4165.0, 7472.0, 15608.0, 37174.0, 127705.0, 3694992.0, 209546.0, 48352.0, 18838.0, 9207.0, 5053.0, 2972.0, 1926.0, 1229.0, 808.0, 543.0, 382.0, 260.0, 180.0, 123.0, 70.0, 56.0, 37.0, 26.0, 22.0, 10.0, 7.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-96.0625, -93.3662109375, -90.669921875, -87.9736328125, -85.27734375, -82.5810546875, -79.884765625, -77.1884765625, -74.4921875, -71.7958984375, -69.099609375, -66.4033203125, -63.70703125, -61.0107421875, -58.314453125, -55.6181640625, -52.921875, -50.2255859375, -47.529296875, -44.8330078125, -42.13671875, -39.4404296875, -36.744140625, -34.0478515625, -31.3515625, -28.6552734375, -25.958984375, -23.2626953125, -20.56640625, -17.8701171875, -15.173828125, -12.4775390625, -9.78125, -7.0849609375, -4.388671875, -1.6923828125, 1.00390625, 3.7001953125, 6.396484375, 9.0927734375, 11.7890625, 14.4853515625, 17.181640625, 19.8779296875, 22.57421875, 25.2705078125, 27.966796875, 30.6630859375, 33.359375, 36.0556640625, 38.751953125, 41.4482421875, 44.14453125, 46.8408203125, 49.537109375, 52.2333984375, 54.9296875, 57.6259765625, 60.322265625, 63.0185546875, 65.71484375, 68.4111328125, 71.107421875, 73.8037109375, 76.5]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 0.0, 2.0, 4.0, 4.0, 8.0, 7.0, 6.0, 11.0, 16.0, 17.0, 22.0, 26.0, 19.0, 27.0, 28.0, 34.0, 36.0, 41.0, 42.0, 52.0, 49.0, 46.0, 37.0, 59.0, 37.0, 46.0, 38.0, 37.0, 33.0, 33.0, 33.0, 26.0, 20.0, 18.0, 16.0, 16.0, 17.0, 11.0, 10.0, 5.0, 3.0, 7.0, 3.0, 0.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-20.171875, -19.6126708984375, -19.053466796875, -18.4942626953125, -17.93505859375, -17.3758544921875, -16.816650390625, -16.2574462890625, -15.6982421875, -15.1390380859375, -14.579833984375, -14.0206298828125, -13.46142578125, -12.9022216796875, -12.343017578125, -11.7838134765625, -11.224609375, -10.6654052734375, -10.106201171875, -9.5469970703125, -8.98779296875, -8.4285888671875, -7.869384765625, -7.3101806640625, -6.7509765625, -6.1917724609375, -5.632568359375, -5.0733642578125, -4.51416015625, -3.9549560546875, -3.395751953125, -2.8365478515625, -2.27734375, -1.7181396484375, -1.158935546875, -0.5997314453125, -0.04052734375, 0.5186767578125, 1.077880859375, 1.6370849609375, 2.1962890625, 2.7554931640625, 3.314697265625, 3.8739013671875, 4.43310546875, 4.9923095703125, 5.551513671875, 6.1107177734375, 6.669921875, 7.2291259765625, 7.788330078125, 8.3475341796875, 8.90673828125, 9.4659423828125, 10.025146484375, 10.5843505859375, 11.1435546875, 11.7027587890625, 12.261962890625, 12.8211669921875, 13.38037109375, 13.9395751953125, 14.498779296875, 15.0579833984375, 15.6171875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 3.0, 2.0, 6.0, 7.0, 8.0, 8.0, 13.0, 13.0, 14.0, 26.0, 30.0, 30.0, 50.0, 55.0, 100.0, 157.0, 218.0, 441.0, 840.0, 1720.0, 3879.0, 10436.0, 35914.0, 285796.0, 3744019.0, 80746.0, 18296.0, 6266.0, 2525.0, 1163.0, 557.0, 310.0, 183.0, 134.0, 75.0, 57.0, 46.0, 33.0, 16.0, 22.0, 24.0, 11.0, 7.0, 11.0, 5.0, 4.0, 8.0, 3.0, 5.0, 2.0, 2.0], "bins": [-253.0, -246.20703125, -239.4140625, -232.62109375, -225.828125, -219.03515625, -212.2421875, -205.44921875, -198.65625, -191.86328125, -185.0703125, -178.27734375, -171.484375, -164.69140625, -157.8984375, -151.10546875, -144.3125, -137.51953125, -130.7265625, -123.93359375, -117.140625, -110.34765625, -103.5546875, -96.76171875, -89.96875, -83.17578125, -76.3828125, -69.58984375, -62.796875, -56.00390625, -49.2109375, -42.41796875, -35.625, -28.83203125, -22.0390625, -15.24609375, -8.453125, -1.66015625, 5.1328125, 11.92578125, 18.71875, 25.51171875, 32.3046875, 39.09765625, 45.890625, 52.68359375, 59.4765625, 66.26953125, 73.0625, 79.85546875, 86.6484375, 93.44140625, 100.234375, 107.02734375, 113.8203125, 120.61328125, 127.40625, 134.19921875, 140.9921875, 147.78515625, 154.578125, 161.37109375, 168.1640625, 174.95703125, 181.75]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 7.0, 11.0, 9.0, 9.0, 21.0, 28.0, 28.0, 56.0, 131.0, 518.0, 2784.0, 233.0, 104.0, 46.0, 32.0, 20.0, 17.0, 7.0, 7.0, 6.0, 3.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-166.25, -162.576171875, -158.90234375, -155.228515625, -151.5546875, -147.880859375, -144.20703125, -140.533203125, -136.859375, -133.185546875, -129.51171875, -125.837890625, -122.1640625, -118.490234375, -114.81640625, -111.142578125, -107.46875, -103.794921875, -100.12109375, -96.447265625, -92.7734375, -89.099609375, -85.42578125, -81.751953125, -78.078125, -74.404296875, -70.73046875, -67.056640625, -63.3828125, -59.708984375, -56.03515625, -52.361328125, -48.6875, -45.013671875, -41.33984375, -37.666015625, -33.9921875, -30.318359375, -26.64453125, -22.970703125, -19.296875, -15.623046875, -11.94921875, -8.275390625, -4.6015625, -0.927734375, 2.74609375, 6.419921875, 10.09375, 13.767578125, 17.44140625, 21.115234375, 24.7890625, 28.462890625, 32.13671875, 35.810546875, 39.484375, 43.158203125, 46.83203125, 50.505859375, 54.1796875, 57.853515625, 61.52734375, 65.201171875, 68.875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 4.0, 8.0, 16.0, 41.0, 82.0, 202.0, 246.0, 243.0, 99.0, 41.0, 12.0, 8.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-880.707275390625, -847.4222412109375, -814.13720703125, -780.8521118164062, -747.5670776367188, -714.2820434570312, -680.9969482421875, -647.7119140625, -614.4268798828125, -581.141845703125, -547.8568115234375, -514.5717163085938, -481.28668212890625, -448.00164794921875, -414.7165832519531, -381.4315185546875, -348.146484375, -314.8614501953125, -281.5763854980469, -248.2913360595703, -215.00628662109375, -181.7212371826172, -148.43618774414062, -115.15113830566406, -81.8660888671875, -48.58103942871094, -15.295989990234375, 17.989059448242188, 51.27410888671875, 84.55915832519531, 117.84420776367188, 151.12925720214844, 184.414306640625, 217.69935607910156, 250.98440551757812, 284.26947021484375, 317.55450439453125, 350.83953857421875, 384.1246032714844, 417.40966796875, 450.6947021484375, 483.979736328125, 517.2647705078125, 550.5498657226562, 583.8348999023438, 617.1199340820312, 650.405029296875, 683.6900634765625, 716.97509765625, 750.2601318359375, 783.545166015625, 816.8302612304688, 850.1152954101562, 883.4003295898438, 916.6854248046875, 949.970458984375, 983.2554931640625, 1016.54052734375, 1049.8255615234375, 1083.110595703125, 1116.395751953125, 1149.6807861328125, 1182.9658203125, 1216.2508544921875, 1249.535888671875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 3.0, 2.0, 8.0, 6.0, 12.0, 5.0, 12.0, 16.0, 15.0, 21.0, 15.0, 19.0, 29.0, 24.0, 22.0, 38.0, 42.0, 43.0, 39.0, 37.0, 44.0, 43.0, 41.0, 40.0, 49.0, 40.0, 50.0, 42.0, 35.0, 37.0, 20.0, 30.0, 25.0, 18.0, 14.0, 18.0, 8.0, 13.0, 6.0, 5.0, 7.0, 7.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-230.9420623779297, -223.25466918945312, -215.56727600097656, -207.8798828125, -200.19248962402344, -192.50509643554688, -184.81771850585938, -177.13031005859375, -169.44293212890625, -161.7555389404297, -154.06814575195312, -146.38075256347656, -138.693359375, -131.00596618652344, -123.3185806274414, -115.63118743896484, -107.94378662109375, -100.25639343261719, -92.56900024414062, -84.88160705566406, -77.1942138671875, -69.50682067871094, -61.819435119628906, -54.132041931152344, -46.44464874267578, -38.75725555419922, -31.06986427307129, -23.38247299194336, -15.695079803466797, -8.007686614990234, -0.3202972412109375, 7.367095947265625, 15.05450439453125, 22.741897583007812, 30.429288864135742, 38.11668014526367, 45.804073333740234, 53.4914665222168, 61.178855895996094, 68.86624908447266, 76.55364227294922, 84.24103546142578, 91.92842864990234, 99.61581420898438, 107.30320739746094, 114.9906005859375, 122.67799377441406, 130.36538696289062, 138.0527801513672, 145.74017333984375, 153.4275665283203, 161.11495971679688, 168.80235290527344, 176.48974609375, 184.1771240234375, 191.86453247070312, 199.55191040039062, 207.2393035888672, 214.92669677734375, 222.6140899658203, 230.30148315429688, 237.98887634277344, 245.67626953125, 253.3636474609375, 261.0510559082031]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 0.0, 5.0, 1.0, 5.0, 11.0, 15.0, 21.0, 17.0, 31.0, 51.0, 62.0, 105.0, 127.0, 185.0, 280.0, 430.0, 670.0, 1106.0, 2085.0, 4254.0, 9491.0, 24525.0, 78861.0, 345640.0, 431039.0, 98292.0, 29675.0, 10991.0, 4834.0, 2421.0, 1212.0, 700.0, 429.0, 301.0, 224.0, 115.0, 81.0, 73.0, 52.0, 32.0, 28.0, 22.0, 24.0, 12.0, 7.0, 5.0, 4.0, 3.0, 4.0, 3.0, 1.0, 2.0], "bins": [-115.4375, -112.23828125, -109.0390625, -105.83984375, -102.640625, -99.44140625, -96.2421875, -93.04296875, -89.84375, -86.64453125, -83.4453125, -80.24609375, -77.046875, -73.84765625, -70.6484375, -67.44921875, -64.25, -61.05078125, -57.8515625, -54.65234375, -51.453125, -48.25390625, -45.0546875, -41.85546875, -38.65625, -35.45703125, -32.2578125, -29.05859375, -25.859375, -22.66015625, -19.4609375, -16.26171875, -13.0625, -9.86328125, -6.6640625, -3.46484375, -0.265625, 2.93359375, 6.1328125, 9.33203125, 12.53125, 15.73046875, 18.9296875, 22.12890625, 25.328125, 28.52734375, 31.7265625, 34.92578125, 38.125, 41.32421875, 44.5234375, 47.72265625, 50.921875, 54.12109375, 57.3203125, 60.51953125, 63.71875, 66.91796875, 70.1171875, 73.31640625, 76.515625, 79.71484375, 82.9140625, 86.11328125, 89.3125]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 1.0, 3.0, 5.0, 11.0, 6.0, 8.0, 15.0, 13.0, 9.0, 14.0, 22.0, 28.0, 24.0, 33.0, 38.0, 46.0, 40.0, 50.0, 49.0, 50.0, 38.0, 57.0, 54.0, 46.0, 39.0, 40.0, 50.0, 32.0, 25.0, 31.0, 28.0, 22.0, 9.0, 20.0, 14.0, 8.0, 7.0, 5.0, 9.0, 3.0, 4.0, 0.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-25.140625, -24.349853515625, -23.55908203125, -22.768310546875, -21.9775390625, -21.186767578125, -20.39599609375, -19.605224609375, -18.814453125, -18.023681640625, -17.23291015625, -16.442138671875, -15.6513671875, -14.860595703125, -14.06982421875, -13.279052734375, -12.48828125, -11.697509765625, -10.90673828125, -10.115966796875, -9.3251953125, -8.534423828125, -7.74365234375, -6.952880859375, -6.162109375, -5.371337890625, -4.58056640625, -3.789794921875, -2.9990234375, -2.208251953125, -1.41748046875, -0.626708984375, 0.1640625, 0.954833984375, 1.74560546875, 2.536376953125, 3.3271484375, 4.117919921875, 4.90869140625, 5.699462890625, 6.490234375, 7.281005859375, 8.07177734375, 8.862548828125, 9.6533203125, 10.444091796875, 11.23486328125, 12.025634765625, 12.81640625, 13.607177734375, 14.39794921875, 15.188720703125, 15.9794921875, 16.770263671875, 17.56103515625, 18.351806640625, 19.142578125, 19.933349609375, 20.72412109375, 21.514892578125, 22.3056640625, 23.096435546875, 23.88720703125, 24.677978515625, 25.46875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 2.0, 7.0, 5.0, 3.0, 12.0, 27.0, 32.0, 45.0, 86.0, 124.0, 199.0, 329.0, 594.0, 1040.0, 1925.0, 4242.0, 12956.0, 72892.0, 746505.0, 174035.0, 21908.0, 6038.0, 2467.0, 1304.0, 706.0, 418.0, 247.0, 170.0, 88.0, 60.0, 30.0, 23.0, 12.0, 9.0, 11.0, 4.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-179.125, -172.87890625, -166.6328125, -160.38671875, -154.140625, -147.89453125, -141.6484375, -135.40234375, -129.15625, -122.91015625, -116.6640625, -110.41796875, -104.171875, -97.92578125, -91.6796875, -85.43359375, -79.1875, -72.94140625, -66.6953125, -60.44921875, -54.203125, -47.95703125, -41.7109375, -35.46484375, -29.21875, -22.97265625, -16.7265625, -10.48046875, -4.234375, 2.01171875, 8.2578125, 14.50390625, 20.75, 26.99609375, 33.2421875, 39.48828125, 45.734375, 51.98046875, 58.2265625, 64.47265625, 70.71875, 76.96484375, 83.2109375, 89.45703125, 95.703125, 101.94921875, 108.1953125, 114.44140625, 120.6875, 126.93359375, 133.1796875, 139.42578125, 145.671875, 151.91796875, 158.1640625, 164.41015625, 170.65625, 176.90234375, 183.1484375, 189.39453125, 195.640625, 201.88671875, 208.1328125, 214.37890625, 220.625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 9.0, 5.0, 6.0, 12.0, 12.0, 14.0, 15.0, 15.0, 25.0, 17.0, 33.0, 43.0, 59.0, 46.0, 59.0, 55.0, 56.0, 41.0, 48.0, 49.0, 47.0, 61.0, 45.0, 28.0, 28.0, 27.0, 23.0, 26.0, 21.0, 19.0, 8.0, 14.0, 10.0, 8.0, 1.0, 3.0, 2.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-124.9375, -120.4228515625, -115.908203125, -111.3935546875, -106.87890625, -102.3642578125, -97.849609375, -93.3349609375, -88.8203125, -84.3056640625, -79.791015625, -75.2763671875, -70.76171875, -66.2470703125, -61.732421875, -57.2177734375, -52.703125, -48.1884765625, -43.673828125, -39.1591796875, -34.64453125, -30.1298828125, -25.615234375, -21.1005859375, -16.5859375, -12.0712890625, -7.556640625, -3.0419921875, 1.47265625, 5.9873046875, 10.501953125, 15.0166015625, 19.53125, 24.0458984375, 28.560546875, 33.0751953125, 37.58984375, 42.1044921875, 46.619140625, 51.1337890625, 55.6484375, 60.1630859375, 64.677734375, 69.1923828125, 73.70703125, 78.2216796875, 82.736328125, 87.2509765625, 91.765625, 96.2802734375, 100.794921875, 105.3095703125, 109.82421875, 114.3388671875, 118.853515625, 123.3681640625, 127.8828125, 132.3974609375, 136.912109375, 141.4267578125, 145.94140625, 150.4560546875, 154.970703125, 159.4853515625, 164.0]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 8.0, 0.0, 11.0, 10.0, 9.0, 19.0, 15.0, 28.0, 24.0, 47.0, 56.0, 73.0, 108.0, 162.0, 245.0, 274.0, 400.0, 515.0, 751.0, 1032.0, 1562.0, 2398.0, 4408.0, 15316.0, 661375.0, 335975.0, 12283.0, 4126.0, 2248.0, 1456.0, 1012.0, 672.0, 535.0, 373.0, 274.0, 184.0, 159.0, 98.0, 95.0, 53.0, 51.0, 33.0, 24.0, 13.0, 16.0, 10.0, 9.0, 4.0, 4.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-213.0, -206.115234375, -199.23046875, -192.345703125, -185.4609375, -178.576171875, -171.69140625, -164.806640625, -157.921875, -151.037109375, -144.15234375, -137.267578125, -130.3828125, -123.498046875, -116.61328125, -109.728515625, -102.84375, -95.958984375, -89.07421875, -82.189453125, -75.3046875, -68.419921875, -61.53515625, -54.650390625, -47.765625, -40.880859375, -33.99609375, -27.111328125, -20.2265625, -13.341796875, -6.45703125, 0.427734375, 7.3125, 14.197265625, 21.08203125, 27.966796875, 34.8515625, 41.736328125, 48.62109375, 55.505859375, 62.390625, 69.275390625, 76.16015625, 83.044921875, 89.9296875, 96.814453125, 103.69921875, 110.583984375, 117.46875, 124.353515625, 131.23828125, 138.123046875, 145.0078125, 151.892578125, 158.77734375, 165.662109375, 172.546875, 179.431640625, 186.31640625, 193.201171875, 200.0859375, 206.970703125, 213.85546875, 220.740234375, 227.625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 8.0, 12.0, 26.0, 113.0, 594.0, 165.0, 43.0, 20.0, 7.0, 3.0, 3.0, 3.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.097412109375, -0.09401321411132812, -0.09061431884765625, -0.08721542358398438, -0.0838165283203125, -0.08041763305664062, -0.07701873779296875, -0.07361984252929688, -0.070220947265625, -0.06682205200195312, -0.06342315673828125, -0.060024261474609375, -0.0566253662109375, -0.053226470947265625, -0.04982757568359375, -0.046428680419921875, -0.04302978515625, -0.039630889892578125, -0.03623199462890625, -0.032833099365234375, -0.0294342041015625, -0.026035308837890625, -0.02263641357421875, -0.019237518310546875, -0.015838623046875, -0.012439727783203125, -0.00904083251953125, -0.005641937255859375, -0.0022430419921875, 0.001155853271484375, 0.00455474853515625, 0.007953643798828125, 0.0113525390625, 0.014751434326171875, 0.01815032958984375, 0.021549224853515625, 0.0249481201171875, 0.028347015380859375, 0.03174591064453125, 0.035144805908203125, 0.038543701171875, 0.041942596435546875, 0.04534149169921875, 0.048740386962890625, 0.0521392822265625, 0.055538177490234375, 0.05893707275390625, 0.062335968017578125, 0.06573486328125, 0.06913375854492188, 0.07253265380859375, 0.07593154907226562, 0.0793304443359375, 0.08272933959960938, 0.08612823486328125, 0.08952713012695312, 0.092926025390625, 0.09632492065429688, 0.09972381591796875, 0.10312271118164062, 0.1065216064453125, 0.10992050170898438, 0.11331939697265625, 0.11671829223632812, 0.1201171875]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 6.0, 0.0, 0.0, 9.0, 11.0, 10.0, 17.0, 28.0, 49.0, 52.0, 96.0, 148.0, 264.0, 464.0, 916.0, 2024.0, 5040.0, 24008.0, 988400.0, 18538.0, 4589.0, 1902.0, 910.0, 428.0, 256.0, 149.0, 80.0, 44.0, 36.0, 22.0, 14.0, 12.0, 11.0, 9.0, 5.0, 7.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-346.5, -333.87890625, -321.2578125, -308.63671875, -296.015625, -283.39453125, -270.7734375, -258.15234375, -245.53125, -232.91015625, -220.2890625, -207.66796875, -195.046875, -182.42578125, -169.8046875, -157.18359375, -144.5625, -131.94140625, -119.3203125, -106.69921875, -94.078125, -81.45703125, -68.8359375, -56.21484375, -43.59375, -30.97265625, -18.3515625, -5.73046875, 6.890625, 19.51171875, 32.1328125, 44.75390625, 57.375, 69.99609375, 82.6171875, 95.23828125, 107.859375, 120.48046875, 133.1015625, 145.72265625, 158.34375, 170.96484375, 183.5859375, 196.20703125, 208.828125, 221.44921875, 234.0703125, 246.69140625, 259.3125, 271.93359375, 284.5546875, 297.17578125, 309.796875, 322.41796875, 335.0390625, 347.66015625, 360.28125, 372.90234375, 385.5234375, 398.14453125, 410.765625, 423.38671875, 436.0078125, 448.62890625, 461.25]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 4.0, 5.0, 7.0, 14.0, 45.0, 295.0, 474.0, 101.0, 21.0, 9.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-298.5, -287.93359375, -277.3671875, -266.80078125, -256.234375, -245.66796875, -235.1015625, -224.53515625, -213.96875, -203.40234375, -192.8359375, -182.26953125, -171.703125, -161.13671875, -150.5703125, -140.00390625, -129.4375, -118.87109375, -108.3046875, -97.73828125, -87.171875, -76.60546875, -66.0390625, -55.47265625, -44.90625, -34.33984375, -23.7734375, -13.20703125, -2.640625, 7.92578125, 18.4921875, 29.05859375, 39.625, 50.19140625, 60.7578125, 71.32421875, 81.890625, 92.45703125, 103.0234375, 113.58984375, 124.15625, 134.72265625, 145.2890625, 155.85546875, 166.421875, 176.98828125, 187.5546875, 198.12109375, 208.6875, 219.25390625, 229.8203125, 240.38671875, 250.953125, 261.51953125, 272.0859375, 282.65234375, 293.21875, 303.78515625, 314.3515625, 324.91796875, 335.484375, 346.05078125, 356.6171875, 367.18359375, 377.75]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 6.0, 7.0, 13.0, 18.0, 16.0, 31.0, 25.0, 51.0, 54.0, 77.0, 86.0, 120.0, 106.0, 104.0, 82.0, 57.0, 48.0, 40.0, 19.0, 9.0, 9.0, 8.0, 4.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1795.10498046875, -1750.699462890625, -1706.2939453125, -1661.888427734375, -1617.48291015625, -1573.077392578125, -1528.671875, -1484.2662353515625, -1439.8607177734375, -1395.4552001953125, -1351.0496826171875, -1306.6441650390625, -1262.2386474609375, -1217.8330078125, -1173.427490234375, -1129.02197265625, -1084.616455078125, -1040.2109375, -995.805419921875, -951.39990234375, -906.9943237304688, -862.5888061523438, -818.1832885742188, -773.7777099609375, -729.372314453125, -684.966796875, -640.561279296875, -596.15576171875, -551.7501831054688, -507.34466552734375, -462.93914794921875, -418.5335998535156, -374.1280517578125, -329.7225341796875, -285.3169860839844, -240.91146850585938, -196.5059356689453, -152.10040283203125, -107.69488525390625, -63.289337158203125, -18.883819580078125, 25.521709442138672, 69.92723846435547, 114.332763671875, 158.73829650878906, 203.14382934570312, 247.54934692382812, 291.95489501953125, 336.36041259765625, 380.76593017578125, 425.1714782714844, 469.5769958496094, 513.9825439453125, 558.3880615234375, 602.7935791015625, 647.1990966796875, 691.6046142578125, 736.0101318359375, 780.4156494140625, 824.8211669921875, 869.2267456054688, 913.6322631835938, 958.0377807617188, 1002.443359375, 1046.848876953125]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 11.0, 11.0, 9.0, 7.0, 13.0, 14.0, 27.0, 23.0, 33.0, 25.0, 23.0, 29.0, 31.0, 46.0, 35.0, 45.0, 54.0, 43.0, 39.0, 38.0, 49.0, 38.0, 44.0, 44.0, 34.0, 26.0, 32.0, 28.0, 33.0, 18.0, 20.0, 19.0, 9.0, 13.0, 11.0, 5.0, 9.0, 6.0, 2.0, 3.0, 4.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-966.2689208984375, -938.384521484375, -910.5001831054688, -882.6157836914062, -854.7314453125, -826.8470458984375, -798.9627075195312, -771.0783081054688, -743.1939697265625, -715.3095703125, -687.4252319335938, -659.5408325195312, -631.656494140625, -603.7720947265625, -575.8877563476562, -548.0033569335938, -520.1190185546875, -492.2346496582031, -464.35028076171875, -436.4659118652344, -408.58154296875, -380.6971435546875, -352.81280517578125, -324.92840576171875, -297.04400634765625, -269.1596374511719, -241.2752685546875, -213.39089965820312, -185.50653076171875, -157.6221466064453, -129.73777770996094, -101.85340881347656, -73.96905517578125, -46.084686279296875, -18.200313568115234, 9.684059143066406, 37.56842803955078, 65.45280456542969, 93.33717346191406, 121.22154235839844, 149.1059112548828, 176.9902801513672, 204.87464904785156, 232.759033203125, 260.6434020996094, 288.52777099609375, 316.4121398925781, 344.2965087890625, 372.1808776855469, 400.06524658203125, 427.9496154785156, 455.833984375, 483.7183532714844, 511.60272216796875, 539.4871215820312, 567.3714599609375, 595.255859375, 623.1402587890625, 651.0245971679688, 678.9089965820312, 706.7933349609375, 734.677734375, 762.5620727539062, 790.4464721679688, 818.330810546875]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 10.0, 2.0, 4.0, 7.0, 8.0, 7.0, 20.0, 19.0, 33.0, 49.0, 42.0, 77.0, 115.0, 160.0, 261.0, 450.0, 707.0, 1330.0, 3114.0, 11585.0, 4154649.0, 14592.0, 3471.0, 1425.0, 743.0, 455.0, 319.0, 186.0, 130.0, 85.0, 51.0, 42.0, 36.0, 23.0, 20.0, 14.0, 13.0, 7.0, 10.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-318.0, -307.59375, -297.1875, -286.78125, -276.375, -265.96875, -255.5625, -245.15625, -234.75, -224.34375, -213.9375, -203.53125, -193.125, -182.71875, -172.3125, -161.90625, -151.5, -141.09375, -130.6875, -120.28125, -109.875, -99.46875, -89.0625, -78.65625, -68.25, -57.84375, -47.4375, -37.03125, -26.625, -16.21875, -5.8125, 4.59375, 15.0, 25.40625, 35.8125, 46.21875, 56.625, 67.03125, 77.4375, 87.84375, 98.25, 108.65625, 119.0625, 129.46875, 139.875, 150.28125, 160.6875, 171.09375, 181.5, 191.90625, 202.3125, 212.71875, 223.125, 233.53125, 243.9375, 254.34375, 264.75, 275.15625, 285.5625, 295.96875, 306.375, 316.78125, 327.1875, 337.59375, 348.0]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 4.0, 3.0, 5.0, 7.0, 6.0, 19.0, 14.0, 18.0, 24.0, 20.0, 31.0, 21.0, 37.0, 42.0, 43.0, 44.0, 54.0, 64.0, 52.0, 54.0, 46.0, 48.0, 35.0, 48.0, 33.0, 40.0, 29.0, 24.0, 23.0, 14.0, 12.0, 18.0, 17.0, 11.0, 10.0, 9.0, 4.0, 5.0, 6.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.015625, -29.906982421875, -28.79833984375, -27.689697265625, -26.5810546875, -25.472412109375, -24.36376953125, -23.255126953125, -22.146484375, -21.037841796875, -19.92919921875, -18.820556640625, -17.7119140625, -16.603271484375, -15.49462890625, -14.385986328125, -13.27734375, -12.168701171875, -11.06005859375, -9.951416015625, -8.8427734375, -7.734130859375, -6.62548828125, -5.516845703125, -4.408203125, -3.299560546875, -2.19091796875, -1.082275390625, 0.0263671875, 1.135009765625, 2.24365234375, 3.352294921875, 4.4609375, 5.569580078125, 6.67822265625, 7.786865234375, 8.8955078125, 10.004150390625, 11.11279296875, 12.221435546875, 13.330078125, 14.438720703125, 15.54736328125, 16.656005859375, 17.7646484375, 18.873291015625, 19.98193359375, 21.090576171875, 22.19921875, 23.307861328125, 24.41650390625, 25.525146484375, 26.6337890625, 27.742431640625, 28.85107421875, 29.959716796875, 31.068359375, 32.177001953125, 33.28564453125, 34.394287109375, 35.5029296875, 36.611572265625, 37.72021484375, 38.828857421875, 39.9375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 8.0, 4.0, 15.0, 19.0, 25.0, 39.0, 49.0, 79.0, 151.0, 205.0, 297.0, 481.0, 712.0, 1169.0, 1825.0, 3136.0, 6654.0, 38889.0, 4116437.0, 12889.0, 4443.0, 2423.0, 1473.0, 957.0, 645.0, 438.0, 271.0, 185.0, 115.0, 85.0, 54.0, 49.0, 15.0, 21.0, 9.0, 10.0, 7.0, 4.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-227.375, -216.681640625, -205.98828125, -195.294921875, -184.6015625, -173.908203125, -163.21484375, -152.521484375, -141.828125, -131.134765625, -120.44140625, -109.748046875, -99.0546875, -88.361328125, -77.66796875, -66.974609375, -56.28125, -45.587890625, -34.89453125, -24.201171875, -13.5078125, -2.814453125, 7.87890625, 18.572265625, 29.265625, 39.958984375, 50.65234375, 61.345703125, 72.0390625, 82.732421875, 93.42578125, 104.119140625, 114.8125, 125.505859375, 136.19921875, 146.892578125, 157.5859375, 168.279296875, 178.97265625, 189.666015625, 200.359375, 211.052734375, 221.74609375, 232.439453125, 243.1328125, 253.826171875, 264.51953125, 275.212890625, 285.90625, 296.599609375, 307.29296875, 317.986328125, 328.6796875, 339.373046875, 350.06640625, 360.759765625, 371.453125, 382.146484375, 392.83984375, 403.533203125, 414.2265625, 424.919921875, 435.61328125, 446.306640625, 457.0]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 1.0, 3.0, 5.0, 9.0, 29.0, 69.0, 3852.0, 41.0, 20.0, 11.0, 7.0, 6.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.34375, -43.62939453125, -41.9150390625, -40.20068359375, -38.486328125, -36.77197265625, -35.0576171875, -33.34326171875, -31.62890625, -29.91455078125, -28.2001953125, -26.48583984375, -24.771484375, -23.05712890625, -21.3427734375, -19.62841796875, -17.9140625, -16.19970703125, -14.4853515625, -12.77099609375, -11.056640625, -9.34228515625, -7.6279296875, -5.91357421875, -4.19921875, -2.48486328125, -0.7705078125, 0.94384765625, 2.658203125, 4.37255859375, 6.0869140625, 7.80126953125, 9.515625, 11.22998046875, 12.9443359375, 14.65869140625, 16.373046875, 18.08740234375, 19.8017578125, 21.51611328125, 23.23046875, 24.94482421875, 26.6591796875, 28.37353515625, 30.087890625, 31.80224609375, 33.5166015625, 35.23095703125, 36.9453125, 38.65966796875, 40.3740234375, 42.08837890625, 43.802734375, 45.51708984375, 47.2314453125, 48.94580078125, 50.66015625, 52.37451171875, 54.0888671875, 55.80322265625, 57.517578125, 59.23193359375, 60.9462890625, 62.66064453125, 64.375]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 1.0, 2.0, 2.0, 4.0, 9.0, 10.0, 15.0, 26.0, 44.0, 65.0, 67.0, 116.0, 117.0, 108.0, 108.0, 87.0, 52.0, 45.0, 23.0, 31.0, 24.0, 12.0, 10.0, 9.0, 7.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-150.50454711914062, -144.19775390625, -137.89096069335938, -131.5841827392578, -125.27738952636719, -118.97059631347656, -112.66381072998047, -106.35702514648438, -100.05023193359375, -93.74343872070312, -87.43665313720703, -81.12986755371094, -74.82307434082031, -68.51628112792969, -62.209495544433594, -55.902706146240234, -49.595916748046875, -43.289127349853516, -36.982337951660156, -30.675548553466797, -24.368759155273438, -18.061969757080078, -11.755180358886719, -5.448390960693359, 0.8583984375, 7.165187835693359, 13.471977233886719, 19.778766632080078, 26.085556030273438, 32.3923454284668, 38.699134826660156, 45.005924224853516, 51.31272888183594, 57.6195182800293, 63.926307678222656, 70.23309326171875, 76.53988647460938, 82.8466796875, 89.1534652709961, 95.46025085449219, 101.76704406738281, 108.07383728027344, 114.38062286376953, 120.68740844726562, 126.99420166015625, 133.30099487304688, 139.6077880859375, 145.91456604003906, 152.2213592529297, 158.5281524658203, 164.83493041992188, 171.1417236328125, 177.44851684570312, 183.75531005859375, 190.06210327148438, 196.36888122558594, 202.67567443847656, 208.9824676513672, 215.28924560546875, 221.59603881835938, 227.90283203125, 234.20962524414062, 240.51641845703125, 246.8231964111328, 253.12998962402344]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 3.0, 2.0, 5.0, 4.0, 2.0, 8.0, 7.0, 11.0, 11.0, 16.0, 24.0, 20.0, 26.0, 27.0, 20.0, 25.0, 28.0, 28.0, 40.0, 38.0, 40.0, 51.0, 34.0, 40.0, 49.0, 42.0, 38.0, 27.0, 33.0, 34.0, 41.0, 40.0, 26.0, 20.0, 25.0, 20.0, 23.0, 13.0, 11.0, 14.0, 9.0, 9.0, 11.0, 3.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-100.87227630615234, -97.64218139648438, -94.41209411621094, -91.18199920654297, -87.951904296875, -84.72180938720703, -81.49171447753906, -78.26162719726562, -75.03153228759766, -71.80143737792969, -68.57135009765625, -65.34125518798828, -62.11116027832031, -58.881065368652344, -55.65097427368164, -52.42088317871094, -49.19078826904297, -45.960693359375, -42.7306022644043, -39.500511169433594, -36.270416259765625, -33.040321350097656, -29.810230255126953, -26.580137252807617, -23.35004425048828, -20.119951248168945, -16.88985824584961, -13.659765243530273, -10.429672241210938, -7.199579238891602, -3.9694862365722656, -0.7393932342529297, 2.490692138671875, 5.720785140991211, 8.950878143310547, 12.180971145629883, 15.411064147949219, 18.641157150268555, 21.87125015258789, 25.101343154907227, 28.331436157226562, 31.5615291595459, 34.791622161865234, 38.02171325683594, 41.251808166503906, 44.481903076171875, 47.71199417114258, 50.94208526611328, 54.17218017578125, 57.40227508544922, 60.63236618041992, 63.862457275390625, 67.0925521850586, 70.32264709472656, 73.552734375, 76.78282928466797, 80.01292419433594, 83.2430191040039, 86.47311401367188, 89.70320129394531, 92.93329620361328, 96.16339111328125, 99.39347839355469, 102.62357330322266, 105.85366821289062]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 7.0, 4.0, 9.0, 10.0, 11.0, 23.0, 37.0, 53.0, 78.0, 116.0, 186.0, 275.0, 435.0, 647.0, 1011.0, 1502.0, 2555.0, 4066.0, 7461.0, 12906.0, 24162.0, 49217.0, 111254.0, 278614.0, 309605.0, 128408.0, 55104.0, 26688.0, 13985.0, 7844.0, 4664.0, 2861.0, 1760.0, 1121.0, 652.0, 399.0, 284.0, 172.0, 147.0, 71.0, 50.0, 35.0, 26.0, 16.0, 12.0, 7.0, 3.0, 4.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-80.125, -77.4609375, -74.796875, -72.1328125, -69.46875, -66.8046875, -64.140625, -61.4765625, -58.8125, -56.1484375, -53.484375, -50.8203125, -48.15625, -45.4921875, -42.828125, -40.1640625, -37.5, -34.8359375, -32.171875, -29.5078125, -26.84375, -24.1796875, -21.515625, -18.8515625, -16.1875, -13.5234375, -10.859375, -8.1953125, -5.53125, -2.8671875, -0.203125, 2.4609375, 5.125, 7.7890625, 10.453125, 13.1171875, 15.78125, 18.4453125, 21.109375, 23.7734375, 26.4375, 29.1015625, 31.765625, 34.4296875, 37.09375, 39.7578125, 42.421875, 45.0859375, 47.75, 50.4140625, 53.078125, 55.7421875, 58.40625, 61.0703125, 63.734375, 66.3984375, 69.0625, 71.7265625, 74.390625, 77.0546875, 79.71875, 82.3828125, 85.046875, 87.7109375, 90.375]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 4.0, 4.0, 3.0, 5.0, 4.0, 4.0, 6.0, 6.0, 9.0, 8.0, 12.0, 12.0, 25.0, 15.0, 22.0, 23.0, 20.0, 29.0, 30.0, 35.0, 24.0, 39.0, 47.0, 54.0, 53.0, 39.0, 37.0, 41.0, 26.0, 40.0, 39.0, 54.0, 36.0, 22.0, 26.0, 17.0, 28.0, 17.0, 13.0, 17.0, 17.0, 8.0, 13.0, 6.0, 7.0, 3.0, 4.0, 1.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-31.25, -30.19287109375, -29.1357421875, -28.07861328125, -27.021484375, -25.96435546875, -24.9072265625, -23.85009765625, -22.79296875, -21.73583984375, -20.6787109375, -19.62158203125, -18.564453125, -17.50732421875, -16.4501953125, -15.39306640625, -14.3359375, -13.27880859375, -12.2216796875, -11.16455078125, -10.107421875, -9.05029296875, -7.9931640625, -6.93603515625, -5.87890625, -4.82177734375, -3.7646484375, -2.70751953125, -1.650390625, -0.59326171875, 0.4638671875, 1.52099609375, 2.578125, 3.63525390625, 4.6923828125, 5.74951171875, 6.806640625, 7.86376953125, 8.9208984375, 9.97802734375, 11.03515625, 12.09228515625, 13.1494140625, 14.20654296875, 15.263671875, 16.32080078125, 17.3779296875, 18.43505859375, 19.4921875, 20.54931640625, 21.6064453125, 22.66357421875, 23.720703125, 24.77783203125, 25.8349609375, 26.89208984375, 27.94921875, 29.00634765625, 30.0634765625, 31.12060546875, 32.177734375, 33.23486328125, 34.2919921875, 35.34912109375, 36.40625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 5.0, 3.0, 6.0, 6.0, 21.0, 20.0, 23.0, 30.0, 40.0, 59.0, 104.0, 140.0, 239.0, 429.0, 780.0, 1531.0, 3426.0, 8090.0, 22827.0, 79323.0, 453133.0, 374092.0, 69664.0, 20596.0, 7511.0, 3178.0, 1457.0, 775.0, 407.0, 228.0, 139.0, 85.0, 58.0, 38.0, 26.0, 18.0, 12.0, 15.0, 4.0, 9.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-168.625, -163.34765625, -158.0703125, -152.79296875, -147.515625, -142.23828125, -136.9609375, -131.68359375, -126.40625, -121.12890625, -115.8515625, -110.57421875, -105.296875, -100.01953125, -94.7421875, -89.46484375, -84.1875, -78.91015625, -73.6328125, -68.35546875, -63.078125, -57.80078125, -52.5234375, -47.24609375, -41.96875, -36.69140625, -31.4140625, -26.13671875, -20.859375, -15.58203125, -10.3046875, -5.02734375, 0.25, 5.52734375, 10.8046875, 16.08203125, 21.359375, 26.63671875, 31.9140625, 37.19140625, 42.46875, 47.74609375, 53.0234375, 58.30078125, 63.578125, 68.85546875, 74.1328125, 79.41015625, 84.6875, 89.96484375, 95.2421875, 100.51953125, 105.796875, 111.07421875, 116.3515625, 121.62890625, 126.90625, 132.18359375, 137.4609375, 142.73828125, 148.015625, 153.29296875, 158.5703125, 163.84765625, 169.125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 6.0, 10.0, 9.0, 14.0, 13.0, 22.0, 15.0, 19.0, 19.0, 27.0, 36.0, 32.0, 50.0, 33.0, 39.0, 50.0, 41.0, 48.0, 50.0, 50.0, 61.0, 53.0, 31.0, 51.0, 31.0, 33.0, 23.0, 27.0, 30.0, 14.0, 11.0, 9.0, 12.0, 11.0, 6.0, 4.0, 6.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-213.375, -206.7890625, -200.203125, -193.6171875, -187.03125, -180.4453125, -173.859375, -167.2734375, -160.6875, -154.1015625, -147.515625, -140.9296875, -134.34375, -127.7578125, -121.171875, -114.5859375, -108.0, -101.4140625, -94.828125, -88.2421875, -81.65625, -75.0703125, -68.484375, -61.8984375, -55.3125, -48.7265625, -42.140625, -35.5546875, -28.96875, -22.3828125, -15.796875, -9.2109375, -2.625, 3.9609375, 10.546875, 17.1328125, 23.71875, 30.3046875, 36.890625, 43.4765625, 50.0625, 56.6484375, 63.234375, 69.8203125, 76.40625, 82.9921875, 89.578125, 96.1640625, 102.75, 109.3359375, 115.921875, 122.5078125, 129.09375, 135.6796875, 142.265625, 148.8515625, 155.4375, 162.0234375, 168.609375, 175.1953125, 181.78125, 188.3671875, 194.953125, 201.5390625, 208.125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 7.0, 1.0, 7.0, 10.0, 10.0, 15.0, 25.0, 25.0, 37.0, 55.0, 78.0, 99.0, 173.0, 223.0, 310.0, 531.0, 836.0, 1504.0, 2930.0, 6198.0, 16139.0, 54503.0, 285710.0, 538866.0, 97652.0, 24944.0, 8820.0, 3886.0, 1900.0, 1141.0, 631.0, 396.0, 258.0, 195.0, 136.0, 75.0, 65.0, 50.0, 30.0, 26.0, 18.0, 10.0, 4.0, 3.0, 9.0, 3.0, 6.0, 5.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-68.9375, -66.86083984375, -64.7841796875, -62.70751953125, -60.630859375, -58.55419921875, -56.4775390625, -54.40087890625, -52.32421875, -50.24755859375, -48.1708984375, -46.09423828125, -44.017578125, -41.94091796875, -39.8642578125, -37.78759765625, -35.7109375, -33.63427734375, -31.5576171875, -29.48095703125, -27.404296875, -25.32763671875, -23.2509765625, -21.17431640625, -19.09765625, -17.02099609375, -14.9443359375, -12.86767578125, -10.791015625, -8.71435546875, -6.6376953125, -4.56103515625, -2.484375, -0.40771484375, 1.6689453125, 3.74560546875, 5.822265625, 7.89892578125, 9.9755859375, 12.05224609375, 14.12890625, 16.20556640625, 18.2822265625, 20.35888671875, 22.435546875, 24.51220703125, 26.5888671875, 28.66552734375, 30.7421875, 32.81884765625, 34.8955078125, 36.97216796875, 39.048828125, 41.12548828125, 43.2021484375, 45.27880859375, 47.35546875, 49.43212890625, 51.5087890625, 53.58544921875, 55.662109375, 57.73876953125, 59.8154296875, 61.89208984375, 63.96875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 5.0, 6.0, 4.0, 11.0, 15.0, 16.0, 21.0, 37.0, 64.0, 106.0, 148.0, 155.0, 133.0, 84.0, 61.0, 43.0, 29.0, 21.0, 12.0, 9.0, 5.0, 8.0, 4.0, 0.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0347900390625, -0.0339512825012207, -0.033112525939941406, -0.03227376937866211, -0.03143501281738281, -0.030596256256103516, -0.02975749969482422, -0.028918743133544922, -0.028079986572265625, -0.027241230010986328, -0.02640247344970703, -0.025563716888427734, -0.024724960327148438, -0.02388620376586914, -0.023047447204589844, -0.022208690643310547, -0.02136993408203125, -0.020531177520751953, -0.019692420959472656, -0.01885366439819336, -0.018014907836914062, -0.017176151275634766, -0.01633739471435547, -0.015498638153076172, -0.014659881591796875, -0.013821125030517578, -0.012982368469238281, -0.012143611907958984, -0.011304855346679688, -0.01046609878540039, -0.009627342224121094, -0.008788585662841797, -0.0079498291015625, -0.007111072540283203, -0.006272315979003906, -0.005433559417724609, -0.0045948028564453125, -0.0037560462951660156, -0.0029172897338867188, -0.002078533172607422, -0.001239776611328125, -0.0004010200500488281, 0.00043773651123046875, 0.0012764930725097656, 0.0021152496337890625, 0.0029540061950683594, 0.0037927627563476562, 0.004631519317626953, 0.00547027587890625, 0.006309032440185547, 0.007147789001464844, 0.00798654556274414, 0.008825302124023438, 0.009664058685302734, 0.010502815246582031, 0.011341571807861328, 0.012180328369140625, 0.013019084930419922, 0.013857841491699219, 0.014696598052978516, 0.015535354614257812, 0.01637411117553711, 0.017212867736816406, 0.018051624298095703, 0.018890380859375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 4.0, 3.0, 1.0, 4.0, 5.0, 4.0, 8.0, 22.0, 15.0, 18.0, 39.0, 72.0, 87.0, 138.0, 234.0, 365.0, 758.0, 1400.0, 3233.0, 8347.0, 27587.0, 129008.0, 588806.0, 225319.0, 43034.0, 11940.0, 4170.0, 1848.0, 875.0, 486.0, 260.0, 157.0, 115.0, 65.0, 37.0, 22.0, 28.0, 13.0, 8.0, 8.0, 5.0, 6.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-67.5, -65.14453125, -62.7890625, -60.43359375, -58.078125, -55.72265625, -53.3671875, -51.01171875, -48.65625, -46.30078125, -43.9453125, -41.58984375, -39.234375, -36.87890625, -34.5234375, -32.16796875, -29.8125, -27.45703125, -25.1015625, -22.74609375, -20.390625, -18.03515625, -15.6796875, -13.32421875, -10.96875, -8.61328125, -6.2578125, -3.90234375, -1.546875, 0.80859375, 3.1640625, 5.51953125, 7.875, 10.23046875, 12.5859375, 14.94140625, 17.296875, 19.65234375, 22.0078125, 24.36328125, 26.71875, 29.07421875, 31.4296875, 33.78515625, 36.140625, 38.49609375, 40.8515625, 43.20703125, 45.5625, 47.91796875, 50.2734375, 52.62890625, 54.984375, 57.33984375, 59.6953125, 62.05078125, 64.40625, 66.76171875, 69.1171875, 71.47265625, 73.828125, 76.18359375, 78.5390625, 80.89453125, 83.25]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 6.0, 3.0, 4.0, 5.0, 11.0, 12.0, 25.0, 40.0, 46.0, 49.0, 66.0, 77.0, 89.0, 114.0, 111.0, 78.0, 61.0, 48.0, 49.0, 24.0, 20.0, 18.0, 13.0, 10.0, 5.0, 2.0, 6.0, 3.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.96875, -60.56494140625, -58.1611328125, -55.75732421875, -53.353515625, -50.94970703125, -48.5458984375, -46.14208984375, -43.73828125, -41.33447265625, -38.9306640625, -36.52685546875, -34.123046875, -31.71923828125, -29.3154296875, -26.91162109375, -24.5078125, -22.10400390625, -19.7001953125, -17.29638671875, -14.892578125, -12.48876953125, -10.0849609375, -7.68115234375, -5.27734375, -2.87353515625, -0.4697265625, 1.93408203125, 4.337890625, 6.74169921875, 9.1455078125, 11.54931640625, 13.953125, 16.35693359375, 18.7607421875, 21.16455078125, 23.568359375, 25.97216796875, 28.3759765625, 30.77978515625, 33.18359375, 35.58740234375, 37.9912109375, 40.39501953125, 42.798828125, 45.20263671875, 47.6064453125, 50.01025390625, 52.4140625, 54.81787109375, 57.2216796875, 59.62548828125, 62.029296875, 64.43310546875, 66.8369140625, 69.24072265625, 71.64453125, 74.04833984375, 76.4521484375, 78.85595703125, 81.259765625, 83.66357421875, 86.0673828125, 88.47119140625, 90.875]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 6.0, 11.0, 12.0, 18.0, 56.0, 53.0, 90.0, 149.0, 169.0, 139.0, 112.0, 79.0, 42.0, 17.0, 18.0, 11.0, 12.0, 4.0, 2.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-801.0159912109375, -749.6306762695312, -698.245361328125, -646.8599853515625, -595.4747314453125, -544.08935546875, -492.70404052734375, -441.3187255859375, -389.93341064453125, -338.548095703125, -287.16278076171875, -235.77743530273438, -184.39212036132812, -133.00680541992188, -81.6214599609375, -30.23614501953125, 21.149169921875, 72.53449249267578, 123.91981506347656, 175.30514526367188, 226.69046020507812, 278.0757751464844, 329.46112060546875, 380.846435546875, 432.23175048828125, 483.6170654296875, 535.0023803710938, 586.3876953125, 637.7730712890625, 689.1583251953125, 740.543701171875, 791.9290161132812, 843.314453125, 894.6997680664062, 946.0850830078125, 997.470458984375, 1048.855712890625, 1100.2410888671875, 1151.62646484375, 1203.01171875, 1254.39697265625, 1305.7823486328125, 1357.1676025390625, 1408.552978515625, 1459.938232421875, 1511.3236083984375, 1562.708984375, 1614.09423828125, 1665.4796142578125, 1716.864990234375, 1768.250244140625, 1819.6356201171875, 1871.0208740234375, 1922.40625, 1973.79150390625, 2025.1768798828125, 2076.562255859375, 2127.947509765625, 2179.3330078125, 2230.71826171875, 2282.103515625, 2333.48876953125, 2384.874267578125, 2436.259521484375, 2487.644775390625]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 7.0, 4.0, 6.0, 7.0, 4.0, 8.0, 12.0, 9.0, 6.0, 16.0, 26.0, 27.0, 23.0, 24.0, 31.0, 39.0, 52.0, 50.0, 50.0, 50.0, 59.0, 55.0, 63.0, 57.0, 58.0, 38.0, 33.0, 29.0, 30.0, 25.0, 23.0, 16.0, 12.0, 13.0, 13.0, 11.0, 4.0, 3.0, 3.0, 3.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1346.954345703125, -1311.202880859375, -1275.451416015625, -1239.699951171875, -1203.948486328125, -1168.197021484375, -1132.445556640625, -1096.694091796875, -1060.942626953125, -1025.191162109375, -989.439697265625, -953.688232421875, -917.936767578125, -882.185302734375, -846.433837890625, -810.682373046875, -774.930908203125, -739.179443359375, -703.427978515625, -667.676513671875, -631.925048828125, -596.173583984375, -560.422119140625, -524.670654296875, -488.919189453125, -453.167724609375, -417.416259765625, -381.664794921875, -345.913330078125, -310.161865234375, -274.410400390625, -238.658935546875, -202.9073486328125, -167.1558837890625, -131.4044189453125, -95.6529541015625, -59.9014892578125, -24.1500244140625, 11.6014404296875, 47.3529052734375, 83.1043701171875, 118.8558349609375, 154.6072998046875, 190.3587646484375, 226.1102294921875, 261.8616943359375, 297.6131591796875, 333.3646240234375, 369.1160888671875, 404.8675537109375, 440.6190185546875, 476.3704833984375, 512.1219482421875, 547.8734130859375, 583.6248779296875, 619.3763427734375, 655.1278076171875, 690.8792724609375, 726.6307373046875, 762.3822021484375, 798.1336669921875, 833.8851318359375, 869.6365966796875, 905.3880615234375, 941.1395263671875]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 4.0, 1.0, 6.0, 3.0, 6.0, 4.0, 10.0, 8.0, 19.0, 22.0, 29.0, 45.0, 70.0, 98.0, 118.0, 191.0, 231.0, 328.0, 516.0, 757.0, 1114.0, 2186.0, 5519.0, 4043915.0, 128159.0, 5259.0, 2094.0, 1212.0, 698.0, 473.0, 317.0, 239.0, 192.0, 108.0, 96.0, 57.0, 49.0, 42.0, 26.0, 16.0, 14.0, 10.0, 7.0, 11.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-348.75, -338.17578125, -327.6015625, -317.02734375, -306.453125, -295.87890625, -285.3046875, -274.73046875, -264.15625, -253.58203125, -243.0078125, -232.43359375, -221.859375, -211.28515625, -200.7109375, -190.13671875, -179.5625, -168.98828125, -158.4140625, -147.83984375, -137.265625, -126.69140625, -116.1171875, -105.54296875, -94.96875, -84.39453125, -73.8203125, -63.24609375, -52.671875, -42.09765625, -31.5234375, -20.94921875, -10.375, 0.19921875, 10.7734375, 21.34765625, 31.921875, 42.49609375, 53.0703125, 63.64453125, 74.21875, 84.79296875, 95.3671875, 105.94140625, 116.515625, 127.08984375, 137.6640625, 148.23828125, 158.8125, 169.38671875, 179.9609375, 190.53515625, 201.109375, 211.68359375, 222.2578125, 232.83203125, 243.40625, 253.98046875, 264.5546875, 275.12890625, 285.703125, 296.27734375, 306.8515625, 317.42578125, 328.0]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 6.0, 6.0, 2.0, 3.0, 9.0, 4.0, 7.0, 12.0, 9.0, 12.0, 9.0, 15.0, 22.0, 21.0, 22.0, 30.0, 33.0, 22.0, 38.0, 28.0, 45.0, 41.0, 51.0, 47.0, 51.0, 54.0, 42.0, 36.0, 32.0, 39.0, 28.0, 25.0, 29.0, 28.0, 20.0, 26.0, 14.0, 15.0, 12.0, 7.0, 9.0, 9.0, 10.0, 5.0, 6.0, 6.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-31.421875, -30.412841796875, -29.40380859375, -28.394775390625, -27.3857421875, -26.376708984375, -25.36767578125, -24.358642578125, -23.349609375, -22.340576171875, -21.33154296875, -20.322509765625, -19.3134765625, -18.304443359375, -17.29541015625, -16.286376953125, -15.27734375, -14.268310546875, -13.25927734375, -12.250244140625, -11.2412109375, -10.232177734375, -9.22314453125, -8.214111328125, -7.205078125, -6.196044921875, -5.18701171875, -4.177978515625, -3.1689453125, -2.159912109375, -1.15087890625, -0.141845703125, 0.8671875, 1.876220703125, 2.88525390625, 3.894287109375, 4.9033203125, 5.912353515625, 6.92138671875, 7.930419921875, 8.939453125, 9.948486328125, 10.95751953125, 11.966552734375, 12.9755859375, 13.984619140625, 14.99365234375, 16.002685546875, 17.01171875, 18.020751953125, 19.02978515625, 20.038818359375, 21.0478515625, 22.056884765625, 23.06591796875, 24.074951171875, 25.083984375, 26.093017578125, 27.10205078125, 28.111083984375, 29.1201171875, 30.129150390625, 31.13818359375, 32.147216796875, 33.15625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 0.0, 1.0, 4.0, 9.0, 2.0, 3.0, 7.0, 9.0, 6.0, 17.0, 13.0, 29.0, 31.0, 55.0, 86.0, 97.0, 165.0, 234.0, 398.0, 669.0, 1087.0, 2170.0, 8104.0, 4139805.0, 33759.0, 3664.0, 1510.0, 891.0, 527.0, 308.0, 172.0, 135.0, 87.0, 47.0, 50.0, 24.0, 23.0, 21.0, 24.0, 11.0, 9.0, 9.0, 4.0, 6.0, 1.0, 1.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-519.0, -502.125, -485.25, -468.375, -451.5, -434.625, -417.75, -400.875, -384.0, -367.125, -350.25, -333.375, -316.5, -299.625, -282.75, -265.875, -249.0, -232.125, -215.25, -198.375, -181.5, -164.625, -147.75, -130.875, -114.0, -97.125, -80.25, -63.375, -46.5, -29.625, -12.75, 4.125, 21.0, 37.875, 54.75, 71.625, 88.5, 105.375, 122.25, 139.125, 156.0, 172.875, 189.75, 206.625, 223.5, 240.375, 257.25, 274.125, 291.0, 307.875, 324.75, 341.625, 358.5, 375.375, 392.25, 409.125, 426.0, 442.875, 459.75, 476.625, 493.5, 510.375, 527.25, 544.125, 561.0]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 7.0, 21.0, 49.0, 3905.0, 70.0, 18.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-171.75, -167.5263671875, -163.302734375, -159.0791015625, -154.85546875, -150.6318359375, -146.408203125, -142.1845703125, -137.9609375, -133.7373046875, -129.513671875, -125.2900390625, -121.06640625, -116.8427734375, -112.619140625, -108.3955078125, -104.171875, -99.9482421875, -95.724609375, -91.5009765625, -87.27734375, -83.0537109375, -78.830078125, -74.6064453125, -70.3828125, -66.1591796875, -61.935546875, -57.7119140625, -53.48828125, -49.2646484375, -45.041015625, -40.8173828125, -36.59375, -32.3701171875, -28.146484375, -23.9228515625, -19.69921875, -15.4755859375, -11.251953125, -7.0283203125, -2.8046875, 1.4189453125, 5.642578125, 9.8662109375, 14.08984375, 18.3134765625, 22.537109375, 26.7607421875, 30.984375, 35.2080078125, 39.431640625, 43.6552734375, 47.87890625, 52.1025390625, 56.326171875, 60.5498046875, 64.7734375, 68.9970703125, 73.220703125, 77.4443359375, 81.66796875, 85.8916015625, 90.115234375, 94.3388671875, 98.5625]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 5.0, 2.0, 3.0, 7.0, 10.0, 11.0, 14.0, 11.0, 20.0, 18.0, 27.0, 35.0, 41.0, 45.0, 73.0, 87.0, 84.0, 80.0, 92.0, 73.0, 67.0, 44.0, 40.0, 30.0, 15.0, 10.0, 14.0, 9.0, 10.0, 7.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-243.32638549804688, -237.09654235839844, -230.86669921875, -224.63685607910156, -218.40701293945312, -212.1771697998047, -205.94732666015625, -199.71746826171875, -193.48764038085938, -187.25779724121094, -181.0279541015625, -174.79811096191406, -168.56826782226562, -162.3384246826172, -156.10858154296875, -149.87872314453125, -143.6488800048828, -137.41903686523438, -131.18919372558594, -124.9593505859375, -118.72950744628906, -112.49966430664062, -106.26981353759766, -100.03997039794922, -93.81012725830078, -87.58028411865234, -81.3504409790039, -75.12059020996094, -68.8907470703125, -62.66090774536133, -56.431060791015625, -50.20121765136719, -43.97135925292969, -37.74151611328125, -31.51167106628418, -25.28182601928711, -19.051982879638672, -12.822139739990234, -6.592292785644531, -0.36244964599609375, 5.867393493652344, 12.097237586975098, 18.32708168029785, 24.556926727294922, 30.78676986694336, 37.0166130065918, 43.2464599609375, 49.47630310058594, 55.706146240234375, 61.93598937988281, 68.16583251953125, 74.39567565917969, 80.62551879882812, 86.85536193847656, 93.08521270751953, 99.31505584716797, 105.5448989868164, 111.77474212646484, 118.00458526611328, 124.23443603515625, 130.4642791748047, 136.69412231445312, 142.92396545410156, 149.15380859375, 155.38365173339844]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 3.0, 4.0, 5.0, 4.0, 7.0, 7.0, 8.0, 7.0, 13.0, 17.0, 17.0, 12.0, 25.0, 31.0, 31.0, 31.0, 30.0, 40.0, 30.0, 33.0, 52.0, 44.0, 50.0, 55.0, 34.0, 44.0, 48.0, 41.0, 35.0, 35.0, 31.0, 30.0, 25.0, 18.0, 19.0, 16.0, 14.0, 15.0, 4.0, 8.0, 6.0, 11.0, 7.0, 4.0, 4.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-169.7794952392578, -164.78338623046875, -159.78729248046875, -154.7911834716797, -149.79507446289062, -144.79896545410156, -139.8028564453125, -134.8067626953125, -129.81065368652344, -124.81454467773438, -119.81844329833984, -114.82234191894531, -109.82623291015625, -104.83012390136719, -99.83402252197266, -94.83792114257812, -89.84181213378906, -84.845703125, -79.84960174560547, -74.85350036621094, -69.85739135742188, -64.86128234863281, -59.86518096923828, -54.869075775146484, -49.87297058105469, -44.87686538696289, -39.880760192871094, -34.8846549987793, -29.8885498046875, -24.892444610595703, -19.896339416503906, -14.90023422241211, -9.904144287109375, -4.908039093017578, 0.08806610107421875, 5.084171295166016, 10.080276489257812, 15.07638168334961, 20.072486877441406, 25.068592071533203, 30.064697265625, 35.0608024597168, 40.056907653808594, 45.05301284790039, 50.04911804199219, 55.045223236083984, 60.04132843017578, 65.03742980957031, 70.03353881835938, 75.02964782714844, 80.02574920654297, 85.0218505859375, 90.01795959472656, 95.01406860351562, 100.01016998291016, 105.00627136230469, 110.00238037109375, 114.99848937988281, 119.99459075927734, 124.99069213867188, 129.98680114746094, 134.98291015625, 139.97900390625, 144.97511291503906, 149.97122192382812]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 3.0, 0.0, 5.0, 9.0, 19.0, 17.0, 36.0, 58.0, 64.0, 86.0, 152.0, 272.0, 437.0, 699.0, 1219.0, 2161.0, 3951.0, 7097.0, 14550.0, 30791.0, 70494.0, 181620.0, 378698.0, 207841.0, 79922.0, 34469.0, 15934.0, 8056.0, 4348.0, 2294.0, 1323.0, 763.0, 451.0, 267.0, 172.0, 80.0, 54.0, 44.0, 39.0, 24.0, 18.0, 12.0, 5.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-106.0, -102.93359375, -99.8671875, -96.80078125, -93.734375, -90.66796875, -87.6015625, -84.53515625, -81.46875, -78.40234375, -75.3359375, -72.26953125, -69.203125, -66.13671875, -63.0703125, -60.00390625, -56.9375, -53.87109375, -50.8046875, -47.73828125, -44.671875, -41.60546875, -38.5390625, -35.47265625, -32.40625, -29.33984375, -26.2734375, -23.20703125, -20.140625, -17.07421875, -14.0078125, -10.94140625, -7.875, -4.80859375, -1.7421875, 1.32421875, 4.390625, 7.45703125, 10.5234375, 13.58984375, 16.65625, 19.72265625, 22.7890625, 25.85546875, 28.921875, 31.98828125, 35.0546875, 38.12109375, 41.1875, 44.25390625, 47.3203125, 50.38671875, 53.453125, 56.51953125, 59.5859375, 62.65234375, 65.71875, 68.78515625, 71.8515625, 74.91796875, 77.984375, 81.05078125, 84.1171875, 87.18359375, 90.25]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 4.0, 6.0, 4.0, 4.0, 5.0, 5.0, 8.0, 10.0, 13.0, 14.0, 16.0, 17.0, 18.0, 28.0, 22.0, 24.0, 31.0, 34.0, 28.0, 29.0, 37.0, 43.0, 44.0, 40.0, 47.0, 48.0, 36.0, 47.0, 35.0, 33.0, 25.0, 30.0, 28.0, 25.0, 28.0, 21.0, 17.0, 16.0, 16.0, 14.0, 11.0, 5.0, 14.0, 9.0, 5.0, 3.0, 2.0, 3.0, 5.0, 1.0, 1.0], "bins": [-41.9375, -40.8017578125, -39.666015625, -38.5302734375, -37.39453125, -36.2587890625, -35.123046875, -33.9873046875, -32.8515625, -31.7158203125, -30.580078125, -29.4443359375, -28.30859375, -27.1728515625, -26.037109375, -24.9013671875, -23.765625, -22.6298828125, -21.494140625, -20.3583984375, -19.22265625, -18.0869140625, -16.951171875, -15.8154296875, -14.6796875, -13.5439453125, -12.408203125, -11.2724609375, -10.13671875, -9.0009765625, -7.865234375, -6.7294921875, -5.59375, -4.4580078125, -3.322265625, -2.1865234375, -1.05078125, 0.0849609375, 1.220703125, 2.3564453125, 3.4921875, 4.6279296875, 5.763671875, 6.8994140625, 8.03515625, 9.1708984375, 10.306640625, 11.4423828125, 12.578125, 13.7138671875, 14.849609375, 15.9853515625, 17.12109375, 18.2568359375, 19.392578125, 20.5283203125, 21.6640625, 22.7998046875, 23.935546875, 25.0712890625, 26.20703125, 27.3427734375, 28.478515625, 29.6142578125, 30.75]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 6.0, 5.0, 7.0, 7.0, 10.0, 18.0, 20.0, 45.0, 74.0, 86.0, 166.0, 278.0, 526.0, 1009.0, 2288.0, 6385.0, 21885.0, 124794.0, 718002.0, 137959.0, 23607.0, 6683.0, 2404.0, 1086.0, 496.0, 274.0, 151.0, 102.0, 55.0, 40.0, 23.0, 15.0, 13.0, 9.0, 12.0, 6.0, 2.0, 5.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-181.75, -175.146484375, -168.54296875, -161.939453125, -155.3359375, -148.732421875, -142.12890625, -135.525390625, -128.921875, -122.318359375, -115.71484375, -109.111328125, -102.5078125, -95.904296875, -89.30078125, -82.697265625, -76.09375, -69.490234375, -62.88671875, -56.283203125, -49.6796875, -43.076171875, -36.47265625, -29.869140625, -23.265625, -16.662109375, -10.05859375, -3.455078125, 3.1484375, 9.751953125, 16.35546875, 22.958984375, 29.5625, 36.166015625, 42.76953125, 49.373046875, 55.9765625, 62.580078125, 69.18359375, 75.787109375, 82.390625, 88.994140625, 95.59765625, 102.201171875, 108.8046875, 115.408203125, 122.01171875, 128.615234375, 135.21875, 141.822265625, 148.42578125, 155.029296875, 161.6328125, 168.236328125, 174.83984375, 181.443359375, 188.046875, 194.650390625, 201.25390625, 207.857421875, 214.4609375, 221.064453125, 227.66796875, 234.271484375, 240.875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 5.0, 7.0, 10.0, 11.0, 8.0, 12.0, 18.0, 27.0, 17.0, 24.0, 26.0, 32.0, 40.0, 36.0, 34.0, 52.0, 43.0, 46.0, 41.0, 50.0, 54.0, 45.0, 38.0, 50.0, 33.0, 29.0, 36.0, 28.0, 27.0, 19.0, 18.0, 13.0, 6.0, 15.0, 13.0, 3.0, 5.0, 10.0, 4.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 4.0, 1.0, 2.0, 2.0, 2.0], "bins": [-195.875, -190.046875, -184.21875, -178.390625, -172.5625, -166.734375, -160.90625, -155.078125, -149.25, -143.421875, -137.59375, -131.765625, -125.9375, -120.109375, -114.28125, -108.453125, -102.625, -96.796875, -90.96875, -85.140625, -79.3125, -73.484375, -67.65625, -61.828125, -56.0, -50.171875, -44.34375, -38.515625, -32.6875, -26.859375, -21.03125, -15.203125, -9.375, -3.546875, 2.28125, 8.109375, 13.9375, 19.765625, 25.59375, 31.421875, 37.25, 43.078125, 48.90625, 54.734375, 60.5625, 66.390625, 72.21875, 78.046875, 83.875, 89.703125, 95.53125, 101.359375, 107.1875, 113.015625, 118.84375, 124.671875, 130.5, 136.328125, 142.15625, 147.984375, 153.8125, 159.640625, 165.46875, 171.296875, 177.125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 4.0, 2.0, 4.0, 7.0, 9.0, 11.0, 24.0, 28.0, 39.0, 72.0, 89.0, 189.0, 335.0, 675.0, 1368.0, 3252.0, 8967.0, 36706.0, 463821.0, 480612.0, 37553.0, 8658.0, 3123.0, 1340.0, 702.0, 389.0, 246.0, 126.0, 71.0, 56.0, 23.0, 18.0, 16.0, 8.0, 5.0, 4.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-103.625, -100.4853515625, -97.345703125, -94.2060546875, -91.06640625, -87.9267578125, -84.787109375, -81.6474609375, -78.5078125, -75.3681640625, -72.228515625, -69.0888671875, -65.94921875, -62.8095703125, -59.669921875, -56.5302734375, -53.390625, -50.2509765625, -47.111328125, -43.9716796875, -40.83203125, -37.6923828125, -34.552734375, -31.4130859375, -28.2734375, -25.1337890625, -21.994140625, -18.8544921875, -15.71484375, -12.5751953125, -9.435546875, -6.2958984375, -3.15625, -0.0166015625, 3.123046875, 6.2626953125, 9.40234375, 12.5419921875, 15.681640625, 18.8212890625, 21.9609375, 25.1005859375, 28.240234375, 31.3798828125, 34.51953125, 37.6591796875, 40.798828125, 43.9384765625, 47.078125, 50.2177734375, 53.357421875, 56.4970703125, 59.63671875, 62.7763671875, 65.916015625, 69.0556640625, 72.1953125, 75.3349609375, 78.474609375, 81.6142578125, 84.75390625, 87.8935546875, 91.033203125, 94.1728515625, 97.3125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 4.0, 13.0, 21.0, 28.0, 48.0, 82.0, 156.0, 228.0, 182.0, 114.0, 60.0, 30.0, 9.0, 7.0, 9.0, 2.0, 3.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.022216796875, -0.020956993103027344, -0.019697189331054688, -0.01843738555908203, -0.017177581787109375, -0.01591777801513672, -0.014657974243164062, -0.013398170471191406, -0.01213836669921875, -0.010878562927246094, -0.009618759155273438, -0.008358955383300781, -0.007099151611328125, -0.005839347839355469, -0.0045795440673828125, -0.0033197402954101562, -0.0020599365234375, -0.0008001327514648438, 0.0004596710205078125, 0.0017194747924804688, 0.002979278564453125, 0.004239082336425781, 0.0054988861083984375, 0.006758689880371094, 0.00801849365234375, 0.009278297424316406, 0.010538101196289062, 0.011797904968261719, 0.013057708740234375, 0.014317512512207031, 0.015577316284179688, 0.016837120056152344, 0.018096923828125, 0.019356727600097656, 0.020616531372070312, 0.02187633514404297, 0.023136138916015625, 0.02439594268798828, 0.025655746459960938, 0.026915550231933594, 0.02817535400390625, 0.029435157775878906, 0.030694961547851562, 0.03195476531982422, 0.033214569091796875, 0.03447437286376953, 0.03573417663574219, 0.036993980407714844, 0.0382537841796875, 0.039513587951660156, 0.04077339172363281, 0.04203319549560547, 0.043292999267578125, 0.04455280303955078, 0.04581260681152344, 0.047072410583496094, 0.04833221435546875, 0.049592018127441406, 0.05085182189941406, 0.05211162567138672, 0.053371429443359375, 0.05463123321533203, 0.05589103698730469, 0.057150840759277344, 0.05841064453125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 8.0, 5.0, 6.0, 13.0, 17.0, 27.0, 34.0, 70.0, 109.0, 154.0, 361.0, 752.0, 1953.0, 6387.0, 41782.0, 778075.0, 198024.0, 15166.0, 3355.0, 1092.0, 503.0, 295.0, 127.0, 87.0, 47.0, 24.0, 20.0, 14.0, 19.0, 6.0, 10.0, 6.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-134.5, -129.98046875, -125.4609375, -120.94140625, -116.421875, -111.90234375, -107.3828125, -102.86328125, -98.34375, -93.82421875, -89.3046875, -84.78515625, -80.265625, -75.74609375, -71.2265625, -66.70703125, -62.1875, -57.66796875, -53.1484375, -48.62890625, -44.109375, -39.58984375, -35.0703125, -30.55078125, -26.03125, -21.51171875, -16.9921875, -12.47265625, -7.953125, -3.43359375, 1.0859375, 5.60546875, 10.125, 14.64453125, 19.1640625, 23.68359375, 28.203125, 32.72265625, 37.2421875, 41.76171875, 46.28125, 50.80078125, 55.3203125, 59.83984375, 64.359375, 68.87890625, 73.3984375, 77.91796875, 82.4375, 86.95703125, 91.4765625, 95.99609375, 100.515625, 105.03515625, 109.5546875, 114.07421875, 118.59375, 123.11328125, 127.6328125, 132.15234375, 136.671875, 141.19140625, 145.7109375, 150.23046875, 154.75]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 5.0, 4.0, 5.0, 8.0, 15.0, 8.0, 23.0, 34.0, 60.0, 63.0, 120.0, 118.0, 128.0, 135.0, 92.0, 63.0, 33.0, 33.0, 16.0, 11.0, 8.0, 9.0, 7.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.28125, -52.42529296875, -49.5693359375, -46.71337890625, -43.857421875, -41.00146484375, -38.1455078125, -35.28955078125, -32.43359375, -29.57763671875, -26.7216796875, -23.86572265625, -21.009765625, -18.15380859375, -15.2978515625, -12.44189453125, -9.5859375, -6.72998046875, -3.8740234375, -1.01806640625, 1.837890625, 4.69384765625, 7.5498046875, 10.40576171875, 13.26171875, 16.11767578125, 18.9736328125, 21.82958984375, 24.685546875, 27.54150390625, 30.3974609375, 33.25341796875, 36.109375, 38.96533203125, 41.8212890625, 44.67724609375, 47.533203125, 50.38916015625, 53.2451171875, 56.10107421875, 58.95703125, 61.81298828125, 64.6689453125, 67.52490234375, 70.380859375, 73.23681640625, 76.0927734375, 78.94873046875, 81.8046875, 84.66064453125, 87.5166015625, 90.37255859375, 93.228515625, 96.08447265625, 98.9404296875, 101.79638671875, 104.65234375, 107.50830078125, 110.3642578125, 113.22021484375, 116.076171875, 118.93212890625, 121.7880859375, 124.64404296875, 127.5]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 5.0, 5.0, 12.0, 22.0, 59.0, 108.0, 207.0, 242.0, 176.0, 78.0, 47.0, 23.0, 17.0, 6.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3731.10546875, -3645.3759765625, -3559.646484375, -3473.9169921875, -3388.1875, -3302.458251953125, -3216.728759765625, -3130.999267578125, -3045.269775390625, -2959.540283203125, -2873.810791015625, -2788.081298828125, -2702.35205078125, -2616.62255859375, -2530.89306640625, -2445.16357421875, -2359.43408203125, -2273.70458984375, -2187.97509765625, -2102.24560546875, -2016.5162353515625, -1930.7867431640625, -1845.057373046875, -1759.327880859375, -1673.598388671875, -1587.868896484375, -1502.139404296875, -1416.4100341796875, -1330.6805419921875, -1244.9510498046875, -1159.2216796875, -1073.4921875, -987.7628173828125, -902.0333251953125, -816.3038940429688, -730.574462890625, -644.844970703125, -559.115478515625, -473.38604736328125, -387.6566162109375, -301.9271240234375, -216.19766235351562, -130.46820068359375, -44.738739013671875, 40.99072265625, 126.72018432617188, 212.44964599609375, 298.1790771484375, 383.9085693359375, 469.6380310058594, 555.3674926757812, 641.096923828125, 726.826416015625, 812.555908203125, 898.2853393554688, 984.0147705078125, 1069.7442626953125, 1155.4737548828125, 1241.203125, 1326.9326171875, 1412.662109375, 1498.3916015625, 1584.12109375, 1669.8504638671875, 1755.5799560546875]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 7.0, 10.0, 8.0, 13.0, 19.0, 17.0, 21.0, 15.0, 19.0, 31.0, 37.0, 38.0, 46.0, 54.0, 69.0, 54.0, 58.0, 59.0, 47.0, 50.0, 59.0, 37.0, 42.0, 35.0, 34.0, 34.0, 18.0, 20.0, 13.0, 13.0, 4.0, 6.0, 7.0, 4.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1028.7578125, -993.9733276367188, -959.1888427734375, -924.4044189453125, -889.6199340820312, -854.83544921875, -820.051025390625, -785.2665405273438, -750.4820556640625, -715.6975708007812, -680.9130859375, -646.128662109375, -611.3441772460938, -576.5596923828125, -541.7752685546875, -506.99078369140625, -472.206298828125, -437.42181396484375, -402.6373596191406, -367.8529052734375, -333.06842041015625, -298.283935546875, -263.4994812011719, -228.7150115966797, -193.9305419921875, -159.1460723876953, -124.36160278320312, -89.57713317871094, -54.79266357421875, -20.008193969726562, 14.776275634765625, 49.56074523925781, 84.3453369140625, 119.12980651855469, 153.91427612304688, 188.69874572753906, 223.48321533203125, 258.2677001953125, 293.0521545410156, 327.83660888671875, 362.62109375, 397.40557861328125, 432.1900329589844, 466.9744873046875, 501.75897216796875, 536.54345703125, 571.327880859375, 606.1123657226562, 640.8968505859375, 675.6813354492188, 710.4658203125, 745.250244140625, 780.0347290039062, 814.8192138671875, 849.6036376953125, 884.3881225585938, 919.172607421875, 953.9570922851562, 988.7415771484375, 1023.5260009765625, 1058.310546875, 1093.094970703125, 1127.87939453125, 1162.6639404296875, 1197.4483642578125]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 6.0, 3.0, 6.0, 5.0, 9.0, 5.0, 12.0, 19.0, 16.0, 27.0, 24.0, 35.0, 42.0, 76.0, 64.0, 112.0, 128.0, 181.0, 209.0, 283.0, 393.0, 600.0, 915.0, 1767.0, 5137.0, 4165384.0, 12410.0, 2703.0, 1206.0, 662.0, 416.0, 348.0, 249.0, 173.0, 161.0, 112.0, 91.0, 65.0, 64.0, 41.0, 26.0, 27.0, 18.0, 18.0, 15.0, 7.0, 3.0, 7.0, 5.0, 3.0, 2.0, 6.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-291.5, -282.58984375, -273.6796875, -264.76953125, -255.859375, -246.94921875, -238.0390625, -229.12890625, -220.21875, -211.30859375, -202.3984375, -193.48828125, -184.578125, -175.66796875, -166.7578125, -157.84765625, -148.9375, -140.02734375, -131.1171875, -122.20703125, -113.296875, -104.38671875, -95.4765625, -86.56640625, -77.65625, -68.74609375, -59.8359375, -50.92578125, -42.015625, -33.10546875, -24.1953125, -15.28515625, -6.375, 2.53515625, 11.4453125, 20.35546875, 29.265625, 38.17578125, 47.0859375, 55.99609375, 64.90625, 73.81640625, 82.7265625, 91.63671875, 100.546875, 109.45703125, 118.3671875, 127.27734375, 136.1875, 145.09765625, 154.0078125, 162.91796875, 171.828125, 180.73828125, 189.6484375, 198.55859375, 207.46875, 216.37890625, 225.2890625, 234.19921875, 243.109375, 252.01953125, 260.9296875, 269.83984375, 278.75]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 6.0, 5.0, 12.0, 9.0, 17.0, 12.0, 13.0, 27.0, 19.0, 28.0, 35.0, 38.0, 39.0, 46.0, 36.0, 52.0, 54.0, 57.0, 53.0, 46.0, 51.0, 54.0, 42.0, 48.0, 37.0, 32.0, 18.0, 15.0, 14.0, 18.0, 18.0, 11.0, 11.0, 6.0, 8.0, 5.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-45.75, -44.26318359375, -42.7763671875, -41.28955078125, -39.802734375, -38.31591796875, -36.8291015625, -35.34228515625, -33.85546875, -32.36865234375, -30.8818359375, -29.39501953125, -27.908203125, -26.42138671875, -24.9345703125, -23.44775390625, -21.9609375, -20.47412109375, -18.9873046875, -17.50048828125, -16.013671875, -14.52685546875, -13.0400390625, -11.55322265625, -10.06640625, -8.57958984375, -7.0927734375, -5.60595703125, -4.119140625, -2.63232421875, -1.1455078125, 0.34130859375, 1.828125, 3.31494140625, 4.8017578125, 6.28857421875, 7.775390625, 9.26220703125, 10.7490234375, 12.23583984375, 13.72265625, 15.20947265625, 16.6962890625, 18.18310546875, 19.669921875, 21.15673828125, 22.6435546875, 24.13037109375, 25.6171875, 27.10400390625, 28.5908203125, 30.07763671875, 31.564453125, 33.05126953125, 34.5380859375, 36.02490234375, 37.51171875, 38.99853515625, 40.4853515625, 41.97216796875, 43.458984375, 44.94580078125, 46.4326171875, 47.91943359375, 49.40625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 1.0, 5.0, 6.0, 4.0, 14.0, 20.0, 17.0, 26.0, 38.0, 40.0, 51.0, 72.0, 103.0, 120.0, 204.0, 260.0, 427.0, 655.0, 1186.0, 2632.0, 10167.0, 4155381.0, 15990.0, 3249.0, 1374.0, 731.0, 435.0, 306.0, 217.0, 144.0, 107.0, 92.0, 50.0, 39.0, 20.0, 24.0, 18.0, 22.0, 9.0, 12.0, 5.0, 5.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-380.75, -368.69921875, -356.6484375, -344.59765625, -332.546875, -320.49609375, -308.4453125, -296.39453125, -284.34375, -272.29296875, -260.2421875, -248.19140625, -236.140625, -224.08984375, -212.0390625, -199.98828125, -187.9375, -175.88671875, -163.8359375, -151.78515625, -139.734375, -127.68359375, -115.6328125, -103.58203125, -91.53125, -79.48046875, -67.4296875, -55.37890625, -43.328125, -31.27734375, -19.2265625, -7.17578125, 4.875, 16.92578125, 28.9765625, 41.02734375, 53.078125, 65.12890625, 77.1796875, 89.23046875, 101.28125, 113.33203125, 125.3828125, 137.43359375, 149.484375, 161.53515625, 173.5859375, 185.63671875, 197.6875, 209.73828125, 221.7890625, 233.83984375, 245.890625, 257.94140625, 269.9921875, 282.04296875, 294.09375, 306.14453125, 318.1953125, 330.24609375, 342.296875, 354.34765625, 366.3984375, 378.44921875, 390.5]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 7.0, 7.0, 16.0, 3904.0, 102.0, 19.0, 9.0, 4.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-82.3125, -79.7314453125, -77.150390625, -74.5693359375, -71.98828125, -69.4072265625, -66.826171875, -64.2451171875, -61.6640625, -59.0830078125, -56.501953125, -53.9208984375, -51.33984375, -48.7587890625, -46.177734375, -43.5966796875, -41.015625, -38.4345703125, -35.853515625, -33.2724609375, -30.69140625, -28.1103515625, -25.529296875, -22.9482421875, -20.3671875, -17.7861328125, -15.205078125, -12.6240234375, -10.04296875, -7.4619140625, -4.880859375, -2.2998046875, 0.28125, 2.8623046875, 5.443359375, 8.0244140625, 10.60546875, 13.1865234375, 15.767578125, 18.3486328125, 20.9296875, 23.5107421875, 26.091796875, 28.6728515625, 31.25390625, 33.8349609375, 36.416015625, 38.9970703125, 41.578125, 44.1591796875, 46.740234375, 49.3212890625, 51.90234375, 54.4833984375, 57.064453125, 59.6455078125, 62.2265625, 64.8076171875, 67.388671875, 69.9697265625, 72.55078125, 75.1318359375, 77.712890625, 80.2939453125, 82.875]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 6.0, 5.0, 5.0, 8.0, 10.0, 19.0, 11.0, 22.0, 41.0, 63.0, 76.0, 78.0, 85.0, 115.0, 94.0, 100.0, 76.0, 47.0, 43.0, 26.0, 21.0, 15.0, 8.0, 8.0, 8.0, 3.0, 3.0, 4.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-166.56581115722656, -161.5968017578125, -156.6278076171875, -151.6588134765625, -146.68980407714844, -141.72079467773438, -136.75180053710938, -131.78280639648438, -126.81379699707031, -121.84479522705078, -116.87579345703125, -111.90679168701172, -106.93778991699219, -101.96878814697266, -96.99978637695312, -92.0307846069336, -87.06178283691406, -82.09278106689453, -77.123779296875, -72.15477752685547, -67.18577575683594, -62.216773986816406, -57.247772216796875, -52.278770446777344, -47.30976867675781, -42.34076690673828, -37.37176513671875, -32.40276336669922, -27.433761596679688, -22.464759826660156, -17.495758056640625, -12.526756286621094, -7.5577392578125, -2.5887374877929688, 2.3802642822265625, 7.349266052246094, 12.318267822265625, 17.287269592285156, 22.256271362304688, 27.22527313232422, 32.19427490234375, 37.16327667236328, 42.13227844238281, 47.101280212402344, 52.070281982421875, 57.039283752441406, 62.00828552246094, 66.97728729248047, 71.9462890625, 76.91529083251953, 81.88429260253906, 86.8532943725586, 91.82229614257812, 96.79129791259766, 101.76029968261719, 106.72930145263672, 111.69830322265625, 116.66730499267578, 121.63630676269531, 126.60530853271484, 131.57431030273438, 136.54330444335938, 141.51231384277344, 146.4813232421875, 151.4503173828125]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 3.0, 4.0, 7.0, 11.0, 17.0, 9.0, 16.0, 13.0, 22.0, 16.0, 22.0, 28.0, 37.0, 25.0, 40.0, 29.0, 35.0, 49.0, 44.0, 47.0, 40.0, 47.0, 31.0, 34.0, 42.0, 37.0, 29.0, 37.0, 20.0, 33.0, 25.0, 26.0, 23.0, 13.0, 14.0, 19.0, 7.0, 9.0, 7.0, 8.0, 4.0, 6.0, 4.0, 3.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-76.51296997070312, -74.08256530761719, -71.65216064453125, -69.22174835205078, -66.79134368896484, -64.3609390258789, -61.93053436279297, -59.500125885009766, -57.06971740722656, -54.639312744140625, -52.20890426635742, -49.778499603271484, -47.34809112548828, -44.917686462402344, -42.487281799316406, -40.0568733215332, -37.626468658447266, -35.19606399536133, -32.765655517578125, -30.335250854492188, -27.904842376708984, -25.474437713623047, -23.044031143188477, -20.613624572753906, -18.183218002319336, -15.752811431884766, -13.322404861450195, -10.891999244689941, -8.461592674255371, -6.031186103820801, -3.600780487060547, -1.1703739166259766, 1.2600326538085938, 3.690438985824585, 6.120845317840576, 8.551251411437988, 10.981657981872559, 13.412064552307129, 15.842470169067383, 18.272876739501953, 20.703283309936523, 23.133689880371094, 25.564096450805664, 27.994503021240234, 30.424907684326172, 32.855316162109375, 35.28572082519531, 37.71612548828125, 40.14653396606445, 42.57693862915039, 45.007347106933594, 47.43775177001953, 49.868160247802734, 52.29856491088867, 54.728973388671875, 57.15937805175781, 59.58978271484375, 62.02018737792969, 64.45059204101562, 66.8810043334961, 69.31140899658203, 71.74181365966797, 74.1722183227539, 76.60263061523438, 79.03303527832031]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 6.0, 8.0, 9.0, 13.0, 17.0, 18.0, 28.0, 50.0, 63.0, 93.0, 145.0, 226.0, 292.0, 510.0, 727.0, 1228.0, 2205.0, 4259.0, 9036.0, 22181.0, 63455.0, 233213.0, 496910.0, 140574.0, 42745.0, 15744.0, 6734.0, 3303.0, 1810.0, 1061.0, 655.0, 411.0, 250.0, 203.0, 113.0, 83.0, 50.0, 46.0, 22.0, 19.0, 18.0, 13.0, 7.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-132.5, -128.400390625, -124.30078125, -120.201171875, -116.1015625, -112.001953125, -107.90234375, -103.802734375, -99.703125, -95.603515625, -91.50390625, -87.404296875, -83.3046875, -79.205078125, -75.10546875, -71.005859375, -66.90625, -62.806640625, -58.70703125, -54.607421875, -50.5078125, -46.408203125, -42.30859375, -38.208984375, -34.109375, -30.009765625, -25.91015625, -21.810546875, -17.7109375, -13.611328125, -9.51171875, -5.412109375, -1.3125, 2.787109375, 6.88671875, 10.986328125, 15.0859375, 19.185546875, 23.28515625, 27.384765625, 31.484375, 35.583984375, 39.68359375, 43.783203125, 47.8828125, 51.982421875, 56.08203125, 60.181640625, 64.28125, 68.380859375, 72.48046875, 76.580078125, 80.6796875, 84.779296875, 88.87890625, 92.978515625, 97.078125, 101.177734375, 105.27734375, 109.376953125, 113.4765625, 117.576171875, 121.67578125, 125.775390625, 129.875]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 7.0, 5.0, 10.0, 7.0, 6.0, 19.0, 8.0, 15.0, 22.0, 16.0, 32.0, 36.0, 38.0, 43.0, 36.0, 49.0, 53.0, 53.0, 51.0, 39.0, 54.0, 42.0, 47.0, 31.0, 48.0, 51.0, 34.0, 25.0, 23.0, 18.0, 17.0, 14.0, 10.0, 11.0, 6.0, 7.0, 1.0, 9.0, 4.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-49.78125, -48.2314453125, -46.681640625, -45.1318359375, -43.58203125, -42.0322265625, -40.482421875, -38.9326171875, -37.3828125, -35.8330078125, -34.283203125, -32.7333984375, -31.18359375, -29.6337890625, -28.083984375, -26.5341796875, -24.984375, -23.4345703125, -21.884765625, -20.3349609375, -18.78515625, -17.2353515625, -15.685546875, -14.1357421875, -12.5859375, -11.0361328125, -9.486328125, -7.9365234375, -6.38671875, -4.8369140625, -3.287109375, -1.7373046875, -0.1875, 1.3623046875, 2.912109375, 4.4619140625, 6.01171875, 7.5615234375, 9.111328125, 10.6611328125, 12.2109375, 13.7607421875, 15.310546875, 16.8603515625, 18.41015625, 19.9599609375, 21.509765625, 23.0595703125, 24.609375, 26.1591796875, 27.708984375, 29.2587890625, 30.80859375, 32.3583984375, 33.908203125, 35.4580078125, 37.0078125, 38.5576171875, 40.107421875, 41.6572265625, 43.20703125, 44.7568359375, 46.306640625, 47.8564453125, 49.40625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 6.0, 7.0, 9.0, 7.0, 15.0, 22.0, 23.0, 43.0, 61.0, 77.0, 145.0, 219.0, 350.0, 622.0, 1250.0, 2873.0, 7816.0, 27196.0, 148564.0, 689299.0, 132217.0, 25100.0, 7295.0, 2611.0, 1165.0, 610.0, 336.0, 199.0, 125.0, 90.0, 41.0, 41.0, 26.0, 22.0, 19.0, 19.0, 7.0, 6.0, 5.0, 1.0, 3.0, 2.0, 3.0, 5.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-176.125, -171.015625, -165.90625, -160.796875, -155.6875, -150.578125, -145.46875, -140.359375, -135.25, -130.140625, -125.03125, -119.921875, -114.8125, -109.703125, -104.59375, -99.484375, -94.375, -89.265625, -84.15625, -79.046875, -73.9375, -68.828125, -63.71875, -58.609375, -53.5, -48.390625, -43.28125, -38.171875, -33.0625, -27.953125, -22.84375, -17.734375, -12.625, -7.515625, -2.40625, 2.703125, 7.8125, 12.921875, 18.03125, 23.140625, 28.25, 33.359375, 38.46875, 43.578125, 48.6875, 53.796875, 58.90625, 64.015625, 69.125, 74.234375, 79.34375, 84.453125, 89.5625, 94.671875, 99.78125, 104.890625, 110.0, 115.109375, 120.21875, 125.328125, 130.4375, 135.546875, 140.65625, 145.765625, 150.875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 6.0, 5.0, 10.0, 5.0, 17.0, 13.0, 21.0, 17.0, 34.0, 29.0, 29.0, 33.0, 43.0, 39.0, 35.0, 50.0, 62.0, 52.0, 56.0, 57.0, 55.0, 54.0, 46.0, 30.0, 32.0, 34.0, 28.0, 27.0, 16.0, 15.0, 12.0, 10.0, 13.0, 7.0, 4.0, 6.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-190.375, -183.169921875, -175.96484375, -168.759765625, -161.5546875, -154.349609375, -147.14453125, -139.939453125, -132.734375, -125.529296875, -118.32421875, -111.119140625, -103.9140625, -96.708984375, -89.50390625, -82.298828125, -75.09375, -67.888671875, -60.68359375, -53.478515625, -46.2734375, -39.068359375, -31.86328125, -24.658203125, -17.453125, -10.248046875, -3.04296875, 4.162109375, 11.3671875, 18.572265625, 25.77734375, 32.982421875, 40.1875, 47.392578125, 54.59765625, 61.802734375, 69.0078125, 76.212890625, 83.41796875, 90.623046875, 97.828125, 105.033203125, 112.23828125, 119.443359375, 126.6484375, 133.853515625, 141.05859375, 148.263671875, 155.46875, 162.673828125, 169.87890625, 177.083984375, 184.2890625, 191.494140625, 198.69921875, 205.904296875, 213.109375, 220.314453125, 227.51953125, 234.724609375, 241.9296875, 249.134765625, 256.33984375, 263.544921875, 270.75]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 5.0, 11.0, 14.0, 16.0, 36.0, 64.0, 163.0, 449.0, 1240.0, 4621.0, 36494.0, 915505.0, 80618.0, 6809.0, 1616.0, 525.0, 184.0, 84.0, 41.0, 24.0, 15.0, 4.0, 9.0, 1.0, 4.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-209.25, -203.83203125, -198.4140625, -192.99609375, -187.578125, -182.16015625, -176.7421875, -171.32421875, -165.90625, -160.48828125, -155.0703125, -149.65234375, -144.234375, -138.81640625, -133.3984375, -127.98046875, -122.5625, -117.14453125, -111.7265625, -106.30859375, -100.890625, -95.47265625, -90.0546875, -84.63671875, -79.21875, -73.80078125, -68.3828125, -62.96484375, -57.546875, -52.12890625, -46.7109375, -41.29296875, -35.875, -30.45703125, -25.0390625, -19.62109375, -14.203125, -8.78515625, -3.3671875, 2.05078125, 7.46875, 12.88671875, 18.3046875, 23.72265625, 29.140625, 34.55859375, 39.9765625, 45.39453125, 50.8125, 56.23046875, 61.6484375, 67.06640625, 72.484375, 77.90234375, 83.3203125, 88.73828125, 94.15625, 99.57421875, 104.9921875, 110.41015625, 115.828125, 121.24609375, 126.6640625, 132.08203125, 137.5]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 9.0, 3.0, 11.0, 8.0, 9.0, 18.0, 26.0, 24.0, 36.0, 52.0, 81.0, 153.0, 151.0, 126.0, 83.0, 60.0, 39.0, 28.0, 21.0, 18.0, 10.0, 10.0, 9.0, 8.0, 2.0, 2.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01995849609375, -0.019141197204589844, -0.018323898315429688, -0.01750659942626953, -0.016689300537109375, -0.01587200164794922, -0.015054702758789062, -0.014237403869628906, -0.01342010498046875, -0.012602806091308594, -0.011785507202148438, -0.010968208312988281, -0.010150909423828125, -0.009333610534667969, -0.008516311645507812, -0.007699012756347656, -0.0068817138671875, -0.006064414978027344, -0.0052471160888671875, -0.004429817199707031, -0.003612518310546875, -0.0027952194213867188, -0.0019779205322265625, -0.0011606216430664062, -0.00034332275390625, 0.00047397613525390625, 0.0012912750244140625, 0.0021085739135742188, 0.002925872802734375, 0.0037431716918945312, 0.0045604705810546875, 0.005377769470214844, 0.006195068359375, 0.007012367248535156, 0.007829666137695312, 0.008646965026855469, 0.009464263916015625, 0.010281562805175781, 0.011098861694335938, 0.011916160583496094, 0.01273345947265625, 0.013550758361816406, 0.014368057250976562, 0.015185356140136719, 0.016002655029296875, 0.01681995391845703, 0.017637252807617188, 0.018454551696777344, 0.0192718505859375, 0.020089149475097656, 0.020906448364257812, 0.02172374725341797, 0.022541046142578125, 0.02335834503173828, 0.024175643920898438, 0.024992942810058594, 0.02581024169921875, 0.026627540588378906, 0.027444839477539062, 0.02826213836669922, 0.029079437255859375, 0.02989673614501953, 0.030714035034179688, 0.031531333923339844, 0.0323486328125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 7.0, 15.0, 7.0, 10.0, 23.0, 40.0, 87.0, 106.0, 255.0, 658.0, 3243.0, 46045.0, 951014.0, 42775.0, 3096.0, 648.0, 248.0, 111.0, 62.0, 38.0, 26.0, 15.0, 12.0, 3.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-178.375, -171.376953125, -164.37890625, -157.380859375, -150.3828125, -143.384765625, -136.38671875, -129.388671875, -122.390625, -115.392578125, -108.39453125, -101.396484375, -94.3984375, -87.400390625, -80.40234375, -73.404296875, -66.40625, -59.408203125, -52.41015625, -45.412109375, -38.4140625, -31.416015625, -24.41796875, -17.419921875, -10.421875, -3.423828125, 3.57421875, 10.572265625, 17.5703125, 24.568359375, 31.56640625, 38.564453125, 45.5625, 52.560546875, 59.55859375, 66.556640625, 73.5546875, 80.552734375, 87.55078125, 94.548828125, 101.546875, 108.544921875, 115.54296875, 122.541015625, 129.5390625, 136.537109375, 143.53515625, 150.533203125, 157.53125, 164.529296875, 171.52734375, 178.525390625, 185.5234375, 192.521484375, 199.51953125, 206.517578125, 213.515625, 220.513671875, 227.51171875, 234.509765625, 241.5078125, 248.505859375, 255.50390625, 262.501953125, 269.5]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 9.0, 9.0, 25.0, 43.0, 110.0, 216.0, 314.0, 154.0, 59.0, 33.0, 21.0, 10.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-109.25, -102.11328125, -94.9765625, -87.83984375, -80.703125, -73.56640625, -66.4296875, -59.29296875, -52.15625, -45.01953125, -37.8828125, -30.74609375, -23.609375, -16.47265625, -9.3359375, -2.19921875, 4.9375, 12.07421875, 19.2109375, 26.34765625, 33.484375, 40.62109375, 47.7578125, 54.89453125, 62.03125, 69.16796875, 76.3046875, 83.44140625, 90.578125, 97.71484375, 104.8515625, 111.98828125, 119.125, 126.26171875, 133.3984375, 140.53515625, 147.671875, 154.80859375, 161.9453125, 169.08203125, 176.21875, 183.35546875, 190.4921875, 197.62890625, 204.765625, 211.90234375, 219.0390625, 226.17578125, 233.3125, 240.44921875, 247.5859375, 254.72265625, 261.859375, 268.99609375, 276.1328125, 283.26953125, 290.40625, 297.54296875, 304.6796875, 311.81640625, 318.953125, 326.08984375, 333.2265625, 340.36328125, 347.5]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 7.0, 26.0, 77.0, 188.0, 304.0, 244.0, 104.0, 35.0, 10.0, 7.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2995.394287109375, -2897.577392578125, -2799.760498046875, -2701.943359375, -2604.12646484375, -2506.3095703125, -2408.49267578125, -2310.67578125, -2212.85888671875, -2115.0419921875, -2017.2249755859375, -1919.4080810546875, -1821.591064453125, -1723.774169921875, -1625.957275390625, -1528.140380859375, -1430.3232421875, -1332.50634765625, -1234.6893310546875, -1136.8724365234375, -1039.055419921875, -941.238525390625, -843.421630859375, -745.6046752929688, -647.7877197265625, -549.9707641601562, -452.1538391113281, -354.3369140625, -256.51995849609375, -158.7030029296875, -60.8861083984375, 36.93084716796875, 134.747802734375, 232.5647430419922, 330.3816833496094, 428.1986083984375, 526.0155639648438, 623.83251953125, 721.6494140625, 819.4663696289062, 917.2833251953125, 1015.1002807617188, 1112.917236328125, 1210.734130859375, 1308.551025390625, 1406.3680419921875, 1504.1849365234375, 1602.001953125, 1699.81884765625, 1797.6357421875, 1895.4527587890625, 1993.2696533203125, 2091.086669921875, 2188.903564453125, 2286.720458984375, 2384.537353515625, 2482.3544921875, 2580.17138671875, 2677.98828125, 2775.80517578125, 2873.622314453125, 2971.439208984375, 3069.256103515625, 3167.072998046875, 3264.889892578125]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 7.0, 4.0, 8.0, 7.0, 7.0, 12.0, 9.0, 12.0, 14.0, 14.0, 15.0, 17.0, 19.0, 23.0, 26.0, 29.0, 33.0, 30.0, 39.0, 45.0, 50.0, 50.0, 39.0, 47.0, 56.0, 50.0, 47.0, 37.0, 25.0, 32.0, 25.0, 23.0, 23.0, 21.0, 14.0, 19.0, 10.0, 16.0, 9.0, 7.0, 4.0, 3.0, 1.0, 8.0, 5.0, 4.0, 2.0, 0.0, 5.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-890.6057739257812, -863.0966796875, -835.587646484375, -808.0785522460938, -780.5695190429688, -753.0604248046875, -725.5513916015625, -698.0422973632812, -670.533203125, -643.0241088867188, -615.5150756835938, -588.0059814453125, -560.4969482421875, -532.9878540039062, -505.4787902832031, -477.9697265625, -450.460693359375, -422.9516296386719, -395.44256591796875, -367.9334716796875, -340.4244384765625, -312.91534423828125, -285.4062805175781, -257.897216796875, -230.38815307617188, -202.87908935546875, -175.37002563476562, -147.86094665527344, -120.35188293457031, -92.84281921386719, -65.333740234375, -37.824676513671875, -10.3155517578125, 17.19351577758789, 44.70258331298828, 72.21165466308594, 99.72071838378906, 127.22978210449219, 154.73886108398438, 182.2479248046875, 209.75698852539062, 237.26605224609375, 264.7751159667969, 292.2841796875, 319.79327392578125, 347.30230712890625, 374.8114013671875, 402.3204650878906, 429.82952880859375, 457.3385925292969, 484.84765625, 512.3567504882812, 539.8657836914062, 567.3748779296875, 594.8839111328125, 622.3930053710938, 649.902099609375, 677.4111938476562, 704.9202270507812, 732.4293212890625, 759.9383544921875, 787.4474487304688, 814.95654296875, 842.465576171875, 869.974609375]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 5.0, 4.0, 4.0, 8.0, 8.0, 17.0, 15.0, 15.0, 36.0, 36.0, 46.0, 55.0, 74.0, 95.0, 116.0, 218.0, 281.0, 435.0, 709.0, 1223.0, 2188.0, 4830.0, 15213.0, 4094330.0, 58181.0, 8412.0, 3318.0, 1690.0, 883.0, 569.0, 378.0, 229.0, 170.0, 115.0, 89.0, 52.0, 61.0, 43.0, 32.0, 25.0, 17.0, 15.0, 13.0, 14.0, 5.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 4.0, 2.0, 0.0, 0.0, 3.0], "bins": [-258.5, -250.3671875, -242.234375, -234.1015625, -225.96875, -217.8359375, -209.703125, -201.5703125, -193.4375, -185.3046875, -177.171875, -169.0390625, -160.90625, -152.7734375, -144.640625, -136.5078125, -128.375, -120.2421875, -112.109375, -103.9765625, -95.84375, -87.7109375, -79.578125, -71.4453125, -63.3125, -55.1796875, -47.046875, -38.9140625, -30.78125, -22.6484375, -14.515625, -6.3828125, 1.75, 9.8828125, 18.015625, 26.1484375, 34.28125, 42.4140625, 50.546875, 58.6796875, 66.8125, 74.9453125, 83.078125, 91.2109375, 99.34375, 107.4765625, 115.609375, 123.7421875, 131.875, 140.0078125, 148.140625, 156.2734375, 164.40625, 172.5390625, 180.671875, 188.8046875, 196.9375, 205.0703125, 213.203125, 221.3359375, 229.46875, 237.6015625, 245.734375, 253.8671875, 262.0]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 5.0, 11.0, 5.0, 11.0, 6.0, 12.0, 14.0, 18.0, 24.0, 23.0, 37.0, 33.0, 33.0, 36.0, 44.0, 56.0, 43.0, 46.0, 50.0, 57.0, 49.0, 43.0, 32.0, 51.0, 39.0, 33.0, 43.0, 17.0, 19.0, 15.0, 18.0, 12.0, 7.0, 13.0, 9.0, 8.0, 8.0, 5.0, 3.0, 4.0, 1.0, 3.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-47.0, -45.47607421875, -43.9521484375, -42.42822265625, -40.904296875, -39.38037109375, -37.8564453125, -36.33251953125, -34.80859375, -33.28466796875, -31.7607421875, -30.23681640625, -28.712890625, -27.18896484375, -25.6650390625, -24.14111328125, -22.6171875, -21.09326171875, -19.5693359375, -18.04541015625, -16.521484375, -14.99755859375, -13.4736328125, -11.94970703125, -10.42578125, -8.90185546875, -7.3779296875, -5.85400390625, -4.330078125, -2.80615234375, -1.2822265625, 0.24169921875, 1.765625, 3.28955078125, 4.8134765625, 6.33740234375, 7.861328125, 9.38525390625, 10.9091796875, 12.43310546875, 13.95703125, 15.48095703125, 17.0048828125, 18.52880859375, 20.052734375, 21.57666015625, 23.1005859375, 24.62451171875, 26.1484375, 27.67236328125, 29.1962890625, 30.72021484375, 32.244140625, 33.76806640625, 35.2919921875, 36.81591796875, 38.33984375, 39.86376953125, 41.3876953125, 42.91162109375, 44.435546875, 45.95947265625, 47.4833984375, 49.00732421875, 50.53125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 3.0, 2.0, 3.0, 8.0, 11.0, 20.0, 22.0, 48.0, 49.0, 85.0, 159.0, 222.0, 423.0, 696.0, 1305.0, 2630.0, 5881.0, 19027.0, 3952864.0, 185909.0, 14756.0, 5080.0, 2264.0, 1215.0, 626.0, 370.0, 202.0, 151.0, 86.0, 62.0, 29.0, 21.0, 17.0, 10.0, 15.0, 7.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-318.75, -308.76171875, -298.7734375, -288.78515625, -278.796875, -268.80859375, -258.8203125, -248.83203125, -238.84375, -228.85546875, -218.8671875, -208.87890625, -198.890625, -188.90234375, -178.9140625, -168.92578125, -158.9375, -148.94921875, -138.9609375, -128.97265625, -118.984375, -108.99609375, -99.0078125, -89.01953125, -79.03125, -69.04296875, -59.0546875, -49.06640625, -39.078125, -29.08984375, -19.1015625, -9.11328125, 0.875, 10.86328125, 20.8515625, 30.83984375, 40.828125, 50.81640625, 60.8046875, 70.79296875, 80.78125, 90.76953125, 100.7578125, 110.74609375, 120.734375, 130.72265625, 140.7109375, 150.69921875, 160.6875, 170.67578125, 180.6640625, 190.65234375, 200.640625, 210.62890625, 220.6171875, 230.60546875, 240.59375, 250.58203125, 260.5703125, 270.55859375, 280.546875, 290.53515625, 300.5234375, 310.51171875, 320.5]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 3.0, 2.0, 2.0, 1.0, 7.0, 7.0, 13.0, 23.0, 43.0, 125.0, 3644.0, 98.0, 46.0, 12.0, 12.0, 12.0, 6.0, 7.0, 1.0, 2.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-110.25, -106.37890625, -102.5078125, -98.63671875, -94.765625, -90.89453125, -87.0234375, -83.15234375, -79.28125, -75.41015625, -71.5390625, -67.66796875, -63.796875, -59.92578125, -56.0546875, -52.18359375, -48.3125, -44.44140625, -40.5703125, -36.69921875, -32.828125, -28.95703125, -25.0859375, -21.21484375, -17.34375, -13.47265625, -9.6015625, -5.73046875, -1.859375, 2.01171875, 5.8828125, 9.75390625, 13.625, 17.49609375, 21.3671875, 25.23828125, 29.109375, 32.98046875, 36.8515625, 40.72265625, 44.59375, 48.46484375, 52.3359375, 56.20703125, 60.078125, 63.94921875, 67.8203125, 71.69140625, 75.5625, 79.43359375, 83.3046875, 87.17578125, 91.046875, 94.91796875, 98.7890625, 102.66015625, 106.53125, 110.40234375, 114.2734375, 118.14453125, 122.015625, 125.88671875, 129.7578125, 133.62890625, 137.5]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 6.0, 2.0, 2.0, 8.0, 4.0, 10.0, 15.0, 30.0, 42.0, 58.0, 86.0, 117.0, 136.0, 144.0, 104.0, 76.0, 46.0, 43.0, 28.0, 18.0, 5.0, 6.0, 4.0, 12.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-458.49542236328125, -444.99444580078125, -431.4934387207031, -417.9924621582031, -404.491455078125, -390.990478515625, -377.489501953125, -363.988525390625, -350.4875183105469, -336.9865417480469, -323.48553466796875, -309.98455810546875, -296.48358154296875, -282.9825744628906, -269.4815979003906, -255.98060607910156, -242.4796142578125, -228.97862243652344, -215.47763061523438, -201.97665405273438, -188.4756622314453, -174.97467041015625, -161.47369384765625, -147.9727020263672, -134.47171020507812, -120.97071838378906, -107.46973419189453, -93.96875, -80.46775817871094, -66.96676635742188, -53.465782165527344, -39.96479797363281, -26.463775634765625, -12.962787628173828, 0.5382003784179688, 14.039188385009766, 27.540176391601562, 41.041168212890625, 54.542152404785156, 68.04313659667969, 81.54412841796875, 95.04512023925781, 108.54610443115234, 122.04708862304688, 135.54808044433594, 149.049072265625, 162.550048828125, 176.05104064941406, 189.55203247070312, 203.0530242919922, 216.55401611328125, 230.05499267578125, 243.5559844970703, 257.0569763183594, 270.5579528808594, 284.0589599609375, 297.5599365234375, 311.0609130859375, 324.5619201660156, 338.0628967285156, 351.56390380859375, 365.06488037109375, 378.56585693359375, 392.06683349609375, 405.5678405761719]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 2.0, 4.0, 1.0, 1.0, 4.0, 6.0, 4.0, 7.0, 9.0, 9.0, 22.0, 10.0, 17.0, 20.0, 20.0, 30.0, 32.0, 28.0, 41.0, 42.0, 43.0, 47.0, 51.0, 45.0, 60.0, 55.0, 38.0, 44.0, 39.0, 33.0, 29.0, 36.0, 20.0, 22.0, 19.0, 23.0, 16.0, 16.0, 16.0, 10.0, 6.0, 6.0, 4.0, 7.0, 4.0, 4.0, 6.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-227.385498046875, -220.46206665039062, -213.5386505126953, -206.61521911621094, -199.69180297851562, -192.76837158203125, -185.84494018554688, -178.9215087890625, -171.9980926513672, -165.0746612548828, -158.1512451171875, -151.22781372070312, -144.30438232421875, -137.38096618652344, -130.45753479003906, -123.53411102294922, -116.61068725585938, -109.68726348876953, -102.76383972167969, -95.84040832519531, -88.91698455810547, -81.99356079101562, -75.07012939453125, -68.1467056274414, -61.22328186035156, -54.29985809326172, -47.37643051147461, -40.4530029296875, -33.529579162597656, -26.606155395507812, -19.682727813720703, -12.759300231933594, -5.8358917236328125, 1.087533950805664, 8.01095962524414, 14.934385299682617, 21.857810974121094, 28.781234741210938, 35.70466232299805, 42.628089904785156, 49.551513671875, 56.474937438964844, 63.39836502075195, 70.32179260253906, 77.2452163696289, 84.16864013671875, 91.09207153320312, 98.01549530029297, 104.93891906738281, 111.86234283447266, 118.7857666015625, 125.70919799804688, 132.63262939453125, 139.55604553222656, 146.47947692871094, 153.40289306640625, 160.32632446289062, 167.249755859375, 174.1731719970703, 181.0966033935547, 188.02001953125, 194.94345092773438, 201.86688232421875, 208.79031372070312, 215.71372985839844]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 6.0, 5.0, 10.0, 11.0, 21.0, 43.0, 41.0, 73.0, 112.0, 165.0, 319.0, 468.0, 897.0, 1678.0, 3198.0, 6688.0, 14824.0, 36220.0, 98647.0, 334594.0, 372618.0, 108152.0, 39625.0, 15820.0, 7106.0, 3462.0, 1634.0, 810.0, 512.0, 275.0, 177.0, 104.0, 59.0, 52.0, 43.0, 35.0, 16.0, 13.0, 5.0, 2.0, 4.0, 8.0, 7.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-133.125, -128.541015625, -123.95703125, -119.373046875, -114.7890625, -110.205078125, -105.62109375, -101.037109375, -96.453125, -91.869140625, -87.28515625, -82.701171875, -78.1171875, -73.533203125, -68.94921875, -64.365234375, -59.78125, -55.197265625, -50.61328125, -46.029296875, -41.4453125, -36.861328125, -32.27734375, -27.693359375, -23.109375, -18.525390625, -13.94140625, -9.357421875, -4.7734375, -0.189453125, 4.39453125, 8.978515625, 13.5625, 18.146484375, 22.73046875, 27.314453125, 31.8984375, 36.482421875, 41.06640625, 45.650390625, 50.234375, 54.818359375, 59.40234375, 63.986328125, 68.5703125, 73.154296875, 77.73828125, 82.322265625, 86.90625, 91.490234375, 96.07421875, 100.658203125, 105.2421875, 109.826171875, 114.41015625, 118.994140625, 123.578125, 128.162109375, 132.74609375, 137.330078125, 141.9140625, 146.498046875, 151.08203125, 155.666015625, 160.25]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 4.0, 6.0, 4.0, 4.0, 10.0, 12.0, 10.0, 14.0, 22.0, 21.0, 36.0, 31.0, 44.0, 45.0, 48.0, 47.0, 67.0, 75.0, 65.0, 55.0, 48.0, 47.0, 55.0, 38.0, 41.0, 32.0, 28.0, 14.0, 11.0, 20.0, 11.0, 11.0, 9.0, 6.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.25, -63.27880859375, -61.3076171875, -59.33642578125, -57.365234375, -55.39404296875, -53.4228515625, -51.45166015625, -49.48046875, -47.50927734375, -45.5380859375, -43.56689453125, -41.595703125, -39.62451171875, -37.6533203125, -35.68212890625, -33.7109375, -31.73974609375, -29.7685546875, -27.79736328125, -25.826171875, -23.85498046875, -21.8837890625, -19.91259765625, -17.94140625, -15.97021484375, -13.9990234375, -12.02783203125, -10.056640625, -8.08544921875, -6.1142578125, -4.14306640625, -2.171875, -0.20068359375, 1.7705078125, 3.74169921875, 5.712890625, 7.68408203125, 9.6552734375, 11.62646484375, 13.59765625, 15.56884765625, 17.5400390625, 19.51123046875, 21.482421875, 23.45361328125, 25.4248046875, 27.39599609375, 29.3671875, 31.33837890625, 33.3095703125, 35.28076171875, 37.251953125, 39.22314453125, 41.1943359375, 43.16552734375, 45.13671875, 47.10791015625, 49.0791015625, 51.05029296875, 53.021484375, 54.99267578125, 56.9638671875, 58.93505859375, 60.90625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 6.0, 3.0, 4.0, 7.0, 4.0, 3.0, 11.0, 20.0, 21.0, 40.0, 41.0, 59.0, 99.0, 110.0, 173.0, 264.0, 390.0, 590.0, 1028.0, 1847.0, 3608.0, 8797.0, 25701.0, 101468.0, 577890.0, 249482.0, 50221.0, 14922.0, 5637.0, 2519.0, 1347.0, 813.0, 460.0, 270.0, 200.0, 152.0, 92.0, 71.0, 55.0, 35.0, 30.0, 14.0, 12.0, 15.0, 11.0, 6.0, 5.0, 0.0, 3.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-160.875, -155.46875, -150.0625, -144.65625, -139.25, -133.84375, -128.4375, -123.03125, -117.625, -112.21875, -106.8125, -101.40625, -96.0, -90.59375, -85.1875, -79.78125, -74.375, -68.96875, -63.5625, -58.15625, -52.75, -47.34375, -41.9375, -36.53125, -31.125, -25.71875, -20.3125, -14.90625, -9.5, -4.09375, 1.3125, 6.71875, 12.125, 17.53125, 22.9375, 28.34375, 33.75, 39.15625, 44.5625, 49.96875, 55.375, 60.78125, 66.1875, 71.59375, 77.0, 82.40625, 87.8125, 93.21875, 98.625, 104.03125, 109.4375, 114.84375, 120.25, 125.65625, 131.0625, 136.46875, 141.875, 147.28125, 152.6875, 158.09375, 163.5, 168.90625, 174.3125, 179.71875, 185.125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 3.0, 2.0, 1.0, 5.0, 4.0, 2.0, 3.0, 7.0, 10.0, 13.0, 13.0, 22.0, 27.0, 28.0, 29.0, 39.0, 40.0, 48.0, 50.0, 52.0, 40.0, 45.0, 58.0, 64.0, 45.0, 52.0, 39.0, 41.0, 40.0, 38.0, 29.0, 22.0, 25.0, 16.0, 13.0, 11.0, 7.0, 9.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-198.625, -191.095703125, -183.56640625, -176.037109375, -168.5078125, -160.978515625, -153.44921875, -145.919921875, -138.390625, -130.861328125, -123.33203125, -115.802734375, -108.2734375, -100.744140625, -93.21484375, -85.685546875, -78.15625, -70.626953125, -63.09765625, -55.568359375, -48.0390625, -40.509765625, -32.98046875, -25.451171875, -17.921875, -10.392578125, -2.86328125, 4.666015625, 12.1953125, 19.724609375, 27.25390625, 34.783203125, 42.3125, 49.841796875, 57.37109375, 64.900390625, 72.4296875, 79.958984375, 87.48828125, 95.017578125, 102.546875, 110.076171875, 117.60546875, 125.134765625, 132.6640625, 140.193359375, 147.72265625, 155.251953125, 162.78125, 170.310546875, 177.83984375, 185.369140625, 192.8984375, 200.427734375, 207.95703125, 215.486328125, 223.015625, 230.544921875, 238.07421875, 245.603515625, 253.1328125, 260.662109375, 268.19140625, 275.720703125, 283.25]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 8.0, 17.0, 14.0, 23.0, 39.0, 79.0, 150.0, 380.0, 953.0, 2970.0, 11800.0, 88416.0, 769582.0, 151107.0, 17012.0, 3863.0, 1206.0, 468.0, 230.0, 91.0, 52.0, 30.0, 21.0, 11.0, 9.0, 10.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-98.125, -95.369140625, -92.61328125, -89.857421875, -87.1015625, -84.345703125, -81.58984375, -78.833984375, -76.078125, -73.322265625, -70.56640625, -67.810546875, -65.0546875, -62.298828125, -59.54296875, -56.787109375, -54.03125, -51.275390625, -48.51953125, -45.763671875, -43.0078125, -40.251953125, -37.49609375, -34.740234375, -31.984375, -29.228515625, -26.47265625, -23.716796875, -20.9609375, -18.205078125, -15.44921875, -12.693359375, -9.9375, -7.181640625, -4.42578125, -1.669921875, 1.0859375, 3.841796875, 6.59765625, 9.353515625, 12.109375, 14.865234375, 17.62109375, 20.376953125, 23.1328125, 25.888671875, 28.64453125, 31.400390625, 34.15625, 36.912109375, 39.66796875, 42.423828125, 45.1796875, 47.935546875, 50.69140625, 53.447265625, 56.203125, 58.958984375, 61.71484375, 64.470703125, 67.2265625, 69.982421875, 72.73828125, 75.494140625, 78.25]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 5.0, 4.0, 4.0, 3.0, 8.0, 13.0, 12.0, 18.0, 19.0, 34.0, 34.0, 36.0, 29.0, 45.0, 54.0, 73.0, 115.0, 81.0, 86.0, 72.0, 44.0, 40.0, 26.0, 27.0, 20.0, 14.0, 14.0, 8.0, 11.0, 14.0, 4.0, 9.0, 3.0, 5.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01447296142578125, -0.01399219036102295, -0.013511419296264648, -0.013030648231506348, -0.012549877166748047, -0.012069106101989746, -0.011588335037231445, -0.011107563972473145, -0.010626792907714844, -0.010146021842956543, -0.009665250778198242, -0.009184479713439941, -0.00870370864868164, -0.00822293758392334, -0.007742166519165039, -0.007261395454406738, -0.0067806243896484375, -0.006299853324890137, -0.005819082260131836, -0.005338311195373535, -0.004857540130615234, -0.004376769065856934, -0.003895998001098633, -0.003415226936340332, -0.0029344558715820312, -0.0024536848068237305, -0.0019729137420654297, -0.001492142677307129, -0.0010113716125488281, -0.0005306005477905273, -4.982948303222656e-05, 0.0004309415817260742, 0.000911712646484375, 0.0013924837112426758, 0.0018732547760009766, 0.0023540258407592773, 0.002834796905517578, 0.003315567970275879, 0.0037963390350341797, 0.0042771100997924805, 0.004757881164550781, 0.005238652229309082, 0.005719423294067383, 0.006200194358825684, 0.006680965423583984, 0.007161736488342285, 0.007642507553100586, 0.008123278617858887, 0.008604049682617188, 0.009084820747375488, 0.009565591812133789, 0.01004636287689209, 0.01052713394165039, 0.011007905006408691, 0.011488676071166992, 0.011969447135925293, 0.012450218200683594, 0.012930989265441895, 0.013411760330200195, 0.013892531394958496, 0.014373302459716797, 0.014854073524475098, 0.015334844589233398, 0.0158156156539917, 0.01629638671875]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 2.0, 5.0, 1.0, 9.0, 9.0, 13.0, 19.0, 24.0, 32.0, 50.0, 77.0, 131.0, 160.0, 314.0, 511.0, 932.0, 1806.0, 4027.0, 10690.0, 39369.0, 221504.0, 606561.0, 122940.0, 25362.0, 7612.0, 2988.0, 1479.0, 755.0, 410.0, 252.0, 159.0, 92.0, 71.0, 57.0, 33.0, 25.0, 20.0, 13.0, 15.0, 5.0, 4.0, 8.0, 4.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-69.875, -67.84033203125, -65.8056640625, -63.77099609375, -61.736328125, -59.70166015625, -57.6669921875, -55.63232421875, -53.59765625, -51.56298828125, -49.5283203125, -47.49365234375, -45.458984375, -43.42431640625, -41.3896484375, -39.35498046875, -37.3203125, -35.28564453125, -33.2509765625, -31.21630859375, -29.181640625, -27.14697265625, -25.1123046875, -23.07763671875, -21.04296875, -19.00830078125, -16.9736328125, -14.93896484375, -12.904296875, -10.86962890625, -8.8349609375, -6.80029296875, -4.765625, -2.73095703125, -0.6962890625, 1.33837890625, 3.373046875, 5.40771484375, 7.4423828125, 9.47705078125, 11.51171875, 13.54638671875, 15.5810546875, 17.61572265625, 19.650390625, 21.68505859375, 23.7197265625, 25.75439453125, 27.7890625, 29.82373046875, 31.8583984375, 33.89306640625, 35.927734375, 37.96240234375, 39.9970703125, 42.03173828125, 44.06640625, 46.10107421875, 48.1357421875, 50.17041015625, 52.205078125, 54.23974609375, 56.2744140625, 58.30908203125, 60.34375]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 2.0, 8.0, 9.0, 20.0, 31.0, 42.0, 86.0, 93.0, 129.0, 178.0, 113.0, 103.0, 79.0, 34.0, 24.0, 15.0, 8.0, 3.0, 11.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-117.75, -114.3232421875, -110.896484375, -107.4697265625, -104.04296875, -100.6162109375, -97.189453125, -93.7626953125, -90.3359375, -86.9091796875, -83.482421875, -80.0556640625, -76.62890625, -73.2021484375, -69.775390625, -66.3486328125, -62.921875, -59.4951171875, -56.068359375, -52.6416015625, -49.21484375, -45.7880859375, -42.361328125, -38.9345703125, -35.5078125, -32.0810546875, -28.654296875, -25.2275390625, -21.80078125, -18.3740234375, -14.947265625, -11.5205078125, -8.09375, -4.6669921875, -1.240234375, 2.1865234375, 5.61328125, 9.0400390625, 12.466796875, 15.8935546875, 19.3203125, 22.7470703125, 26.173828125, 29.6005859375, 33.02734375, 36.4541015625, 39.880859375, 43.3076171875, 46.734375, 50.1611328125, 53.587890625, 57.0146484375, 60.44140625, 63.8681640625, 67.294921875, 70.7216796875, 74.1484375, 77.5751953125, 81.001953125, 84.4287109375, 87.85546875, 91.2822265625, 94.708984375, 98.1357421875, 101.5625]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 5.0, 5.0, 5.0, 13.0, 13.0, 29.0, 49.0, 66.0, 113.0, 124.0, 161.0, 136.0, 105.0, 62.0, 37.0, 25.0, 16.0, 14.0, 8.0, 5.0, 3.0, 0.0, 4.0, 3.0, 0.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1657.6605224609375, -1606.6939697265625, -1555.727294921875, -1504.7607421875, -1453.794189453125, -1402.8275146484375, -1351.8609619140625, -1300.894287109375, -1249.927734375, -1198.961181640625, -1147.9945068359375, -1097.0279541015625, -1046.061279296875, -995.0947265625, -944.128173828125, -893.1615600585938, -842.1949462890625, -791.2283325195312, -740.26171875, -689.295166015625, -638.3285522460938, -587.3619384765625, -536.3953857421875, -485.42877197265625, -434.462158203125, -383.49554443359375, -332.5289611816406, -281.5623779296875, -230.59576416015625, -179.62916564941406, -128.66256713867188, -77.69598388671875, -26.7294921875, 24.237106323242188, 75.20370483398438, 126.17030334472656, 177.13690185546875, 228.10350036621094, 279.0700988769531, 330.03668212890625, 381.0032958984375, 431.96990966796875, 482.9364929199219, 533.903076171875, 584.8696899414062, 635.8363037109375, 686.8028564453125, 737.7694702148438, 788.736083984375, 839.7026977539062, 890.6693115234375, 941.6358642578125, 992.6024780273438, 1043.569091796875, 1094.53564453125, 1145.502197265625, 1196.4688720703125, 1247.4354248046875, 1298.402099609375, 1349.36865234375, 1400.335205078125, 1451.3018798828125, 1502.2684326171875, 1553.235107421875, 1604.20166015625]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 6.0, 4.0, 4.0, 6.0, 9.0, 12.0, 10.0, 16.0, 20.0, 25.0, 28.0, 20.0, 33.0, 34.0, 39.0, 53.0, 41.0, 47.0, 49.0, 41.0, 49.0, 39.0, 38.0, 48.0, 47.0, 28.0, 44.0, 27.0, 37.0, 20.0, 28.0, 20.0, 15.0, 13.0, 13.0, 9.0, 13.0, 9.0, 3.0, 3.0, 7.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1066.38671875, -1032.3743896484375, -998.3619995117188, -964.349609375, -930.3372802734375, -896.3248901367188, -862.3125, -828.3001708984375, -794.2877807617188, -760.275390625, -726.2630615234375, -692.2506713867188, -658.23828125, -624.2259521484375, -590.2135620117188, -556.201171875, -522.1888427734375, -488.1764831542969, -454.16412353515625, -420.1517333984375, -386.1393737792969, -352.12701416015625, -318.1146240234375, -284.1022644042969, -250.08990478515625, -216.07754516601562, -182.06517028808594, -148.05279541015625, -114.04043579101562, -80.028076171875, -46.01570129394531, -12.003326416015625, 22.0089111328125, 56.021278381347656, 90.03364562988281, 124.04601287841797, 158.05838012695312, 192.07073974609375, 226.08311462402344, 260.0954895019531, 294.10784912109375, 328.1202087402344, 362.132568359375, 396.14495849609375, 430.1573181152344, 464.169677734375, 498.18206787109375, 532.1944580078125, 566.206787109375, 600.2191772460938, 634.2315063476562, 668.243896484375, 702.2562255859375, 736.2686157226562, 770.281005859375, 804.2933349609375, 838.3057250976562, 872.318115234375, 906.3304443359375, 940.3428344726562, 974.355224609375, 1008.3675537109375, 1042.3798828125, 1076.392333984375, 1110.4046630859375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 6.0, 8.0, 7.0, 6.0, 18.0, 14.0, 36.0, 20.0, 38.0, 56.0, 81.0, 112.0, 190.0, 344.0, 505.0, 802.0, 1448.0, 2357.0, 4321.0, 8306.0, 18402.0, 53158.0, 451295.0, 3372747.0, 210470.0, 39314.0, 14818.0, 6843.0, 3548.0, 1950.0, 1148.0, 707.0, 408.0, 256.0, 162.0, 129.0, 72.0, 46.0, 39.0, 25.0, 22.0, 15.0, 11.0, 12.0, 10.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-125.0, -120.744140625, -116.48828125, -112.232421875, -107.9765625, -103.720703125, -99.46484375, -95.208984375, -90.953125, -86.697265625, -82.44140625, -78.185546875, -73.9296875, -69.673828125, -65.41796875, -61.162109375, -56.90625, -52.650390625, -48.39453125, -44.138671875, -39.8828125, -35.626953125, -31.37109375, -27.115234375, -22.859375, -18.603515625, -14.34765625, -10.091796875, -5.8359375, -1.580078125, 2.67578125, 6.931640625, 11.1875, 15.443359375, 19.69921875, 23.955078125, 28.2109375, 32.466796875, 36.72265625, 40.978515625, 45.234375, 49.490234375, 53.74609375, 58.001953125, 62.2578125, 66.513671875, 70.76953125, 75.025390625, 79.28125, 83.537109375, 87.79296875, 92.048828125, 96.3046875, 100.560546875, 104.81640625, 109.072265625, 113.328125, 117.583984375, 121.83984375, 126.095703125, 130.3515625, 134.607421875, 138.86328125, 143.119140625, 147.375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 6.0, 6.0, 7.0, 10.0, 9.0, 15.0, 14.0, 16.0, 22.0, 33.0, 24.0, 36.0, 24.0, 27.0, 42.0, 44.0, 54.0, 55.0, 52.0, 50.0, 44.0, 50.0, 32.0, 33.0, 41.0, 50.0, 31.0, 32.0, 24.0, 17.0, 20.0, 13.0, 19.0, 16.0, 4.0, 7.0, 9.0, 7.0, 6.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-49.21875, -47.68359375, -46.1484375, -44.61328125, -43.078125, -41.54296875, -40.0078125, -38.47265625, -36.9375, -35.40234375, -33.8671875, -32.33203125, -30.796875, -29.26171875, -27.7265625, -26.19140625, -24.65625, -23.12109375, -21.5859375, -20.05078125, -18.515625, -16.98046875, -15.4453125, -13.91015625, -12.375, -10.83984375, -9.3046875, -7.76953125, -6.234375, -4.69921875, -3.1640625, -1.62890625, -0.09375, 1.44140625, 2.9765625, 4.51171875, 6.046875, 7.58203125, 9.1171875, 10.65234375, 12.1875, 13.72265625, 15.2578125, 16.79296875, 18.328125, 19.86328125, 21.3984375, 22.93359375, 24.46875, 26.00390625, 27.5390625, 29.07421875, 30.609375, 32.14453125, 33.6796875, 35.21484375, 36.75, 38.28515625, 39.8203125, 41.35546875, 42.890625, 44.42578125, 45.9609375, 47.49609375, 49.03125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 3.0, 2.0, 3.0, 3.0, 16.0, 11.0, 21.0, 28.0, 38.0, 55.0, 73.0, 118.0, 206.0, 356.0, 710.0, 1394.0, 3027.0, 6668.0, 16900.0, 52043.0, 277419.0, 3492503.0, 263150.0, 50845.0, 16558.0, 6534.0, 2712.0, 1365.0, 625.0, 348.0, 216.0, 111.0, 65.0, 50.0, 34.0, 21.0, 17.0, 14.0, 9.0, 8.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-174.375, -169.0078125, -163.640625, -158.2734375, -152.90625, -147.5390625, -142.171875, -136.8046875, -131.4375, -126.0703125, -120.703125, -115.3359375, -109.96875, -104.6015625, -99.234375, -93.8671875, -88.5, -83.1328125, -77.765625, -72.3984375, -67.03125, -61.6640625, -56.296875, -50.9296875, -45.5625, -40.1953125, -34.828125, -29.4609375, -24.09375, -18.7265625, -13.359375, -7.9921875, -2.625, 2.7421875, 8.109375, 13.4765625, 18.84375, 24.2109375, 29.578125, 34.9453125, 40.3125, 45.6796875, 51.046875, 56.4140625, 61.78125, 67.1484375, 72.515625, 77.8828125, 83.25, 88.6171875, 93.984375, 99.3515625, 104.71875, 110.0859375, 115.453125, 120.8203125, 126.1875, 131.5546875, 136.921875, 142.2890625, 147.65625, 153.0234375, 158.390625, 163.7578125, 169.125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 11.0, 4.0, 4.0, 9.0, 11.0, 9.0, 16.0, 18.0, 18.0, 19.0, 30.0, 58.0, 67.0, 83.0, 171.0, 370.0, 953.0, 1060.0, 478.0, 236.0, 134.0, 74.0, 54.0, 48.0, 25.0, 25.0, 25.0, 14.0, 7.0, 5.0, 5.0, 4.0, 7.0, 3.0, 1.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-194.5, -189.1328125, -183.765625, -178.3984375, -173.03125, -167.6640625, -162.296875, -156.9296875, -151.5625, -146.1953125, -140.828125, -135.4609375, -130.09375, -124.7265625, -119.359375, -113.9921875, -108.625, -103.2578125, -97.890625, -92.5234375, -87.15625, -81.7890625, -76.421875, -71.0546875, -65.6875, -60.3203125, -54.953125, -49.5859375, -44.21875, -38.8515625, -33.484375, -28.1171875, -22.75, -17.3828125, -12.015625, -6.6484375, -1.28125, 4.0859375, 9.453125, 14.8203125, 20.1875, 25.5546875, 30.921875, 36.2890625, 41.65625, 47.0234375, 52.390625, 57.7578125, 63.125, 68.4921875, 73.859375, 79.2265625, 84.59375, 89.9609375, 95.328125, 100.6953125, 106.0625, 111.4296875, 116.796875, 122.1640625, 127.53125, 132.8984375, 138.265625, 143.6328125, 149.0]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 8.0, 9.0, 14.0, 30.0, 78.0, 190.0, 284.0, 237.0, 84.0, 37.0, 21.0, 4.0, 3.0, 3.0, 1.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2384.1220703125, -2290.970458984375, -2197.818603515625, -2104.6669921875, -2011.51513671875, -1918.363525390625, -1825.2117919921875, -1732.06005859375, -1638.9083251953125, -1545.756591796875, -1452.6048583984375, -1359.453125, -1266.301513671875, -1173.149658203125, -1079.998046875, -986.8463134765625, -893.694580078125, -800.5428466796875, -707.39111328125, -614.2394409179688, -521.0877075195312, -427.93597412109375, -334.7843017578125, -241.632568359375, -148.4808349609375, -55.32911682128906, 37.822601318359375, 130.97430419921875, 224.12603759765625, 317.27777099609375, 410.429443359375, 503.5811767578125, 596.73291015625, 689.8846435546875, 783.036376953125, 876.1880493164062, 969.3397827148438, 1062.491455078125, 1155.6431884765625, 1248.794921875, 1341.9466552734375, 1435.098388671875, 1528.2501220703125, 1621.40185546875, 1714.553466796875, 1807.705322265625, 1900.85693359375, 1994.0086669921875, 2087.160400390625, 2180.31201171875, 2273.4638671875, 2366.615478515625, 2459.767333984375, 2552.9189453125, 2646.07080078125, 2739.222412109375, 2832.3740234375, 2925.525634765625, 3018.677490234375, 3111.8291015625, 3204.98095703125, 3298.132568359375, 3391.2841796875, 3484.43603515625, 3577.587890625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 3.0, 4.0, 3.0, 3.0, 1.0, 3.0, 6.0, 10.0, 9.0, 8.0, 12.0, 13.0, 15.0, 12.0, 16.0, 26.0, 23.0, 28.0, 28.0, 38.0, 30.0, 27.0, 37.0, 43.0, 44.0, 49.0, 31.0, 42.0, 30.0, 36.0, 36.0, 46.0, 35.0, 39.0, 29.0, 23.0, 12.0, 21.0, 17.0, 17.0, 16.0, 17.0, 7.0, 7.0, 11.0, 4.0, 7.0, 5.0, 9.0, 9.0, 6.0, 3.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-557.974853515625, -538.8375854492188, -519.7003784179688, -500.5631103515625, -481.4258728027344, -462.28863525390625, -443.1513671875, -424.0141296386719, -404.87689208984375, -385.7396545410156, -366.6024169921875, -347.46514892578125, -328.3279113769531, -309.190673828125, -290.05340576171875, -270.9161682128906, -251.7789306640625, -232.64169311523438, -213.5044403076172, -194.3671875, -175.22994995117188, -156.09271240234375, -136.95545959472656, -117.81820678710938, -98.68096923828125, -79.5437240600586, -60.40647888183594, -41.26923370361328, -22.131988525390625, -2.9947433471679688, 16.142501831054688, 35.279754638671875, 54.4169921875, 73.55423736572266, 92.69148254394531, 111.82872772216797, 130.96597290039062, 150.10321044921875, 169.24046325683594, 188.37771606445312, 207.51495361328125, 226.65219116210938, 245.78944396972656, 264.92669677734375, 284.0639343261719, 303.201171875, 322.33843994140625, 341.4756774902344, 360.6129150390625, 379.7501525878906, 398.88739013671875, 418.024658203125, 437.1618957519531, 456.29913330078125, 475.4364013671875, 494.5736389160156, 513.7108764648438, 532.84814453125, 551.9853515625, 571.1226196289062, 590.2598876953125, 609.3970947265625, 628.5343627929688, 647.671630859375, 666.808837890625]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 6.0, 5.0, 17.0, 18.0, 30.0, 28.0, 59.0, 84.0, 110.0, 159.0, 221.0, 360.0, 564.0, 839.0, 1230.0, 1988.0, 3156.0, 5460.0, 9110.0, 16596.0, 32566.0, 68115.0, 161287.0, 357832.0, 214596.0, 86745.0, 39651.0, 20294.0, 10987.0, 6175.0, 3746.0, 2263.0, 1456.0, 944.0, 613.0, 405.0, 301.0, 183.0, 132.0, 74.0, 44.0, 39.0, 23.0, 16.0, 11.0, 7.0, 6.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-104.3125, -101.0166015625, -97.720703125, -94.4248046875, -91.12890625, -87.8330078125, -84.537109375, -81.2412109375, -77.9453125, -74.6494140625, -71.353515625, -68.0576171875, -64.76171875, -61.4658203125, -58.169921875, -54.8740234375, -51.578125, -48.2822265625, -44.986328125, -41.6904296875, -38.39453125, -35.0986328125, -31.802734375, -28.5068359375, -25.2109375, -21.9150390625, -18.619140625, -15.3232421875, -12.02734375, -8.7314453125, -5.435546875, -2.1396484375, 1.15625, 4.4521484375, 7.748046875, 11.0439453125, 14.33984375, 17.6357421875, 20.931640625, 24.2275390625, 27.5234375, 30.8193359375, 34.115234375, 37.4111328125, 40.70703125, 44.0029296875, 47.298828125, 50.5947265625, 53.890625, 57.1865234375, 60.482421875, 63.7783203125, 67.07421875, 70.3701171875, 73.666015625, 76.9619140625, 80.2578125, 83.5537109375, 86.849609375, 90.1455078125, 93.44140625, 96.7373046875, 100.033203125, 103.3291015625, 106.625]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 3.0, 7.0, 4.0, 6.0, 6.0, 6.0, 9.0, 9.0, 11.0, 14.0, 16.0, 12.0, 18.0, 24.0, 25.0, 28.0, 33.0, 27.0, 36.0, 40.0, 45.0, 34.0, 34.0, 53.0, 62.0, 37.0, 43.0, 36.0, 36.0, 44.0, 27.0, 32.0, 28.0, 26.0, 17.0, 20.0, 16.0, 19.0, 10.0, 16.0, 6.0, 7.0, 3.0, 6.0, 1.0, 4.0, 5.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-42.03125, -40.61279296875, -39.1943359375, -37.77587890625, -36.357421875, -34.93896484375, -33.5205078125, -32.10205078125, -30.68359375, -29.26513671875, -27.8466796875, -26.42822265625, -25.009765625, -23.59130859375, -22.1728515625, -20.75439453125, -19.3359375, -17.91748046875, -16.4990234375, -15.08056640625, -13.662109375, -12.24365234375, -10.8251953125, -9.40673828125, -7.98828125, -6.56982421875, -5.1513671875, -3.73291015625, -2.314453125, -0.89599609375, 0.5224609375, 1.94091796875, 3.359375, 4.77783203125, 6.1962890625, 7.61474609375, 9.033203125, 10.45166015625, 11.8701171875, 13.28857421875, 14.70703125, 16.12548828125, 17.5439453125, 18.96240234375, 20.380859375, 21.79931640625, 23.2177734375, 24.63623046875, 26.0546875, 27.47314453125, 28.8916015625, 30.31005859375, 31.728515625, 33.14697265625, 34.5654296875, 35.98388671875, 37.40234375, 38.82080078125, 40.2392578125, 41.65771484375, 43.076171875, 44.49462890625, 45.9130859375, 47.33154296875, 48.75]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 5.0, 11.0, 17.0, 24.0, 20.0, 44.0, 56.0, 90.0, 110.0, 219.0, 320.0, 569.0, 1005.0, 2190.0, 5506.0, 19753.0, 132081.0, 765317.0, 96064.0, 16237.0, 4687.0, 1963.0, 915.0, 495.0, 299.0, 171.0, 124.0, 83.0, 56.0, 35.0, 26.0, 19.0, 12.0, 8.0, 5.0, 7.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-270.25, -262.166015625, -254.08203125, -245.998046875, -237.9140625, -229.830078125, -221.74609375, -213.662109375, -205.578125, -197.494140625, -189.41015625, -181.326171875, -173.2421875, -165.158203125, -157.07421875, -148.990234375, -140.90625, -132.822265625, -124.73828125, -116.654296875, -108.5703125, -100.486328125, -92.40234375, -84.318359375, -76.234375, -68.150390625, -60.06640625, -51.982421875, -43.8984375, -35.814453125, -27.73046875, -19.646484375, -11.5625, -3.478515625, 4.60546875, 12.689453125, 20.7734375, 28.857421875, 36.94140625, 45.025390625, 53.109375, 61.193359375, 69.27734375, 77.361328125, 85.4453125, 93.529296875, 101.61328125, 109.697265625, 117.78125, 125.865234375, 133.94921875, 142.033203125, 150.1171875, 158.201171875, 166.28515625, 174.369140625, 182.453125, 190.537109375, 198.62109375, 206.705078125, 214.7890625, 222.873046875, 230.95703125, 239.041015625, 247.125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 7.0, 5.0, 13.0, 6.0, 13.0, 14.0, 25.0, 25.0, 34.0, 39.0, 30.0, 46.0, 62.0, 44.0, 46.0, 49.0, 64.0, 69.0, 59.0, 58.0, 49.0, 40.0, 40.0, 23.0, 31.0, 28.0, 20.0, 17.0, 20.0, 5.0, 9.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-236.5, -227.9921875, -219.484375, -210.9765625, -202.46875, -193.9609375, -185.453125, -176.9453125, -168.4375, -159.9296875, -151.421875, -142.9140625, -134.40625, -125.8984375, -117.390625, -108.8828125, -100.375, -91.8671875, -83.359375, -74.8515625, -66.34375, -57.8359375, -49.328125, -40.8203125, -32.3125, -23.8046875, -15.296875, -6.7890625, 1.71875, 10.2265625, 18.734375, 27.2421875, 35.75, 44.2578125, 52.765625, 61.2734375, 69.78125, 78.2890625, 86.796875, 95.3046875, 103.8125, 112.3203125, 120.828125, 129.3359375, 137.84375, 146.3515625, 154.859375, 163.3671875, 171.875, 180.3828125, 188.890625, 197.3984375, 205.90625, 214.4140625, 222.921875, 231.4296875, 239.9375, 248.4453125, 256.953125, 265.4609375, 273.96875, 282.4765625, 290.984375, 299.4921875, 308.0]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 8.0, 7.0, 10.0, 19.0, 18.0, 31.0, 40.0, 87.0, 141.0, 284.0, 609.0, 1572.0, 4842.0, 23406.0, 442921.0, 541631.0, 24884.0, 5148.0, 1632.0, 605.0, 295.0, 157.0, 76.0, 37.0, 32.0, 23.0, 12.0, 8.0, 9.0, 6.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-137.125, -132.556640625, -127.98828125, -123.419921875, -118.8515625, -114.283203125, -109.71484375, -105.146484375, -100.578125, -96.009765625, -91.44140625, -86.873046875, -82.3046875, -77.736328125, -73.16796875, -68.599609375, -64.03125, -59.462890625, -54.89453125, -50.326171875, -45.7578125, -41.189453125, -36.62109375, -32.052734375, -27.484375, -22.916015625, -18.34765625, -13.779296875, -9.2109375, -4.642578125, -0.07421875, 4.494140625, 9.0625, 13.630859375, 18.19921875, 22.767578125, 27.3359375, 31.904296875, 36.47265625, 41.041015625, 45.609375, 50.177734375, 54.74609375, 59.314453125, 63.8828125, 68.451171875, 73.01953125, 77.587890625, 82.15625, 86.724609375, 91.29296875, 95.861328125, 100.4296875, 104.998046875, 109.56640625, 114.134765625, 118.703125, 123.271484375, 127.83984375, 132.408203125, 136.9765625, 141.544921875, 146.11328125, 150.681640625, 155.25]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 5.0, 3.0, 2.0, 3.0, 6.0, 5.0, 21.0, 25.0, 46.0, 68.0, 105.0, 182.0, 191.0, 132.0, 85.0, 39.0, 30.0, 20.0, 10.0, 7.0, 4.0, 8.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0301513671875, -0.028729915618896484, -0.02730846405029297, -0.025887012481689453, -0.024465560913085938, -0.023044109344482422, -0.021622657775878906, -0.02020120620727539, -0.018779754638671875, -0.01735830307006836, -0.015936851501464844, -0.014515399932861328, -0.013093948364257812, -0.011672496795654297, -0.010251045227050781, -0.008829593658447266, -0.00740814208984375, -0.005986690521240234, -0.004565238952636719, -0.003143787384033203, -0.0017223358154296875, -0.0003008842468261719, 0.0011205673217773438, 0.0025420188903808594, 0.003963470458984375, 0.005384922027587891, 0.006806373596191406, 0.008227825164794922, 0.009649276733398438, 0.011070728302001953, 0.012492179870605469, 0.013913631439208984, 0.0153350830078125, 0.016756534576416016, 0.01817798614501953, 0.019599437713623047, 0.021020889282226562, 0.022442340850830078, 0.023863792419433594, 0.02528524398803711, 0.026706695556640625, 0.02812814712524414, 0.029549598693847656, 0.030971050262451172, 0.03239250183105469, 0.0338139533996582, 0.03523540496826172, 0.036656856536865234, 0.03807830810546875, 0.039499759674072266, 0.04092121124267578, 0.0423426628112793, 0.04376411437988281, 0.04518556594848633, 0.046607017517089844, 0.04802846908569336, 0.049449920654296875, 0.05087137222290039, 0.052292823791503906, 0.05371427536010742, 0.05513572692871094, 0.05655717849731445, 0.05797863006591797, 0.059400081634521484, 0.060821533203125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 10.0, 21.0, 19.0, 29.0, 50.0, 70.0, 109.0, 179.0, 323.0, 643.0, 1464.0, 3709.0, 13035.0, 79852.0, 758144.0, 161857.0, 20291.0, 5145.0, 1840.0, 824.0, 383.0, 208.0, 123.0, 77.0, 47.0, 23.0, 13.0, 16.0, 14.0, 13.0, 9.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-103.8125, -100.4248046875, -97.037109375, -93.6494140625, -90.26171875, -86.8740234375, -83.486328125, -80.0986328125, -76.7109375, -73.3232421875, -69.935546875, -66.5478515625, -63.16015625, -59.7724609375, -56.384765625, -52.9970703125, -49.609375, -46.2216796875, -42.833984375, -39.4462890625, -36.05859375, -32.6708984375, -29.283203125, -25.8955078125, -22.5078125, -19.1201171875, -15.732421875, -12.3447265625, -8.95703125, -5.5693359375, -2.181640625, 1.2060546875, 4.59375, 7.9814453125, 11.369140625, 14.7568359375, 18.14453125, 21.5322265625, 24.919921875, 28.3076171875, 31.6953125, 35.0830078125, 38.470703125, 41.8583984375, 45.24609375, 48.6337890625, 52.021484375, 55.4091796875, 58.796875, 62.1845703125, 65.572265625, 68.9599609375, 72.34765625, 75.7353515625, 79.123046875, 82.5107421875, 85.8984375, 89.2861328125, 92.673828125, 96.0615234375, 99.44921875, 102.8369140625, 106.224609375, 109.6123046875, 113.0]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 4.0, 4.0, 7.0, 6.0, 11.0, 10.0, 15.0, 18.0, 21.0, 53.0, 54.0, 80.0, 71.0, 128.0, 99.0, 101.0, 82.0, 62.0, 38.0, 35.0, 24.0, 17.0, 10.0, 17.0, 7.0, 7.0, 10.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-105.3125, -102.490234375, -99.66796875, -96.845703125, -94.0234375, -91.201171875, -88.37890625, -85.556640625, -82.734375, -79.912109375, -77.08984375, -74.267578125, -71.4453125, -68.623046875, -65.80078125, -62.978515625, -60.15625, -57.333984375, -54.51171875, -51.689453125, -48.8671875, -46.044921875, -43.22265625, -40.400390625, -37.578125, -34.755859375, -31.93359375, -29.111328125, -26.2890625, -23.466796875, -20.64453125, -17.822265625, -15.0, -12.177734375, -9.35546875, -6.533203125, -3.7109375, -0.888671875, 1.93359375, 4.755859375, 7.578125, 10.400390625, 13.22265625, 16.044921875, 18.8671875, 21.689453125, 24.51171875, 27.333984375, 30.15625, 32.978515625, 35.80078125, 38.623046875, 41.4453125, 44.267578125, 47.08984375, 49.912109375, 52.734375, 55.556640625, 58.37890625, 61.201171875, 64.0234375, 66.845703125, 69.66796875, 72.490234375, 75.3125]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 4.0, 6.0, 7.0, 11.0, 19.0, 32.0, 52.0, 98.0, 144.0, 179.0, 137.0, 102.0, 73.0, 62.0, 28.0, 15.0, 6.0, 10.0, 3.0, 4.0, 4.0, 3.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-938.35693359375, -884.2062377929688, -830.0555419921875, -775.9049072265625, -721.754150390625, -667.603515625, -613.4528198242188, -559.3021240234375, -505.15142822265625, -451.000732421875, -396.85003662109375, -342.6993713378906, -288.5486755371094, -234.39797973632812, -180.247314453125, -126.09661865234375, -71.9459228515625, -17.79523468017578, 36.35545349121094, 90.50613403320312, 144.65682983398438, 198.80752563476562, 252.95819091796875, 307.10888671875, 361.25958251953125, 415.4102783203125, 469.56097412109375, 523.711669921875, 577.8623046875, 632.0130615234375, 686.1636962890625, 740.3143920898438, 794.465087890625, 848.6157836914062, 902.7664794921875, 956.9171142578125, 1011.06787109375, 1065.218505859375, 1119.369140625, 1173.5198974609375, 1227.670654296875, 1281.8212890625, 1335.9720458984375, 1390.1226806640625, 1444.2734375, 1498.424072265625, 1552.57470703125, 1606.7254638671875, 1660.8760986328125, 1715.0267333984375, 1769.177490234375, 1823.328125, 1877.4788818359375, 1931.6295166015625, 1985.7802734375, 2039.930908203125, 2094.08154296875, 2148.232177734375, 2202.3828125, 2256.53369140625, 2310.684326171875, 2364.8349609375, 2418.985595703125, 2473.13623046875, 2527.287109375]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 5.0, 3.0, 1.0, 1.0, 2.0, 7.0, 5.0, 6.0, 11.0, 7.0, 14.0, 11.0, 24.0, 27.0, 31.0, 29.0, 32.0, 28.0, 34.0, 44.0, 39.0, 49.0, 55.0, 35.0, 52.0, 41.0, 51.0, 45.0, 56.0, 36.0, 31.0, 20.0, 28.0, 29.0, 21.0, 16.0, 11.0, 9.0, 9.0, 13.0, 1.0, 8.0, 5.0, 7.0, 5.0, 6.0, 5.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-763.8731689453125, -736.0970458984375, -708.3209228515625, -680.5447998046875, -652.7686767578125, -624.9925537109375, -597.2164306640625, -569.4403076171875, -541.6641845703125, -513.8880615234375, -486.1119384765625, -458.3358154296875, -430.5596923828125, -402.7835693359375, -375.0074768066406, -347.2313537597656, -319.45526123046875, -291.67913818359375, -263.90301513671875, -236.1269073486328, -208.3507843017578, -180.5746612548828, -152.79855346679688, -125.02243041992188, -97.24630737304688, -69.47018432617188, -41.694068908691406, -13.917953491210938, 13.858169555664062, 41.63429260253906, 69.410400390625, 97.1865234375, 124.96258544921875, 152.73870849609375, 180.51483154296875, 208.2909393310547, 236.0670623779297, 263.84320068359375, 291.6192932128906, 319.3954162597656, 347.1715393066406, 374.9476623535156, 402.7237854003906, 430.4998779296875, 458.2760009765625, 486.0521240234375, 513.8282470703125, 541.6043701171875, 569.3804931640625, 597.1566162109375, 624.9327392578125, 652.7088623046875, 680.4849853515625, 708.2611083984375, 736.0372314453125, 763.8133544921875, 791.5894775390625, 819.3656005859375, 847.1417236328125, 874.9178466796875, 902.6939697265625, 930.4700927734375, 958.2462158203125, 986.0223388671875, 1013.7984008789062]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 0.0, 1.0, 2.0, 6.0, 7.0, 9.0, 18.0, 21.0, 36.0, 52.0, 88.0, 174.0, 524.0, 3412.0, 61314.0, 4090829.0, 34984.0, 2101.0, 380.0, 133.0, 58.0, 40.0, 22.0, 27.0, 10.0, 13.0, 5.0, 5.0, 11.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-277.25, -263.67578125, -250.1015625, -236.52734375, -222.953125, -209.37890625, -195.8046875, -182.23046875, -168.65625, -155.08203125, -141.5078125, -127.93359375, -114.359375, -100.78515625, -87.2109375, -73.63671875, -60.0625, -46.48828125, -32.9140625, -19.33984375, -5.765625, 7.80859375, 21.3828125, 34.95703125, 48.53125, 62.10546875, 75.6796875, 89.25390625, 102.828125, 116.40234375, 129.9765625, 143.55078125, 157.125, 170.69921875, 184.2734375, 197.84765625, 211.421875, 224.99609375, 238.5703125, 252.14453125, 265.71875, 279.29296875, 292.8671875, 306.44140625, 320.015625, 333.58984375, 347.1640625, 360.73828125, 374.3125, 387.88671875, 401.4609375, 415.03515625, 428.609375, 442.18359375, 455.7578125, 469.33203125, 482.90625, 496.48046875, 510.0546875, 523.62890625, 537.203125, 550.77734375, 564.3515625, 577.92578125, 591.5]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 4.0, 5.0, 4.0, 10.0, 6.0, 9.0, 7.0, 6.0, 13.0, 16.0, 9.0, 16.0, 20.0, 26.0, 21.0, 23.0, 32.0, 39.0, 31.0, 25.0, 37.0, 36.0, 39.0, 54.0, 43.0, 40.0, 36.0, 37.0, 53.0, 42.0, 35.0, 33.0, 22.0, 27.0, 26.0, 28.0, 11.0, 21.0, 11.0, 5.0, 10.0, 5.0, 7.0, 4.0, 5.0, 3.0, 5.0, 5.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-42.71875, -41.41943359375, -40.1201171875, -38.82080078125, -37.521484375, -36.22216796875, -34.9228515625, -33.62353515625, -32.32421875, -31.02490234375, -29.7255859375, -28.42626953125, -27.126953125, -25.82763671875, -24.5283203125, -23.22900390625, -21.9296875, -20.63037109375, -19.3310546875, -18.03173828125, -16.732421875, -15.43310546875, -14.1337890625, -12.83447265625, -11.53515625, -10.23583984375, -8.9365234375, -7.63720703125, -6.337890625, -5.03857421875, -3.7392578125, -2.43994140625, -1.140625, 0.15869140625, 1.4580078125, 2.75732421875, 4.056640625, 5.35595703125, 6.6552734375, 7.95458984375, 9.25390625, 10.55322265625, 11.8525390625, 13.15185546875, 14.451171875, 15.75048828125, 17.0498046875, 18.34912109375, 19.6484375, 20.94775390625, 22.2470703125, 23.54638671875, 24.845703125, 26.14501953125, 27.4443359375, 28.74365234375, 30.04296875, 31.34228515625, 32.6416015625, 33.94091796875, 35.240234375, 36.53955078125, 37.8388671875, 39.13818359375, 40.4375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 5.0, 5.0, 0.0, 6.0, 8.0, 10.0, 27.0, 20.0, 33.0, 39.0, 63.0, 102.0, 147.0, 245.0, 376.0, 665.0, 1166.0, 2217.0, 4285.0, 9233.0, 21702.0, 60860.0, 299699.0, 3234669.0, 438710.0, 74071.0, 25149.0, 10453.0, 4735.0, 2472.0, 1295.0, 699.0, 420.0, 236.0, 160.0, 101.0, 57.0, 52.0, 22.0, 22.0, 19.0, 9.0, 6.0, 6.0, 3.0, 1.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-149.375, -144.7890625, -140.203125, -135.6171875, -131.03125, -126.4453125, -121.859375, -117.2734375, -112.6875, -108.1015625, -103.515625, -98.9296875, -94.34375, -89.7578125, -85.171875, -80.5859375, -76.0, -71.4140625, -66.828125, -62.2421875, -57.65625, -53.0703125, -48.484375, -43.8984375, -39.3125, -34.7265625, -30.140625, -25.5546875, -20.96875, -16.3828125, -11.796875, -7.2109375, -2.625, 1.9609375, 6.546875, 11.1328125, 15.71875, 20.3046875, 24.890625, 29.4765625, 34.0625, 38.6484375, 43.234375, 47.8203125, 52.40625, 56.9921875, 61.578125, 66.1640625, 70.75, 75.3359375, 79.921875, 84.5078125, 89.09375, 93.6796875, 98.265625, 102.8515625, 107.4375, 112.0234375, 116.609375, 121.1953125, 125.78125, 130.3671875, 134.953125, 139.5390625, 144.125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 5.0, 4.0, 4.0, 4.0, 6.0, 5.0, 11.0, 18.0, 22.0, 22.0, 41.0, 32.0, 54.0, 83.0, 167.0, 363.0, 768.0, 1135.0, 614.0, 249.0, 154.0, 80.0, 53.0, 44.0, 32.0, 21.0, 24.0, 11.0, 9.0, 12.0, 9.0, 5.0, 5.0, 2.0, 4.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-208.0, -202.26953125, -196.5390625, -190.80859375, -185.078125, -179.34765625, -173.6171875, -167.88671875, -162.15625, -156.42578125, -150.6953125, -144.96484375, -139.234375, -133.50390625, -127.7734375, -122.04296875, -116.3125, -110.58203125, -104.8515625, -99.12109375, -93.390625, -87.66015625, -81.9296875, -76.19921875, -70.46875, -64.73828125, -59.0078125, -53.27734375, -47.546875, -41.81640625, -36.0859375, -30.35546875, -24.625, -18.89453125, -13.1640625, -7.43359375, -1.703125, 4.02734375, 9.7578125, 15.48828125, 21.21875, 26.94921875, 32.6796875, 38.41015625, 44.140625, 49.87109375, 55.6015625, 61.33203125, 67.0625, 72.79296875, 78.5234375, 84.25390625, 89.984375, 95.71484375, 101.4453125, 107.17578125, 112.90625, 118.63671875, 124.3671875, 130.09765625, 135.828125, 141.55859375, 147.2890625, 153.01953125, 158.75]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 7.0, 7.0, 9.0, 19.0, 46.0, 82.0, 167.0, 199.0, 205.0, 106.0, 66.0, 28.0, 20.0, 13.0, 7.0, 6.0, 5.0, 2.0, 1.0, 3.0, 1.0, 4.0, 0.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1288.7979736328125, -1225.997802734375, -1163.1976318359375, -1100.3974609375, -1037.597412109375, -974.7972412109375, -911.9970703125, -849.1968994140625, -786.3967895507812, -723.5966186523438, -660.7965087890625, -597.996337890625, -535.1961669921875, -472.39605712890625, -409.59588623046875, -346.7957458496094, -283.99560546875, -221.19546508789062, -158.3953094482422, -95.59515380859375, -32.795013427734375, 30.005126953125, 92.8052978515625, 155.60543823242188, 218.40557861328125, 281.2057189941406, 344.005859375, 406.8060302734375, 469.6061706542969, 532.4063110351562, 595.2064819335938, 658.006591796875, 720.806640625, 783.6068115234375, 846.4069213867188, 909.2070922851562, 972.0072021484375, 1034.807373046875, 1097.6075439453125, 1160.40771484375, 1223.207763671875, 1286.0079345703125, 1348.80810546875, 1411.608154296875, 1474.4083251953125, 1537.20849609375, 1600.0086669921875, 1662.808837890625, 1725.6090087890625, 1788.4091796875, 1851.2093505859375, 1914.009521484375, 1976.8095703125, 2039.6097412109375, 2102.409912109375, 2165.2099609375, 2228.01025390625, 2290.810302734375, 2353.610595703125, 2416.41064453125, 2479.2109375, 2542.010986328125, 2604.81103515625, 2667.611328125, 2730.411376953125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 6.0, 3.0, 4.0, 4.0, 7.0, 4.0, 8.0, 15.0, 12.0, 21.0, 17.0, 25.0, 33.0, 25.0, 39.0, 38.0, 41.0, 32.0, 44.0, 51.0, 44.0, 55.0, 60.0, 55.0, 40.0, 46.0, 23.0, 34.0, 34.0, 29.0, 24.0, 34.0, 15.0, 21.0, 18.0, 9.0, 8.0, 7.0, 7.0, 9.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-759.8634033203125, -734.7206420898438, -709.577880859375, -684.4351196289062, -659.2923583984375, -634.1495971679688, -609.0068359375, -583.8640747070312, -558.7213134765625, -533.5785522460938, -508.435791015625, -483.29302978515625, -458.1502685546875, -433.00750732421875, -407.86474609375, -382.72198486328125, -357.5792236328125, -332.43646240234375, -307.293701171875, -282.15093994140625, -257.0081787109375, -231.86541748046875, -206.72265625, -181.57989501953125, -156.4371337890625, -131.29437255859375, -106.151611328125, -81.00885009765625, -55.8660888671875, -30.72332763671875, -5.58056640625, 19.56219482421875, 44.7049560546875, 69.84771728515625, 94.990478515625, 120.13323974609375, 145.2760009765625, 170.41876220703125, 195.5615234375, 220.70428466796875, 245.8470458984375, 270.98980712890625, 296.132568359375, 321.27532958984375, 346.4180908203125, 371.56085205078125, 396.70361328125, 421.84637451171875, 446.9891357421875, 472.13189697265625, 497.274658203125, 522.4174194335938, 547.5601806640625, 572.7029418945312, 597.845703125, 622.9884643554688, 648.1312255859375, 673.2739868164062, 698.416748046875, 723.5595092773438, 748.7022705078125, 773.8450317382812, 798.98779296875, 824.1305541992188, 849.2733154296875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 5.0, 1.0, 2.0, 5.0, 5.0, 7.0, 14.0, 19.0, 30.0, 32.0, 44.0, 62.0, 114.0, 158.0, 221.0, 314.0, 475.0, 790.0, 1214.0, 1994.0, 3372.0, 5948.0, 11091.0, 21933.0, 46881.0, 111505.0, 296807.0, 320822.0, 122825.0, 50899.0, 23572.0, 11875.0, 6234.0, 3548.0, 2083.0, 1289.0, 756.0, 532.0, 367.0, 204.0, 142.0, 98.0, 84.0, 62.0, 37.0, 32.0, 22.0, 17.0, 6.0, 7.0, 5.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-102.0625, -98.775390625, -95.48828125, -92.201171875, -88.9140625, -85.626953125, -82.33984375, -79.052734375, -75.765625, -72.478515625, -69.19140625, -65.904296875, -62.6171875, -59.330078125, -56.04296875, -52.755859375, -49.46875, -46.181640625, -42.89453125, -39.607421875, -36.3203125, -33.033203125, -29.74609375, -26.458984375, -23.171875, -19.884765625, -16.59765625, -13.310546875, -10.0234375, -6.736328125, -3.44921875, -0.162109375, 3.125, 6.412109375, 9.69921875, 12.986328125, 16.2734375, 19.560546875, 22.84765625, 26.134765625, 29.421875, 32.708984375, 35.99609375, 39.283203125, 42.5703125, 45.857421875, 49.14453125, 52.431640625, 55.71875, 59.005859375, 62.29296875, 65.580078125, 68.8671875, 72.154296875, 75.44140625, 78.728515625, 82.015625, 85.302734375, 88.58984375, 91.876953125, 95.1640625, 98.451171875, 101.73828125, 105.025390625, 108.3125]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 6.0, 3.0, 3.0, 8.0, 6.0, 9.0, 16.0, 15.0, 24.0, 18.0, 28.0, 21.0, 36.0, 38.0, 49.0, 43.0, 54.0, 61.0, 63.0, 59.0, 64.0, 53.0, 39.0, 52.0, 31.0, 32.0, 25.0, 27.0, 22.0, 27.0, 16.0, 19.0, 12.0, 9.0, 8.0, 6.0, 7.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.6875, -57.646484375, -55.60546875, -53.564453125, -51.5234375, -49.482421875, -47.44140625, -45.400390625, -43.359375, -41.318359375, -39.27734375, -37.236328125, -35.1953125, -33.154296875, -31.11328125, -29.072265625, -27.03125, -24.990234375, -22.94921875, -20.908203125, -18.8671875, -16.826171875, -14.78515625, -12.744140625, -10.703125, -8.662109375, -6.62109375, -4.580078125, -2.5390625, -0.498046875, 1.54296875, 3.583984375, 5.625, 7.666015625, 9.70703125, 11.748046875, 13.7890625, 15.830078125, 17.87109375, 19.912109375, 21.953125, 23.994140625, 26.03515625, 28.076171875, 30.1171875, 32.158203125, 34.19921875, 36.240234375, 38.28125, 40.322265625, 42.36328125, 44.404296875, 46.4453125, 48.486328125, 50.52734375, 52.568359375, 54.609375, 56.650390625, 58.69140625, 60.732421875, 62.7734375, 64.814453125, 66.85546875, 68.896484375, 70.9375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0, 2.0, 10.0, 10.0, 9.0, 9.0, 19.0, 26.0, 53.0, 76.0, 116.0, 227.0, 459.0, 925.0, 2273.0, 7239.0, 36011.0, 421492.0, 528496.0, 38892.0, 7834.0, 2331.0, 983.0, 455.0, 236.0, 141.0, 73.0, 45.0, 31.0, 30.0, 16.0, 9.0, 5.0, 9.0, 5.0, 4.0, 2.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-352.0, -341.94921875, -331.8984375, -321.84765625, -311.796875, -301.74609375, -291.6953125, -281.64453125, -271.59375, -261.54296875, -251.4921875, -241.44140625, -231.390625, -221.33984375, -211.2890625, -201.23828125, -191.1875, -181.13671875, -171.0859375, -161.03515625, -150.984375, -140.93359375, -130.8828125, -120.83203125, -110.78125, -100.73046875, -90.6796875, -80.62890625, -70.578125, -60.52734375, -50.4765625, -40.42578125, -30.375, -20.32421875, -10.2734375, -0.22265625, 9.828125, 19.87890625, 29.9296875, 39.98046875, 50.03125, 60.08203125, 70.1328125, 80.18359375, 90.234375, 100.28515625, 110.3359375, 120.38671875, 130.4375, 140.48828125, 150.5390625, 160.58984375, 170.640625, 180.69140625, 190.7421875, 200.79296875, 210.84375, 220.89453125, 230.9453125, 240.99609375, 251.046875, 261.09765625, 271.1484375, 281.19921875, 291.25]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 5.0, 13.0, 6.0, 9.0, 26.0, 26.0, 31.0, 40.0, 46.0, 55.0, 67.0, 63.0, 84.0, 65.0, 69.0, 61.0, 64.0, 44.0, 48.0, 35.0, 33.0, 25.0, 23.0, 19.0, 14.0, 9.0, 9.0, 8.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-371.25, -359.87109375, -348.4921875, -337.11328125, -325.734375, -314.35546875, -302.9765625, -291.59765625, -280.21875, -268.83984375, -257.4609375, -246.08203125, -234.703125, -223.32421875, -211.9453125, -200.56640625, -189.1875, -177.80859375, -166.4296875, -155.05078125, -143.671875, -132.29296875, -120.9140625, -109.53515625, -98.15625, -86.77734375, -75.3984375, -64.01953125, -52.640625, -41.26171875, -29.8828125, -18.50390625, -7.125, 4.25390625, 15.6328125, 27.01171875, 38.390625, 49.76953125, 61.1484375, 72.52734375, 83.90625, 95.28515625, 106.6640625, 118.04296875, 129.421875, 140.80078125, 152.1796875, 163.55859375, 174.9375, 186.31640625, 197.6953125, 209.07421875, 220.453125, 231.83203125, 243.2109375, 254.58984375, 265.96875, 277.34765625, 288.7265625, 300.10546875, 311.484375, 322.86328125, 334.2421875, 345.62109375, 357.0]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 3.0, 5.0, 4.0, 10.0, 17.0, 22.0, 43.0, 86.0, 217.0, 572.0, 1817.0, 9337.0, 98324.0, 860616.0, 67617.0, 7392.0, 1578.0, 503.0, 186.0, 85.0, 41.0, 21.0, 10.0, 14.0, 10.0, 6.0, 3.0, 1.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-208.375, -202.80859375, -197.2421875, -191.67578125, -186.109375, -180.54296875, -174.9765625, -169.41015625, -163.84375, -158.27734375, -152.7109375, -147.14453125, -141.578125, -136.01171875, -130.4453125, -124.87890625, -119.3125, -113.74609375, -108.1796875, -102.61328125, -97.046875, -91.48046875, -85.9140625, -80.34765625, -74.78125, -69.21484375, -63.6484375, -58.08203125, -52.515625, -46.94921875, -41.3828125, -35.81640625, -30.25, -24.68359375, -19.1171875, -13.55078125, -7.984375, -2.41796875, 3.1484375, 8.71484375, 14.28125, 19.84765625, 25.4140625, 30.98046875, 36.546875, 42.11328125, 47.6796875, 53.24609375, 58.8125, 64.37890625, 69.9453125, 75.51171875, 81.078125, 86.64453125, 92.2109375, 97.77734375, 103.34375, 108.91015625, 114.4765625, 120.04296875, 125.609375, 131.17578125, 136.7421875, 142.30859375, 147.875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 5.0, 7.0, 5.0, 14.0, 8.0, 20.0, 30.0, 47.0, 75.0, 94.0, 171.0, 184.0, 127.0, 66.0, 48.0, 29.0, 29.0, 16.0, 10.0, 9.0, 4.0, 7.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.032684326171875, -0.03133201599121094, -0.029979705810546875, -0.028627395629882812, -0.02727508544921875, -0.025922775268554688, -0.024570465087890625, -0.023218154907226562, -0.0218658447265625, -0.020513534545898438, -0.019161224365234375, -0.017808914184570312, -0.01645660400390625, -0.015104293823242188, -0.013751983642578125, -0.012399673461914062, -0.01104736328125, -0.009695053100585938, -0.008342742919921875, -0.0069904327392578125, -0.00563812255859375, -0.0042858123779296875, -0.002933502197265625, -0.0015811920166015625, -0.0002288818359375, 0.0011234283447265625, 0.002475738525390625, 0.0038280487060546875, 0.00518035888671875, 0.0065326690673828125, 0.007884979248046875, 0.009237289428710938, 0.010589599609375, 0.011941909790039062, 0.013294219970703125, 0.014646530151367188, 0.01599884033203125, 0.017351150512695312, 0.018703460693359375, 0.020055770874023438, 0.0214080810546875, 0.022760391235351562, 0.024112701416015625, 0.025465011596679688, 0.02681732177734375, 0.028169631958007812, 0.029521942138671875, 0.030874252319335938, 0.0322265625, 0.03357887268066406, 0.034931182861328125, 0.03628349304199219, 0.03763580322265625, 0.03898811340332031, 0.040340423583984375, 0.04169273376464844, 0.0430450439453125, 0.04439735412597656, 0.045749664306640625, 0.04710197448730469, 0.04845428466796875, 0.04980659484863281, 0.051158905029296875, 0.05251121520996094, 0.053863525390625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 5.0, 11.0, 14.0, 28.0, 18.0, 46.0, 88.0, 142.0, 279.0, 700.0, 2174.0, 8455.0, 53260.0, 747428.0, 209796.0, 19820.0, 4053.0, 1282.0, 473.0, 213.0, 101.0, 62.0, 42.0, 16.0, 13.0, 8.0, 5.0, 5.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-142.0, -137.529296875, -133.05859375, -128.587890625, -124.1171875, -119.646484375, -115.17578125, -110.705078125, -106.234375, -101.763671875, -97.29296875, -92.822265625, -88.3515625, -83.880859375, -79.41015625, -74.939453125, -70.46875, -65.998046875, -61.52734375, -57.056640625, -52.5859375, -48.115234375, -43.64453125, -39.173828125, -34.703125, -30.232421875, -25.76171875, -21.291015625, -16.8203125, -12.349609375, -7.87890625, -3.408203125, 1.0625, 5.533203125, 10.00390625, 14.474609375, 18.9453125, 23.416015625, 27.88671875, 32.357421875, 36.828125, 41.298828125, 45.76953125, 50.240234375, 54.7109375, 59.181640625, 63.65234375, 68.123046875, 72.59375, 77.064453125, 81.53515625, 86.005859375, 90.4765625, 94.947265625, 99.41796875, 103.888671875, 108.359375, 112.830078125, 117.30078125, 121.771484375, 126.2421875, 130.712890625, 135.18359375, 139.654296875, 144.125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 2.0, 6.0, 7.0, 9.0, 17.0, 16.0, 17.0, 22.0, 46.0, 37.0, 59.0, 56.0, 100.0, 105.0, 88.0, 94.0, 61.0, 57.0, 47.0, 25.0, 23.0, 22.0, 23.0, 12.0, 9.0, 7.0, 11.0, 5.0, 5.0, 5.0, 2.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-86.9375, -84.0390625, -81.140625, -78.2421875, -75.34375, -72.4453125, -69.546875, -66.6484375, -63.75, -60.8515625, -57.953125, -55.0546875, -52.15625, -49.2578125, -46.359375, -43.4609375, -40.5625, -37.6640625, -34.765625, -31.8671875, -28.96875, -26.0703125, -23.171875, -20.2734375, -17.375, -14.4765625, -11.578125, -8.6796875, -5.78125, -2.8828125, 0.015625, 2.9140625, 5.8125, 8.7109375, 11.609375, 14.5078125, 17.40625, 20.3046875, 23.203125, 26.1015625, 29.0, 31.8984375, 34.796875, 37.6953125, 40.59375, 43.4921875, 46.390625, 49.2890625, 52.1875, 55.0859375, 57.984375, 60.8828125, 63.78125, 66.6796875, 69.578125, 72.4765625, 75.375, 78.2734375, 81.171875, 84.0703125, 86.96875, 89.8671875, 92.765625, 95.6640625, 98.5625]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 11.0, 10.0, 26.0, 67.0, 134.0, 229.0, 255.0, 145.0, 69.0, 23.0, 16.0, 6.0, 8.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1734.6851806640625, -1652.6103515625, -1570.53564453125, -1488.4609375, -1406.3861083984375, -1324.311279296875, -1242.236572265625, -1160.161865234375, -1078.0870361328125, -996.0122680664062, -913.9375, -831.8627319335938, -749.7879638671875, -667.7131958007812, -585.638427734375, -503.56365966796875, -421.4888916015625, -339.41412353515625, -257.33935546875, -175.26458740234375, -93.1898193359375, -11.11505126953125, 70.959716796875, 153.03448486328125, 235.1092529296875, 317.18402099609375, 399.2587890625, 481.33355712890625, 563.4083251953125, 645.4830932617188, 727.557861328125, 809.6326293945312, 891.70751953125, 973.7822875976562, 1055.8570556640625, 1137.931884765625, 1220.006591796875, 1302.081298828125, 1384.1561279296875, 1466.23095703125, 1548.3056640625, 1630.38037109375, 1712.4552001953125, 1794.530029296875, 1876.604736328125, 1958.679443359375, 2040.7542724609375, 2122.8291015625, 2204.90380859375, 2286.978515625, 2369.05322265625, 2451.128173828125, 2533.202880859375, 2615.277587890625, 2697.3525390625, 2779.42724609375, 2861.501953125, 2943.57666015625, 3025.6513671875, 3107.726318359375, 3189.801025390625, 3271.875732421875, 3353.95068359375, 3436.025390625, 3518.10009765625]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 4.0, 1.0, 1.0, 8.0, 8.0, 8.0, 11.0, 14.0, 11.0, 15.0, 11.0, 14.0, 16.0, 28.0, 26.0, 34.0, 45.0, 49.0, 50.0, 56.0, 64.0, 66.0, 60.0, 55.0, 43.0, 43.0, 40.0, 35.0, 32.0, 35.0, 18.0, 11.0, 17.0, 16.0, 12.0, 11.0, 11.0, 4.0, 9.0, 5.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1078.020751953125, -1043.714599609375, -1009.4083251953125, -975.1021118164062, -940.7958984375, -906.4896850585938, -872.1834716796875, -837.8772583007812, -803.571044921875, -769.2648315429688, -734.9586181640625, -700.6524047851562, -666.34619140625, -632.0399780273438, -597.7337646484375, -563.4275512695312, -529.121337890625, -494.81512451171875, -460.5089111328125, -426.20269775390625, -391.896484375, -357.59027099609375, -323.2840576171875, -288.97784423828125, -254.671630859375, -220.36541748046875, -186.0592041015625, -151.75299072265625, -117.44677734375, -83.14056396484375, -48.8343505859375, -14.52813720703125, 19.778076171875, 54.08428955078125, 88.3905029296875, 122.69671630859375, 157.0029296875, 191.30914306640625, 225.6153564453125, 259.92156982421875, 294.227783203125, 328.53399658203125, 362.8402099609375, 397.14642333984375, 431.45263671875, 465.75885009765625, 500.0650634765625, 534.3712768554688, 568.677490234375, 602.9837036132812, 637.2899169921875, 671.5961303710938, 705.90234375, 740.2085571289062, 774.5147705078125, 808.8209838867188, 843.127197265625, 877.4334106445312, 911.7396240234375, 946.0458374023438, 980.35205078125, 1014.6582641601562, 1048.9644775390625, 1083.270751953125, 1117.576904296875]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 5.0, 7.0, 9.0, 9.0, 12.0, 19.0, 21.0, 35.0, 51.0, 65.0, 115.0, 179.0, 219.0, 394.0, 615.0, 951.0, 1672.0, 2748.0, 4701.0, 8298.0, 15384.0, 32885.0, 85752.0, 320626.0, 1339522.0, 1729423.0, 455544.0, 113433.0, 40213.0, 18555.0, 9664.0, 5367.0, 3000.0, 1786.0, 1106.0, 650.0, 420.0, 274.0, 174.0, 118.0, 100.0, 46.0, 33.0, 25.0, 22.0, 13.0, 10.0, 5.0, 5.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0], "bins": [-70.9375, -68.7958984375, -66.654296875, -64.5126953125, -62.37109375, -60.2294921875, -58.087890625, -55.9462890625, -53.8046875, -51.6630859375, -49.521484375, -47.3798828125, -45.23828125, -43.0966796875, -40.955078125, -38.8134765625, -36.671875, -34.5302734375, -32.388671875, -30.2470703125, -28.10546875, -25.9638671875, -23.822265625, -21.6806640625, -19.5390625, -17.3974609375, -15.255859375, -13.1142578125, -10.97265625, -8.8310546875, -6.689453125, -4.5478515625, -2.40625, -0.2646484375, 1.876953125, 4.0185546875, 6.16015625, 8.3017578125, 10.443359375, 12.5849609375, 14.7265625, 16.8681640625, 19.009765625, 21.1513671875, 23.29296875, 25.4345703125, 27.576171875, 29.7177734375, 31.859375, 34.0009765625, 36.142578125, 38.2841796875, 40.42578125, 42.5673828125, 44.708984375, 46.8505859375, 48.9921875, 51.1337890625, 53.275390625, 55.4169921875, 57.55859375, 59.7001953125, 61.841796875, 63.9833984375, 66.125]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 3.0, 4.0, 5.0, 9.0, 1.0, 6.0, 11.0, 15.0, 10.0, 21.0, 23.0, 32.0, 34.0, 30.0, 33.0, 32.0, 42.0, 47.0, 41.0, 48.0, 45.0, 66.0, 52.0, 43.0, 51.0, 26.0, 36.0, 44.0, 31.0, 29.0, 24.0, 19.0, 18.0, 8.0, 11.0, 8.0, 6.0, 12.0, 9.0, 7.0, 2.0, 5.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-50.25, -48.56640625, -46.8828125, -45.19921875, -43.515625, -41.83203125, -40.1484375, -38.46484375, -36.78125, -35.09765625, -33.4140625, -31.73046875, -30.046875, -28.36328125, -26.6796875, -24.99609375, -23.3125, -21.62890625, -19.9453125, -18.26171875, -16.578125, -14.89453125, -13.2109375, -11.52734375, -9.84375, -8.16015625, -6.4765625, -4.79296875, -3.109375, -1.42578125, 0.2578125, 1.94140625, 3.625, 5.30859375, 6.9921875, 8.67578125, 10.359375, 12.04296875, 13.7265625, 15.41015625, 17.09375, 18.77734375, 20.4609375, 22.14453125, 23.828125, 25.51171875, 27.1953125, 28.87890625, 30.5625, 32.24609375, 33.9296875, 35.61328125, 37.296875, 38.98046875, 40.6640625, 42.34765625, 44.03125, 45.71484375, 47.3984375, 49.08203125, 50.765625, 52.44921875, 54.1328125, 55.81640625, 57.5]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 7.0, 5.0, 11.0, 17.0, 25.0, 32.0, 73.0, 100.0, 204.0, 477.0, 1070.0, 3308.0, 12926.0, 75528.0, 1882966.0, 2122861.0, 76770.0, 12793.0, 3282.0, 1038.0, 459.0, 164.0, 78.0, 40.0, 20.0, 17.0, 7.0, 6.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-267.25, -258.6328125, -250.015625, -241.3984375, -232.78125, -224.1640625, -215.546875, -206.9296875, -198.3125, -189.6953125, -181.078125, -172.4609375, -163.84375, -155.2265625, -146.609375, -137.9921875, -129.375, -120.7578125, -112.140625, -103.5234375, -94.90625, -86.2890625, -77.671875, -69.0546875, -60.4375, -51.8203125, -43.203125, -34.5859375, -25.96875, -17.3515625, -8.734375, -0.1171875, 8.5, 17.1171875, 25.734375, 34.3515625, 42.96875, 51.5859375, 60.203125, 68.8203125, 77.4375, 86.0546875, 94.671875, 103.2890625, 111.90625, 120.5234375, 129.140625, 137.7578125, 146.375, 154.9921875, 163.609375, 172.2265625, 180.84375, 189.4609375, 198.078125, 206.6953125, 215.3125, 223.9296875, 232.546875, 241.1640625, 249.78125, 258.3984375, 267.015625, 275.6328125, 284.25]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 3.0, 9.0, 9.0, 9.0, 16.0, 24.0, 27.0, 42.0, 77.0, 88.0, 142.0, 218.0, 436.0, 781.0, 920.0, 522.0, 279.0, 143.0, 108.0, 65.0, 50.0, 36.0, 20.0, 9.0, 15.0, 12.0, 10.0, 2.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-338.0, -329.99609375, -321.9921875, -313.98828125, -305.984375, -297.98046875, -289.9765625, -281.97265625, -273.96875, -265.96484375, -257.9609375, -249.95703125, -241.953125, -233.94921875, -225.9453125, -217.94140625, -209.9375, -201.93359375, -193.9296875, -185.92578125, -177.921875, -169.91796875, -161.9140625, -153.91015625, -145.90625, -137.90234375, -129.8984375, -121.89453125, -113.890625, -105.88671875, -97.8828125, -89.87890625, -81.875, -73.87109375, -65.8671875, -57.86328125, -49.859375, -41.85546875, -33.8515625, -25.84765625, -17.84375, -9.83984375, -1.8359375, 6.16796875, 14.171875, 22.17578125, 30.1796875, 38.18359375, 46.1875, 54.19140625, 62.1953125, 70.19921875, 78.203125, 86.20703125, 94.2109375, 102.21484375, 110.21875, 118.22265625, 126.2265625, 134.23046875, 142.234375, 150.23828125, 158.2421875, 166.24609375, 174.25]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 6.0, 8.0, 17.0, 51.0, 276.0, 473.0, 137.0, 29.0, 8.0, 3.0, 2.0, 3.0], "bins": [-11731.53515625, -11526.765625, -11321.99609375, -11117.2265625, -10912.45703125, -10707.6875, -10502.91796875, -10298.1494140625, -10093.3798828125, -9888.6103515625, -9683.8408203125, -9479.0712890625, -9274.3017578125, -9069.533203125, -8864.763671875, -8659.994140625, -8455.224609375, -8250.455078125, -8045.685546875, -7840.916015625, -7636.14697265625, -7431.37744140625, -7226.60791015625, -7021.83837890625, -6817.068359375, -6612.298828125, -6407.529296875, -6202.759765625, -5997.99072265625, -5793.22119140625, -5588.45166015625, -5383.68212890625, -5178.91259765625, -4974.14306640625, -4769.37353515625, -4564.6044921875, -4359.8349609375, -4155.0654296875, -3950.2958984375, -3745.5263671875, -3540.75732421875, -3335.98779296875, -3131.218505859375, -2926.448974609375, -2721.6796875, -2516.91015625, -2312.140625, -2107.37109375, -1902.6016845703125, -1697.832275390625, -1493.062744140625, -1288.2933349609375, -1083.52392578125, -878.7545166015625, -673.9849853515625, -469.215576171875, -264.4461669921875, -59.676727294921875, 145.09271240234375, 349.8621826171875, 554.631591796875, 759.4010009765625, 964.1705322265625, 1168.93994140625, 1373.7093505859375]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 2.0, 6.0, 5.0, 7.0, 11.0, 16.0, 21.0, 21.0, 26.0, 22.0, 30.0, 32.0, 43.0, 35.0, 36.0, 33.0, 40.0, 48.0, 53.0, 51.0, 52.0, 58.0, 42.0, 38.0, 38.0, 33.0, 29.0, 32.0, 24.0, 20.0, 21.0, 17.0, 7.0, 12.0, 8.0, 7.0, 7.0, 7.0, 2.0, 4.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-930.379638671875, -898.8958740234375, -867.4120483398438, -835.9282836914062, -804.4445190429688, -772.960693359375, -741.4769287109375, -709.9931640625, -678.5093383789062, -647.0255737304688, -615.541748046875, -584.0579833984375, -552.57421875, -521.0903930664062, -489.60662841796875, -458.1228332519531, -426.6390686035156, -395.1552734375, -363.6715087890625, -332.1877136230469, -300.70391845703125, -269.22015380859375, -237.73635864257812, -206.2525634765625, -174.76878356933594, -143.28500366210938, -111.80120849609375, -80.31742858886719, -48.833641052246094, -17.349853515625, 14.133926391601562, 45.61772155761719, 77.10150146484375, 108.58528900146484, 140.06907653808594, 171.5528564453125, 203.03665161132812, 234.5204315185547, 266.00421142578125, 297.4880065917969, 328.9718017578125, 360.4555969238281, 391.9393615722656, 423.42315673828125, 454.9069519042969, 486.3907470703125, 517.87451171875, 549.3582763671875, 580.842041015625, 612.3258056640625, 643.8096313476562, 675.2933959960938, 706.7771606445312, 738.260986328125, 769.7447509765625, 801.228515625, 832.7123413085938, 864.1961059570312, 895.679931640625, 927.1636962890625, 958.6474609375, 990.1312866210938, 1021.6150512695312, 1053.098876953125, 1084.5826416015625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 6.0, 5.0, 13.0, 9.0, 25.0, 26.0, 49.0, 57.0, 117.0, 156.0, 227.0, 403.0, 634.0, 1181.0, 2114.0, 3798.0, 7205.0, 14470.0, 29633.0, 63901.0, 144496.0, 337707.0, 246964.0, 103539.0, 46764.0, 21883.0, 10621.0, 5540.0, 3043.0, 1624.0, 889.0, 536.0, 330.0, 207.0, 124.0, 92.0, 55.0, 30.0, 32.0, 13.0, 9.0, 10.0, 4.0, 10.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0], "bins": [-131.125, -127.4619140625, -123.798828125, -120.1357421875, -116.47265625, -112.8095703125, -109.146484375, -105.4833984375, -101.8203125, -98.1572265625, -94.494140625, -90.8310546875, -87.16796875, -83.5048828125, -79.841796875, -76.1787109375, -72.515625, -68.8525390625, -65.189453125, -61.5263671875, -57.86328125, -54.2001953125, -50.537109375, -46.8740234375, -43.2109375, -39.5478515625, -35.884765625, -32.2216796875, -28.55859375, -24.8955078125, -21.232421875, -17.5693359375, -13.90625, -10.2431640625, -6.580078125, -2.9169921875, 0.74609375, 4.4091796875, 8.072265625, 11.7353515625, 15.3984375, 19.0615234375, 22.724609375, 26.3876953125, 30.05078125, 33.7138671875, 37.376953125, 41.0400390625, 44.703125, 48.3662109375, 52.029296875, 55.6923828125, 59.35546875, 63.0185546875, 66.681640625, 70.3447265625, 74.0078125, 77.6708984375, 81.333984375, 84.9970703125, 88.66015625, 92.3232421875, 95.986328125, 99.6494140625, 103.3125]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 6.0, 9.0, 3.0, 5.0, 9.0, 5.0, 8.0, 10.0, 16.0, 20.0, 21.0, 17.0, 29.0, 31.0, 33.0, 28.0, 30.0, 50.0, 42.0, 35.0, 43.0, 43.0, 31.0, 51.0, 44.0, 33.0, 36.0, 27.0, 30.0, 33.0, 26.0, 25.0, 21.0, 21.0, 16.0, 17.0, 16.0, 12.0, 10.0, 9.0, 8.0, 9.0, 9.0, 3.0, 4.0, 4.0, 5.0, 2.0, 2.0, 3.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 2.0], "bins": [-48.96875, -47.32470703125, -45.6806640625, -44.03662109375, -42.392578125, -40.74853515625, -39.1044921875, -37.46044921875, -35.81640625, -34.17236328125, -32.5283203125, -30.88427734375, -29.240234375, -27.59619140625, -25.9521484375, -24.30810546875, -22.6640625, -21.02001953125, -19.3759765625, -17.73193359375, -16.087890625, -14.44384765625, -12.7998046875, -11.15576171875, -9.51171875, -7.86767578125, -6.2236328125, -4.57958984375, -2.935546875, -1.29150390625, 0.3525390625, 1.99658203125, 3.640625, 5.28466796875, 6.9287109375, 8.57275390625, 10.216796875, 11.86083984375, 13.5048828125, 15.14892578125, 16.79296875, 18.43701171875, 20.0810546875, 21.72509765625, 23.369140625, 25.01318359375, 26.6572265625, 28.30126953125, 29.9453125, 31.58935546875, 33.2333984375, 34.87744140625, 36.521484375, 38.16552734375, 39.8095703125, 41.45361328125, 43.09765625, 44.74169921875, 46.3857421875, 48.02978515625, 49.673828125, 51.31787109375, 52.9619140625, 54.60595703125, 56.25]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 1.0, 6.0, 10.0, 10.0, 13.0, 9.0, 17.0, 28.0, 38.0, 50.0, 63.0, 103.0, 135.0, 191.0, 245.0, 453.0, 674.0, 1134.0, 2150.0, 4855.0, 14821.0, 71937.0, 674960.0, 227161.0, 33499.0, 8629.0, 3092.0, 1638.0, 897.0, 536.0, 379.0, 241.0, 142.0, 119.0, 86.0, 53.0, 51.0, 31.0, 23.0, 19.0, 19.0, 11.0, 5.0, 7.0, 2.0, 2.0, 5.0, 2.0, 3.0, 1.0, 4.0], "bins": [-322.5, -313.486328125, -304.47265625, -295.458984375, -286.4453125, -277.431640625, -268.41796875, -259.404296875, -250.390625, -241.376953125, -232.36328125, -223.349609375, -214.3359375, -205.322265625, -196.30859375, -187.294921875, -178.28125, -169.267578125, -160.25390625, -151.240234375, -142.2265625, -133.212890625, -124.19921875, -115.185546875, -106.171875, -97.158203125, -88.14453125, -79.130859375, -70.1171875, -61.103515625, -52.08984375, -43.076171875, -34.0625, -25.048828125, -16.03515625, -7.021484375, 1.9921875, 11.005859375, 20.01953125, 29.033203125, 38.046875, 47.060546875, 56.07421875, 65.087890625, 74.1015625, 83.115234375, 92.12890625, 101.142578125, 110.15625, 119.169921875, 128.18359375, 137.197265625, 146.2109375, 155.224609375, 164.23828125, 173.251953125, 182.265625, 191.279296875, 200.29296875, 209.306640625, 218.3203125, 227.333984375, 236.34765625, 245.361328125, 254.375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 7.0, 10.0, 11.0, 13.0, 15.0, 18.0, 19.0, 19.0, 33.0, 33.0, 43.0, 48.0, 54.0, 56.0, 59.0, 72.0, 54.0, 55.0, 81.0, 60.0, 41.0, 31.0, 45.0, 23.0, 29.0, 13.0, 11.0, 17.0, 14.0, 7.0, 5.0, 2.0, 5.0, 4.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-451.0, -438.36328125, -425.7265625, -413.08984375, -400.453125, -387.81640625, -375.1796875, -362.54296875, -349.90625, -337.26953125, -324.6328125, -311.99609375, -299.359375, -286.72265625, -274.0859375, -261.44921875, -248.8125, -236.17578125, -223.5390625, -210.90234375, -198.265625, -185.62890625, -172.9921875, -160.35546875, -147.71875, -135.08203125, -122.4453125, -109.80859375, -97.171875, -84.53515625, -71.8984375, -59.26171875, -46.625, -33.98828125, -21.3515625, -8.71484375, 3.921875, 16.55859375, 29.1953125, 41.83203125, 54.46875, 67.10546875, 79.7421875, 92.37890625, 105.015625, 117.65234375, 130.2890625, 142.92578125, 155.5625, 168.19921875, 180.8359375, 193.47265625, 206.109375, 218.74609375, 231.3828125, 244.01953125, 256.65625, 269.29296875, 281.9296875, 294.56640625, 307.203125, 319.83984375, 332.4765625, 345.11328125, 357.75]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 5.0, 2.0, 15.0, 12.0, 18.0, 27.0, 53.0, 98.0, 202.0, 358.0, 854.0, 2220.0, 8217.0, 50764.0, 676035.0, 274764.0, 26792.0, 5227.0, 1638.0, 633.0, 280.0, 159.0, 74.0, 39.0, 21.0, 20.0, 13.0, 6.0, 5.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-104.4375, -101.0517578125, -97.666015625, -94.2802734375, -90.89453125, -87.5087890625, -84.123046875, -80.7373046875, -77.3515625, -73.9658203125, -70.580078125, -67.1943359375, -63.80859375, -60.4228515625, -57.037109375, -53.6513671875, -50.265625, -46.8798828125, -43.494140625, -40.1083984375, -36.72265625, -33.3369140625, -29.951171875, -26.5654296875, -23.1796875, -19.7939453125, -16.408203125, -13.0224609375, -9.63671875, -6.2509765625, -2.865234375, 0.5205078125, 3.90625, 7.2919921875, 10.677734375, 14.0634765625, 17.44921875, 20.8349609375, 24.220703125, 27.6064453125, 30.9921875, 34.3779296875, 37.763671875, 41.1494140625, 44.53515625, 47.9208984375, 51.306640625, 54.6923828125, 58.078125, 61.4638671875, 64.849609375, 68.2353515625, 71.62109375, 75.0068359375, 78.392578125, 81.7783203125, 85.1640625, 88.5498046875, 91.935546875, 95.3212890625, 98.70703125, 102.0927734375, 105.478515625, 108.8642578125, 112.25]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 5.0, 5.0, 8.0, 14.0, 7.0, 16.0, 17.0, 23.0, 22.0, 29.0, 35.0, 19.0, 39.0, 48.0, 58.0, 80.0, 87.0, 82.0, 65.0, 55.0, 33.0, 34.0, 43.0, 35.0, 22.0, 24.0, 16.0, 14.0, 18.0, 11.0, 5.0, 6.0, 6.0, 6.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0222320556640625, -0.021589994430541992, -0.020947933197021484, -0.020305871963500977, -0.01966381072998047, -0.01902174949645996, -0.018379688262939453, -0.017737627029418945, -0.017095565795898438, -0.01645350456237793, -0.015811443328857422, -0.015169382095336914, -0.014527320861816406, -0.013885259628295898, -0.01324319839477539, -0.012601137161254883, -0.011959075927734375, -0.011317014694213867, -0.01067495346069336, -0.010032892227172852, -0.009390830993652344, -0.008748769760131836, -0.008106708526611328, -0.00746464729309082, -0.0068225860595703125, -0.006180524826049805, -0.005538463592529297, -0.004896402359008789, -0.004254341125488281, -0.0036122798919677734, -0.0029702186584472656, -0.002328157424926758, -0.00168609619140625, -0.0010440349578857422, -0.0004019737243652344, 0.00024008750915527344, 0.0008821487426757812, 0.001524209976196289, 0.002166271209716797, 0.0028083324432373047, 0.0034503936767578125, 0.00409245491027832, 0.004734516143798828, 0.005376577377319336, 0.006018638610839844, 0.0066606998443603516, 0.007302761077880859, 0.007944822311401367, 0.008586883544921875, 0.009228944778442383, 0.00987100601196289, 0.010513067245483398, 0.011155128479003906, 0.011797189712524414, 0.012439250946044922, 0.01308131217956543, 0.013723373413085938, 0.014365434646606445, 0.015007495880126953, 0.01564955711364746, 0.01629161834716797, 0.016933679580688477, 0.017575740814208984, 0.018217802047729492, 0.01885986328125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 9.0, 8.0, 6.0, 23.0, 26.0, 59.0, 72.0, 164.0, 322.0, 683.0, 1599.0, 5201.0, 28431.0, 427687.0, 545665.0, 30232.0, 5266.0, 1653.0, 681.0, 347.0, 192.0, 90.0, 59.0, 42.0, 20.0, 12.0, 11.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-161.75, -158.0751953125, -154.400390625, -150.7255859375, -147.05078125, -143.3759765625, -139.701171875, -136.0263671875, -132.3515625, -128.6767578125, -125.001953125, -121.3271484375, -117.65234375, -113.9775390625, -110.302734375, -106.6279296875, -102.953125, -99.2783203125, -95.603515625, -91.9287109375, -88.25390625, -84.5791015625, -80.904296875, -77.2294921875, -73.5546875, -69.8798828125, -66.205078125, -62.5302734375, -58.85546875, -55.1806640625, -51.505859375, -47.8310546875, -44.15625, -40.4814453125, -36.806640625, -33.1318359375, -29.45703125, -25.7822265625, -22.107421875, -18.4326171875, -14.7578125, -11.0830078125, -7.408203125, -3.7333984375, -0.05859375, 3.6162109375, 7.291015625, 10.9658203125, 14.640625, 18.3154296875, 21.990234375, 25.6650390625, 29.33984375, 33.0146484375, 36.689453125, 40.3642578125, 44.0390625, 47.7138671875, 51.388671875, 55.0634765625, 58.73828125, 62.4130859375, 66.087890625, 69.7626953125, 73.4375]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 0.0, 2.0, 5.0, 6.0, 3.0, 3.0, 11.0, 7.0, 18.0, 12.0, 11.0, 18.0, 20.0, 25.0, 32.0, 34.0, 36.0, 39.0, 44.0, 43.0, 45.0, 45.0, 50.0, 50.0, 55.0, 56.0, 38.0, 51.0, 33.0, 34.0, 21.0, 24.0, 24.0, 14.0, 20.0, 10.0, 12.0, 9.0, 9.0, 6.0, 6.0, 4.0, 5.0, 3.0, 6.0, 1.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-53.875, -52.10791015625, -50.3408203125, -48.57373046875, -46.806640625, -45.03955078125, -43.2724609375, -41.50537109375, -39.73828125, -37.97119140625, -36.2041015625, -34.43701171875, -32.669921875, -30.90283203125, -29.1357421875, -27.36865234375, -25.6015625, -23.83447265625, -22.0673828125, -20.30029296875, -18.533203125, -16.76611328125, -14.9990234375, -13.23193359375, -11.46484375, -9.69775390625, -7.9306640625, -6.16357421875, -4.396484375, -2.62939453125, -0.8623046875, 0.90478515625, 2.671875, 4.43896484375, 6.2060546875, 7.97314453125, 9.740234375, 11.50732421875, 13.2744140625, 15.04150390625, 16.80859375, 18.57568359375, 20.3427734375, 22.10986328125, 23.876953125, 25.64404296875, 27.4111328125, 29.17822265625, 30.9453125, 32.71240234375, 34.4794921875, 36.24658203125, 38.013671875, 39.78076171875, 41.5478515625, 43.31494140625, 45.08203125, 46.84912109375, 48.6162109375, 50.38330078125, 52.150390625, 53.91748046875, 55.6845703125, 57.45166015625, 59.21875]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 6.0, 7.0, 8.0, 18.0, 21.0, 77.0, 160.0, 278.0, 203.0, 114.0, 62.0, 26.0, 13.0, 9.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2113.28076171875, -2031.3466796875, -1949.4127197265625, -1867.478759765625, -1785.544677734375, -1703.610595703125, -1621.6766357421875, -1539.74267578125, -1457.80859375, -1375.87451171875, -1293.9405517578125, -1212.006591796875, -1130.072509765625, -1048.138427734375, -966.2044677734375, -884.2704467773438, -802.33642578125, -720.4024047851562, -638.4683837890625, -556.5343627929688, -474.600341796875, -392.66632080078125, -310.7322998046875, -228.79827880859375, -146.8642578125, -64.93023681640625, 17.0037841796875, 98.93780517578125, 180.871826171875, 262.80584716796875, 344.7398681640625, 426.67388916015625, 508.60791015625, 590.5419311523438, 672.4759521484375, 754.4099731445312, 836.343994140625, 918.2780151367188, 1000.2120361328125, 1082.14599609375, 1164.080078125, 1246.01416015625, 1327.9481201171875, 1409.882080078125, 1491.816162109375, 1573.750244140625, 1655.6842041015625, 1737.6181640625, 1819.55224609375, 1901.486328125, 1983.4202880859375, 2065.354248046875, 2147.288330078125, 2229.222412109375, 2311.15625, 2393.09033203125, 2475.0244140625, 2556.95849609375, 2638.892578125, 2720.826416015625, 2802.760498046875, 2884.694580078125, 2966.62841796875, 3048.5625, 3130.49658203125]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 6.0, 6.0, 4.0, 9.0, 8.0, 11.0, 14.0, 11.0, 22.0, 18.0, 22.0, 24.0, 22.0, 36.0, 30.0, 43.0, 37.0, 55.0, 76.0, 68.0, 76.0, 61.0, 52.0, 36.0, 38.0, 43.0, 33.0, 25.0, 25.0, 13.0, 16.0, 15.0, 11.0, 9.0, 5.0, 8.0, 5.0, 3.0, 5.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1455.0361328125, -1411.7655029296875, -1368.4949951171875, -1325.224365234375, -1281.953857421875, -1238.6832275390625, -1195.41259765625, -1152.14208984375, -1108.8714599609375, -1065.600830078125, -1022.330322265625, -979.0596923828125, -935.7891235351562, -892.5185546875, -849.2479248046875, -805.9773559570312, -762.706787109375, -719.4362182617188, -676.1656494140625, -632.89501953125, -589.6244506835938, -546.3538818359375, -503.0832824707031, -459.81268310546875, -416.5421142578125, -373.27154541015625, -330.0009460449219, -286.7303466796875, -243.45977783203125, -200.18919372558594, -156.91860961914062, -113.64801025390625, -70.3773193359375, -27.106735229492188, 16.163848876953125, 59.43443298339844, 102.70501708984375, 145.97560119628906, 189.24618530273438, 232.51678466796875, 275.787353515625, 319.05792236328125, 362.3285217285156, 405.59912109375, 448.86968994140625, 492.1402587890625, 535.410888671875, 578.6814575195312, 621.9520263671875, 665.2225952148438, 708.4931640625, 751.7637939453125, 795.0343627929688, 838.304931640625, 881.5755615234375, 924.8461303710938, 968.11669921875, 1011.3872680664062, 1054.6578369140625, 1097.928466796875, 1141.198974609375, 1184.4696044921875, 1227.740234375, 1271.0107421875, 1314.2813720703125]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 4.0, 9.0, 10.0, 15.0, 34.0, 40.0, 57.0, 86.0, 150.0, 240.0, 436.0, 701.0, 1196.0, 2104.0, 3890.0, 7216.0, 14909.0, 36036.0, 116678.0, 493805.0, 1742292.0, 1326649.0, 319126.0, 77136.0, 26521.0, 11622.0, 5715.0, 3136.0, 1821.0, 991.0, 614.0, 362.0, 243.0, 139.0, 99.0, 57.0, 48.0, 35.0, 21.0, 19.0, 13.0, 2.0, 6.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-54.40625, -52.21728515625, -50.0283203125, -47.83935546875, -45.650390625, -43.46142578125, -41.2724609375, -39.08349609375, -36.89453125, -34.70556640625, -32.5166015625, -30.32763671875, -28.138671875, -25.94970703125, -23.7607421875, -21.57177734375, -19.3828125, -17.19384765625, -15.0048828125, -12.81591796875, -10.626953125, -8.43798828125, -6.2490234375, -4.06005859375, -1.87109375, 0.31787109375, 2.5068359375, 4.69580078125, 6.884765625, 9.07373046875, 11.2626953125, 13.45166015625, 15.640625, 17.82958984375, 20.0185546875, 22.20751953125, 24.396484375, 26.58544921875, 28.7744140625, 30.96337890625, 33.15234375, 35.34130859375, 37.5302734375, 39.71923828125, 41.908203125, 44.09716796875, 46.2861328125, 48.47509765625, 50.6640625, 52.85302734375, 55.0419921875, 57.23095703125, 59.419921875, 61.60888671875, 63.7978515625, 65.98681640625, 68.17578125, 70.36474609375, 72.5537109375, 74.74267578125, 76.931640625, 79.12060546875, 81.3095703125, 83.49853515625, 85.6875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 10.0, 7.0, 5.0, 14.0, 12.0, 19.0, 26.0, 22.0, 48.0, 42.0, 44.0, 67.0, 51.0, 70.0, 66.0, 60.0, 60.0, 57.0, 51.0, 51.0, 46.0, 34.0, 41.0, 26.0, 17.0, 18.0, 12.0, 14.0, 1.0, 8.0, 4.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.8125, -74.1767578125, -71.541015625, -68.9052734375, -66.26953125, -63.6337890625, -60.998046875, -58.3623046875, -55.7265625, -53.0908203125, -50.455078125, -47.8193359375, -45.18359375, -42.5478515625, -39.912109375, -37.2763671875, -34.640625, -32.0048828125, -29.369140625, -26.7333984375, -24.09765625, -21.4619140625, -18.826171875, -16.1904296875, -13.5546875, -10.9189453125, -8.283203125, -5.6474609375, -3.01171875, -0.3759765625, 2.259765625, 4.8955078125, 7.53125, 10.1669921875, 12.802734375, 15.4384765625, 18.07421875, 20.7099609375, 23.345703125, 25.9814453125, 28.6171875, 31.2529296875, 33.888671875, 36.5244140625, 39.16015625, 41.7958984375, 44.431640625, 47.0673828125, 49.703125, 52.3388671875, 54.974609375, 57.6103515625, 60.24609375, 62.8818359375, 65.517578125, 68.1533203125, 70.7890625, 73.4248046875, 76.060546875, 78.6962890625, 81.33203125, 83.9677734375, 86.603515625, 89.2392578125, 91.875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 5.0, 5.0, 8.0, 12.0, 12.0, 14.0, 27.0, 27.0, 62.0, 107.0, 144.0, 262.0, 524.0, 1083.0, 2562.0, 6578.0, 19987.0, 73282.0, 457305.0, 3117858.0, 413408.0, 69165.0, 19935.0, 6817.0, 2677.0, 1129.0, 559.0, 269.0, 146.0, 103.0, 59.0, 46.0, 34.0, 16.0, 26.0, 10.0, 4.0, 6.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-136.875, -132.232421875, -127.58984375, -122.947265625, -118.3046875, -113.662109375, -109.01953125, -104.376953125, -99.734375, -95.091796875, -90.44921875, -85.806640625, -81.1640625, -76.521484375, -71.87890625, -67.236328125, -62.59375, -57.951171875, -53.30859375, -48.666015625, -44.0234375, -39.380859375, -34.73828125, -30.095703125, -25.453125, -20.810546875, -16.16796875, -11.525390625, -6.8828125, -2.240234375, 2.40234375, 7.044921875, 11.6875, 16.330078125, 20.97265625, 25.615234375, 30.2578125, 34.900390625, 39.54296875, 44.185546875, 48.828125, 53.470703125, 58.11328125, 62.755859375, 67.3984375, 72.041015625, 76.68359375, 81.326171875, 85.96875, 90.611328125, 95.25390625, 99.896484375, 104.5390625, 109.181640625, 113.82421875, 118.466796875, 123.109375, 127.751953125, 132.39453125, 137.037109375, 141.6796875, 146.322265625, 150.96484375, 155.607421875, 160.25]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 4.0, 5.0, 5.0, 8.0, 10.0, 5.0, 8.0, 15.0, 12.0, 15.0, 33.0, 35.0, 35.0, 57.0, 70.0, 87.0, 118.0, 151.0, 226.0, 359.0, 443.0, 531.0, 515.0, 357.0, 261.0, 175.0, 127.0, 83.0, 67.0, 45.0, 42.0, 29.0, 27.0, 19.0, 20.0, 16.0, 10.0, 9.0, 7.0, 10.0, 4.0, 3.0, 9.0, 1.0, 7.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-131.875, -127.5703125, -123.265625, -118.9609375, -114.65625, -110.3515625, -106.046875, -101.7421875, -97.4375, -93.1328125, -88.828125, -84.5234375, -80.21875, -75.9140625, -71.609375, -67.3046875, -63.0, -58.6953125, -54.390625, -50.0859375, -45.78125, -41.4765625, -37.171875, -32.8671875, -28.5625, -24.2578125, -19.953125, -15.6484375, -11.34375, -7.0390625, -2.734375, 1.5703125, 5.875, 10.1796875, 14.484375, 18.7890625, 23.09375, 27.3984375, 31.703125, 36.0078125, 40.3125, 44.6171875, 48.921875, 53.2265625, 57.53125, 61.8359375, 66.140625, 70.4453125, 74.75, 79.0546875, 83.359375, 87.6640625, 91.96875, 96.2734375, 100.578125, 104.8828125, 109.1875, 113.4921875, 117.796875, 122.1015625, 126.40625, 130.7109375, 135.015625, 139.3203125, 143.625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 1.0, 10.0, 56.0, 349.0, 439.0, 113.0, 20.0, 10.0, 4.0, 1.0, 4.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1325.0260009765625, -1164.0267333984375, -1003.027587890625, -842.0283203125, -681.0291137695312, -520.0299072265625, -359.0306396484375, -198.031494140625, -37.0322265625, 123.96699523925781, 284.9662170410156, 445.9654541015625, 606.9646606445312, 767.9638671875, 928.963134765625, 1089.9622802734375, 1250.9615478515625, 1411.9608154296875, 1572.9599609375, 1733.959228515625, 1894.95849609375, 2055.95751953125, 2216.95703125, 2377.9560546875, 2538.955322265625, 2699.95458984375, 2860.953857421875, 3021.953125, 3182.9521484375, 3343.951416015625, 3504.95068359375, 3665.94970703125, 3826.94873046875, 3987.947998046875, 4148.947265625, 4309.9462890625, 4470.94580078125, 4631.94482421875, 4792.9443359375, 4953.943359375, 5114.9423828125, 5275.94140625, 5436.94091796875, 5597.93994140625, 5758.939453125, 5919.9384765625, 6080.9375, 6241.93701171875, 6402.9365234375, 6563.935546875, 6724.93505859375, 6885.93408203125, 7046.93359375, 7207.9326171875, 7368.931640625, 7529.93115234375, 7690.93017578125, 7851.92919921875, 8012.9287109375, 8173.927734375, 8334.9267578125, 8495.92578125, 8656.92578125, 8817.9248046875, 8978.923828125]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 11.0, 4.0, 5.0, 4.0, 7.0, 9.0, 17.0, 8.0, 18.0, 19.0, 19.0, 25.0, 25.0, 32.0, 24.0, 27.0, 34.0, 39.0, 50.0, 34.0, 57.0, 52.0, 50.0, 51.0, 41.0, 44.0, 40.0, 24.0, 38.0, 25.0, 35.0, 23.0, 13.0, 24.0, 16.0, 8.0, 9.0, 7.0, 7.0, 9.0, 5.0, 5.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-795.8304443359375, -770.4745483398438, -745.1187133789062, -719.7628173828125, -694.406982421875, -669.0510864257812, -643.6952514648438, -618.33935546875, -592.9835205078125, -567.6276245117188, -542.2717895507812, -516.9158935546875, -491.56005859375, -466.2041931152344, -440.84832763671875, -415.492431640625, -390.1365661621094, -364.78070068359375, -339.4248352050781, -314.0689697265625, -288.7131042480469, -263.35723876953125, -238.00135803222656, -212.64549255371094, -187.2896270751953, -161.9337615966797, -136.57789611816406, -111.2220230102539, -85.86615753173828, -60.510292053222656, -35.1544189453125, -9.798553466796875, 15.55731201171875, 40.913177490234375, 66.26904296875, 91.62491607666016, 116.98078155517578, 142.33663940429688, 167.69252014160156, 193.0483856201172, 218.4042510986328, 243.76011657714844, 269.1159973144531, 294.47186279296875, 319.8277282714844, 345.18359375, 370.5394592285156, 395.89532470703125, 421.2511901855469, 446.6070556640625, 471.9629211425781, 497.31878662109375, 522.6746826171875, 548.030517578125, 573.3864135742188, 598.7422485351562, 624.09814453125, 649.4540405273438, 674.8098754882812, 700.165771484375, 725.5216064453125, 750.8775024414062, 776.2333374023438, 801.5892333984375, 826.945068359375]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 4.0, 6.0, 9.0, 18.0, 19.0, 33.0, 37.0, 61.0, 109.0, 145.0, 217.0, 345.0, 543.0, 887.0, 1516.0, 2699.0, 5034.0, 9780.0, 19612.0, 41800.0, 93534.0, 237262.0, 357681.0, 152782.0, 64383.0, 29486.0, 14233.0, 7151.0, 3899.0, 2121.0, 1202.0, 706.0, 441.0, 258.0, 182.0, 124.0, 77.0, 69.0, 31.0, 19.0, 19.0, 9.0, 6.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-104.8125, -101.4609375, -98.109375, -94.7578125, -91.40625, -88.0546875, -84.703125, -81.3515625, -78.0, -74.6484375, -71.296875, -67.9453125, -64.59375, -61.2421875, -57.890625, -54.5390625, -51.1875, -47.8359375, -44.484375, -41.1328125, -37.78125, -34.4296875, -31.078125, -27.7265625, -24.375, -21.0234375, -17.671875, -14.3203125, -10.96875, -7.6171875, -4.265625, -0.9140625, 2.4375, 5.7890625, 9.140625, 12.4921875, 15.84375, 19.1953125, 22.546875, 25.8984375, 29.25, 32.6015625, 35.953125, 39.3046875, 42.65625, 46.0078125, 49.359375, 52.7109375, 56.0625, 59.4140625, 62.765625, 66.1171875, 69.46875, 72.8203125, 76.171875, 79.5234375, 82.875, 86.2265625, 89.578125, 92.9296875, 96.28125, 99.6328125, 102.984375, 106.3359375, 109.6875]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 3.0, 9.0, 3.0, 15.0, 13.0, 21.0, 20.0, 23.0, 28.0, 46.0, 31.0, 48.0, 50.0, 54.0, 52.0, 57.0, 53.0, 54.0, 49.0, 49.0, 46.0, 47.0, 44.0, 39.0, 24.0, 23.0, 24.0, 17.0, 9.0, 13.0, 10.0, 10.0, 5.0, 9.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.25, -65.7763671875, -63.302734375, -60.8291015625, -58.35546875, -55.8818359375, -53.408203125, -50.9345703125, -48.4609375, -45.9873046875, -43.513671875, -41.0400390625, -38.56640625, -36.0927734375, -33.619140625, -31.1455078125, -28.671875, -26.1982421875, -23.724609375, -21.2509765625, -18.77734375, -16.3037109375, -13.830078125, -11.3564453125, -8.8828125, -6.4091796875, -3.935546875, -1.4619140625, 1.01171875, 3.4853515625, 5.958984375, 8.4326171875, 10.90625, 13.3798828125, 15.853515625, 18.3271484375, 20.80078125, 23.2744140625, 25.748046875, 28.2216796875, 30.6953125, 33.1689453125, 35.642578125, 38.1162109375, 40.58984375, 43.0634765625, 45.537109375, 48.0107421875, 50.484375, 52.9580078125, 55.431640625, 57.9052734375, 60.37890625, 62.8525390625, 65.326171875, 67.7998046875, 70.2734375, 72.7470703125, 75.220703125, 77.6943359375, 80.16796875, 82.6416015625, 85.115234375, 87.5888671875, 90.0625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 7.0, 6.0, 13.0, 11.0, 28.0, 32.0, 40.0, 70.0, 109.0, 185.0, 284.0, 445.0, 871.0, 1825.0, 5308.0, 24887.0, 236698.0, 708712.0, 54884.0, 8888.0, 2598.0, 1095.0, 601.0, 344.0, 208.0, 134.0, 97.0, 64.0, 38.0, 20.0, 18.0, 11.0, 8.0, 5.0, 3.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-331.0, -321.3203125, -311.640625, -301.9609375, -292.28125, -282.6015625, -272.921875, -263.2421875, -253.5625, -243.8828125, -234.203125, -224.5234375, -214.84375, -205.1640625, -195.484375, -185.8046875, -176.125, -166.4453125, -156.765625, -147.0859375, -137.40625, -127.7265625, -118.046875, -108.3671875, -98.6875, -89.0078125, -79.328125, -69.6484375, -59.96875, -50.2890625, -40.609375, -30.9296875, -21.25, -11.5703125, -1.890625, 7.7890625, 17.46875, 27.1484375, 36.828125, 46.5078125, 56.1875, 65.8671875, 75.546875, 85.2265625, 94.90625, 104.5859375, 114.265625, 123.9453125, 133.625, 143.3046875, 152.984375, 162.6640625, 172.34375, 182.0234375, 191.703125, 201.3828125, 211.0625, 220.7421875, 230.421875, 240.1015625, 249.78125, 259.4609375, 269.140625, 278.8203125, 288.5]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 5.0, 3.0, 9.0, 19.0, 25.0, 21.0, 37.0, 46.0, 45.0, 47.0, 68.0, 48.0, 68.0, 64.0, 60.0, 60.0, 69.0, 55.0, 41.0, 44.0, 39.0, 21.0, 24.0, 28.0, 17.0, 16.0, 10.0, 4.0, 7.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-299.75, -287.78125, -275.8125, -263.84375, -251.875, -239.90625, -227.9375, -215.96875, -204.0, -192.03125, -180.0625, -168.09375, -156.125, -144.15625, -132.1875, -120.21875, -108.25, -96.28125, -84.3125, -72.34375, -60.375, -48.40625, -36.4375, -24.46875, -12.5, -0.53125, 11.4375, 23.40625, 35.375, 47.34375, 59.3125, 71.28125, 83.25, 95.21875, 107.1875, 119.15625, 131.125, 143.09375, 155.0625, 167.03125, 179.0, 190.96875, 202.9375, 214.90625, 226.875, 238.84375, 250.8125, 262.78125, 274.75, 286.71875, 298.6875, 310.65625, 322.625, 334.59375, 346.5625, 358.53125, 370.5, 382.46875, 394.4375, 406.40625, 418.375, 430.34375, 442.3125, 454.28125, 466.25]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 6.0, 8.0, 6.0, 4.0, 8.0, 12.0, 21.0, 19.0, 29.0, 42.0, 73.0, 117.0, 181.0, 307.0, 489.0, 1037.0, 2349.0, 5822.0, 18135.0, 82304.0, 583264.0, 283092.0, 50661.0, 12485.0, 4330.0, 1777.0, 820.0, 444.0, 257.0, 148.0, 96.0, 59.0, 38.0, 23.0, 24.0, 21.0, 10.0, 8.0, 5.0, 10.0, 6.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 3.0], "bins": [-63.3125, -61.38525390625, -59.4580078125, -57.53076171875, -55.603515625, -53.67626953125, -51.7490234375, -49.82177734375, -47.89453125, -45.96728515625, -44.0400390625, -42.11279296875, -40.185546875, -38.25830078125, -36.3310546875, -34.40380859375, -32.4765625, -30.54931640625, -28.6220703125, -26.69482421875, -24.767578125, -22.84033203125, -20.9130859375, -18.98583984375, -17.05859375, -15.13134765625, -13.2041015625, -11.27685546875, -9.349609375, -7.42236328125, -5.4951171875, -3.56787109375, -1.640625, 0.28662109375, 2.2138671875, 4.14111328125, 6.068359375, 7.99560546875, 9.9228515625, 11.85009765625, 13.77734375, 15.70458984375, 17.6318359375, 19.55908203125, 21.486328125, 23.41357421875, 25.3408203125, 27.26806640625, 29.1953125, 31.12255859375, 33.0498046875, 34.97705078125, 36.904296875, 38.83154296875, 40.7587890625, 42.68603515625, 44.61328125, 46.54052734375, 48.4677734375, 50.39501953125, 52.322265625, 54.24951171875, 56.1767578125, 58.10400390625, 60.03125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 0.0, 2.0, 3.0, 6.0, 8.0, 8.0, 9.0, 17.0, 34.0, 37.0, 52.0, 74.0, 96.0, 116.0, 142.0, 109.0, 72.0, 66.0, 54.0, 24.0, 19.0, 12.0, 9.0, 5.0, 9.0, 4.0, 7.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.0390625, -0.038178443908691406, -0.03729438781738281, -0.03641033172607422, -0.035526275634765625, -0.03464221954345703, -0.03375816345214844, -0.032874107360839844, -0.03199005126953125, -0.031105995178222656, -0.030221939086914062, -0.02933788299560547, -0.028453826904296875, -0.02756977081298828, -0.026685714721679688, -0.025801658630371094, -0.0249176025390625, -0.024033546447753906, -0.023149490356445312, -0.02226543426513672, -0.021381378173828125, -0.02049732208251953, -0.019613265991210938, -0.018729209899902344, -0.01784515380859375, -0.016961097717285156, -0.016077041625976562, -0.015192985534667969, -0.014308929443359375, -0.013424873352050781, -0.012540817260742188, -0.011656761169433594, -0.010772705078125, -0.009888648986816406, -0.009004592895507812, -0.008120536804199219, -0.007236480712890625, -0.006352424621582031, -0.0054683685302734375, -0.004584312438964844, -0.00370025634765625, -0.0028162002563476562, -0.0019321441650390625, -0.0010480880737304688, -0.000164031982421875, 0.0007200241088867188, 0.0016040802001953125, 0.0024881362915039062, 0.0033721923828125, 0.004256248474121094, 0.0051403045654296875, 0.006024360656738281, 0.006908416748046875, 0.007792472839355469, 0.008676528930664062, 0.009560585021972656, 0.01044464111328125, 0.011328697204589844, 0.012212753295898438, 0.013096809387207031, 0.013980865478515625, 0.014864921569824219, 0.015748977661132812, 0.016633033752441406, 0.01751708984375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 2.0, 6.0, 12.0, 16.0, 16.0, 41.0, 76.0, 188.0, 471.0, 1364.0, 6576.0, 119533.0, 881243.0, 34024.0, 3517.0, 890.0, 294.0, 148.0, 59.0, 26.0, 20.0, 14.0, 14.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-100.625, -96.48828125, -92.3515625, -88.21484375, -84.078125, -79.94140625, -75.8046875, -71.66796875, -67.53125, -63.39453125, -59.2578125, -55.12109375, -50.984375, -46.84765625, -42.7109375, -38.57421875, -34.4375, -30.30078125, -26.1640625, -22.02734375, -17.890625, -13.75390625, -9.6171875, -5.48046875, -1.34375, 2.79296875, 6.9296875, 11.06640625, 15.203125, 19.33984375, 23.4765625, 27.61328125, 31.75, 35.88671875, 40.0234375, 44.16015625, 48.296875, 52.43359375, 56.5703125, 60.70703125, 64.84375, 68.98046875, 73.1171875, 77.25390625, 81.390625, 85.52734375, 89.6640625, 93.80078125, 97.9375, 102.07421875, 106.2109375, 110.34765625, 114.484375, 118.62109375, 122.7578125, 126.89453125, 131.03125, 135.16796875, 139.3046875, 143.44140625, 147.578125, 151.71484375, 155.8515625, 159.98828125, 164.125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 2.0, 3.0, 2.0, 8.0, 14.0, 17.0, 22.0, 31.0, 27.0, 46.0, 45.0, 52.0, 48.0, 66.0, 77.0, 75.0, 74.0, 64.0, 57.0, 57.0, 40.0, 42.0, 41.0, 28.0, 15.0, 15.0, 9.0, 7.0, 5.0, 6.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.1875, -58.33935546875, -56.4912109375, -54.64306640625, -52.794921875, -50.94677734375, -49.0986328125, -47.25048828125, -45.40234375, -43.55419921875, -41.7060546875, -39.85791015625, -38.009765625, -36.16162109375, -34.3134765625, -32.46533203125, -30.6171875, -28.76904296875, -26.9208984375, -25.07275390625, -23.224609375, -21.37646484375, -19.5283203125, -17.68017578125, -15.83203125, -13.98388671875, -12.1357421875, -10.28759765625, -8.439453125, -6.59130859375, -4.7431640625, -2.89501953125, -1.046875, 0.80126953125, 2.6494140625, 4.49755859375, 6.345703125, 8.19384765625, 10.0419921875, 11.89013671875, 13.73828125, 15.58642578125, 17.4345703125, 19.28271484375, 21.130859375, 22.97900390625, 24.8271484375, 26.67529296875, 28.5234375, 30.37158203125, 32.2197265625, 34.06787109375, 35.916015625, 37.76416015625, 39.6123046875, 41.46044921875, 43.30859375, 45.15673828125, 47.0048828125, 48.85302734375, 50.701171875, 52.54931640625, 54.3974609375, 56.24560546875, 58.09375]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 7.0, 8.0, 29.0, 58.0, 157.0, 324.0, 244.0, 95.0, 50.0, 14.0, 8.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2960.052978515625, -2874.81982421875, -2789.586669921875, -2704.353515625, -2619.120361328125, -2533.88720703125, -2448.654052734375, -2363.4208984375, -2278.187744140625, -2192.95458984375, -2107.721435546875, -2022.48828125, -1937.255126953125, -1852.02197265625, -1766.788818359375, -1681.5556640625, -1596.322509765625, -1511.08935546875, -1425.856201171875, -1340.623046875, -1255.389892578125, -1170.15673828125, -1084.923583984375, -999.6904296875, -914.457275390625, -829.22412109375, -743.990966796875, -658.7578125, -573.524658203125, -488.29150390625, -403.058349609375, -317.8251953125, -232.592041015625, -147.35888671875, -62.125732421875, 23.107421875, 108.340576171875, 193.57373046875, 278.806884765625, 364.0400390625, 449.273193359375, 534.50634765625, 619.739501953125, 704.97265625, 790.205810546875, 875.43896484375, 960.672119140625, 1045.9052734375, 1131.138427734375, 1216.37158203125, 1301.604736328125, 1386.837890625, 1472.071044921875, 1557.30419921875, 1642.537353515625, 1727.7705078125, 1813.003662109375, 1898.23681640625, 1983.469970703125, 2068.703125, 2153.936279296875, 2239.16943359375, 2324.402587890625, 2409.6357421875, 2494.868896484375]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 3.0, 5.0, 6.0, 12.0, 9.0, 13.0, 12.0, 14.0, 12.0, 14.0, 14.0, 26.0, 32.0, 32.0, 38.0, 30.0, 33.0, 47.0, 51.0, 57.0, 82.0, 61.0, 47.0, 39.0, 29.0, 30.0, 23.0, 33.0, 22.0, 35.0, 21.0, 21.0, 15.0, 9.0, 13.0, 14.0, 9.0, 7.0, 5.0, 5.0, 7.0, 1.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0], "bins": [-1181.378662109375, -1148.8143310546875, -1116.25, -1083.685791015625, -1051.1214599609375, -1018.55712890625, -985.9927978515625, -953.428466796875, -920.8641967773438, -888.2998657226562, -855.735595703125, -823.1712646484375, -790.60693359375, -758.0426635742188, -725.4783325195312, -692.9140625, -660.3497314453125, -627.785400390625, -595.2211303710938, -562.6567993164062, -530.092529296875, -497.5281982421875, -464.9638671875, -432.3995666503906, -399.83526611328125, -367.2709655761719, -334.7066650390625, -302.142333984375, -269.5780334472656, -237.01373291015625, -204.4494171142578, -171.88510131835938, -139.32086181640625, -106.75655364990234, -74.19224548339844, -41.62793731689453, -9.063629150390625, 23.50067138671875, 56.06498718261719, 88.62930297851562, 121.193603515625, 153.75790405273438, 186.3222198486328, 218.88653564453125, 251.45083618164062, 284.01513671875, 316.5794677734375, 349.1437683105469, 381.70806884765625, 414.2723693847656, 446.836669921875, 479.4010009765625, 511.9653015136719, 544.5296020507812, 577.0939331054688, 609.658203125, 642.2225341796875, 674.786865234375, 707.3511352539062, 739.9154663085938, 772.479736328125, 805.0440673828125, 837.6083984375, 870.1727294921875, 902.7369995117188]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 4.0, 7.0, 11.0, 9.0, 22.0, 33.0, 46.0, 60.0, 78.0, 146.0, 228.0, 406.0, 697.0, 1339.0, 2702.0, 6160.0, 16755.0, 69253.0, 536323.0, 2578308.0, 847198.0, 98720.0, 21584.0, 7502.0, 3215.0, 1529.0, 789.0, 438.0, 244.0, 149.0, 83.0, 77.0, 44.0, 32.0, 25.0, 18.0, 15.0, 7.0, 5.0, 6.0, 1.0, 2.0, 4.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-100.5625, -97.380859375, -94.19921875, -91.017578125, -87.8359375, -84.654296875, -81.47265625, -78.291015625, -75.109375, -71.927734375, -68.74609375, -65.564453125, -62.3828125, -59.201171875, -56.01953125, -52.837890625, -49.65625, -46.474609375, -43.29296875, -40.111328125, -36.9296875, -33.748046875, -30.56640625, -27.384765625, -24.203125, -21.021484375, -17.83984375, -14.658203125, -11.4765625, -8.294921875, -5.11328125, -1.931640625, 1.25, 4.431640625, 7.61328125, 10.794921875, 13.9765625, 17.158203125, 20.33984375, 23.521484375, 26.703125, 29.884765625, 33.06640625, 36.248046875, 39.4296875, 42.611328125, 45.79296875, 48.974609375, 52.15625, 55.337890625, 58.51953125, 61.701171875, 64.8828125, 68.064453125, 71.24609375, 74.427734375, 77.609375, 80.791015625, 83.97265625, 87.154296875, 90.3359375, 93.517578125, 96.69921875, 99.880859375, 103.0625]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 7.0, 7.0, 6.0, 8.0, 14.0, 16.0, 18.0, 26.0, 29.0, 35.0, 28.0, 30.0, 40.0, 30.0, 35.0, 44.0, 50.0, 42.0, 57.0, 52.0, 36.0, 46.0, 41.0, 35.0, 35.0, 29.0, 32.0, 34.0, 23.0, 21.0, 21.0, 12.0, 16.0, 10.0, 7.0, 4.0, 11.0, 9.0, 2.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.90625, -61.87841796875, -59.8505859375, -57.82275390625, -55.794921875, -53.76708984375, -51.7392578125, -49.71142578125, -47.68359375, -45.65576171875, -43.6279296875, -41.60009765625, -39.572265625, -37.54443359375, -35.5166015625, -33.48876953125, -31.4609375, -29.43310546875, -27.4052734375, -25.37744140625, -23.349609375, -21.32177734375, -19.2939453125, -17.26611328125, -15.23828125, -13.21044921875, -11.1826171875, -9.15478515625, -7.126953125, -5.09912109375, -3.0712890625, -1.04345703125, 0.984375, 3.01220703125, 5.0400390625, 7.06787109375, 9.095703125, 11.12353515625, 13.1513671875, 15.17919921875, 17.20703125, 19.23486328125, 21.2626953125, 23.29052734375, 25.318359375, 27.34619140625, 29.3740234375, 31.40185546875, 33.4296875, 35.45751953125, 37.4853515625, 39.51318359375, 41.541015625, 43.56884765625, 45.5966796875, 47.62451171875, 49.65234375, 51.68017578125, 53.7080078125, 55.73583984375, 57.763671875, 59.79150390625, 61.8193359375, 63.84716796875, 65.875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 2.0, 7.0, 17.0, 24.0, 27.0, 53.0, 78.0, 114.0, 220.0, 532.0, 1393.0, 4674.0, 22882.0, 278022.0, 3724162.0, 140391.0, 16005.0, 3623.0, 1148.0, 460.0, 181.0, 108.0, 47.0, 37.0, 18.0, 13.0, 7.0, 9.0, 6.0, 7.0, 2.0, 5.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-275.0, -267.23046875, -259.4609375, -251.69140625, -243.921875, -236.15234375, -228.3828125, -220.61328125, -212.84375, -205.07421875, -197.3046875, -189.53515625, -181.765625, -173.99609375, -166.2265625, -158.45703125, -150.6875, -142.91796875, -135.1484375, -127.37890625, -119.609375, -111.83984375, -104.0703125, -96.30078125, -88.53125, -80.76171875, -72.9921875, -65.22265625, -57.453125, -49.68359375, -41.9140625, -34.14453125, -26.375, -18.60546875, -10.8359375, -3.06640625, 4.703125, 12.47265625, 20.2421875, 28.01171875, 35.78125, 43.55078125, 51.3203125, 59.08984375, 66.859375, 74.62890625, 82.3984375, 90.16796875, 97.9375, 105.70703125, 113.4765625, 121.24609375, 129.015625, 136.78515625, 144.5546875, 152.32421875, 160.09375, 167.86328125, 175.6328125, 183.40234375, 191.171875, 198.94140625, 206.7109375, 214.48046875, 222.25]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 6.0, 6.0, 7.0, 13.0, 16.0, 13.0, 17.0, 28.0, 36.0, 49.0, 82.0, 136.0, 217.0, 428.0, 651.0, 800.0, 598.0, 369.0, 189.0, 129.0, 70.0, 60.0, 35.0, 22.0, 22.0, 13.0, 12.0, 11.0, 11.0, 14.0, 3.0, 3.0, 2.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-208.625, -203.05078125, -197.4765625, -191.90234375, -186.328125, -180.75390625, -175.1796875, -169.60546875, -164.03125, -158.45703125, -152.8828125, -147.30859375, -141.734375, -136.16015625, -130.5859375, -125.01171875, -119.4375, -113.86328125, -108.2890625, -102.71484375, -97.140625, -91.56640625, -85.9921875, -80.41796875, -74.84375, -69.26953125, -63.6953125, -58.12109375, -52.546875, -46.97265625, -41.3984375, -35.82421875, -30.25, -24.67578125, -19.1015625, -13.52734375, -7.953125, -2.37890625, 3.1953125, 8.76953125, 14.34375, 19.91796875, 25.4921875, 31.06640625, 36.640625, 42.21484375, 47.7890625, 53.36328125, 58.9375, 64.51171875, 70.0859375, 75.66015625, 81.234375, 86.80859375, 92.3828125, 97.95703125, 103.53125, 109.10546875, 114.6796875, 120.25390625, 125.828125, 131.40234375, 136.9765625, 142.55078125, 148.125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 2.0, 6.0, 4.0, 5.0, 14.0, 33.0, 62.0, 166.0, 259.0, 198.0, 133.0, 55.0, 26.0, 20.0, 8.0, 1.0, 1.0, 4.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1606.7406005859375, -1539.2440185546875, -1471.74755859375, -1404.2509765625, -1336.75439453125, -1269.2578125, -1201.7613525390625, -1134.2647705078125, -1066.768310546875, -999.2717895507812, -931.7752075195312, -864.2786865234375, -796.7821044921875, -729.2855834960938, -661.7890625, -594.29248046875, -526.7958984375, -459.2993469238281, -391.80279541015625, -324.3062744140625, -256.8097229003906, -189.31317138671875, -121.816650390625, -54.320098876953125, 13.17645263671875, 80.6729965209961, 148.16954040527344, 215.66607666015625, 283.1626281738281, 350.6591796875, 418.15570068359375, 485.6522521972656, 553.148681640625, 620.6452026367188, 688.1417846679688, 755.6383056640625, 823.1348876953125, 890.6314086914062, 958.1279296875, 1025.62451171875, 1093.12109375, 1160.61767578125, 1228.1141357421875, 1295.6107177734375, 1363.1072998046875, 1430.603759765625, 1498.100341796875, 1565.596923828125, 1633.0933837890625, 1700.5899658203125, 1768.08642578125, 1835.5830078125, 1903.07958984375, 1970.576171875, 2038.0726318359375, 2105.569091796875, 2173.065673828125, 2240.562255859375, 2308.058837890625, 2375.55517578125, 2443.0517578125, 2510.54833984375, 2578.044921875, 2645.54150390625, 2713.0380859375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 3.0, 14.0, 10.0, 16.0, 15.0, 18.0, 23.0, 23.0, 26.0, 35.0, 33.0, 29.0, 50.0, 36.0, 50.0, 46.0, 44.0, 55.0, 51.0, 52.0, 47.0, 49.0, 35.0, 39.0, 29.0, 33.0, 21.0, 23.0, 16.0, 18.0, 12.0, 13.0, 11.0, 5.0, 3.0, 8.0, 1.0, 6.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-986.668701171875, -959.8295288085938, -932.9903564453125, -906.1511840820312, -879.31201171875, -852.472900390625, -825.6337280273438, -798.7945556640625, -771.9553833007812, -745.1162109375, -718.2770385742188, -691.4378662109375, -664.5987548828125, -637.759521484375, -610.92041015625, -584.0812377929688, -557.2420654296875, -530.4028930664062, -503.563720703125, -476.7245788574219, -449.8854064941406, -423.0462341308594, -396.20709228515625, -369.367919921875, -342.52874755859375, -315.6895751953125, -288.85040283203125, -262.0112609863281, -235.17208862304688, -208.33291625976562, -181.49375915527344, -154.65460205078125, -127.81549072265625, -100.97632598876953, -74.13716125488281, -47.297996520996094, -20.458831787109375, 6.380340576171875, 33.21949768066406, 60.05865478515625, 86.8978271484375, 113.73699188232422, 140.57615661621094, 167.41531372070312, 194.25448608398438, 221.09365844726562, 247.9328155517578, 274.77197265625, 301.61114501953125, 328.4503173828125, 355.28948974609375, 382.1286315917969, 408.9678039550781, 435.8069763183594, 462.6461181640625, 489.48529052734375, 516.324462890625, 543.1636352539062, 570.0028076171875, 596.8419799804688, 623.68115234375, 650.520263671875, 677.3594360351562, 704.1986083984375, 731.0377807617188]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 5.0, 5.0, 5.0, 11.0, 15.0, 23.0, 39.0, 36.0, 92.0, 131.0, 232.0, 414.0, 704.0, 1363.0, 2469.0, 5103.0, 10753.0, 24717.0, 61592.0, 163224.0, 352961.0, 256356.0, 99008.0, 38369.0, 16187.0, 7175.0, 3538.0, 1733.0, 981.0, 539.0, 314.0, 170.0, 112.0, 83.0, 47.0, 23.0, 10.0, 14.0, 7.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-68.4375, -65.779296875, -63.12109375, -60.462890625, -57.8046875, -55.146484375, -52.48828125, -49.830078125, -47.171875, -44.513671875, -41.85546875, -39.197265625, -36.5390625, -33.880859375, -31.22265625, -28.564453125, -25.90625, -23.248046875, -20.58984375, -17.931640625, -15.2734375, -12.615234375, -9.95703125, -7.298828125, -4.640625, -1.982421875, 0.67578125, 3.333984375, 5.9921875, 8.650390625, 11.30859375, 13.966796875, 16.625, 19.283203125, 21.94140625, 24.599609375, 27.2578125, 29.916015625, 32.57421875, 35.232421875, 37.890625, 40.548828125, 43.20703125, 45.865234375, 48.5234375, 51.181640625, 53.83984375, 56.498046875, 59.15625, 61.814453125, 64.47265625, 67.130859375, 69.7890625, 72.447265625, 75.10546875, 77.763671875, 80.421875, 83.080078125, 85.73828125, 88.396484375, 91.0546875, 93.712890625, 96.37109375, 99.029296875, 101.6875]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 4.0, 5.0, 7.0, 7.0, 10.0, 17.0, 19.0, 27.0, 17.0, 27.0, 31.0, 30.0, 35.0, 35.0, 43.0, 46.0, 53.0, 43.0, 62.0, 47.0, 47.0, 49.0, 44.0, 38.0, 30.0, 38.0, 23.0, 27.0, 19.0, 25.0, 16.0, 14.0, 18.0, 12.0, 11.0, 7.0, 5.0, 6.0, 2.0, 4.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-74.125, -71.9541015625, -69.783203125, -67.6123046875, -65.44140625, -63.2705078125, -61.099609375, -58.9287109375, -56.7578125, -54.5869140625, -52.416015625, -50.2451171875, -48.07421875, -45.9033203125, -43.732421875, -41.5615234375, -39.390625, -37.2197265625, -35.048828125, -32.8779296875, -30.70703125, -28.5361328125, -26.365234375, -24.1943359375, -22.0234375, -19.8525390625, -17.681640625, -15.5107421875, -13.33984375, -11.1689453125, -8.998046875, -6.8271484375, -4.65625, -2.4853515625, -0.314453125, 1.8564453125, 4.02734375, 6.1982421875, 8.369140625, 10.5400390625, 12.7109375, 14.8818359375, 17.052734375, 19.2236328125, 21.39453125, 23.5654296875, 25.736328125, 27.9072265625, 30.078125, 32.2490234375, 34.419921875, 36.5908203125, 38.76171875, 40.9326171875, 43.103515625, 45.2744140625, 47.4453125, 49.6162109375, 51.787109375, 53.9580078125, 56.12890625, 58.2998046875, 60.470703125, 62.6416015625, 64.8125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 5.0, 1.0, 3.0, 8.0, 12.0, 24.0, 38.0, 65.0, 155.0, 481.0, 1544.0, 9270.0, 166689.0, 834431.0, 31023.0, 3473.0, 835.0, 281.0, 94.0, 64.0, 27.0, 13.0, 14.0, 8.0, 3.0, 0.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-267.25, -256.2265625, -245.203125, -234.1796875, -223.15625, -212.1328125, -201.109375, -190.0859375, -179.0625, -168.0390625, -157.015625, -145.9921875, -134.96875, -123.9453125, -112.921875, -101.8984375, -90.875, -79.8515625, -68.828125, -57.8046875, -46.78125, -35.7578125, -24.734375, -13.7109375, -2.6875, 8.3359375, 19.359375, 30.3828125, 41.40625, 52.4296875, 63.453125, 74.4765625, 85.5, 96.5234375, 107.546875, 118.5703125, 129.59375, 140.6171875, 151.640625, 162.6640625, 173.6875, 184.7109375, 195.734375, 206.7578125, 217.78125, 228.8046875, 239.828125, 250.8515625, 261.875, 272.8984375, 283.921875, 294.9453125, 305.96875, 316.9921875, 328.015625, 339.0390625, 350.0625, 361.0859375, 372.109375, 383.1328125, 394.15625, 405.1796875, 416.203125, 427.2265625, 438.25]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 4.0, 6.0, 11.0, 9.0, 23.0, 21.0, 44.0, 59.0, 72.0, 73.0, 80.0, 88.0, 80.0, 87.0, 60.0, 60.0, 48.0, 42.0, 40.0, 41.0, 17.0, 14.0, 6.0, 11.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-467.0, -454.046875, -441.09375, -428.140625, -415.1875, -402.234375, -389.28125, -376.328125, -363.375, -350.421875, -337.46875, -324.515625, -311.5625, -298.609375, -285.65625, -272.703125, -259.75, -246.796875, -233.84375, -220.890625, -207.9375, -194.984375, -182.03125, -169.078125, -156.125, -143.171875, -130.21875, -117.265625, -104.3125, -91.359375, -78.40625, -65.453125, -52.5, -39.546875, -26.59375, -13.640625, -0.6875, 12.265625, 25.21875, 38.171875, 51.125, 64.078125, 77.03125, 89.984375, 102.9375, 115.890625, 128.84375, 141.796875, 154.75, 167.703125, 180.65625, 193.609375, 206.5625, 219.515625, 232.46875, 245.421875, 258.375, 271.328125, 284.28125, 297.234375, 310.1875, 323.140625, 336.09375, 349.046875, 362.0]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 3.0, 3.0, 8.0, 17.0, 18.0, 35.0, 70.0, 106.0, 229.0, 414.0, 907.0, 2309.0, 6156.0, 21591.0, 96446.0, 596482.0, 253661.0, 50463.0, 12662.0, 4040.0, 1513.0, 692.0, 326.0, 173.0, 77.0, 54.0, 25.0, 27.0, 18.0, 9.0, 5.0, 3.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.125, -45.5947265625, -44.064453125, -42.5341796875, -41.00390625, -39.4736328125, -37.943359375, -36.4130859375, -34.8828125, -33.3525390625, -31.822265625, -30.2919921875, -28.76171875, -27.2314453125, -25.701171875, -24.1708984375, -22.640625, -21.1103515625, -19.580078125, -18.0498046875, -16.51953125, -14.9892578125, -13.458984375, -11.9287109375, -10.3984375, -8.8681640625, -7.337890625, -5.8076171875, -4.27734375, -2.7470703125, -1.216796875, 0.3134765625, 1.84375, 3.3740234375, 4.904296875, 6.4345703125, 7.96484375, 9.4951171875, 11.025390625, 12.5556640625, 14.0859375, 15.6162109375, 17.146484375, 18.6767578125, 20.20703125, 21.7373046875, 23.267578125, 24.7978515625, 26.328125, 27.8583984375, 29.388671875, 30.9189453125, 32.44921875, 33.9794921875, 35.509765625, 37.0400390625, 38.5703125, 40.1005859375, 41.630859375, 43.1611328125, 44.69140625, 46.2216796875, 47.751953125, 49.2822265625, 50.8125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 6.0, 3.0, 8.0, 11.0, 10.0, 17.0, 36.0, 29.0, 46.0, 67.0, 90.0, 115.0, 109.0, 92.0, 81.0, 75.0, 59.0, 36.0, 30.0, 23.0, 19.0, 12.0, 12.0, 7.0, 1.0, 3.0, 0.0, 1.0, 4.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0142059326171875, -0.013648748397827148, -0.013091564178466797, -0.012534379959106445, -0.011977195739746094, -0.011420011520385742, -0.01086282730102539, -0.010305643081665039, -0.009748458862304688, -0.009191274642944336, -0.008634090423583984, -0.008076906204223633, -0.007519721984863281, -0.00696253776550293, -0.006405353546142578, -0.0058481693267822266, -0.005290985107421875, -0.0047338008880615234, -0.004176616668701172, -0.0036194324493408203, -0.0030622482299804688, -0.002505064010620117, -0.0019478797912597656, -0.001390695571899414, -0.0008335113525390625, -0.00027632713317871094, 0.0002808570861816406, 0.0008380413055419922, 0.0013952255249023438, 0.0019524097442626953, 0.002509593963623047, 0.0030667781829833984, 0.00362396240234375, 0.0041811466217041016, 0.004738330841064453, 0.005295515060424805, 0.005852699279785156, 0.006409883499145508, 0.006967067718505859, 0.007524251937866211, 0.008081436157226562, 0.008638620376586914, 0.009195804595947266, 0.009752988815307617, 0.010310173034667969, 0.01086735725402832, 0.011424541473388672, 0.011981725692749023, 0.012538909912109375, 0.013096094131469727, 0.013653278350830078, 0.01421046257019043, 0.014767646789550781, 0.015324831008911133, 0.015882015228271484, 0.016439199447631836, 0.016996383666992188, 0.01755356788635254, 0.01811075210571289, 0.018667936325073242, 0.019225120544433594, 0.019782304763793945, 0.020339488983154297, 0.02089667320251465, 0.021453857421875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 6.0, 4.0, 3.0, 7.0, 19.0, 13.0, 25.0, 30.0, 50.0, 96.0, 172.0, 307.0, 710.0, 1808.0, 5350.0, 18402.0, 85722.0, 576002.0, 285429.0, 55109.0, 12882.0, 3807.0, 1420.0, 584.0, 253.0, 117.0, 64.0, 48.0, 39.0, 29.0, 10.0, 9.0, 9.0, 6.0, 6.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-54.0, -52.4052734375, -50.810546875, -49.2158203125, -47.62109375, -46.0263671875, -44.431640625, -42.8369140625, -41.2421875, -39.6474609375, -38.052734375, -36.4580078125, -34.86328125, -33.2685546875, -31.673828125, -30.0791015625, -28.484375, -26.8896484375, -25.294921875, -23.7001953125, -22.10546875, -20.5107421875, -18.916015625, -17.3212890625, -15.7265625, -14.1318359375, -12.537109375, -10.9423828125, -9.34765625, -7.7529296875, -6.158203125, -4.5634765625, -2.96875, -1.3740234375, 0.220703125, 1.8154296875, 3.41015625, 5.0048828125, 6.599609375, 8.1943359375, 9.7890625, 11.3837890625, 12.978515625, 14.5732421875, 16.16796875, 17.7626953125, 19.357421875, 20.9521484375, 22.546875, 24.1416015625, 25.736328125, 27.3310546875, 28.92578125, 30.5205078125, 32.115234375, 33.7099609375, 35.3046875, 36.8994140625, 38.494140625, 40.0888671875, 41.68359375, 43.2783203125, 44.873046875, 46.4677734375, 48.0625]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 8.0, 6.0, 9.0, 12.0, 11.0, 19.0, 13.0, 29.0, 33.0, 43.0, 44.0, 43.0, 51.0, 73.0, 89.0, 67.0, 58.0, 67.0, 61.0, 58.0, 42.0, 40.0, 28.0, 29.0, 11.0, 15.0, 11.0, 8.0, 7.0, 8.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-47.625, -46.1416015625, -44.658203125, -43.1748046875, -41.69140625, -40.2080078125, -38.724609375, -37.2412109375, -35.7578125, -34.2744140625, -32.791015625, -31.3076171875, -29.82421875, -28.3408203125, -26.857421875, -25.3740234375, -23.890625, -22.4072265625, -20.923828125, -19.4404296875, -17.95703125, -16.4736328125, -14.990234375, -13.5068359375, -12.0234375, -10.5400390625, -9.056640625, -7.5732421875, -6.08984375, -4.6064453125, -3.123046875, -1.6396484375, -0.15625, 1.3271484375, 2.810546875, 4.2939453125, 5.77734375, 7.2607421875, 8.744140625, 10.2275390625, 11.7109375, 13.1943359375, 14.677734375, 16.1611328125, 17.64453125, 19.1279296875, 20.611328125, 22.0947265625, 23.578125, 25.0615234375, 26.544921875, 28.0283203125, 29.51171875, 30.9951171875, 32.478515625, 33.9619140625, 35.4453125, 36.9287109375, 38.412109375, 39.8955078125, 41.37890625, 42.8623046875, 44.345703125, 45.8291015625, 47.3125]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 9.0, 19.0, 43.0, 70.0, 113.0, 199.0, 238.0, 120.0, 82.0, 40.0, 20.0, 15.0, 11.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1245.5618896484375, -1204.123779296875, -1162.6856689453125, -1121.24755859375, -1079.8094482421875, -1038.371337890625, -996.9331665039062, -955.4950561523438, -914.0569458007812, -872.6188354492188, -831.1807250976562, -789.7426147460938, -748.304443359375, -706.8663330078125, -665.42822265625, -623.9901123046875, -582.552001953125, -541.1138916015625, -499.67578125, -458.2376403808594, -416.7995300292969, -375.3614196777344, -333.92327880859375, -292.48516845703125, -251.04705810546875, -209.60894775390625, -168.1708221435547, -126.73270416259766, -85.29458618164062, -43.856475830078125, -2.4183502197265625, 39.019775390625, 80.457763671875, 121.89588165283203, 163.33399963378906, 204.77212524414062, 246.21023559570312, 287.6483459472656, 329.08648681640625, 370.52459716796875, 411.96270751953125, 453.40081787109375, 494.83892822265625, 536.2770385742188, 577.7152099609375, 619.1533203125, 660.5914306640625, 702.029541015625, 743.4676513671875, 784.90576171875, 826.3438720703125, 867.781982421875, 909.2200927734375, 950.658203125, 992.0963745117188, 1033.534423828125, 1074.97265625, 1116.4107666015625, 1157.848876953125, 1199.2869873046875, 1240.72509765625, 1282.1632080078125, 1323.601318359375, 1365.03955078125, 1406.4775390625]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 4.0, 6.0, 7.0, 15.0, 9.0, 8.0, 6.0, 16.0, 22.0, 15.0, 29.0, 27.0, 28.0, 33.0, 32.0, 32.0, 52.0, 66.0, 94.0, 76.0, 69.0, 56.0, 41.0, 35.0, 31.0, 16.0, 26.0, 26.0, 27.0, 23.0, 12.0, 9.0, 19.0, 7.0, 11.0, 7.0, 5.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1107.3682861328125, -1075.04150390625, -1042.7147216796875, -1010.3878784179688, -978.0610961914062, -945.7343139648438, -913.407470703125, -881.0806884765625, -848.75390625, -816.4271240234375, -784.100341796875, -751.7734985351562, -719.4467163085938, -687.1199340820312, -654.7930908203125, -622.46630859375, -590.1395263671875, -557.812744140625, -525.4859619140625, -493.15911865234375, -460.83233642578125, -428.50555419921875, -396.1787414550781, -363.8519287109375, -331.525146484375, -299.1983642578125, -266.8715515136719, -234.5447540283203, -202.21795654296875, -169.8911590576172, -137.56436157226562, -105.23756408691406, -72.9107666015625, -40.58396911621094, -8.257171630859375, 24.069625854492188, 56.39642333984375, 88.72322082519531, 121.05001831054688, 153.37681579589844, 185.70361328125, 218.03041076660156, 250.35720825195312, 282.68402099609375, 315.01080322265625, 347.33758544921875, 379.6643981933594, 411.9912109375, 444.3179931640625, 476.644775390625, 508.9715881347656, 541.2984008789062, 573.6251831054688, 605.9519653320312, 638.27880859375, 670.6055908203125, 702.932373046875, 735.2591552734375, 767.5859375, 799.9127807617188, 832.2395629882812, 864.5663452148438, 896.8931884765625, 929.219970703125, 961.5467529296875]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 8.0, 3.0, 8.0, 16.0, 13.0, 23.0, 24.0, 27.0, 34.0, 51.0, 83.0, 243.0, 818.0, 3523.0, 28514.0, 1314904.0, 2782705.0, 55767.0, 5619.0, 1155.0, 365.0, 123.0, 81.0, 35.0, 35.0, 28.0, 18.0, 16.0, 6.0, 14.0, 5.0, 7.0, 3.0, 4.0, 2.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-243.0, -236.625, -230.25, -223.875, -217.5, -211.125, -204.75, -198.375, -192.0, -185.625, -179.25, -172.875, -166.5, -160.125, -153.75, -147.375, -141.0, -134.625, -128.25, -121.875, -115.5, -109.125, -102.75, -96.375, -90.0, -83.625, -77.25, -70.875, -64.5, -58.125, -51.75, -45.375, -39.0, -32.625, -26.25, -19.875, -13.5, -7.125, -0.75, 5.625, 12.0, 18.375, 24.75, 31.125, 37.5, 43.875, 50.25, 56.625, 63.0, 69.375, 75.75, 82.125, 88.5, 94.875, 101.25, 107.625, 114.0, 120.375, 126.75, 133.125, 139.5, 145.875, 152.25, 158.625, 165.0]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 11.0, 4.0, 9.0, 12.0, 18.0, 13.0, 25.0, 29.0, 29.0, 29.0, 44.0, 39.0, 44.0, 55.0, 59.0, 61.0, 48.0, 44.0, 61.0, 45.0, 40.0, 47.0, 38.0, 43.0, 37.0, 24.0, 20.0, 19.0, 15.0, 8.0, 9.0, 7.0, 5.0, 5.0, 5.0, 1.0, 5.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-90.875, -88.3798828125, -85.884765625, -83.3896484375, -80.89453125, -78.3994140625, -75.904296875, -73.4091796875, -70.9140625, -68.4189453125, -65.923828125, -63.4287109375, -60.93359375, -58.4384765625, -55.943359375, -53.4482421875, -50.953125, -48.4580078125, -45.962890625, -43.4677734375, -40.97265625, -38.4775390625, -35.982421875, -33.4873046875, -30.9921875, -28.4970703125, -26.001953125, -23.5068359375, -21.01171875, -18.5166015625, -16.021484375, -13.5263671875, -11.03125, -8.5361328125, -6.041015625, -3.5458984375, -1.05078125, 1.4443359375, 3.939453125, 6.4345703125, 8.9296875, 11.4248046875, 13.919921875, 16.4150390625, 18.91015625, 21.4052734375, 23.900390625, 26.3955078125, 28.890625, 31.3857421875, 33.880859375, 36.3759765625, 38.87109375, 41.3662109375, 43.861328125, 46.3564453125, 48.8515625, 51.3466796875, 53.841796875, 56.3369140625, 58.83203125, 61.3271484375, 63.822265625, 66.3173828125, 68.8125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 5.0, 5.0, 6.0, 6.0, 4.0, 13.0, 16.0, 33.0, 58.0, 111.0, 298.0, 1074.0, 8215.0, 318352.0, 3833625.0, 29207.0, 2361.0, 525.0, 198.0, 84.0, 30.0, 20.0, 20.0, 7.0, 5.0, 3.0, 3.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-207.875, -196.470703125, -185.06640625, -173.662109375, -162.2578125, -150.853515625, -139.44921875, -128.044921875, -116.640625, -105.236328125, -93.83203125, -82.427734375, -71.0234375, -59.619140625, -48.21484375, -36.810546875, -25.40625, -14.001953125, -2.59765625, 8.806640625, 20.2109375, 31.615234375, 43.01953125, 54.423828125, 65.828125, 77.232421875, 88.63671875, 100.041015625, 111.4453125, 122.849609375, 134.25390625, 145.658203125, 157.0625, 168.466796875, 179.87109375, 191.275390625, 202.6796875, 214.083984375, 225.48828125, 236.892578125, 248.296875, 259.701171875, 271.10546875, 282.509765625, 293.9140625, 305.318359375, 316.72265625, 328.126953125, 339.53125, 350.935546875, 362.33984375, 373.744140625, 385.1484375, 396.552734375, 407.95703125, 419.361328125, 430.765625, 442.169921875, 453.57421875, 464.978515625, 476.3828125, 487.787109375, 499.19140625, 510.595703125, 522.0]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 3.0, 1.0, 3.0, 12.0, 5.0, 11.0, 18.0, 20.0, 32.0, 60.0, 75.0, 152.0, 258.0, 529.0, 867.0, 861.0, 524.0, 273.0, 147.0, 69.0, 56.0, 27.0, 21.0, 16.0, 16.0, 7.0, 2.0, 3.0, 3.0, 3.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-161.5, -155.294921875, -149.08984375, -142.884765625, -136.6796875, -130.474609375, -124.26953125, -118.064453125, -111.859375, -105.654296875, -99.44921875, -93.244140625, -87.0390625, -80.833984375, -74.62890625, -68.423828125, -62.21875, -56.013671875, -49.80859375, -43.603515625, -37.3984375, -31.193359375, -24.98828125, -18.783203125, -12.578125, -6.373046875, -0.16796875, 6.037109375, 12.2421875, 18.447265625, 24.65234375, 30.857421875, 37.0625, 43.267578125, 49.47265625, 55.677734375, 61.8828125, 68.087890625, 74.29296875, 80.498046875, 86.703125, 92.908203125, 99.11328125, 105.318359375, 111.5234375, 117.728515625, 123.93359375, 130.138671875, 136.34375, 142.548828125, 148.75390625, 154.958984375, 161.1640625, 167.369140625, 173.57421875, 179.779296875, 185.984375, 192.189453125, 198.39453125, 204.599609375, 210.8046875, 217.009765625, 223.21484375, 229.419921875, 235.625]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 8.0, 13.0, 62.0, 173.0, 349.0, 258.0, 95.0, 35.0, 12.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4054.216064453125, -3972.801513671875, -3891.38671875, -3809.97216796875, -3728.5576171875, -3647.14306640625, -3565.728271484375, -3484.313720703125, -3402.89892578125, -3321.484375, -3240.069580078125, -3158.655029296875, -3077.240478515625, -2995.82568359375, -2914.4111328125, -2832.99658203125, -2751.58203125, -2670.16748046875, -2588.752685546875, -2507.338134765625, -2425.923583984375, -2344.5087890625, -2263.09423828125, -2181.6796875, -2100.26513671875, -2018.8504638671875, -1937.4359130859375, -1856.021240234375, -1774.606689453125, -1693.1920166015625, -1611.77734375, -1530.36279296875, -1448.947998046875, -1367.5333251953125, -1286.1187744140625, -1204.7041015625, -1123.28955078125, -1041.8748779296875, -960.460205078125, -879.0455932617188, -797.6309814453125, -716.2163696289062, -634.8017578125, -553.3870849609375, -471.97247314453125, -390.557861328125, -309.1432189941406, -227.72857666015625, -146.31396484375, -64.89933776855469, 16.515289306640625, 97.92991638183594, 179.34454345703125, 260.7591552734375, 342.1737976074219, 423.58843994140625, 505.0030517578125, 586.4176635742188, 667.832275390625, 749.2469482421875, 830.6615600585938, 912.076171875, 993.4908447265625, 1074.905517578125, 1156.320068359375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 5.0, 6.0, 4.0, 5.0, 8.0, 7.0, 9.0, 10.0, 16.0, 22.0, 20.0, 17.0, 30.0, 32.0, 37.0, 25.0, 41.0, 35.0, 38.0, 41.0, 34.0, 29.0, 37.0, 40.0, 40.0, 49.0, 32.0, 40.0, 38.0, 30.0, 35.0, 28.0, 22.0, 21.0, 23.0, 17.0, 10.0, 18.0, 13.0, 10.0, 9.0, 5.0, 3.0, 5.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-566.1646118164062, -547.57373046875, -528.9827880859375, -510.39190673828125, -491.8009948730469, -473.2100830078125, -454.61920166015625, -436.0282897949219, -417.4373779296875, -398.8464660644531, -380.25555419921875, -361.6646728515625, -343.0737609863281, -324.48284912109375, -305.8919677734375, -287.3010559082031, -268.71014404296875, -250.11923217773438, -231.52833557128906, -212.93743896484375, -194.34652709960938, -175.755615234375, -157.1647186279297, -138.57382202148438, -119.98291015625, -101.39200592041016, -82.80110168457031, -64.21019744873047, -45.619293212890625, -27.02838897705078, -8.437484741210938, 10.153411865234375, 28.7442626953125, 47.335166931152344, 65.92607116699219, 84.51697540283203, 103.10787963867188, 121.69878387451172, 140.28968811035156, 158.88058471679688, 177.47149658203125, 196.06240844726562, 214.65330505371094, 233.24420166015625, 251.83511352539062, 270.426025390625, 289.01690673828125, 307.6078186035156, 326.19873046875, 344.7896423339844, 363.38055419921875, 381.971435546875, 400.5623474121094, 419.15325927734375, 437.744140625, 456.3350524902344, 474.92596435546875, 493.5168762207031, 512.1077880859375, 530.6986694335938, 549.28955078125, 567.8804931640625, 586.4713745117188, 605.062255859375, 623.6531982421875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 12.0, 8.0, 23.0, 16.0, 28.0, 67.0, 90.0, 145.0, 194.0, 333.0, 544.0, 928.0, 1480.0, 2787.0, 5027.0, 9733.0, 18793.0, 39736.0, 87738.0, 204591.0, 331554.0, 188855.0, 81194.0, 36934.0, 17896.0, 8915.0, 4702.0, 2480.0, 1436.0, 877.0, 539.0, 341.0, 218.0, 135.0, 67.0, 44.0, 27.0, 26.0, 19.0, 10.0, 8.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-79.4375, -77.19677734375, -74.9560546875, -72.71533203125, -70.474609375, -68.23388671875, -65.9931640625, -63.75244140625, -61.51171875, -59.27099609375, -57.0302734375, -54.78955078125, -52.548828125, -50.30810546875, -48.0673828125, -45.82666015625, -43.5859375, -41.34521484375, -39.1044921875, -36.86376953125, -34.623046875, -32.38232421875, -30.1416015625, -27.90087890625, -25.66015625, -23.41943359375, -21.1787109375, -18.93798828125, -16.697265625, -14.45654296875, -12.2158203125, -9.97509765625, -7.734375, -5.49365234375, -3.2529296875, -1.01220703125, 1.228515625, 3.46923828125, 5.7099609375, 7.95068359375, 10.19140625, 12.43212890625, 14.6728515625, 16.91357421875, 19.154296875, 21.39501953125, 23.6357421875, 25.87646484375, 28.1171875, 30.35791015625, 32.5986328125, 34.83935546875, 37.080078125, 39.32080078125, 41.5615234375, 43.80224609375, 46.04296875, 48.28369140625, 50.5244140625, 52.76513671875, 55.005859375, 57.24658203125, 59.4873046875, 61.72802734375, 63.96875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 3.0, 2.0, 0.0, 7.0, 6.0, 10.0, 7.0, 7.0, 11.0, 19.0, 19.0, 24.0, 19.0, 31.0, 38.0, 30.0, 35.0, 42.0, 51.0, 47.0, 42.0, 49.0, 40.0, 50.0, 52.0, 47.0, 43.0, 36.0, 27.0, 35.0, 32.0, 21.0, 17.0, 22.0, 14.0, 13.0, 8.0, 10.0, 5.0, 7.0, 10.0, 6.0, 1.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0], "bins": [-71.75, -69.5888671875, -67.427734375, -65.2666015625, -63.10546875, -60.9443359375, -58.783203125, -56.6220703125, -54.4609375, -52.2998046875, -50.138671875, -47.9775390625, -45.81640625, -43.6552734375, -41.494140625, -39.3330078125, -37.171875, -35.0107421875, -32.849609375, -30.6884765625, -28.52734375, -26.3662109375, -24.205078125, -22.0439453125, -19.8828125, -17.7216796875, -15.560546875, -13.3994140625, -11.23828125, -9.0771484375, -6.916015625, -4.7548828125, -2.59375, -0.4326171875, 1.728515625, 3.8896484375, 6.05078125, 8.2119140625, 10.373046875, 12.5341796875, 14.6953125, 16.8564453125, 19.017578125, 21.1787109375, 23.33984375, 25.5009765625, 27.662109375, 29.8232421875, 31.984375, 34.1455078125, 36.306640625, 38.4677734375, 40.62890625, 42.7900390625, 44.951171875, 47.1123046875, 49.2734375, 51.4345703125, 53.595703125, 55.7568359375, 57.91796875, 60.0791015625, 62.240234375, 64.4013671875, 66.5625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 2.0, 1.0, 4.0, 7.0, 4.0, 4.0, 2.0, 5.0, 10.0, 13.0, 16.0, 23.0, 25.0, 49.0, 45.0, 90.0, 123.0, 213.0, 363.0, 679.0, 1400.0, 3719.0, 13234.0, 77974.0, 765463.0, 154751.0, 21104.0, 5387.0, 1947.0, 797.0, 423.0, 225.0, 135.0, 94.0, 66.0, 34.0, 22.0, 21.0, 20.0, 15.0, 13.0, 5.0, 9.0, 6.0, 7.0, 7.0, 1.0, 1.0, 0.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-209.375, -202.962890625, -196.55078125, -190.138671875, -183.7265625, -177.314453125, -170.90234375, -164.490234375, -158.078125, -151.666015625, -145.25390625, -138.841796875, -132.4296875, -126.017578125, -119.60546875, -113.193359375, -106.78125, -100.369140625, -93.95703125, -87.544921875, -81.1328125, -74.720703125, -68.30859375, -61.896484375, -55.484375, -49.072265625, -42.66015625, -36.248046875, -29.8359375, -23.423828125, -17.01171875, -10.599609375, -4.1875, 2.224609375, 8.63671875, 15.048828125, 21.4609375, 27.873046875, 34.28515625, 40.697265625, 47.109375, 53.521484375, 59.93359375, 66.345703125, 72.7578125, 79.169921875, 85.58203125, 91.994140625, 98.40625, 104.818359375, 111.23046875, 117.642578125, 124.0546875, 130.466796875, 136.87890625, 143.291015625, 149.703125, 156.115234375, 162.52734375, 168.939453125, 175.3515625, 181.763671875, 188.17578125, 194.587890625, 201.0]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 4.0, 4.0, 1.0, 2.0, 10.0, 8.0, 11.0, 14.0, 32.0, 40.0, 33.0, 36.0, 47.0, 56.0, 70.0, 84.0, 86.0, 81.0, 71.0, 48.0, 69.0, 44.0, 50.0, 28.0, 18.0, 12.0, 14.0, 7.0, 6.0, 3.0, 5.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-435.75, -423.56640625, -411.3828125, -399.19921875, -387.015625, -374.83203125, -362.6484375, -350.46484375, -338.28125, -326.09765625, -313.9140625, -301.73046875, -289.546875, -277.36328125, -265.1796875, -252.99609375, -240.8125, -228.62890625, -216.4453125, -204.26171875, -192.078125, -179.89453125, -167.7109375, -155.52734375, -143.34375, -131.16015625, -118.9765625, -106.79296875, -94.609375, -82.42578125, -70.2421875, -58.05859375, -45.875, -33.69140625, -21.5078125, -9.32421875, 2.859375, 15.04296875, 27.2265625, 39.41015625, 51.59375, 63.77734375, 75.9609375, 88.14453125, 100.328125, 112.51171875, 124.6953125, 136.87890625, 149.0625, 161.24609375, 173.4296875, 185.61328125, 197.796875, 209.98046875, 222.1640625, 234.34765625, 246.53125, 258.71484375, 270.8984375, 283.08203125, 295.265625, 307.44921875, 319.6328125, 331.81640625, 344.0]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 4.0, 3.0, 4.0, 9.0, 7.0, 15.0, 20.0, 20.0, 43.0, 45.0, 78.0, 137.0, 224.0, 326.0, 603.0, 1142.0, 2304.0, 5096.0, 13131.0, 40058.0, 157232.0, 651623.0, 123544.0, 32657.0, 11319.0, 4386.0, 2092.0, 1009.0, 560.0, 350.0, 176.0, 98.0, 74.0, 55.0, 29.0, 25.0, 22.0, 18.0, 7.0, 4.0, 9.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.65625, -33.29296875, -31.9296875, -30.56640625, -29.203125, -27.83984375, -26.4765625, -25.11328125, -23.75, -22.38671875, -21.0234375, -19.66015625, -18.296875, -16.93359375, -15.5703125, -14.20703125, -12.84375, -11.48046875, -10.1171875, -8.75390625, -7.390625, -6.02734375, -4.6640625, -3.30078125, -1.9375, -0.57421875, 0.7890625, 2.15234375, 3.515625, 4.87890625, 6.2421875, 7.60546875, 8.96875, 10.33203125, 11.6953125, 13.05859375, 14.421875, 15.78515625, 17.1484375, 18.51171875, 19.875, 21.23828125, 22.6015625, 23.96484375, 25.328125, 26.69140625, 28.0546875, 29.41796875, 30.78125, 32.14453125, 33.5078125, 34.87109375, 36.234375, 37.59765625, 38.9609375, 40.32421875, 41.6875, 43.05078125, 44.4140625, 45.77734375, 47.140625, 48.50390625, 49.8671875, 51.23046875, 52.59375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 5.0, 3.0, 3.0, 2.0, 7.0, 7.0, 11.0, 13.0, 18.0, 25.0, 23.0, 63.0, 72.0, 76.0, 107.0, 157.0, 113.0, 83.0, 55.0, 46.0, 32.0, 23.0, 23.0, 11.0, 7.0, 3.0, 7.0, 4.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0198516845703125, -0.019176006317138672, -0.018500328063964844, -0.017824649810791016, -0.017148971557617188, -0.01647329330444336, -0.01579761505126953, -0.015121936798095703, -0.014446258544921875, -0.013770580291748047, -0.013094902038574219, -0.01241922378540039, -0.011743545532226562, -0.011067867279052734, -0.010392189025878906, -0.009716510772705078, -0.00904083251953125, -0.008365154266357422, -0.007689476013183594, -0.007013797760009766, -0.0063381195068359375, -0.005662441253662109, -0.004986763000488281, -0.004311084747314453, -0.003635406494140625, -0.002959728240966797, -0.0022840499877929688, -0.0016083717346191406, -0.0009326934814453125, -0.0002570152282714844, 0.00041866302490234375, 0.0010943412780761719, 0.00177001953125, 0.002445697784423828, 0.0031213760375976562, 0.0037970542907714844, 0.0044727325439453125, 0.005148410797119141, 0.005824089050292969, 0.006499767303466797, 0.007175445556640625, 0.007851123809814453, 0.008526802062988281, 0.00920248031616211, 0.009878158569335938, 0.010553836822509766, 0.011229515075683594, 0.011905193328857422, 0.01258087158203125, 0.013256549835205078, 0.013932228088378906, 0.014607906341552734, 0.015283584594726562, 0.01595926284790039, 0.01663494110107422, 0.017310619354248047, 0.017986297607421875, 0.018661975860595703, 0.01933765411376953, 0.02001333236694336, 0.020689010620117188, 0.021364688873291016, 0.022040367126464844, 0.022716045379638672, 0.0233917236328125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 3.0, 3.0, 6.0, 4.0, 12.0, 10.0, 13.0, 21.0, 43.0, 53.0, 63.0, 136.0, 236.0, 371.0, 868.0, 1953.0, 5273.0, 18780.0, 97322.0, 742570.0, 144898.0, 24830.0, 6705.0, 2275.0, 947.0, 498.0, 273.0, 117.0, 81.0, 70.0, 39.0, 22.0, 16.0, 10.0, 6.0, 9.0, 11.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-60.4375, -58.58349609375, -56.7294921875, -54.87548828125, -53.021484375, -51.16748046875, -49.3134765625, -47.45947265625, -45.60546875, -43.75146484375, -41.8974609375, -40.04345703125, -38.189453125, -36.33544921875, -34.4814453125, -32.62744140625, -30.7734375, -28.91943359375, -27.0654296875, -25.21142578125, -23.357421875, -21.50341796875, -19.6494140625, -17.79541015625, -15.94140625, -14.08740234375, -12.2333984375, -10.37939453125, -8.525390625, -6.67138671875, -4.8173828125, -2.96337890625, -1.109375, 0.74462890625, 2.5986328125, 4.45263671875, 6.306640625, 8.16064453125, 10.0146484375, 11.86865234375, 13.72265625, 15.57666015625, 17.4306640625, 19.28466796875, 21.138671875, 22.99267578125, 24.8466796875, 26.70068359375, 28.5546875, 30.40869140625, 32.2626953125, 34.11669921875, 35.970703125, 37.82470703125, 39.6787109375, 41.53271484375, 43.38671875, 45.24072265625, 47.0947265625, 48.94873046875, 50.802734375, 52.65673828125, 54.5107421875, 56.36474609375, 58.21875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 4.0, 6.0, 8.0, 8.0, 4.0, 8.0, 14.0, 10.0, 14.0, 18.0, 24.0, 29.0, 25.0, 49.0, 58.0, 55.0, 56.0, 93.0, 71.0, 67.0, 66.0, 58.0, 45.0, 31.0, 33.0, 28.0, 21.0, 12.0, 16.0, 8.0, 8.0, 11.0, 10.0, 8.0, 3.0, 1.0, 5.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 2.0, 2.0, 4.0, 0.0, 2.0], "bins": [-42.25, -41.017578125, -39.78515625, -38.552734375, -37.3203125, -36.087890625, -34.85546875, -33.623046875, -32.390625, -31.158203125, -29.92578125, -28.693359375, -27.4609375, -26.228515625, -24.99609375, -23.763671875, -22.53125, -21.298828125, -20.06640625, -18.833984375, -17.6015625, -16.369140625, -15.13671875, -13.904296875, -12.671875, -11.439453125, -10.20703125, -8.974609375, -7.7421875, -6.509765625, -5.27734375, -4.044921875, -2.8125, -1.580078125, -0.34765625, 0.884765625, 2.1171875, 3.349609375, 4.58203125, 5.814453125, 7.046875, 8.279296875, 9.51171875, 10.744140625, 11.9765625, 13.208984375, 14.44140625, 15.673828125, 16.90625, 18.138671875, 19.37109375, 20.603515625, 21.8359375, 23.068359375, 24.30078125, 25.533203125, 26.765625, 27.998046875, 29.23046875, 30.462890625, 31.6953125, 32.927734375, 34.16015625, 35.392578125, 36.625]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 7.0, 4.0, 12.0, 5.0, 11.0, 16.0, 27.0, 60.0, 82.0, 140.0, 268.0, 136.0, 101.0, 55.0, 38.0, 12.0, 7.0, 9.0, 5.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1242.4111328125, -1208.351806640625, -1174.29248046875, -1140.233154296875, -1106.173828125, -1072.114501953125, -1038.05517578125, -1003.9957885742188, -969.9364624023438, -935.8771362304688, -901.8178100585938, -867.7584838867188, -833.6990966796875, -799.6397705078125, -765.5804443359375, -731.5211181640625, -697.4617919921875, -663.4024658203125, -629.3431396484375, -595.2838134765625, -561.2244873046875, -527.1651611328125, -493.10577392578125, -459.04644775390625, -424.98712158203125, -390.92779541015625, -356.86846923828125, -322.8091125488281, -288.7497863769531, -254.69046020507812, -220.63111877441406, -186.57177734375, -152.5123291015625, -118.45299530029297, -84.39366149902344, -50.334327697753906, -16.274993896484375, 17.784332275390625, 51.84367370605469, 85.90301513671875, 119.96234130859375, 154.02166748046875, 188.0810089111328, 222.14035034179688, 256.1996765136719, 290.2590026855469, 324.318359375, 358.377685546875, 392.43701171875, 426.496337890625, 460.5556640625, 494.6150207519531, 528.67431640625, 562.733642578125, 596.7930297851562, 630.8523559570312, 664.9116821289062, 698.9710083007812, 733.0303344726562, 767.0896606445312, 801.1490478515625, 835.2083740234375, 869.2677001953125, 903.3270263671875, 937.3863525390625]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 6.0, 3.0, 5.0, 3.0, 4.0, 2.0, 10.0, 5.0, 9.0, 12.0, 12.0, 14.0, 13.0, 18.0, 18.0, 25.0, 31.0, 26.0, 38.0, 34.0, 53.0, 69.0, 92.0, 98.0, 77.0, 48.0, 42.0, 30.0, 28.0, 28.0, 21.0, 21.0, 24.0, 15.0, 16.0, 9.0, 11.0, 12.0, 4.0, 6.0, 6.0, 4.0, 3.0, 3.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-854.59912109375, -822.7855224609375, -790.971923828125, -759.1583251953125, -727.3446655273438, -695.5310668945312, -663.7174682617188, -631.9038696289062, -600.0902709960938, -568.2766723632812, -536.4630737304688, -504.6494445800781, -472.8358459472656, -441.022216796875, -409.2086181640625, -377.39501953125, -345.5813903808594, -313.7677917480469, -281.95416259765625, -250.14056396484375, -218.32696533203125, -186.5133514404297, -154.69973754882812, -122.88613891601562, -91.07252502441406, -59.25891876220703, -27.445308685302734, 4.3683013916015625, 36.181907653808594, 67.99551391601562, 99.80912780761719, 131.6227264404297, 163.43634033203125, 195.2499542236328, 227.0635528564453, 258.8771667480469, 290.6907653808594, 322.50439453125, 354.3179931640625, 386.131591796875, 417.9451904296875, 449.7587890625, 481.5724182128906, 513.385986328125, 545.1996459960938, 577.0132446289062, 608.8268432617188, 640.6404418945312, 672.4541015625, 704.2677001953125, 736.081298828125, 767.8948974609375, 799.7085571289062, 831.5221557617188, 863.3357543945312, 895.1493530273438, 926.9629516601562, 958.7765502929688, 990.5901489257812, 1022.40380859375, 1054.2174072265625, 1086.031005859375, 1117.8446044921875, 1149.658203125, 1181.4718017578125]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 6.0, 6.0, 8.0, 12.0, 22.0, 46.0, 71.0, 115.0, 180.0, 318.0, 575.0, 1184.0, 2464.0, 5941.0, 17941.0, 76239.0, 454744.0, 2179492.0, 1188717.0, 207356.0, 40038.0, 10766.0, 4077.0, 1853.0, 942.0, 513.0, 250.0, 166.0, 89.0, 59.0, 32.0, 19.0, 20.0, 9.0, 3.0, 5.0, 2.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.78125, -57.15673828125, -54.5322265625, -51.90771484375, -49.283203125, -46.65869140625, -44.0341796875, -41.40966796875, -38.78515625, -36.16064453125, -33.5361328125, -30.91162109375, -28.287109375, -25.66259765625, -23.0380859375, -20.41357421875, -17.7890625, -15.16455078125, -12.5400390625, -9.91552734375, -7.291015625, -4.66650390625, -2.0419921875, 0.58251953125, 3.20703125, 5.83154296875, 8.4560546875, 11.08056640625, 13.705078125, 16.32958984375, 18.9541015625, 21.57861328125, 24.203125, 26.82763671875, 29.4521484375, 32.07666015625, 34.701171875, 37.32568359375, 39.9501953125, 42.57470703125, 45.19921875, 47.82373046875, 50.4482421875, 53.07275390625, 55.697265625, 58.32177734375, 60.9462890625, 63.57080078125, 66.1953125, 68.81982421875, 71.4443359375, 74.06884765625, 76.693359375, 79.31787109375, 81.9423828125, 84.56689453125, 87.19140625, 89.81591796875, 92.4404296875, 95.06494140625, 97.689453125, 100.31396484375, 102.9384765625, 105.56298828125, 108.1875]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 3.0, 1.0, 6.0, 5.0, 4.0, 6.0, 3.0, 9.0, 6.0, 11.0, 12.0, 26.0, 23.0, 19.0, 22.0, 22.0, 30.0, 37.0, 41.0, 41.0, 35.0, 38.0, 49.0, 59.0, 60.0, 57.0, 36.0, 40.0, 38.0, 36.0, 26.0, 35.0, 33.0, 29.0, 27.0, 15.0, 14.0, 15.0, 6.0, 5.0, 5.0, 7.0, 5.0, 6.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.0625, -65.84765625, -63.6328125, -61.41796875, -59.203125, -56.98828125, -54.7734375, -52.55859375, -50.34375, -48.12890625, -45.9140625, -43.69921875, -41.484375, -39.26953125, -37.0546875, -34.83984375, -32.625, -30.41015625, -28.1953125, -25.98046875, -23.765625, -21.55078125, -19.3359375, -17.12109375, -14.90625, -12.69140625, -10.4765625, -8.26171875, -6.046875, -3.83203125, -1.6171875, 0.59765625, 2.8125, 5.02734375, 7.2421875, 9.45703125, 11.671875, 13.88671875, 16.1015625, 18.31640625, 20.53125, 22.74609375, 24.9609375, 27.17578125, 29.390625, 31.60546875, 33.8203125, 36.03515625, 38.25, 40.46484375, 42.6796875, 44.89453125, 47.109375, 49.32421875, 51.5390625, 53.75390625, 55.96875, 58.18359375, 60.3984375, 62.61328125, 64.828125, 67.04296875, 69.2578125, 71.47265625, 73.6875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 3.0, 5.0, 3.0, 3.0, 5.0, 4.0, 17.0, 21.0, 47.0, 102.0, 253.0, 622.0, 2577.0, 24627.0, 3639374.0, 514231.0, 9854.0, 1638.0, 503.0, 206.0, 82.0, 39.0, 24.0, 12.0, 16.0, 6.0, 1.0, 4.0, 1.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-331.0, -320.6015625, -310.203125, -299.8046875, -289.40625, -279.0078125, -268.609375, -258.2109375, -247.8125, -237.4140625, -227.015625, -216.6171875, -206.21875, -195.8203125, -185.421875, -175.0234375, -164.625, -154.2265625, -143.828125, -133.4296875, -123.03125, -112.6328125, -102.234375, -91.8359375, -81.4375, -71.0390625, -60.640625, -50.2421875, -39.84375, -29.4453125, -19.046875, -8.6484375, 1.75, 12.1484375, 22.546875, 32.9453125, 43.34375, 53.7421875, 64.140625, 74.5390625, 84.9375, 95.3359375, 105.734375, 116.1328125, 126.53125, 136.9296875, 147.328125, 157.7265625, 168.125, 178.5234375, 188.921875, 199.3203125, 209.71875, 220.1171875, 230.515625, 240.9140625, 251.3125, 261.7109375, 272.109375, 282.5078125, 292.90625, 303.3046875, 313.703125, 324.1015625, 334.5]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 5.0, 3.0, 14.0, 12.0, 31.0, 27.0, 71.0, 83.0, 197.0, 413.0, 741.0, 1001.0, 697.0, 327.0, 181.0, 96.0, 72.0, 35.0, 27.0, 16.0, 8.0, 6.0, 4.0, 3.0, 4.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-143.625, -136.951171875, -130.27734375, -123.603515625, -116.9296875, -110.255859375, -103.58203125, -96.908203125, -90.234375, -83.560546875, -76.88671875, -70.212890625, -63.5390625, -56.865234375, -50.19140625, -43.517578125, -36.84375, -30.169921875, -23.49609375, -16.822265625, -10.1484375, -3.474609375, 3.19921875, 9.873046875, 16.546875, 23.220703125, 29.89453125, 36.568359375, 43.2421875, 49.916015625, 56.58984375, 63.263671875, 69.9375, 76.611328125, 83.28515625, 89.958984375, 96.6328125, 103.306640625, 109.98046875, 116.654296875, 123.328125, 130.001953125, 136.67578125, 143.349609375, 150.0234375, 156.697265625, 163.37109375, 170.044921875, 176.71875, 183.392578125, 190.06640625, 196.740234375, 203.4140625, 210.087890625, 216.76171875, 223.435546875, 230.109375, 236.783203125, 243.45703125, 250.130859375, 256.8046875, 263.478515625, 270.15234375, 276.826171875, 283.5]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 12.0, 5.0, 13.0, 23.0, 53.0, 43.0, 90.0, 150.0, 162.0, 137.0, 100.0, 70.0, 40.0, 28.0, 21.0, 11.0, 15.0, 6.0, 5.0, 2.0, 3.0, 4.0, 1.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1168.4798583984375, -1135.7244873046875, -1102.9691162109375, -1070.2138671875, -1037.45849609375, -1004.703125, -971.94775390625, -939.1923828125, -906.4370727539062, -873.6817016601562, -840.9263916015625, -808.1710205078125, -775.4156494140625, -742.6603393554688, -709.9049682617188, -677.149658203125, -644.394287109375, -611.638916015625, -578.8836059570312, -546.1282348632812, -513.3729248046875, -480.6175537109375, -447.8621826171875, -415.1068420410156, -382.35150146484375, -349.5961608886719, -316.8408203125, -284.08544921875, -251.33010864257812, -218.57476806640625, -185.8194122314453, -153.06405639648438, -120.30865478515625, -87.55330657958984, -54.79795837402344, -22.04261016845703, 10.712738037109375, 43.46807861328125, 76.22343444824219, 108.97879028320312, 141.734130859375, 174.48947143554688, 207.2448272705078, 240.00018310546875, 272.7555236816406, 305.5108642578125, 338.2662353515625, 371.0215759277344, 403.77691650390625, 436.5322570800781, 469.28759765625, 502.04296875, 534.79833984375, 567.5536499023438, 600.3090209960938, 633.0643310546875, 665.8197021484375, 698.5750732421875, 731.3303833007812, 764.0857543945312, 796.841064453125, 829.596435546875, 862.351806640625, 895.107177734375, 927.8624877929688]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 8.0, 4.0, 6.0, 11.0, 7.0, 17.0, 20.0, 18.0, 25.0, 30.0, 39.0, 41.0, 50.0, 75.0, 83.0, 55.0, 64.0, 58.0, 56.0, 64.0, 55.0, 33.0, 37.0, 24.0, 16.0, 25.0, 17.0, 15.0, 15.0, 2.0, 9.0, 5.0, 11.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-965.2545166015625, -937.2748413085938, -909.2951049804688, -881.3154296875, -853.335693359375, -825.3560180664062, -797.3763427734375, -769.3966064453125, -741.4168701171875, -713.4371948242188, -685.4574584960938, -657.477783203125, -629.498046875, -601.5183715820312, -573.5386962890625, -545.5589599609375, -517.5792846679688, -489.5995788574219, -461.619873046875, -433.64019775390625, -405.66046142578125, -377.6807861328125, -349.7010803222656, -321.72137451171875, -293.7416687011719, -265.761962890625, -237.78225708007812, -209.8025665283203, -181.82286071777344, -153.84315490722656, -125.86346435546875, -97.88375854492188, -69.90399169921875, -41.92428970336914, -13.944587707519531, 14.035110473632812, 42.01481628417969, 69.99452209472656, 97.97421264648438, 125.95391845703125, 153.93362426757812, 181.913330078125, 209.89303588867188, 237.8727264404297, 265.8524169921875, 293.8321533203125, 321.81182861328125, 349.7915344238281, 377.771240234375, 405.7509460449219, 433.73065185546875, 461.7103271484375, 489.6900634765625, 517.6697387695312, 545.6494140625, 573.629150390625, 601.60888671875, 629.5885620117188, 657.5682983398438, 685.5479736328125, 713.5277099609375, 741.5073852539062, 769.487060546875, 797.466796875, 825.4464721679688]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 9.0, 10.0, 22.0, 26.0, 50.0, 55.0, 114.0, 160.0, 302.0, 424.0, 775.0, 1321.0, 2372.0, 4587.0, 9057.0, 20227.0, 47293.0, 125805.0, 348342.0, 304453.0, 106614.0, 41377.0, 17624.0, 8302.0, 4219.0, 2123.0, 1161.0, 662.0, 409.0, 241.0, 157.0, 99.0, 56.0, 44.0, 22.0, 11.0, 11.0, 9.0, 8.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-92.6875, -89.8720703125, -87.056640625, -84.2412109375, -81.42578125, -78.6103515625, -75.794921875, -72.9794921875, -70.1640625, -67.3486328125, -64.533203125, -61.7177734375, -58.90234375, -56.0869140625, -53.271484375, -50.4560546875, -47.640625, -44.8251953125, -42.009765625, -39.1943359375, -36.37890625, -33.5634765625, -30.748046875, -27.9326171875, -25.1171875, -22.3017578125, -19.486328125, -16.6708984375, -13.85546875, -11.0400390625, -8.224609375, -5.4091796875, -2.59375, 0.2216796875, 3.037109375, 5.8525390625, 8.66796875, 11.4833984375, 14.298828125, 17.1142578125, 19.9296875, 22.7451171875, 25.560546875, 28.3759765625, 31.19140625, 34.0068359375, 36.822265625, 39.6376953125, 42.453125, 45.2685546875, 48.083984375, 50.8994140625, 53.71484375, 56.5302734375, 59.345703125, 62.1611328125, 64.9765625, 67.7919921875, 70.607421875, 73.4228515625, 76.23828125, 79.0537109375, 81.869140625, 84.6845703125, 87.5]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 5.0, 4.0, 7.0, 5.0, 8.0, 17.0, 15.0, 15.0, 18.0, 23.0, 15.0, 17.0, 27.0, 35.0, 33.0, 26.0, 38.0, 37.0, 38.0, 52.0, 45.0, 46.0, 53.0, 50.0, 45.0, 46.0, 29.0, 45.0, 32.0, 25.0, 28.0, 25.0, 22.0, 16.0, 9.0, 11.0, 9.0, 8.0, 7.0, 3.0, 3.0, 3.0, 6.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.65625, -57.58056640625, -55.5048828125, -53.42919921875, -51.353515625, -49.27783203125, -47.2021484375, -45.12646484375, -43.05078125, -40.97509765625, -38.8994140625, -36.82373046875, -34.748046875, -32.67236328125, -30.5966796875, -28.52099609375, -26.4453125, -24.36962890625, -22.2939453125, -20.21826171875, -18.142578125, -16.06689453125, -13.9912109375, -11.91552734375, -9.83984375, -7.76416015625, -5.6884765625, -3.61279296875, -1.537109375, 0.53857421875, 2.6142578125, 4.68994140625, 6.765625, 8.84130859375, 10.9169921875, 12.99267578125, 15.068359375, 17.14404296875, 19.2197265625, 21.29541015625, 23.37109375, 25.44677734375, 27.5224609375, 29.59814453125, 31.673828125, 33.74951171875, 35.8251953125, 37.90087890625, 39.9765625, 42.05224609375, 44.1279296875, 46.20361328125, 48.279296875, 50.35498046875, 52.4306640625, 54.50634765625, 56.58203125, 58.65771484375, 60.7333984375, 62.80908203125, 64.884765625, 66.96044921875, 69.0361328125, 71.11181640625, 73.1875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 7.0, 7.0, 6.0, 8.0, 20.0, 27.0, 45.0, 75.0, 93.0, 136.0, 287.0, 512.0, 1048.0, 2917.0, 12828.0, 131012.0, 842090.0, 47045.0, 6710.0, 1904.0, 789.0, 398.0, 222.0, 122.0, 81.0, 53.0, 45.0, 25.0, 13.0, 13.0, 12.0, 1.0, 3.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-285.5, -277.4140625, -269.328125, -261.2421875, -253.15625, -245.0703125, -236.984375, -228.8984375, -220.8125, -212.7265625, -204.640625, -196.5546875, -188.46875, -180.3828125, -172.296875, -164.2109375, -156.125, -148.0390625, -139.953125, -131.8671875, -123.78125, -115.6953125, -107.609375, -99.5234375, -91.4375, -83.3515625, -75.265625, -67.1796875, -59.09375, -51.0078125, -42.921875, -34.8359375, -26.75, -18.6640625, -10.578125, -2.4921875, 5.59375, 13.6796875, 21.765625, 29.8515625, 37.9375, 46.0234375, 54.109375, 62.1953125, 70.28125, 78.3671875, 86.453125, 94.5390625, 102.625, 110.7109375, 118.796875, 126.8828125, 134.96875, 143.0546875, 151.140625, 159.2265625, 167.3125, 175.3984375, 183.484375, 191.5703125, 199.65625, 207.7421875, 215.828125, 223.9140625, 232.0]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 7.0, 6.0, 11.0, 16.0, 13.0, 14.0, 20.0, 21.0, 23.0, 34.0, 41.0, 51.0, 52.0, 55.0, 61.0, 66.0, 75.0, 68.0, 67.0, 49.0, 50.0, 30.0, 32.0, 28.0, 23.0, 12.0, 17.0, 15.0, 13.0, 5.0, 10.0, 2.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-348.25, -338.515625, -328.78125, -319.046875, -309.3125, -299.578125, -289.84375, -280.109375, -270.375, -260.640625, -250.90625, -241.171875, -231.4375, -221.703125, -211.96875, -202.234375, -192.5, -182.765625, -173.03125, -163.296875, -153.5625, -143.828125, -134.09375, -124.359375, -114.625, -104.890625, -95.15625, -85.421875, -75.6875, -65.953125, -56.21875, -46.484375, -36.75, -27.015625, -17.28125, -7.546875, 2.1875, 11.921875, 21.65625, 31.390625, 41.125, 50.859375, 60.59375, 70.328125, 80.0625, 89.796875, 99.53125, 109.265625, 119.0, 128.734375, 138.46875, 148.203125, 157.9375, 167.671875, 177.40625, 187.140625, 196.875, 206.609375, 216.34375, 226.078125, 235.8125, 245.546875, 255.28125, 265.015625, 274.75]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 3.0, 5.0, 6.0, 2.0, 14.0, 22.0, 29.0, 32.0, 36.0, 65.0, 90.0, 139.0, 204.0, 364.0, 677.0, 1200.0, 2155.0, 4635.0, 10729.0, 28651.0, 101497.0, 650064.0, 176914.0, 43486.0, 15080.0, 6183.0, 2884.0, 1403.0, 770.0, 428.0, 261.0, 174.0, 96.0, 79.0, 51.0, 37.0, 29.0, 20.0, 15.0, 9.0, 3.0, 6.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.0, -29.95556640625, -28.9111328125, -27.86669921875, -26.822265625, -25.77783203125, -24.7333984375, -23.68896484375, -22.64453125, -21.60009765625, -20.5556640625, -19.51123046875, -18.466796875, -17.42236328125, -16.3779296875, -15.33349609375, -14.2890625, -13.24462890625, -12.2001953125, -11.15576171875, -10.111328125, -9.06689453125, -8.0224609375, -6.97802734375, -5.93359375, -4.88916015625, -3.8447265625, -2.80029296875, -1.755859375, -0.71142578125, 0.3330078125, 1.37744140625, 2.421875, 3.46630859375, 4.5107421875, 5.55517578125, 6.599609375, 7.64404296875, 8.6884765625, 9.73291015625, 10.77734375, 11.82177734375, 12.8662109375, 13.91064453125, 14.955078125, 15.99951171875, 17.0439453125, 18.08837890625, 19.1328125, 20.17724609375, 21.2216796875, 22.26611328125, 23.310546875, 24.35498046875, 25.3994140625, 26.44384765625, 27.48828125, 28.53271484375, 29.5771484375, 30.62158203125, 31.666015625, 32.71044921875, 33.7548828125, 34.79931640625, 35.84375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 4.0, 5.0, 14.0, 14.0, 18.0, 32.0, 40.0, 62.0, 76.0, 99.0, 121.0, 146.0, 101.0, 76.0, 65.0, 32.0, 26.0, 15.0, 12.0, 12.0, 10.0, 11.0, 2.0, 2.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0169219970703125, -0.01629638671875, -0.0156707763671875, -0.015045166015625, -0.0144195556640625, -0.0137939453125, -0.0131683349609375, -0.012542724609375, -0.0119171142578125, -0.01129150390625, -0.0106658935546875, -0.010040283203125, -0.0094146728515625, -0.0087890625, -0.0081634521484375, -0.007537841796875, -0.0069122314453125, -0.00628662109375, -0.0056610107421875, -0.005035400390625, -0.0044097900390625, -0.0037841796875, -0.0031585693359375, -0.002532958984375, -0.0019073486328125, -0.00128173828125, -0.0006561279296875, -3.0517578125e-05, 0.0005950927734375, 0.001220703125, 0.0018463134765625, 0.002471923828125, 0.0030975341796875, 0.00372314453125, 0.0043487548828125, 0.004974365234375, 0.0055999755859375, 0.0062255859375, 0.0068511962890625, 0.007476806640625, 0.0081024169921875, 0.00872802734375, 0.0093536376953125, 0.009979248046875, 0.0106048583984375, 0.01123046875, 0.0118560791015625, 0.012481689453125, 0.0131072998046875, 0.01373291015625, 0.0143585205078125, 0.014984130859375, 0.0156097412109375, 0.0162353515625, 0.0168609619140625, 0.017486572265625, 0.0181121826171875, 0.01873779296875, 0.0193634033203125, 0.019989013671875, 0.0206146240234375, 0.021240234375, 0.0218658447265625, 0.022491455078125, 0.0231170654296875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 5.0, 3.0, 9.0, 8.0, 11.0, 16.0, 41.0, 106.0, 201.0, 620.0, 2350.0, 20172.0, 854307.0, 161564.0, 7138.0, 1281.0, 390.0, 152.0, 84.0, 37.0, 27.0, 13.0, 11.0, 1.0, 2.0, 5.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-107.6875, -104.5927734375, -101.498046875, -98.4033203125, -95.30859375, -92.2138671875, -89.119140625, -86.0244140625, -82.9296875, -79.8349609375, -76.740234375, -73.6455078125, -70.55078125, -67.4560546875, -64.361328125, -61.2666015625, -58.171875, -55.0771484375, -51.982421875, -48.8876953125, -45.79296875, -42.6982421875, -39.603515625, -36.5087890625, -33.4140625, -30.3193359375, -27.224609375, -24.1298828125, -21.03515625, -17.9404296875, -14.845703125, -11.7509765625, -8.65625, -5.5615234375, -2.466796875, 0.6279296875, 3.72265625, 6.8173828125, 9.912109375, 13.0068359375, 16.1015625, 19.1962890625, 22.291015625, 25.3857421875, 28.48046875, 31.5751953125, 34.669921875, 37.7646484375, 40.859375, 43.9541015625, 47.048828125, 50.1435546875, 53.23828125, 56.3330078125, 59.427734375, 62.5224609375, 65.6171875, 68.7119140625, 71.806640625, 74.9013671875, 77.99609375, 81.0908203125, 84.185546875, 87.2802734375, 90.375]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 7.0, 4.0, 4.0, 12.0, 15.0, 24.0, 48.0, 79.0, 116.0, 133.0, 141.0, 120.0, 90.0, 78.0, 38.0, 31.0, 24.0, 10.0, 11.0, 8.0, 3.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-87.6875, -85.2197265625, -82.751953125, -80.2841796875, -77.81640625, -75.3486328125, -72.880859375, -70.4130859375, -67.9453125, -65.4775390625, -63.009765625, -60.5419921875, -58.07421875, -55.6064453125, -53.138671875, -50.6708984375, -48.203125, -45.7353515625, -43.267578125, -40.7998046875, -38.33203125, -35.8642578125, -33.396484375, -30.9287109375, -28.4609375, -25.9931640625, -23.525390625, -21.0576171875, -18.58984375, -16.1220703125, -13.654296875, -11.1865234375, -8.71875, -6.2509765625, -3.783203125, -1.3154296875, 1.15234375, 3.6201171875, 6.087890625, 8.5556640625, 11.0234375, 13.4912109375, 15.958984375, 18.4267578125, 20.89453125, 23.3623046875, 25.830078125, 28.2978515625, 30.765625, 33.2333984375, 35.701171875, 38.1689453125, 40.63671875, 43.1044921875, 45.572265625, 48.0400390625, 50.5078125, 52.9755859375, 55.443359375, 57.9111328125, 60.37890625, 62.8466796875, 65.314453125, 67.7822265625, 70.25]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 5.0, 14.0, 36.0, 68.0, 191.0, 424.0, 135.0, 67.0, 32.0, 11.0, 11.0, 6.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1262.30615234375, -1202.849365234375, -1143.3924560546875, -1083.9356689453125, -1024.4788818359375, -965.02197265625, -905.565185546875, -846.1083374023438, -786.6514892578125, -727.1946411132812, -667.7378540039062, -608.281005859375, -548.8241577148438, -489.3673400878906, -429.9105224609375, -370.45367431640625, -310.99688720703125, -251.54005432128906, -192.08322143554688, -132.62640380859375, -73.16957092285156, -13.712738037109375, 45.74407958984375, 105.200927734375, 164.65774536132812, 224.1145782470703, 283.5714111328125, 343.0282287597656, 402.48504638671875, 461.94189453125, 521.398681640625, 580.8555908203125, 640.3123779296875, 699.7692260742188, 759.2260131835938, 818.682861328125, 878.1397094726562, 937.5965576171875, 997.0533447265625, 1056.51025390625, 1115.967041015625, 1175.423828125, 1234.8807373046875, 1294.3375244140625, 1353.7943115234375, 1413.251220703125, 1472.7080078125, 1532.164794921875, 1591.62158203125, 1651.078369140625, 1710.5352783203125, 1769.9920654296875, 1829.4488525390625, 1888.90576171875, 1948.362548828125, 2007.8193359375, 2067.2763671875, 2126.733154296875, 2186.18994140625, 2245.64697265625, 2305.103759765625, 2364.560546875, 2424.017333984375, 2483.47412109375, 2542.930908203125]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 5.0, 5.0, 9.0, 14.0, 9.0, 20.0, 24.0, 23.0, 22.0, 27.0, 28.0, 39.0, 46.0, 82.0, 185.0, 126.0, 71.0, 54.0, 38.0, 36.0, 25.0, 21.0, 26.0, 23.0, 10.0, 17.0, 11.0, 5.0, 3.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1369.1583251953125, -1328.6373291015625, -1288.1162109375, -1247.59521484375, -1207.07421875, -1166.55322265625, -1126.0321044921875, -1085.5111083984375, -1044.989990234375, -1004.4689331054688, -963.9479370117188, -923.4268798828125, -882.9058837890625, -842.3848266601562, -801.86376953125, -761.3427734375, -720.82177734375, -680.3007202148438, -639.7797241210938, -599.2586669921875, -558.7376708984375, -518.2166137695312, -477.695556640625, -437.1745300292969, -396.65350341796875, -356.1324768066406, -315.6114501953125, -275.09039306640625, -234.56936645507812, -194.04833984375, -153.5272979736328, -113.00625610351562, -72.4853515625, -31.964317321777344, 8.556716918945312, 49.07775115966797, 89.59878540039062, 130.11981201171875, 170.64085388183594, 211.16189575195312, 251.68292236328125, 292.2039489746094, 332.7249755859375, 373.24603271484375, 413.7670593261719, 454.2880859375, 494.80914306640625, 535.3302001953125, 575.8511962890625, 616.3722534179688, 656.8932495117188, 697.414306640625, 737.935302734375, 778.4563598632812, 818.9774169921875, 859.4984130859375, 900.0194702148438, 940.54052734375, 981.0615234375, 1021.5825805664062, 1062.1036376953125, 1102.6246337890625, 1143.1456298828125, 1183.666748046875, 1224.187744140625]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 4.0, 8.0, 8.0, 21.0, 19.0, 33.0, 33.0, 41.0, 61.0, 107.0, 151.0, 243.0, 430.0, 834.0, 1858.0, 4716.0, 13847.0, 56659.0, 426810.0, 2466978.0, 1060649.0, 124662.0, 24012.0, 7044.0, 2487.0, 1149.0, 562.0, 278.0, 187.0, 144.0, 75.0, 41.0, 48.0, 21.0, 22.0, 16.0, 13.0, 4.0, 1.0, 2.0, 5.0, 3.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-151.625, -146.84375, -142.0625, -137.28125, -132.5, -127.71875, -122.9375, -118.15625, -113.375, -108.59375, -103.8125, -99.03125, -94.25, -89.46875, -84.6875, -79.90625, -75.125, -70.34375, -65.5625, -60.78125, -56.0, -51.21875, -46.4375, -41.65625, -36.875, -32.09375, -27.3125, -22.53125, -17.75, -12.96875, -8.1875, -3.40625, 1.375, 6.15625, 10.9375, 15.71875, 20.5, 25.28125, 30.0625, 34.84375, 39.625, 44.40625, 49.1875, 53.96875, 58.75, 63.53125, 68.3125, 73.09375, 77.875, 82.65625, 87.4375, 92.21875, 97.0, 101.78125, 106.5625, 111.34375, 116.125, 120.90625, 125.6875, 130.46875, 135.25, 140.03125, 144.8125, 149.59375, 154.375]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 8.0, 4.0, 10.0, 5.0, 17.0, 18.0, 15.0, 30.0, 27.0, 27.0, 28.0, 34.0, 43.0, 44.0, 50.0, 45.0, 48.0, 48.0, 49.0, 43.0, 46.0, 45.0, 39.0, 35.0, 46.0, 38.0, 26.0, 22.0, 20.0, 15.0, 22.0, 17.0, 8.0, 10.0, 5.0, 6.0, 1.0, 3.0, 2.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-80.5, -78.2666015625, -76.033203125, -73.7998046875, -71.56640625, -69.3330078125, -67.099609375, -64.8662109375, -62.6328125, -60.3994140625, -58.166015625, -55.9326171875, -53.69921875, -51.4658203125, -49.232421875, -46.9990234375, -44.765625, -42.5322265625, -40.298828125, -38.0654296875, -35.83203125, -33.5986328125, -31.365234375, -29.1318359375, -26.8984375, -24.6650390625, -22.431640625, -20.1982421875, -17.96484375, -15.7314453125, -13.498046875, -11.2646484375, -9.03125, -6.7978515625, -4.564453125, -2.3310546875, -0.09765625, 2.1357421875, 4.369140625, 6.6025390625, 8.8359375, 11.0693359375, 13.302734375, 15.5361328125, 17.76953125, 20.0029296875, 22.236328125, 24.4697265625, 26.703125, 28.9365234375, 31.169921875, 33.4033203125, 35.63671875, 37.8701171875, 40.103515625, 42.3369140625, 44.5703125, 46.8037109375, 49.037109375, 51.2705078125, 53.50390625, 55.7373046875, 57.970703125, 60.2041015625, 62.4375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 7.0, 12.0, 17.0, 31.0, 75.0, 266.0, 1060.0, 16194.0, 4164208.0, 11096.0, 941.0, 239.0, 75.0, 39.0, 14.0, 9.0, 6.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1395.0, -1358.7265625, -1322.453125, -1286.1796875, -1249.90625, -1213.6328125, -1177.359375, -1141.0859375, -1104.8125, -1068.5390625, -1032.265625, -995.9921875, -959.71875, -923.4453125, -887.171875, -850.8984375, -814.625, -778.3515625, -742.078125, -705.8046875, -669.53125, -633.2578125, -596.984375, -560.7109375, -524.4375, -488.1640625, -451.890625, -415.6171875, -379.34375, -343.0703125, -306.796875, -270.5234375, -234.25, -197.9765625, -161.703125, -125.4296875, -89.15625, -52.8828125, -16.609375, 19.6640625, 55.9375, 92.2109375, 128.484375, 164.7578125, 201.03125, 237.3046875, 273.578125, 309.8515625, 346.125, 382.3984375, 418.671875, 454.9453125, 491.21875, 527.4921875, 563.765625, 600.0390625, 636.3125, 672.5859375, 708.859375, 745.1328125, 781.40625, 817.6796875, 853.953125, 890.2265625, 926.5]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 6.0, 12.0, 26.0, 31.0, 84.0, 179.0, 428.0, 1015.0, 1367.0, 504.0, 236.0, 87.0, 58.0, 25.0, 10.0, 7.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-692.0, -675.953125, -659.90625, -643.859375, -627.8125, -611.765625, -595.71875, -579.671875, -563.625, -547.578125, -531.53125, -515.484375, -499.4375, -483.390625, -467.34375, -451.296875, -435.25, -419.203125, -403.15625, -387.109375, -371.0625, -355.015625, -338.96875, -322.921875, -306.875, -290.828125, -274.78125, -258.734375, -242.6875, -226.640625, -210.59375, -194.546875, -178.5, -162.453125, -146.40625, -130.359375, -114.3125, -98.265625, -82.21875, -66.171875, -50.125, -34.078125, -18.03125, -1.984375, 14.0625, 30.109375, 46.15625, 62.203125, 78.25, 94.296875, 110.34375, 126.390625, 142.4375, 158.484375, 174.53125, 190.578125, 206.625, 222.671875, 238.71875, 254.765625, 270.8125, 286.859375, 302.90625, 318.953125, 335.0]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0, 7.0, 4.0, 7.0, 16.0, 32.0, 40.0, 67.0, 99.0, 138.0, 169.0, 145.0, 99.0, 67.0, 33.0, 31.0, 8.0, 10.0, 10.0, 3.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2266.616943359375, -2194.469970703125, -2122.322998046875, -2050.176025390625, -1978.0291748046875, -1905.8822021484375, -1833.7353515625, -1761.58837890625, -1689.44140625, -1617.29443359375, -1545.1474609375, -1473.0006103515625, -1400.8536376953125, -1328.7066650390625, -1256.559814453125, -1184.412841796875, -1112.265869140625, -1040.118896484375, -967.9719848632812, -895.8250732421875, -823.6781005859375, -751.5311279296875, -679.3842163085938, -607.2373046875, -535.09033203125, -462.9433898925781, -390.79644775390625, -318.6495056152344, -246.5025634765625, -174.35562133789062, -102.20867919921875, -30.061737060546875, 42.085205078125, 114.23214721679688, 186.37908935546875, 258.5260314941406, 330.6729736328125, 402.8199157714844, 474.96685791015625, 547.11376953125, 619.2607421875, 691.40771484375, 763.5546264648438, 835.7015380859375, 907.8485107421875, 979.9954833984375, 1052.142333984375, 1124.289306640625, 1196.436279296875, 1268.583251953125, 1340.730224609375, 1412.8770751953125, 1485.0240478515625, 1557.1710205078125, 1629.31787109375, 1701.46484375, 1773.61181640625, 1845.7587890625, 1917.90576171875, 1990.0526123046875, 2062.19970703125, 2134.346435546875, 2206.493408203125, 2278.640380859375, 2350.787353515625]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 0.0, 5.0, 2.0, 4.0, 2.0, 8.0, 8.0, 7.0, 10.0, 8.0, 16.0, 12.0, 24.0, 16.0, 17.0, 25.0, 19.0, 22.0, 26.0, 31.0, 41.0, 50.0, 46.0, 42.0, 54.0, 37.0, 51.0, 43.0, 43.0, 37.0, 32.0, 36.0, 29.0, 28.0, 30.0, 21.0, 25.0, 20.0, 11.0, 12.0, 12.0, 10.0, 8.0, 9.0, 4.0, 6.0, 2.0, 2.0, 4.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0], "bins": [-1103.2652587890625, -1070.904052734375, -1038.54296875, -1006.1817626953125, -973.820556640625, -941.4593505859375, -909.0982055664062, -876.737060546875, -844.3758544921875, -812.0146484375, -779.6535034179688, -747.2923583984375, -714.93115234375, -682.5699462890625, -650.2088012695312, -617.84765625, -585.4864501953125, -553.125244140625, -520.7640991210938, -488.4029235839844, -456.041748046875, -423.6805725097656, -391.31939697265625, -358.9582214355469, -326.5970458984375, -294.2358703613281, -261.87469482421875, -229.51351928710938, -197.15234375, -164.79116821289062, -132.42999267578125, -100.06881713867188, -67.7076416015625, -35.346466064453125, -2.98529052734375, 29.375885009765625, 61.737060546875, 94.09823608398438, 126.45941162109375, 158.82058715820312, 191.1817626953125, 223.54293823242188, 255.90411376953125, 288.2652893066406, 320.62646484375, 352.9876403808594, 385.34881591796875, 417.7099914550781, 450.0711669921875, 482.4323425292969, 514.7935180664062, 547.1546630859375, 579.515869140625, 611.8770751953125, 644.2382202148438, 676.599365234375, 708.9605712890625, 741.32177734375, 773.6829223632812, 806.0440673828125, 838.4052734375, 870.7664794921875, 903.1276245117188, 935.48876953125, 967.8499755859375]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 4.0, 10.0, 16.0, 16.0, 27.0, 25.0, 31.0, 47.0, 70.0, 104.0, 154.0, 258.0, 457.0, 765.0, 1356.0, 2606.0, 5341.0, 11515.0, 28246.0, 79388.0, 319286.0, 438819.0, 99121.0, 34393.0, 13667.0, 6168.0, 2956.0, 1486.0, 840.0, 505.0, 306.0, 209.0, 105.0, 67.0, 44.0, 33.0, 29.0, 19.0, 15.0, 15.0, 8.0, 9.0, 8.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-134.625, -130.6767578125, -126.728515625, -122.7802734375, -118.83203125, -114.8837890625, -110.935546875, -106.9873046875, -103.0390625, -99.0908203125, -95.142578125, -91.1943359375, -87.24609375, -83.2978515625, -79.349609375, -75.4013671875, -71.453125, -67.5048828125, -63.556640625, -59.6083984375, -55.66015625, -51.7119140625, -47.763671875, -43.8154296875, -39.8671875, -35.9189453125, -31.970703125, -28.0224609375, -24.07421875, -20.1259765625, -16.177734375, -12.2294921875, -8.28125, -4.3330078125, -0.384765625, 3.5634765625, 7.51171875, 11.4599609375, 15.408203125, 19.3564453125, 23.3046875, 27.2529296875, 31.201171875, 35.1494140625, 39.09765625, 43.0458984375, 46.994140625, 50.9423828125, 54.890625, 58.8388671875, 62.787109375, 66.7353515625, 70.68359375, 74.6318359375, 78.580078125, 82.5283203125, 86.4765625, 90.4248046875, 94.373046875, 98.3212890625, 102.26953125, 106.2177734375, 110.166015625, 114.1142578125, 118.0625]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 6.0, 4.0, 6.0, 12.0, 14.0, 9.0, 26.0, 35.0, 47.0, 50.0, 54.0, 76.0, 76.0, 81.0, 83.0, 85.0, 79.0, 67.0, 39.0, 40.0, 35.0, 22.0, 13.0, 14.0, 15.0, 3.0, 7.0, 4.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-212.75, -207.6630859375, -202.576171875, -197.4892578125, -192.40234375, -187.3154296875, -182.228515625, -177.1416015625, -172.0546875, -166.9677734375, -161.880859375, -156.7939453125, -151.70703125, -146.6201171875, -141.533203125, -136.4462890625, -131.359375, -126.2724609375, -121.185546875, -116.0986328125, -111.01171875, -105.9248046875, -100.837890625, -95.7509765625, -90.6640625, -85.5771484375, -80.490234375, -75.4033203125, -70.31640625, -65.2294921875, -60.142578125, -55.0556640625, -49.96875, -44.8818359375, -39.794921875, -34.7080078125, -29.62109375, -24.5341796875, -19.447265625, -14.3603515625, -9.2734375, -4.1865234375, 0.900390625, 5.9873046875, 11.07421875, 16.1611328125, 21.248046875, 26.3349609375, 31.421875, 36.5087890625, 41.595703125, 46.6826171875, 51.76953125, 56.8564453125, 61.943359375, 67.0302734375, 72.1171875, 77.2041015625, 82.291015625, 87.3779296875, 92.46484375, 97.5517578125, 102.638671875, 107.7255859375, 112.8125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 5.0, 2.0, 4.0, 5.0, 10.0, 9.0, 17.0, 32.0, 35.0, 56.0, 112.0, 206.0, 388.0, 806.0, 2227.0, 8347.0, 75714.0, 919307.0, 33382.0, 5256.0, 1452.0, 560.0, 278.0, 147.0, 82.0, 37.0, 22.0, 23.0, 13.0, 11.0, 4.0, 4.0, 1.0, 1.0, 3.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-377.5, -367.65625, -357.8125, -347.96875, -338.125, -328.28125, -318.4375, -308.59375, -298.75, -288.90625, -279.0625, -269.21875, -259.375, -249.53125, -239.6875, -229.84375, -220.0, -210.15625, -200.3125, -190.46875, -180.625, -170.78125, -160.9375, -151.09375, -141.25, -131.40625, -121.5625, -111.71875, -101.875, -92.03125, -82.1875, -72.34375, -62.5, -52.65625, -42.8125, -32.96875, -23.125, -13.28125, -3.4375, 6.40625, 16.25, 26.09375, 35.9375, 45.78125, 55.625, 65.46875, 75.3125, 85.15625, 95.0, 104.84375, 114.6875, 124.53125, 134.375, 144.21875, 154.0625, 163.90625, 173.75, 183.59375, 193.4375, 203.28125, 213.125, 222.96875, 232.8125, 242.65625, 252.5]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 2.0, 2.0, 2.0, 3.0, 4.0, 7.0, 6.0, 3.0, 8.0, 13.0, 16.0, 10.0, 14.0, 24.0, 28.0, 45.0, 56.0, 60.0, 89.0, 110.0, 94.0, 95.0, 65.0, 46.0, 35.0, 28.0, 24.0, 19.0, 19.0, 16.0, 12.0, 13.0, 10.0, 8.0, 7.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-627.0, -609.09375, -591.1875, -573.28125, -555.375, -537.46875, -519.5625, -501.65625, -483.75, -465.84375, -447.9375, -430.03125, -412.125, -394.21875, -376.3125, -358.40625, -340.5, -322.59375, -304.6875, -286.78125, -268.875, -250.96875, -233.0625, -215.15625, -197.25, -179.34375, -161.4375, -143.53125, -125.625, -107.71875, -89.8125, -71.90625, -54.0, -36.09375, -18.1875, -0.28125, 17.625, 35.53125, 53.4375, 71.34375, 89.25, 107.15625, 125.0625, 142.96875, 160.875, 178.78125, 196.6875, 214.59375, 232.5, 250.40625, 268.3125, 286.21875, 304.125, 322.03125, 339.9375, 357.84375, 375.75, 393.65625, 411.5625, 429.46875, 447.375, 465.28125, 483.1875, 501.09375, 519.0]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 8.0, 6.0, 8.0, 16.0, 26.0, 33.0, 30.0, 78.0, 118.0, 140.0, 238.0, 369.0, 525.0, 940.0, 1736.0, 3098.0, 6532.0, 14557.0, 36848.0, 125883.0, 731061.0, 78087.0, 26233.0, 11096.0, 4959.0, 2580.0, 1295.0, 757.0, 448.0, 314.0, 142.0, 105.0, 83.0, 57.0, 39.0, 36.0, 27.0, 16.0, 10.0, 10.0, 2.0, 4.0, 1.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0], "bins": [-32.65625, -31.73193359375, -30.8076171875, -29.88330078125, -28.958984375, -28.03466796875, -27.1103515625, -26.18603515625, -25.26171875, -24.33740234375, -23.4130859375, -22.48876953125, -21.564453125, -20.64013671875, -19.7158203125, -18.79150390625, -17.8671875, -16.94287109375, -16.0185546875, -15.09423828125, -14.169921875, -13.24560546875, -12.3212890625, -11.39697265625, -10.47265625, -9.54833984375, -8.6240234375, -7.69970703125, -6.775390625, -5.85107421875, -4.9267578125, -4.00244140625, -3.078125, -2.15380859375, -1.2294921875, -0.30517578125, 0.619140625, 1.54345703125, 2.4677734375, 3.39208984375, 4.31640625, 5.24072265625, 6.1650390625, 7.08935546875, 8.013671875, 8.93798828125, 9.8623046875, 10.78662109375, 11.7109375, 12.63525390625, 13.5595703125, 14.48388671875, 15.408203125, 16.33251953125, 17.2568359375, 18.18115234375, 19.10546875, 20.02978515625, 20.9541015625, 21.87841796875, 22.802734375, 23.72705078125, 24.6513671875, 25.57568359375, 26.5]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 2.0, 3.0, 4.0, 4.0, 6.0, 7.0, 10.0, 9.0, 16.0, 11.0, 17.0, 30.0, 32.0, 54.0, 60.0, 100.0, 102.0, 110.0, 114.0, 75.0, 45.0, 24.0, 18.0, 20.0, 23.0, 28.0, 10.0, 13.0, 6.0, 11.0, 6.0, 8.0, 2.0, 5.0, 9.0, 1.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0151824951171875, -0.014662981033325195, -0.01414346694946289, -0.013623952865600586, -0.013104438781738281, -0.012584924697875977, -0.012065410614013672, -0.011545896530151367, -0.011026382446289062, -0.010506868362426758, -0.009987354278564453, -0.009467840194702148, -0.008948326110839844, -0.008428812026977539, -0.007909297943115234, -0.00738978385925293, -0.006870269775390625, -0.00635075569152832, -0.005831241607666016, -0.005311727523803711, -0.004792213439941406, -0.0042726993560791016, -0.003753185272216797, -0.003233671188354492, -0.0027141571044921875, -0.002194643020629883, -0.0016751289367675781, -0.0011556148529052734, -0.0006361007690429688, -0.00011658668518066406, 0.0004029273986816406, 0.0009224414825439453, 0.00144195556640625, 0.0019614696502685547, 0.0024809837341308594, 0.003000497817993164, 0.0035200119018554688, 0.0040395259857177734, 0.004559040069580078, 0.005078554153442383, 0.0055980682373046875, 0.006117582321166992, 0.006637096405029297, 0.0071566104888916016, 0.007676124572753906, 0.008195638656616211, 0.008715152740478516, 0.00923466682434082, 0.009754180908203125, 0.01027369499206543, 0.010793209075927734, 0.011312723159790039, 0.011832237243652344, 0.012351751327514648, 0.012871265411376953, 0.013390779495239258, 0.013910293579101562, 0.014429807662963867, 0.014949321746826172, 0.015468835830688477, 0.01598834991455078, 0.016507863998413086, 0.01702737808227539, 0.017546892166137695, 0.01806640625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 1.0, 4.0, 4.0, 0.0, 8.0, 4.0, 6.0, 7.0, 10.0, 23.0, 32.0, 33.0, 45.0, 72.0, 105.0, 126.0, 184.0, 328.0, 541.0, 866.0, 1414.0, 2353.0, 4595.0, 9504.0, 21076.0, 58059.0, 628716.0, 239931.0, 45726.0, 17461.0, 8073.0, 4024.0, 2032.0, 1185.0, 673.0, 481.0, 277.0, 181.0, 122.0, 63.0, 49.0, 36.0, 44.0, 20.0, 21.0, 10.0, 10.0, 6.0, 7.0, 7.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0], "bins": [-25.796875, -24.9619140625, -24.126953125, -23.2919921875, -22.45703125, -21.6220703125, -20.787109375, -19.9521484375, -19.1171875, -18.2822265625, -17.447265625, -16.6123046875, -15.77734375, -14.9423828125, -14.107421875, -13.2724609375, -12.4375, -11.6025390625, -10.767578125, -9.9326171875, -9.09765625, -8.2626953125, -7.427734375, -6.5927734375, -5.7578125, -4.9228515625, -4.087890625, -3.2529296875, -2.41796875, -1.5830078125, -0.748046875, 0.0869140625, 0.921875, 1.7568359375, 2.591796875, 3.4267578125, 4.26171875, 5.0966796875, 5.931640625, 6.7666015625, 7.6015625, 8.4365234375, 9.271484375, 10.1064453125, 10.94140625, 11.7763671875, 12.611328125, 13.4462890625, 14.28125, 15.1162109375, 15.951171875, 16.7861328125, 17.62109375, 18.4560546875, 19.291015625, 20.1259765625, 20.9609375, 21.7958984375, 22.630859375, 23.4658203125, 24.30078125, 25.1357421875, 25.970703125, 26.8056640625, 27.640625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 1.0, 4.0, 5.0, 5.0, 1.0, 3.0, 6.0, 6.0, 4.0, 13.0, 9.0, 5.0, 13.0, 8.0, 20.0, 25.0, 8.0, 36.0, 32.0, 29.0, 65.0, 60.0, 76.0, 75.0, 83.0, 72.0, 55.0, 59.0, 43.0, 27.0, 19.0, 21.0, 22.0, 13.0, 21.0, 4.0, 5.0, 11.0, 4.0, 7.0, 8.0, 2.0, 4.0, 6.0, 4.0, 1.0, 2.0, 4.0, 2.0, 2.0], "bins": [-53.28125, -51.8720703125, -50.462890625, -49.0537109375, -47.64453125, -46.2353515625, -44.826171875, -43.4169921875, -42.0078125, -40.5986328125, -39.189453125, -37.7802734375, -36.37109375, -34.9619140625, -33.552734375, -32.1435546875, -30.734375, -29.3251953125, -27.916015625, -26.5068359375, -25.09765625, -23.6884765625, -22.279296875, -20.8701171875, -19.4609375, -18.0517578125, -16.642578125, -15.2333984375, -13.82421875, -12.4150390625, -11.005859375, -9.5966796875, -8.1875, -6.7783203125, -5.369140625, -3.9599609375, -2.55078125, -1.1416015625, 0.267578125, 1.6767578125, 3.0859375, 4.4951171875, 5.904296875, 7.3134765625, 8.72265625, 10.1318359375, 11.541015625, 12.9501953125, 14.359375, 15.7685546875, 17.177734375, 18.5869140625, 19.99609375, 21.4052734375, 22.814453125, 24.2236328125, 25.6328125, 27.0419921875, 28.451171875, 29.8603515625, 31.26953125, 32.6787109375, 34.087890625, 35.4970703125, 36.90625]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 6.0, 14.0, 21.0, 64.0, 132.0, 566.0, 121.0, 43.0, 18.0, 8.0, 3.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3842.87158203125, -3745.427734375, -3647.983642578125, -3550.53955078125, -3453.095703125, -3355.65185546875, -3258.207763671875, -3160.763671875, -3063.31982421875, -2965.8759765625, -2868.431884765625, -2770.98779296875, -2673.5439453125, -2576.10009765625, -2478.656005859375, -2381.2119140625, -2283.76806640625, -2186.32421875, -2088.880126953125, -1991.4361572265625, -1893.9921875, -1796.5482177734375, -1699.104248046875, -1601.6602783203125, -1504.21630859375, -1406.7723388671875, -1309.328369140625, -1211.8843994140625, -1114.4404296875, -1016.9964599609375, -919.552490234375, -822.1085205078125, -724.664794921875, -627.2208251953125, -529.77685546875, -432.3328857421875, -334.888916015625, -237.4449462890625, -140.0009765625, -42.5570068359375, 54.886962890625, 152.3309326171875, 249.77490234375, 347.2188720703125, 444.662841796875, 542.1068115234375, 639.55078125, 736.9947509765625, 834.438720703125, 931.8826904296875, 1029.32666015625, 1126.7706298828125, 1224.214599609375, 1321.6585693359375, 1419.1025390625, 1516.5465087890625, 1613.990478515625, 1711.4344482421875, 1808.87841796875, 1906.3223876953125, 2003.766357421875, 2101.21044921875, 2198.654296875, 2296.09814453125, 2393.542236328125]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 0.0, 1.0, 6.0, 3.0, 11.0, 6.0, 10.0, 8.0, 14.0, 11.0, 18.0, 25.0, 22.0, 22.0, 22.0, 24.0, 33.0, 42.0, 101.0, 224.0, 131.0, 39.0, 28.0, 28.0, 24.0, 17.0, 16.0, 16.0, 15.0, 8.0, 22.0, 9.0, 4.0, 6.0, 5.0, 13.0, 3.0, 8.0, 6.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1208.075927734375, -1169.9229736328125, -1131.77001953125, -1093.6170654296875, -1055.464111328125, -1017.3110961914062, -979.1581420898438, -941.005126953125, -902.8521728515625, -864.69921875, -826.5462646484375, -788.393310546875, -750.2402954101562, -712.0873413085938, -673.9343872070312, -635.7813720703125, -597.6284790039062, -559.4755249023438, -521.3225708007812, -483.1695861816406, -445.0166015625, -406.8636474609375, -368.710693359375, -330.5577087402344, -292.4047546386719, -254.2517852783203, -216.09881591796875, -177.94586181640625, -139.7928924560547, -101.63992309570312, -63.486968994140625, -25.333984375, 12.8189697265625, 50.9719352722168, 89.1249008178711, 127.27786254882812, 165.4308319091797, 203.58380126953125, 241.73675537109375, 279.8897399902344, 318.0426940917969, 356.1956481933594, 394.3486328125, 432.5015869140625, 470.654541015625, 508.8075256347656, 546.96044921875, 585.1134643554688, 623.2664184570312, 661.4193725585938, 699.5723266601562, 737.725341796875, 775.8782958984375, 814.03125, 852.1842041015625, 890.337158203125, 928.4901123046875, 966.64306640625, 1004.7960205078125, 1042.948974609375, 1081.1019287109375, 1119.2548828125, 1157.407958984375, 1195.5609130859375, 1233.7138671875]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 9.0, 11.0, 12.0, 14.0, 11.0, 22.0, 14.0, 20.0, 21.0, 24.0, 28.0, 34.0, 45.0, 62.0, 141.0, 155.0, 65.0, 45.0, 41.0, 25.0, 34.0, 22.0, 21.0, 29.0, 17.0, 22.0, 10.0, 7.0, 9.0, 7.0, 4.0, 5.0, 5.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-128.0, -124.71875, -121.4375, -118.15625, -114.875, -111.59375, -108.3125, -105.03125, -101.75, -98.46875, -95.1875, -91.90625, -88.625, -85.34375, -82.0625, -78.78125, -75.5, -72.21875, -68.9375, -65.65625, -62.375, -59.09375, -55.8125, -52.53125, -49.25, -45.96875, -42.6875, -39.40625, -36.125, -32.84375, -29.5625, -26.28125, -23.0, -19.71875, -16.4375, -13.15625, -9.875, -6.59375, -3.3125, -0.03125, 3.25, 6.53125, 9.8125, 13.09375, 16.375, 19.65625, 22.9375, 26.21875, 29.5, 32.78125, 36.0625, 39.34375, 42.625, 45.90625, 49.1875, 52.46875, 55.75, 59.03125, 62.3125, 65.59375, 68.875, 72.15625, 75.4375, 78.71875, 82.0]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 5.0, 1.0, 0.0, 1.0, 2.0, 2.0, 8.0, 2.0, 4.0, 16.0, 18.0, 24.0, 34.0, 46.0, 44.0, 61.0, 163.0, 252.0, 621.0, 1768.0, 7060.0, 399539.0, 7967438.0, 8207.0, 1950.0, 641.0, 266.0, 141.0, 94.0, 40.0, 46.0, 26.0, 17.0, 7.0, 7.0, 15.0, 7.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-734.0562744140625, -713.1082763671875, -692.1602172851562, -671.212158203125, -650.26416015625, -629.316162109375, -608.3681030273438, -587.4200439453125, -566.4720458984375, -545.5240478515625, -524.5759887695312, -503.6279602050781, -482.679931640625, -461.7319030761719, -440.78387451171875, -419.8358459472656, -398.8878173828125, -377.9397888183594, -356.99176025390625, -336.0437316894531, -315.095703125, -294.1476745605469, -273.19964599609375, -252.25161743164062, -231.3035888671875, -210.35556030273438, -189.40753173828125, -168.45950317382812, -147.511474609375, -126.56344604492188, -105.61541748046875, -84.66738891601562, -63.7193603515625, -42.771331787109375, -21.82330322265625, -0.875274658203125, 20.07275390625, 41.020782470703125, 61.96881103515625, 82.91683959960938, 103.8648681640625, 124.81289672851562, 145.76092529296875, 166.70895385742188, 187.656982421875, 208.60501098632812, 229.55303955078125, 250.50106811523438, 271.4490966796875, 292.3971252441406, 313.34515380859375, 334.2931823730469, 355.2412109375, 376.1892395019531, 397.13726806640625, 418.0852966308594, 439.0333251953125, 459.9813537597656, 480.92938232421875, 501.8774108886719, 522.825439453125, 543.7734375, 564.7214965820312, 585.6695556640625, 606.6175537109375]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 5.0, 3.0, 4.0, 3.0, 0.0, 2.0, 0.0, 4.0, 3.0, 2.0, 2.0, 2.0, 6.0, 8.0, 5.0, 4.0, 2.0, 5.0, 3.0, 7.0, 2.0, 6.0, 3.0, 4.0, 4.0, 1.0, 5.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-653.5410766601562, -628.9877319335938, -604.434326171875, -579.8809814453125, -555.3275756835938, -530.7742309570312, -506.2208557128906, -481.66748046875, -457.1141052246094, -432.56072998046875, -408.0073547363281, -383.4539794921875, -358.900634765625, -334.34722900390625, -309.79388427734375, -285.2405090332031, -260.6871337890625, -236.13375854492188, -211.58038330078125, -187.0270233154297, -162.47364807128906, -137.92027282714844, -113.36691284179688, -88.81353759765625, -64.26016235351562, -39.706790924072266, -15.153419494628906, 9.399948120117188, 33.95332336425781, 58.50669860839844, 83.06005859375, 107.61343383789062, 132.166748046875, 156.72012329101562, 181.27349853515625, 205.8268585205078, 230.38023376464844, 254.93360900878906, 279.4869689941406, 304.04034423828125, 328.5937194824219, 353.1470947265625, 377.7004699707031, 402.25384521484375, 426.80718994140625, 451.360595703125, 475.9139404296875, 500.4673156738281, 525.0206909179688, 549.5740356445312, 574.12744140625, 598.6807861328125, 623.2341918945312, 647.7875366210938, 672.3409423828125, 696.894287109375, 721.4476318359375, 746.0009765625, 770.5543823242188, 795.1077270507812, 819.6611328125, 844.2144775390625, 868.767822265625, 893.3212280273438, 917.8746337890625]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 2.0, 5.0, 8.0, 6.0, 10.0, 11.0, 32.0, 25.0, 33.0, 46.0, 56.0, 57.0, 58.0, 60.0, 53.0, 69.0, 61.0, 69.0, 51.0, 65.0, 50.0, 32.0, 36.0, 23.0, 24.0, 17.0, 9.0, 6.0, 9.0, 5.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-103.1875, -100.443359375, -97.69921875, -94.955078125, -92.2109375, -89.466796875, -86.72265625, -83.978515625, -81.234375, -78.490234375, -75.74609375, -73.001953125, -70.2578125, -67.513671875, -64.76953125, -62.025390625, -59.28125, -56.537109375, -53.79296875, -51.048828125, -48.3046875, -45.560546875, -42.81640625, -40.072265625, -37.328125, -34.583984375, -31.83984375, -29.095703125, -26.3515625, -23.607421875, -20.86328125, -18.119140625, -15.375, -12.630859375, -9.88671875, -7.142578125, -4.3984375, -1.654296875, 1.08984375, 3.833984375, 6.578125, 9.322265625, 12.06640625, 14.810546875, 17.5546875, 20.298828125, 23.04296875, 25.787109375, 28.53125, 31.275390625, 34.01953125, 36.763671875, 39.5078125, 42.251953125, 44.99609375, 47.740234375, 50.484375, 53.228515625, 55.97265625, 58.716796875, 61.4609375, 64.205078125, 66.94921875, 69.693359375, 72.4375]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 7.0, 13.0, 13.0, 29.0, 36.0, 58.0, 111.0, 197.0, 379.0, 885.0, 1997.0, 5121.0, 14731.0, 46749.0, 157176.0, 199396.0, 65588.0, 19744.0, 7078.0, 2651.0, 1068.0, 579.0, 279.0, 162.0, 82.0, 54.0, 21.0, 17.0, 14.0, 7.0, 9.0, 4.0, 3.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-595.0, -574.578125, -554.15625, -533.734375, -513.3125, -492.890625, -472.46875, -452.046875, -431.625, -411.203125, -390.78125, -370.359375, -349.9375, -329.515625, -309.09375, -288.671875, -268.25, -247.828125, -227.40625, -206.984375, -186.5625, -166.140625, -145.71875, -125.296875, -104.875, -84.453125, -64.03125, -43.609375, -23.1875, -2.765625, 17.65625, 38.078125, 58.5, 78.921875, 99.34375, 119.765625, 140.1875, 160.609375, 181.03125, 201.453125, 221.875, 242.296875, 262.71875, 283.140625, 303.5625, 323.984375, 344.40625, 364.828125, 385.25, 405.671875, 426.09375, 446.515625, 466.9375, 487.359375, 507.78125, 528.203125, 548.625, 569.046875, 589.46875, 609.890625, 630.3125, 650.734375, 671.15625, 691.578125, 712.0]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 4.0, 1.0, 5.0, 3.0, 6.0, 6.0, 4.0, 10.0, 11.0, 14.0, 11.0, 18.0, 16.0, 23.0, 26.0, 51.0, 46.0, 40.0, 48.0, 49.0, 37.0, 49.0, 53.0, 57.0, 54.0, 47.0, 36.0, 42.0, 42.0, 34.0, 26.0, 25.0, 17.0, 14.0, 17.0, 17.0, 10.0, 6.0, 4.0, 12.0, 6.0, 4.0, 0.0, 2.0, 0.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-83.1875, -80.6728515625, -78.158203125, -75.6435546875, -73.12890625, -70.6142578125, -68.099609375, -65.5849609375, -63.0703125, -60.5556640625, -58.041015625, -55.5263671875, -53.01171875, -50.4970703125, -47.982421875, -45.4677734375, -42.953125, -40.4384765625, -37.923828125, -35.4091796875, -32.89453125, -30.3798828125, -27.865234375, -25.3505859375, -22.8359375, -20.3212890625, -17.806640625, -15.2919921875, -12.77734375, -10.2626953125, -7.748046875, -5.2333984375, -2.71875, -0.2041015625, 2.310546875, 4.8251953125, 7.33984375, 9.8544921875, 12.369140625, 14.8837890625, 17.3984375, 19.9130859375, 22.427734375, 24.9423828125, 27.45703125, 29.9716796875, 32.486328125, 35.0009765625, 37.515625, 40.0302734375, 42.544921875, 45.0595703125, 47.57421875, 50.0888671875, 52.603515625, 55.1181640625, 57.6328125, 60.1474609375, 62.662109375, 65.1767578125, 67.69140625, 70.2060546875, 72.720703125, 75.2353515625, 77.75]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 7.0, 2.0, 3.0, 6.0, 1.0, 5.0, 9.0, 20.0, 45.0, 53.0, 75.0, 69.0, 70.0, 32.0, 31.0, 13.0, 8.0, 6.0, 4.0, 8.0, 6.0, 4.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-642.891845703125, -625.7798461914062, -608.6679077148438, -591.555908203125, -574.4439086914062, -557.3319091796875, -540.219970703125, -523.1079711914062, -505.9959716796875, -488.8840026855469, -471.7720031738281, -454.6600341796875, -437.54803466796875, -420.4360656738281, -403.3240966796875, -386.21209716796875, -369.1001281738281, -351.9881591796875, -334.87615966796875, -317.7641906738281, -300.6521911621094, -283.54022216796875, -266.42822265625, -249.31625366210938, -232.2042694091797, -215.09228515625, -197.9803009033203, -180.86831665039062, -163.75634765625, -146.64434814453125, -129.53237915039062, -112.42039489746094, -95.30838012695312, -78.19639587402344, -61.084415435791016, -43.972434997558594, -26.860450744628906, -9.748466491699219, 7.3635101318359375, 24.475494384765625, 41.58747863769531, 58.699462890625, 75.81144714355469, 92.92342376708984, 110.03540802001953, 127.14739227294922, 144.25936889648438, 161.37135314941406, 178.48333740234375, 195.59532165527344, 212.70730590820312, 229.81927490234375, 246.9312744140625, 264.0432434082031, 281.15521240234375, 298.2672119140625, 315.37921142578125, 332.4911804199219, 349.6031799316406, 366.71514892578125, 383.8271484375, 400.9391174316406, 418.05108642578125, 435.1630859375, 452.2750549316406]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 2.0, 4.0, 5.0, 1.0, 8.0, 2.0, 0.0, 5.0, 5.0, 4.0, 4.0, 4.0, 8.0, 10.0, 20.0, 52.0, 59.0, 80.0, 79.0, 37.0, 23.0, 16.0, 16.0, 11.0, 2.0, 3.0, 5.0, 1.0, 4.0, 6.0, 4.0, 1.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-445.65655517578125, -431.13250732421875, -416.6084289550781, -402.0843811035156, -387.5603332519531, -373.0362548828125, -358.51220703125, -343.9881591796875, -329.464111328125, -314.9400634765625, -300.4159851074219, -285.8919372558594, -271.3678894042969, -256.84381103515625, -242.31976318359375, -227.79571533203125, -213.27163696289062, -198.74757385253906, -184.22352600097656, -169.699462890625, -155.1754150390625, -140.65135192871094, -126.12728881835938, -111.60323333740234, -97.07917785644531, -82.55512237548828, -68.03106689453125, -53.50700378417969, -38.982948303222656, -24.458892822265625, -9.934829711914062, 4.589225769042969, 19.11328125, 33.63733673095703, 48.16139602661133, 62.685455322265625, 77.20951080322266, 91.73356628417969, 106.25762939453125, 120.78168487548828, 135.3057403564453, 149.82980346679688, 164.35385131835938, 178.87791442871094, 193.4019775390625, 207.926025390625, 222.45008850097656, 236.97415161132812, 251.49819946289062, 266.0222473144531, 280.54632568359375, 295.07037353515625, 309.59442138671875, 324.11846923828125, 338.6425476074219, 353.1665954589844, 367.690673828125, 382.2147216796875, 396.7388000488281, 411.2628479003906, 425.7868957519531, 440.31097412109375, 454.83502197265625, 469.35906982421875, 483.88311767578125]}, "eval/loss": 0.717689573764801, "eval/wer": 0.12834192780642603, "eval/runtime": 818.6465, "eval/samples_per_second": 3.227, "eval/steps_per_second": 0.404, "train/train_runtime": 35320.0928, "train/train_samples_per_second": 20.2, "train/train_steps_per_second": 0.631, "train/total_flos": 0.0, "train/train_loss": 0.08645637407097047} \ No newline at end of file